Upload folder using huggingface_hub
Browse files- onnx/decoder_model_merged.onnx +2 -2
- onnx/decoder_model_merged_bnb4.onnx +2 -2
- onnx/decoder_model_merged_fp16.onnx +2 -2
- onnx/decoder_model_merged_int8.onnx +2 -2
- onnx/decoder_model_merged_q4.onnx +2 -2
- onnx/decoder_model_merged_quantized.onnx +2 -2
- onnx/decoder_model_merged_uint8.onnx +2 -2
- onnx/encoder_model.onnx +2 -2
- onnx/encoder_model_bnb4.onnx +2 -2
- onnx/encoder_model_fp16.onnx +2 -2
- onnx/encoder_model_int8.onnx +2 -2
- onnx/encoder_model_q4.onnx +2 -2
- onnx/encoder_model_quantized.onnx +2 -2
- onnx/encoder_model_uint8.onnx +2 -2
- quantize_config.json +21 -3
onnx/decoder_model_merged.onnx
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:04bafad5115776073a393995b4109a8c2ed7851914ea8a9fc43387efbdba5c9f
|
| 3 |
+
size 615487747
|
onnx/decoder_model_merged_bnb4.onnx
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:624d05ae5f584631b43757360d536034c30a87cb0fa8df81eb6f653fc5b177bf
|
| 3 |
+
size 226236613
|
onnx/decoder_model_merged_fp16.onnx
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:84e805a94d456d27b37658133756b2fd2b41bdee3438c89657da741f7c9251cb
|
| 3 |
+
size 308795465
|
onnx/decoder_model_merged_int8.onnx
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:be2e00c055ade0a37a1554bca42697f8808e78f06dfeec164b9cbc72a0ba30f0
|
| 3 |
+
size 156971214
|
onnx/decoder_model_merged_q4.onnx
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:67687fa2d3b47d2ccfea1371d6841d02b08b58cdd232aa7fa4cba281a127c0ff
|
| 3 |
+
size 233312773
|
onnx/decoder_model_merged_quantized.onnx
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:be2e00c055ade0a37a1554bca42697f8808e78f06dfeec164b9cbc72a0ba30f0
|
| 3 |
+
size 156971214
|
onnx/decoder_model_merged_uint8.onnx
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1ed51acd891ed2157debbe3f128292c4f219dcd012054d54abfdfe2cd7608435
|
| 3 |
+
size 156971275
|
onnx/encoder_model.onnx
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ecc02082c11d78ba3fd49284ea96de9e7f6eb9b6fd3f4346c15d2d58c2749257
|
| 3 |
+
size 352858701
|
onnx/encoder_model_bnb4.onnx
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ffb0f9550ed789467f7bd13cd364a5ee2f15715b5b2066ea227b26c34e28eec3
|
| 3 |
+
size 60907047
|
onnx/encoder_model_fp16.onnx
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b39e25407618b2e92a713b25fe6faab127bde2ac89bf8a4b226321e33b35e6ba
|
| 3 |
+
size 176653325
|
onnx/encoder_model_int8.onnx
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:dbb892ee2e1adcdfb3aa5de0afa03aebacd0b21484187156583a0e27392b0a92
|
| 3 |
+
size 92371696
|
onnx/encoder_model_q4.onnx
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:038cee9c13e3d2da9f5a213e426486a23b841de901cdec4f7bf42af65f0d9275
|
| 3 |
+
size 66214935
|
onnx/encoder_model_quantized.onnx
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:663eb2991673c520b68fad25b48b4cb71e9e9cbc6a675e07cfceba463d20b58a
|
| 3 |
+
size 92371729
|
onnx/encoder_model_uint8.onnx
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:663eb2991673c520b68fad25b48b4cb71e9e9cbc6a675e07cfceba463d20b58a
|
| 3 |
+
size 92371729
|
quantize_config.json
CHANGED
|
@@ -5,18 +5,23 @@
|
|
| 5 |
"encoder_model": {
|
| 6 |
"op_types": [
|
| 7 |
"Add",
|
|
|
|
|
|
|
| 8 |
"Conv",
|
| 9 |
"Div",
|
| 10 |
"Erf",
|
|
|
|
| 11 |
"MatMul",
|
| 12 |
"Mul",
|
| 13 |
"Pow",
|
| 14 |
"ReduceMean",
|
| 15 |
"Reshape",
|
|
|
|
| 16 |
"Softmax",
|
| 17 |
"Sqrt",
|
| 18 |
"Sub",
|
| 19 |
-
"Transpose"
|
|
|
|
| 20 |
],
|
| 21 |
"weight_type": "QUInt8"
|
| 22 |
},
|
|
@@ -77,6 +82,7 @@
|
|
| 77 |
"decoder_model_merged": {
|
| 78 |
"op_types": [
|
| 79 |
"Add",
|
|
|
|
| 80 |
"Concat",
|
| 81 |
"Constant",
|
| 82 |
"ConstantOfShape",
|
|
@@ -114,18 +120,23 @@
|
|
| 114 |
"encoder_model": {
|
| 115 |
"op_types": [
|
| 116 |
"Add",
|
|
|
|
|
|
|
| 117 |
"Conv",
|
| 118 |
"Div",
|
| 119 |
"Erf",
|
|
|
|
| 120 |
"MatMul",
|
| 121 |
"Mul",
|
| 122 |
"Pow",
|
| 123 |
"ReduceMean",
|
| 124 |
"Reshape",
|
|
|
|
| 125 |
"Softmax",
|
| 126 |
"Sqrt",
|
| 127 |
"Sub",
|
| 128 |
-
"Transpose"
|
|
|
|
| 129 |
],
|
| 130 |
"weight_type": "QInt8"
|
| 131 |
},
|
|
@@ -186,6 +197,7 @@
|
|
| 186 |
"decoder_model_merged": {
|
| 187 |
"op_types": [
|
| 188 |
"Add",
|
|
|
|
| 189 |
"Concat",
|
| 190 |
"Constant",
|
| 191 |
"ConstantOfShape",
|
|
@@ -223,18 +235,23 @@
|
|
| 223 |
"encoder_model": {
|
| 224 |
"op_types": [
|
| 225 |
"Add",
|
|
|
|
|
|
|
| 226 |
"Conv",
|
| 227 |
"Div",
|
| 228 |
"Erf",
|
|
|
|
| 229 |
"MatMul",
|
| 230 |
"Mul",
|
| 231 |
"Pow",
|
| 232 |
"ReduceMean",
|
| 233 |
"Reshape",
|
|
|
|
| 234 |
"Softmax",
|
| 235 |
"Sqrt",
|
| 236 |
"Sub",
|
| 237 |
-
"Transpose"
|
|
|
|
| 238 |
],
|
| 239 |
"weight_type": "QUInt8"
|
| 240 |
},
|
|
@@ -295,6 +312,7 @@
|
|
| 295 |
"decoder_model_merged": {
|
| 296 |
"op_types": [
|
| 297 |
"Add",
|
|
|
|
| 298 |
"Concat",
|
| 299 |
"Constant",
|
| 300 |
"ConstantOfShape",
|
|
|
|
| 5 |
"encoder_model": {
|
| 6 |
"op_types": [
|
| 7 |
"Add",
|
| 8 |
+
"Concat",
|
| 9 |
+
"Constant",
|
| 10 |
"Conv",
|
| 11 |
"Div",
|
| 12 |
"Erf",
|
| 13 |
+
"Gather",
|
| 14 |
"MatMul",
|
| 15 |
"Mul",
|
| 16 |
"Pow",
|
| 17 |
"ReduceMean",
|
| 18 |
"Reshape",
|
| 19 |
+
"Shape",
|
| 20 |
"Softmax",
|
| 21 |
"Sqrt",
|
| 22 |
"Sub",
|
| 23 |
+
"Transpose",
|
| 24 |
+
"Unsqueeze"
|
| 25 |
],
|
| 26 |
"weight_type": "QUInt8"
|
| 27 |
},
|
|
|
|
| 82 |
"decoder_model_merged": {
|
| 83 |
"op_types": [
|
| 84 |
"Add",
|
| 85 |
+
"Cast",
|
| 86 |
"Concat",
|
| 87 |
"Constant",
|
| 88 |
"ConstantOfShape",
|
|
|
|
| 120 |
"encoder_model": {
|
| 121 |
"op_types": [
|
| 122 |
"Add",
|
| 123 |
+
"Concat",
|
| 124 |
+
"Constant",
|
| 125 |
"Conv",
|
| 126 |
"Div",
|
| 127 |
"Erf",
|
| 128 |
+
"Gather",
|
| 129 |
"MatMul",
|
| 130 |
"Mul",
|
| 131 |
"Pow",
|
| 132 |
"ReduceMean",
|
| 133 |
"Reshape",
|
| 134 |
+
"Shape",
|
| 135 |
"Softmax",
|
| 136 |
"Sqrt",
|
| 137 |
"Sub",
|
| 138 |
+
"Transpose",
|
| 139 |
+
"Unsqueeze"
|
| 140 |
],
|
| 141 |
"weight_type": "QInt8"
|
| 142 |
},
|
|
|
|
| 197 |
"decoder_model_merged": {
|
| 198 |
"op_types": [
|
| 199 |
"Add",
|
| 200 |
+
"Cast",
|
| 201 |
"Concat",
|
| 202 |
"Constant",
|
| 203 |
"ConstantOfShape",
|
|
|
|
| 235 |
"encoder_model": {
|
| 236 |
"op_types": [
|
| 237 |
"Add",
|
| 238 |
+
"Concat",
|
| 239 |
+
"Constant",
|
| 240 |
"Conv",
|
| 241 |
"Div",
|
| 242 |
"Erf",
|
| 243 |
+
"Gather",
|
| 244 |
"MatMul",
|
| 245 |
"Mul",
|
| 246 |
"Pow",
|
| 247 |
"ReduceMean",
|
| 248 |
"Reshape",
|
| 249 |
+
"Shape",
|
| 250 |
"Softmax",
|
| 251 |
"Sqrt",
|
| 252 |
"Sub",
|
| 253 |
+
"Transpose",
|
| 254 |
+
"Unsqueeze"
|
| 255 |
],
|
| 256 |
"weight_type": "QUInt8"
|
| 257 |
},
|
|
|
|
| 312 |
"decoder_model_merged": {
|
| 313 |
"op_types": [
|
| 314 |
"Add",
|
| 315 |
+
"Cast",
|
| 316 |
"Concat",
|
| 317 |
"Constant",
|
| 318 |
"ConstantOfShape",
|