Upload folder using huggingface_hub

Browse files

Files changed (11) hide show

config.json +2 -1
generation_config.json +27 -2
onnx/decoder_model.onnx +2 -2
onnx/decoder_model_merged.onnx +2 -2
onnx/decoder_model_merged_quantized.onnx +2 -2
onnx/decoder_model_quantized.onnx +2 -2
onnx/decoder_with_past_model.onnx +2 -2
onnx/decoder_with_past_model_quantized.onnx +2 -2
onnx/encoder_model.onnx +2 -2
onnx/encoder_model_quantized.onnx +2 -2
quantize_config.json +115 -0

config.json CHANGED Viewed

@@ -50,6 +50,7 @@
   "max_length": 448,
   "max_source_positions": 1500,
   "max_target_positions": 448,
   "model_type": "whisper",
   "num_hidden_layers": 24,
   "num_mel_bins": 80,
@@ -145,7 +146,7 @@
     50361,
     50362
   ],
-  "transformers_version": "4.30.2",
   "use_cache": true,
   "use_weighted_layer_sum": false,
   "vocab_size": 51865

   "max_length": 448,
   "max_source_positions": 1500,
   "max_target_positions": 448,
+  "median_filter_width": 7,
   "model_type": "whisper",
   "num_hidden_layers": 24,
   "num_mel_bins": 80,
     50361,
     50362
   ],
+  "transformers_version": "4.33.0.dev0",
   "use_cache": true,
   "use_weighted_layer_sum": false,
   "vocab_size": 51865

generation_config.json CHANGED Viewed

@@ -1,5 +1,30 @@
 {
-  "alignment_heads": [[13, 15], [15, 4], [15, 15], [16, 1], [20, 0], [23, 4]],
   "begin_suppress_tokens": [
     220,
     50257
@@ -217,5 +242,5 @@
     "transcribe": 50359,
     "translate": 50358
   },
-  "transformers_version": "4.30.2"
 }

 {
+  "alignment_heads": [
+    [
+      13,
+      15
+    ],
+    [
+      15,
+      4
+    ],
+    [
+      15,
+      15
+    ],
+    [
+      16,
+      1
+    ],
+    [
+      20,
+      0
+    ],
+    [
+      23,
+      4
+    ]
+  ],
   "begin_suppress_tokens": [
     220,
     50257
     "transcribe": 50359,
     "translate": 50358
   },
+  "transformers_version": "4.33.0.dev0"
 }

onnx/decoder_model.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:0a648963b5554dd3b637976d78be6befa6093f59dbfcb6374c0363acdb953c1a
-size 2040015092

 version https://git-lfs.github.com/spec/v1
+oid sha256:00ea982dc84ad2d2904b46749eab6f27aa56287d523ae4d5dbcd0f2fd5ae902b
+size 1827707405

onnx/decoder_model_merged.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:6f82a91e07ab23f138384c1d6aba1f20b3437ccb6beb3eaa21b4ef74cdc292ed
-size 1926573

 version https://git-lfs.github.com/spec/v1
+oid sha256:c3b860eefa7321ea078f00a5d4b821f36dd38362ba3641a579ddfde3df37b45e
+size 1828728265

onnx/decoder_model_merged_quantized.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:0bdb36b4facd9a224dde4533588f876ab0fb3599001bde4869a39e014594ce13
-size 515407456

 version https://git-lfs.github.com/spec/v1
+oid sha256:2cdd6d06ebdf9d993d21117bfeeb7e9b399521b7766d3df77c54a85d6dcf3c08
+size 462661606

onnx/decoder_model_quantized.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:bf74fbc6d746531b96673d35e8bd455bb049a4f570847b925e9685fe426bc5a0
-size 514019282

 version https://git-lfs.github.com/spec/v1
+oid sha256:8aa8c0ac25486ecb9dc83cf49b08d6abd22d4ef6960f3d21c00a3ab6f1a8a439
+size 461079957

onnx/decoder_with_past_model.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:885893286374cb2cf662a74c0912ff6c47f0caf80964153555a0398cbeca3b86
-size 1838441751

 version https://git-lfs.github.com/spec/v1
+oid sha256:6bd9e6475391368696a8bf1c8ba10d3a0f8c07ea7e3b3545ed7ccedb28526cd4
+size 1626146694

onnx/decoder_with_past_model_quantized.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:e81dd3275a51a8fd1a41247b7cfb4bba5df7d10b3814640c7920579bcca19ba6
-size 463340703

 version https://git-lfs.github.com/spec/v1
+oid sha256:d652797726d1662d3fe72daa93fccc814e42e68e119d827795ce712f17a705a8
+size 410418679

onnx/encoder_model.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:70292a0b342decb984585a1dcd93ad204dc9640370af48a2f829220483b2835c
-size 1229258863

 version https://git-lfs.github.com/spec/v1
+oid sha256:2089510b7427f03f3126e35a007b9eaf64bd7497d37d13e763264e9178f4a267
+size 1229312445

onnx/encoder_model_quantized.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:5d01068c82a2d3e963ffe9047b5cb802539a4f26980434c00f844d431a794ff1
-size 313397176

 version https://git-lfs.github.com/spec/v1
+oid sha256:7d6b4a00e441271646327f8a71b6e1bd1a305013cd914b51ddd76919c59ee3af
+size 313468028

quantize_config.json ADDED Viewed

	@@ -0,0 +1,115 @@

+{
+    "per_channel": false,
+    "reduce_range": false,
+    "per_model_config": {
+        "decoder_model": {
+            "op_types": [
+                "Expand",
+                "Concat",
+                "Div",
+                "Cast",
+                "Slice",
+                "Mul",
+                "Where",
+                "Transpose",
+                "Erf",
+                "Reshape",
+                "Equal",
+                "ConstantOfShape",
+                "Unsqueeze",
+                "ReduceMean",
+                "Softmax",
+                "Squeeze",
+                "Less",
+                "Range",
+                "MatMul",
+                "Pow",
+                "Sqrt",
+                "Sub",
+                "Add",
+                "Constant",
+                "Gather",
+                "Shape"
+            ],
+            "weight_type": "QInt8"
+        },
+        "decoder_model_merged": {
+            "op_types": [
+                "Expand",
+                "Concat",
+                "Div",
+                "Cast",
+                "Slice",
+                "Mul",
+                "Where",
+                "Transpose",
+                "Erf",
+                "Reshape",
+                "Equal",
+                "ConstantOfShape",
+                "Unsqueeze",
+                "ReduceMean",
+                "Softmax",
+                "Squeeze",
+                "Less",
+                "Range",
+                "MatMul",
+                "Pow",
+                "If",
+                "Sqrt",
+                "Sub",
+                "Add",
+                "Constant",
+                "Gather",
+                "Shape"
+            ],
+            "weight_type": "QInt8"
+        },
+        "decoder_with_past_model": {
+            "op_types": [
+                "ReduceMean",
+                "Div",
+                "Concat",
+                "Sqrt",
+                "Sub",
+                "Softmax",
+                "Add",
+                "Transpose",
+                "Constant",
+                "Gather",
+                "Shape",
+                "Slice",
+                "Erf",
+                "Reshape",
+                "Mul",
+                "MatMul",
+                "Unsqueeze",
+                "Pow"
+            ],
+            "weight_type": "QInt8"
+        },
+        "encoder_model": {
+            "op_types": [
+                "ReduceMean",
+                "Div",
+                "Sqrt",
+                "Concat",
+                "Sub",
+                "Softmax",
+                "Add",
+                "Transpose",
+                "Constant",
+                "Gather",
+                "Shape",
+                "Erf",
+                "Reshape",
+                "Mul",
+                "Conv",
+                "MatMul",
+                "Unsqueeze",
+                "Pow"
+            ],
+            "weight_type": "QUInt8"
+        }
+    }
+}