Upload folder using huggingface_hub

Browse files

Files changed (10) hide show

config.json +1 -1
generation_config.json +1 -1
onnx/decoder_model.onnx +2 -2
onnx/decoder_model_merged.onnx +2 -2
onnx/decoder_model_merged_quantized.onnx +2 -2
onnx/decoder_model_quantized.onnx +2 -2
onnx/decoder_with_past_model.onnx +2 -2
onnx/decoder_with_past_model_quantized.onnx +2 -2
quantize_config.json +66 -65
tokenizer.json +3 -3

config.json CHANGED Viewed

@@ -19,7 +19,7 @@
   "rope_scaling": null,
   "rope_theta": 10000.0,
   "tie_word_embeddings": true,
-  "transformers_version": "4.34.0.dev0",
   "use_cache": true,
   "vocab_size": 32000
 }

   "rope_scaling": null,
   "rope_theta": 10000.0,
   "tie_word_embeddings": true,
+  "transformers_version": "4.33.2",
   "use_cache": true,
   "vocab_size": 32000
 }

generation_config.json CHANGED Viewed

@@ -2,5 +2,5 @@
   "_from_model_config": true,
   "bos_token_id": 1,
   "eos_token_id": 2,
-  "transformers_version": "4.34.0.dev0"
 }

   "_from_model_config": true,
   "bos_token_id": 1,
   "eos_token_id": 2,
+  "transformers_version": "4.33.2"
 }

onnx/decoder_model.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:9b4055de40adc6080300cb0a1a8986259c228b2447689651d7ce91ce340380b6
-size 439063717

 version https://git-lfs.github.com/spec/v1
+oid sha256:793dc3c2b6d845a6954eec6c173cf952485e3af5fa80b22a6337a03a921c5606
+size 439064264

onnx/decoder_model_merged.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:c27b7753ee0c8f83371ce28ebe01b94cddf93cc1045a9171623dc03d3b561c38
-size 440015873

 version https://git-lfs.github.com/spec/v1
+oid sha256:e899dcfd259d7f983e216fffef3756c7e6f72871790ff9fd9cd1eb16601a94ba
+size 440016914

onnx/decoder_model_merged_quantized.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:53a4a3b603720730b5d126fe18fb61f68ca137903881ca3d84db3bb0776d11d8
-size 111933644

 version https://git-lfs.github.com/spec/v1
+oid sha256:ba2a5f1df565916ffeaf95948f9ed9bcf1d5b87c3887cd94a7691fff1458a91c
+size 111935100

onnx/decoder_model_quantized.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:b6c5f19b29fc636f5975f964289fc67d23039120b6479969746c7d51d36f2574
-size 110756863

 version https://git-lfs.github.com/spec/v1
+oid sha256:0aedbba316748e1a640f9be5d920497f8c0d9be6ca4e1c37c2e71dfdc3dc5693
+size 110757634

onnx/decoder_with_past_model.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:a4194c70db527ebd117f4e530341522136e8c6322c86d9ff9cbff875da26c577
-size 439070831

 version https://git-lfs.github.com/spec/v1
+oid sha256:04f8916b363cd9226c6fc019eb26b181f43572b3a87b4cd564a9e78e597100db
+size 439071283

onnx/decoder_with_past_model_quantized.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:5e4a9d9b0e56de9f578abc299639909b3cca9258b87a55d0ef3ef9ae5ede0a55
-size 110765314

 version https://git-lfs.github.com/spec/v1
+oid sha256:5c7d4a097526bc1b211b8e5c7b4f4004f2b58c9d0076893afa9ca31c65507648
+size 110765955

quantize_config.json CHANGED Viewed

@@ -4,101 +4,102 @@
     "per_model_config": {
         "decoder_with_past_model": {
             "op_types": [
-                "Sub",
-                "Slice",
-                "Constant",
-                "Identity",
-                "Equal",
-                "Sigmoid",
-                "Div",
-                "Mul",
-                "MatMul",
-                "Pow",
                 "Where",
-                "Neg",
-                "ConstantOfShape",
                 "Softmax",
-                "Add",
                 "Sqrt",
-                "Unsqueeze",
-                "Reshape",
-                "Expand",
-                "ReduceMean",
                 "Concat",
-                "Cast",
                 "Gather",
-                "Transpose",
-                "Shape",
                 "If",
-                "Squeeze"
             ],
             "weight_type": "QInt8"
         },
         "decoder_model": {
             "op_types": [
-                "Sub",
-                "Slice",
-                "Constant",
-                "Identity",
-                "Equal",
-                "Sigmoid",
-                "Div",
-                "Mul",
-                "MatMul",
-                "Pow",
                 "Where",
-                "Neg",
-                "ConstantOfShape",
                 "Softmax",
-                "Add",
                 "Sqrt",
-                "Unsqueeze",
-                "Reshape",
-                "Expand",
-                "ReduceMean",
                 "Concat",
                 "Less",
-                "Cast",
                 "Gather",
-                "Range",
-                "Transpose",
-                "Shape",
                 "If",
-                "Squeeze"
             ],
             "weight_type": "QInt8"
         },
         "decoder_model_merged": {
             "op_types": [
-                "Sub",
-                "Slice",
-                "Constant",
-                "Identity",
-                "Equal",
-                "Sigmoid",
-                "Div",
-                "Mul",
-                "MatMul",
-                "Pow",
                 "Where",
-                "Neg",
-                "ConstantOfShape",
                 "Softmax",
-                "Add",
                 "Sqrt",
-                "Unsqueeze",
-                "Reshape",
-                "Expand",
-                "ReduceMean",
                 "Concat",
                 "Less",
-                "Cast",
                 "Gather",
-                "Range",
-                "Transpose",
-                "Shape",
                 "If",
-                "Squeeze"
             ],
             "weight_type": "QInt8"
         }

     "per_model_config": {
         "decoder_with_past_model": {
             "op_types": [
                 "Where",
+                "Cast",
+                "Mul",
+                "Slice",
                 "Softmax",
                 "Sqrt",
+                "Shape",
+                "Add",
+                "Range",
                 "Concat",
+                "ReduceMean",
+                "Sub",
+                "Unsqueeze",
+                "ConstantOfShape",
+                "Squeeze",
+                "Identity",
+                "Constant",
                 "Gather",
+                "Expand",
+                "Sigmoid",
+                "Equal",
                 "If",
+                "Div",
+                "Neg",
+                "Pow",
+                "Transpose",
+                "MatMul",
+                "Reshape"
             ],
             "weight_type": "QInt8"
         },
         "decoder_model": {
             "op_types": [
                 "Where",
+                "Cast",
+                "Mul",
+                "Slice",
                 "Softmax",
                 "Sqrt",
+                "Shape",
+                "Add",
+                "Range",
                 "Concat",
+                "ReduceMean",
+                "Sub",
+                "Unsqueeze",
+                "ConstantOfShape",
                 "Less",
+                "Squeeze",
+                "Identity",
+                "Constant",
                 "Gather",
+                "Expand",
+                "Sigmoid",
+                "Equal",
                 "If",
+                "Div",
+                "Neg",
+                "Pow",
+                "Transpose",
+                "MatMul",
+                "Reshape"
             ],
             "weight_type": "QInt8"
         },
         "decoder_model_merged": {
             "op_types": [
                 "Where",
+                "Cast",
+                "Mul",
+                "Slice",
                 "Softmax",
                 "Sqrt",
+                "Shape",
+                "Add",
+                "Range",
                 "Concat",
+                "ReduceMean",
+                "Sub",
+                "Unsqueeze",
+                "ConstantOfShape",
                 "Less",
+                "Squeeze",
+                "Identity",
+                "Constant",
                 "Gather",
+                "Expand",
+                "Sigmoid",
+                "Equal",
                 "If",
+                "Div",
+                "Neg",
+                "Pow",
+                "Transpose",
+                "MatMul",
+                "Reshape"
             ],
             "weight_type": "QInt8"
         }

tokenizer.json CHANGED Viewed

@@ -9,7 +9,7 @@
       "single_word": false,
       "lstrip": false,
       "rstrip": false,
-      "normalized": true,
       "special": true
     },
     {
@@ -18,7 +18,7 @@
       "single_word": false,
       "lstrip": false,
       "rstrip": false,
-      "normalized": true,
       "special": true
     },
     {
@@ -27,7 +27,7 @@
       "single_word": false,
       "lstrip": false,
       "rstrip": false,
-      "normalized": true,
       "special": true
     }
   ],

       "single_word": false,
       "lstrip": false,
       "rstrip": false,
+      "normalized": false,
       "special": true
     },
     {
       "single_word": false,
       "lstrip": false,
       "rstrip": false,
+      "normalized": false,
       "special": true
     },
     {
       "single_word": false,
       "lstrip": false,
       "rstrip": false,
+      "normalized": false,
       "special": true
     }
   ],