Upload optimized ONNX files

#9
by Xenova HF staff - opened
.gitattributes CHANGED
@@ -38,3 +38,4 @@ onnx/decoder_model_merged.onnx_data filter=lfs diff=lfs merge=lfs -text
38
  onnx/decoder_with_past_model.onnx_data filter=lfs diff=lfs merge=lfs -text
39
  onnx/decoder_model_merged_fp16.onnx_data filter=lfs diff=lfs merge=lfs -text
40
  onnx/model.onnx_data filter=lfs diff=lfs merge=lfs -text
 
 
38
  onnx/decoder_with_past_model.onnx_data filter=lfs diff=lfs merge=lfs -text
39
  onnx/decoder_model_merged_fp16.onnx_data filter=lfs diff=lfs merge=lfs -text
40
  onnx/model.onnx_data filter=lfs diff=lfs merge=lfs -text
41
+ onnx/model_fp16.onnx_data filter=lfs diff=lfs merge=lfs -text
config.json CHANGED
@@ -36,6 +36,13 @@
36
  "vocab_size": 51200
37
  },
38
  "torch_dtype": "float16",
 
 
 
 
 
 
39
  "transformers_version": "4.38.2",
40
- "image_token_index": -200
 
41
  }
 
36
  "vocab_size": 51200
37
  },
38
  "torch_dtype": "float16",
39
+ "transformers.js_config": {
40
+ "kv_cache_dtype": {
41
+ "q4f16": "float16",
42
+ "fp16": "float16"
43
+ }
44
+ },
45
  "transformers_version": "4.38.2",
46
+ "image_token_index": -200,
47
+ "num_image_tokens": 729
48
  }
onnx/decoder_model_merged.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1376e35e61ef3f05be05af99f24a724e08684f900e79bf719e1ce1717bb05e1c
3
- size 3825843
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ed07185e6b33fd5bbfe6c4910d19f16d64dd1a1c6e81c5f383db6d1419939de9
3
+ size 206171
onnx/decoder_model_merged.onnx_data CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1e0f60b6dbd4825a09e4f6a0f1e276d15918f8fcf0283a7d89fc85192034c911
3
- size 5251268608
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8404f2cf7e57b91060649f9a71385ef090ac3756a197fb0a4714c0818bf71ea9
3
+ size 5253914836
onnx/decoder_model_merged_bnb4.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:33a5b77971745a0cd7d926fadf805b18c027d3368a8ba469e3427fb3e45dc43a
3
- size 742293206
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b814079a830ffa6942d9f023c308b97b39a2883f6911cff6c333910ed21d992e
3
+ size 741313259
onnx/decoder_model_merged_fp16.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:eb5f2a9ac6dd26268ff1ec8207d424206f4b198f78afffa8dff0b1e6ed61e0c0
3
- size 203712385
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:91fe49a027c173c2ee620da92291c47cc559a283d642a792b75c1d055d2b042a
3
+ size 546702655
onnx/decoder_model_merged_fp16.onnx_data CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9d42298b7c9ce5d0515fb806bb6b6ac55aad719860c71b8e5adec7e087360938
3
- size 2424307712
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:707a678ab9e378fb739d8574b2668b73e8b7354fb2bc275a34e97b81215c098c
3
+ size 2080374784
onnx/decoder_model_merged_int8.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:14f48eb98ae76a14108d3f45021877131efdafa1ee7644d8adfce7bda09666f1
3
- size 1317092101
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:187df70b79da653768efe78a8e693142357ed8230f3c3c0f418292d3b38f92ba
3
+ size 1315801598
onnx/decoder_model_merged_q4.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6c6c986cb277a8dbafb4d437b6e56717fbe3dab7c0d9efceb77cfde48d081273
3
- size 824343527
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7bc872a71d27ea5846619c1c22d195c30335380e23cb868ef5ec19ea9276849d
3
+ size 823291250
onnx/decoder_model_merged_q4f16.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:614bcbfdf03dea3eb3e04e20716cd9406d87086caf18ca797247d969156a9274
3
- size 740853830
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:76bbee9e65863a1b393a1c406f132164d98aa58fcdc9c983f85b069c13c295f5
3
+ size 739917135
onnx/decoder_model_merged_quantized.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:14f48eb98ae76a14108d3f45021877131efdafa1ee7644d8adfce7bda09666f1
3
- size 1317092101
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:187df70b79da653768efe78a8e693142357ed8230f3c3c0f418292d3b38f92ba
3
+ size 1315801598
onnx/decoder_model_merged_uint8.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:477dea38c4c4ebc0a31e4ecce7228476e387f0027d88b745f4621e35494b4273
3
- size 1317092152
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2d59781bbbbe8ba295f17f3c70e06947fb356bf362f8b74a3c3fd4ddf31f3511
3
+ size 1315801678
onnx/embed_tokens.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:61fb6a7100aca7c8af125ce05676451458f6f49d57b7ec7ea388e18223f09b75
3
- size 419430639
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bed90ca8a123893110aa6591564f604e1a7524a5a2be9a91e54d76cfefc8b6f2
3
+ size 419430702
onnx/embed_tokens_bnb4.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e83c0024e7785c5946ecda27729cdb4d32d5e6b72d75bc58a155f3d7247967ef
3
- size 419430658
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:24f112ee0d90dfcfc2790b27ca916fd78f74db775446900163f0396e8b30a5d7
3
+ size 419430721
onnx/embed_tokens_fp16.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ca61d34329494679c8f67f5c0f603e49fe9b71700dc8778a22d7dfeb3b90ce69
3
  size 209715586
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9abce1491a74b16e0f4d65562cca0898e23767ad8d932a6d0fea86fa57863fcc
3
  size 209715586
onnx/embed_tokens_int8.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:22e17babd5aa3ac2793aaa15691b285819be212d1bc959ab5156d32e6dce5c9f
3
- size 104858081
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:45f47b27a322cd2d6d9fde2980753bed787f8067033039b4d7adc7125a72291e
3
+ size 104858144
onnx/embed_tokens_q4.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e83c0024e7785c5946ecda27729cdb4d32d5e6b72d75bc58a155f3d7247967ef
3
- size 419430658
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:24f112ee0d90dfcfc2790b27ca916fd78f74db775446900163f0396e8b30a5d7
3
+ size 419430721
onnx/embed_tokens_q4f16.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9de08bf0ff0fc270f5f2f631df8a048d9fe75c6b26668e3eb34188943028de63
3
+ size 209715605
onnx/embed_tokens_quantized.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:22e17babd5aa3ac2793aaa15691b285819be212d1bc959ab5156d32e6dce5c9f
3
- size 104858081
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:45f47b27a322cd2d6d9fde2980753bed787f8067033039b4d7adc7125a72291e
3
+ size 104858144
onnx/embed_tokens_uint8.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:eef70215698d3dc1d820915960a5022479b5276e40e2490fb9c33bf3be11337b
3
- size 104858081
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:41b63b63b8dbba67e81dda6cbbc4754bae9a4edf3339bc3ab3e37037b6ae05e1
3
+ size 104858144
onnx/vision_encoder.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5f0ba31bab9513aaffb2ed83992e46c447dc3d5c37876b741e018de2392823b5
3
- size 1757316914
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2598d0ff22943d32b8de86f4e70c56b49404fe4199ec56fac7e112fa97adbf15
3
+ size 1794812180
onnx/vision_encoder_bnb4.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:16e58e62576028dd79b630744176b870adc455ed145b45a0524b6d45a6bfb048
3
- size 251839217
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ba452a98872aed0aa0d81083f473ae676aa0adfdef5408d8b48596579ba36243
3
+ size 256895150
onnx/vision_encoder_fp16.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:aa79c8ca1b7bc127be6cbcc4776908f7fc499080c52aeaab35e2c3c5ccc00f07
3
- size 879098082
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:481b17a8ee178daf3d3e763e7e98c57c54051fe497d888921269bf57ffd268fb
3
+ size 897514186
onnx/vision_encoder_int8.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3db8a049c57cd67501c72c65925d2d655e7446d57cdf846aeccef7a3a2d80b00
3
- size 443772614
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8e8f87a09e7abbec7ed439914458e30e0e3d891667a310cb4f136d5c5d627b0a
3
+ size 452702446
onnx/vision_encoder_q4.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e2458ab4ab41f43bb24c2b3aa2d68c34318612a6a628237e6c738ddbf5dc2843
3
- size 279536385
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:faf18220478e7df63daaf43722a052a85a6b10037f175f0952d441f961e21b3d
3
+ size 285182144
onnx/vision_encoder_q4f16.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d6e056c6bfd9c4ec7bad2079e8d2f41405a2c916ccfea137107a2a33aa4f5954
3
+ size 254687987
onnx/vision_encoder_quantized.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3db8a049c57cd67501c72c65925d2d655e7446d57cdf846aeccef7a3a2d80b00
3
- size 443772614
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8e8f87a09e7abbec7ed439914458e30e0e3d891667a310cb4f136d5c5d627b0a
3
+ size 452702446
onnx/vision_encoder_uint8.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a57444eb16ff2a1ce7ecf3aec849ec1f7870019fa13e77df10a16bc536ca62e2
3
- size 443772672
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:98516d42adba44eb53a3402d7c6a8c1875f9d2dfed14be3cebe3ba165f635a73
3
+ size 452702506