Synchronizing local compiler cache.
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- .gitattributes +97 -20
- neuronxcc-2.13.66.0+6dfecc895/0_REGISTRY/0.0.22.dev0/inference/llama/meta-llama/Llama-2-13b-chat-hf/55d02a833c68f65f88c9.json +1 -0
- neuronxcc-2.13.66.0+6dfecc895/0_REGISTRY/0.0.22.dev0/inference/llama/meta-llama/Llama-2-13b-chat-hf/a4fb9901e6811328a109.json +1 -0
- neuronxcc-2.13.66.0+6dfecc895/0_REGISTRY/0.0.22.dev0/inference/llama/meta-llama/Llama-2-13b-chat-hf/a8c0b413e79c91496630.json +1 -0
- neuronxcc-2.13.66.0+6dfecc895/0_REGISTRY/0.0.22.dev0/inference/llama/meta-llama/Llama-2-13b-chat-hf/d68250e23574798328a7.json +1 -0
- neuronxcc-2.13.66.0+6dfecc895/0_REGISTRY/0.0.22.dev0/inference/mistral/mistralai/Mistral-7B-Instruct-v0.2/1245bb72b32d75db76f9.json +1 -0
- neuronxcc-2.13.66.0+6dfecc895/0_REGISTRY/0.0.22.dev0/inference/mistral/mistralai/Mistral-7B-Instruct-v0.2/5e1e1d2ca63370d9d0a0.json +1 -0
- neuronxcc-2.13.66.0+6dfecc895/0_REGISTRY/0.0.22.dev0/inference/mistral/mistralai/Mistral-7B-Instruct-v0.2/6255cc2875c3d0c5e501.json +1 -0
- neuronxcc-2.13.66.0+6dfecc895/0_REGISTRY/0.0.22.dev0/inference/mistral/mistralai/Mistral-7B-Instruct-v0.2/64e0d5cd868faca4549f.json +1 -0
- neuronxcc-2.13.66.0+6dfecc895/0_REGISTRY/0.0.22.dev0/inference/mistral/mistralai/Mistral-7B-Instruct-v0.2/733bc79383c0cc56537e.json +1 -0
- neuronxcc-2.13.66.0+6dfecc895/0_REGISTRY/0.0.22.dev0/inference/mistral/mistralai/Mistral-7B-Instruct-v0.2/7fd9b858cf45bbf6355f.json +1 -0
- neuronxcc-2.13.66.0+6dfecc895/0_REGISTRY/0.0.22.dev0/inference/mistral/mistralai/Mistral-7B-Instruct-v0.2/979fce2dd4e4d499c2f0.json +1 -0
- neuronxcc-2.13.66.0+6dfecc895/0_REGISTRY/0.0.22.dev0/inference/mistral/mistralai/Mistral-7B-Instruct-v0.2/aa1ba12921766e16b7dc.json +1 -0
- neuronxcc-2.13.66.0+6dfecc895/0_REGISTRY/0.0.22.dev0/inference/mistral/mistralai/Mistral-7B-Instruct-v0.2/ca240a79f952204527fc.json +1 -0
- neuronxcc-2.13.66.0+6dfecc895/0_REGISTRY/0.0.22.dev0/inference/mistral/mistralai/Mistral-7B-Instruct-v0.2/eec3579b9122a80133a1.json +1 -0
- neuronxcc-2.13.66.0+6dfecc895/0_REGISTRY/0.0.22/inference/llama/meta-llama/Llama-2-7b-chat-hf/06b52fde14a8f28d6a3d.json +1 -0
- neuronxcc-2.13.66.0+6dfecc895/MODULE_007ddbaadfdea74c4db5+2c2d707e/model.neff +1 -1
- neuronxcc-2.13.66.0+6dfecc895/MODULE_01076e8d78b992483879+2c2d707e/compile_flags.txt +1 -0
- neuronxcc-2.13.66.0+6dfecc895/MODULE_01076e8d78b992483879+2c2d707e/model.hlo_module.pb +3 -0
- neuronxcc-2.13.66.0+6dfecc895/MODULE_01076e8d78b992483879+2c2d707e/model.neff +3 -0
- neuronxcc-2.13.66.0+6dfecc895/MODULE_023098bfa18bb6b7e093+2c2d707e/compile_flags.txt +1 -0
- neuronxcc-2.13.66.0+6dfecc895/MODULE_023098bfa18bb6b7e093+2c2d707e/model.hlo_module.pb +3 -0
- neuronxcc-2.13.66.0+6dfecc895/MODULE_023098bfa18bb6b7e093+2c2d707e/model.neff +3 -0
- neuronxcc-2.13.66.0+6dfecc895/MODULE_068011707d27c0821a21+2c2d707e/compile_flags.txt +1 -0
- neuronxcc-2.13.66.0+6dfecc895/MODULE_068011707d27c0821a21+2c2d707e/model.hlo_module.pb +3 -0
- neuronxcc-2.13.66.0+6dfecc895/MODULE_068011707d27c0821a21+2c2d707e/model.neff +3 -0
- neuronxcc-2.13.66.0+6dfecc895/MODULE_0c9f98ff6f5d2ff116cb+2c2d707e/compile_flags.txt +1 -0
- neuronxcc-2.13.66.0+6dfecc895/MODULE_0c9f98ff6f5d2ff116cb+2c2d707e/model.hlo_module.pb +3 -0
- neuronxcc-2.13.66.0+6dfecc895/MODULE_0c9f98ff6f5d2ff116cb+2c2d707e/model.neff +3 -0
- neuronxcc-2.13.66.0+6dfecc895/MODULE_104a70223ddf21bd9b47+2c2d707e/compile_flags.txt +1 -0
- neuronxcc-2.13.66.0+6dfecc895/MODULE_104a70223ddf21bd9b47+2c2d707e/model.hlo_module.pb +3 -0
- neuronxcc-2.13.66.0+6dfecc895/MODULE_104a70223ddf21bd9b47+2c2d707e/model.neff +3 -0
- neuronxcc-2.13.66.0+6dfecc895/MODULE_122e6a965070aa927ca3+2c2d707e/compile_flags.txt +1 -0
- neuronxcc-2.13.66.0+6dfecc895/MODULE_122e6a965070aa927ca3+2c2d707e/model.hlo_module.pb +3 -0
- neuronxcc-2.13.66.0+6dfecc895/MODULE_122e6a965070aa927ca3+2c2d707e/model.neff +3 -0
- neuronxcc-2.13.66.0+6dfecc895/MODULE_1f1e07d570ee56041d0a+2c2d707e/compile_flags.txt +1 -0
- neuronxcc-2.13.66.0+6dfecc895/MODULE_1f1e07d570ee56041d0a+2c2d707e/model.hlo_module.pb +3 -0
- neuronxcc-2.13.66.0+6dfecc895/MODULE_1f1e07d570ee56041d0a+2c2d707e/model.neff +3 -0
- neuronxcc-2.13.66.0+6dfecc895/MODULE_20906ae3bb104009b559+2c2d707e/compile_flags.txt +1 -0
- neuronxcc-2.13.66.0+6dfecc895/MODULE_20906ae3bb104009b559+2c2d707e/model.hlo_module.pb +3 -0
- neuronxcc-2.13.66.0+6dfecc895/MODULE_20906ae3bb104009b559+2c2d707e/model.neff +3 -0
- neuronxcc-2.13.66.0+6dfecc895/MODULE_21b1b0223e4fb6f5af41+2c2d707e/model.neff +1 -1
- neuronxcc-2.13.66.0+6dfecc895/MODULE_21d7ca83fa40eaf22249+2c2d707e/model.hlo_module.pb +3 -0
- neuronxcc-2.13.66.0+6dfecc895/MODULE_237d06dbfd8a5be615d7+2c2d707e/compile_flags.txt +1 -0
- neuronxcc-2.13.66.0+6dfecc895/MODULE_237d06dbfd8a5be615d7+2c2d707e/model.hlo_module.pb +3 -0
- neuronxcc-2.13.66.0+6dfecc895/MODULE_237d06dbfd8a5be615d7+2c2d707e/model.neff +3 -0
- neuronxcc-2.13.66.0+6dfecc895/MODULE_259391de413611a000d7+2c2d707e/compile_flags.txt +1 -0
- neuronxcc-2.13.66.0+6dfecc895/MODULE_259391de413611a000d7+2c2d707e/model.hlo_module.pb +3 -0
- neuronxcc-2.13.66.0+6dfecc895/MODULE_259391de413611a000d7+2c2d707e/model.neff +3 -0
- neuronxcc-2.13.66.0+6dfecc895/MODULE_298bc643cbb368dd898d+2c2d707e/compile_flags.txt +1 -0
.gitattributes
CHANGED
@@ -2654,37 +2654,114 @@ neuronxcc-2.13.66.0+6dfecc895/MODULE_5f931e8bf304c87202cd+2c2d707e/model.neff fi
|
|
2654 |
neuronxcc-2.13.66.0+6dfecc895/MODULE_a4fe1c700a9abdb20641+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2655 |
neuronxcc-2.13.66.0+6dfecc895/MODULE_b54a08c18ad776940cd0+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2656 |
neuronxcc-2.13.66.0+6dfecc895/MODULE_b59ff3b7e545f85152c8+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2657 |
-
neuronxcc-2.13.66.0+6dfecc895/
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
2658 |
neuronxcc-2.13.66.0+6dfecc895/MODULE_21b1b0223e4fb6f5af41+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
|
|
|
|
|
2659 |
neuronxcc-2.13.66.0+6dfecc895/MODULE_3020655465d2e0990c19+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2660 |
-
neuronxcc-2.13.66.0+6dfecc895/
|
2661 |
-
neuronxcc-2.13.66.0+6dfecc895/
|
|
|
|
|
|
|
|
|
|
|
2662 |
neuronxcc-2.13.66.0+6dfecc895/MODULE_426cd9312d26b5e0bf95+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2663 |
-
neuronxcc-2.13.66.0+6dfecc895/
|
2664 |
neuronxcc-2.13.66.0+6dfecc895/MODULE_44563e64a3dddda1db4d+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
|
|
2665 |
neuronxcc-2.13.66.0+6dfecc895/MODULE_47eae16823191f315893+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2666 |
-
neuronxcc-2.13.66.0+6dfecc895/
|
2667 |
-
neuronxcc-2.13.66.0+6dfecc895/
|
2668 |
-
neuronxcc-2.13.66.0+6dfecc895/
|
2669 |
-
neuronxcc-2.13.66.0+6dfecc895/
|
|
|
|
|
|
|
|
|
|
|
|
|
2670 |
neuronxcc-2.13.66.0+6dfecc895/MODULE_62cafa382ec618cff287+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2671 |
-
neuronxcc-2.13.66.0+6dfecc895/
|
2672 |
-
neuronxcc-2.13.66.0+6dfecc895/
|
2673 |
-
neuronxcc-2.13.66.0+6dfecc895/
|
2674 |
-
neuronxcc-2.13.66.0+6dfecc895/
|
2675 |
-
neuronxcc-2.13.66.0+6dfecc895/
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
2676 |
neuronxcc-2.13.66.0+6dfecc895/MODULE_85a47887d4fc41e26097+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
2677 |
neuronxcc-2.13.66.0+6dfecc895/MODULE_8f8b48a08a0c68320dbf+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
2678 |
neuronxcc-2.13.66.0+6dfecc895/MODULE_98b888cee6ab04043987+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2679 |
-
neuronxcc-2.13.66.0+6dfecc895/
|
2680 |
-
neuronxcc-2.13.66.0+6dfecc895/
|
2681 |
-
neuronxcc-2.13.66.0+6dfecc895/
|
2682 |
-
neuronxcc-2.13.66.0+6dfecc895/
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
2683 |
neuronxcc-2.13.66.0+6dfecc895/MODULE_cda75e05b1d55681d8eb+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2684 |
-
neuronxcc-2.13.66.0+6dfecc895/
|
|
|
|
|
|
|
|
|
|
|
|
|
2685 |
neuronxcc-2.13.66.0+6dfecc895/MODULE_d66f5802e5ad890e3919+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2686 |
-
neuronxcc-2.13.66.0+6dfecc895/
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
2687 |
neuronxcc-2.13.66.0+6dfecc895/MODULE_ea017e5effcd92c4e6ff+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2688 |
-
neuronxcc-2.13.66.0+6dfecc895/
|
|
|
|
|
|
|
|
|
2689 |
neuronxcc-2.13.66.0+6dfecc895/MODULE_f2145a17aa8d689f7038+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
|
|
2690 |
neuronxcc-2.13.66.0+6dfecc895/MODULE_f74f07a635721468c2ae+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
|
|
2654 |
neuronxcc-2.13.66.0+6dfecc895/MODULE_a4fe1c700a9abdb20641+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2655 |
neuronxcc-2.13.66.0+6dfecc895/MODULE_b54a08c18ad776940cd0+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2656 |
neuronxcc-2.13.66.0+6dfecc895/MODULE_b59ff3b7e545f85152c8+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2657 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_01076e8d78b992483879+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2658 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_023098bfa18bb6b7e093+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2659 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_068011707d27c0821a21+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2660 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_0c9f98ff6f5d2ff116cb+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2661 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_104a70223ddf21bd9b47+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2662 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_122e6a965070aa927ca3+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2663 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_1f1e07d570ee56041d0a+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2664 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_20906ae3bb104009b559+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2665 |
neuronxcc-2.13.66.0+6dfecc895/MODULE_21b1b0223e4fb6f5af41+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2666 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_237d06dbfd8a5be615d7+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2667 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_259391de413611a000d7+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2668 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_2af13ac81b81096c1639+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2669 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_2b8fde7222de84e947e7+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2670 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_2bee1e5c93ed7d1f7e41+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2671 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_2c1ec1a942837fc9dd52+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2672 |
neuronxcc-2.13.66.0+6dfecc895/MODULE_3020655465d2e0990c19+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2673 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_322406123b6432adb6dc+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2674 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_39eb97b1b9533436c683+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2675 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_3b402aecf275deb431f9+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2676 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_3c0c7b7b3d473ebc8a65+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2677 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_3c95e3e5da57364deaaa+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2678 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_3f3330ac017793bff7e9+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2679 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_4254b9adcf600cfbd813+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2680 |
neuronxcc-2.13.66.0+6dfecc895/MODULE_426cd9312d26b5e0bf95+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2681 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_42ebbddc061c448d5837+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2682 |
neuronxcc-2.13.66.0+6dfecc895/MODULE_44563e64a3dddda1db4d+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2683 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_475e56c6ad56c5870fbe+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2684 |
neuronxcc-2.13.66.0+6dfecc895/MODULE_47eae16823191f315893+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2685 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_4b82c477c6cc7a064950+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2686 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_4ff3e786a52274ce1036+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2687 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_52e827b70e965558e166+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2688 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_538f209e64b33d73a48d+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2689 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_583712a6b0541c0cfdd0+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2690 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_5b1656a79ce81111a281+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2691 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_5b4747041cb35db7b730+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2692 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_5ff9a21793629fea6aaf+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2693 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_6265c4a1043ac00bd8ad+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2694 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_62c11966b3a4b6df942f+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2695 |
neuronxcc-2.13.66.0+6dfecc895/MODULE_62cafa382ec618cff287+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2696 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_64e39442db5e247a51cc+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2697 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_69ac5dff199c51754201+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2698 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_6edfc9ee4f2dcc13e351+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2699 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_6f0081dc753efeb38458+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2700 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_6f687780991c4858fa8e+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2701 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_70731d92d305a068cba1+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2702 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_761df4753670d0439b7a+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2703 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_775a72fd321efed8ea24+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2704 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_7828f484ba2832828302+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2705 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_7c12958cee70be03cbf3+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2706 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_7cac27e9135d049acdd7+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2707 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_7e2a3993bbf047863253+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2708 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_7ea40bbcf7d07a3c3ead+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2709 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_83cc94a2f92353b536c9+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2710 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_84290d79205fc78f7b65+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2711 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_84b20d16b60b305cfd59+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2712 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_85336feb2a590ec9a4ad+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2713 |
neuronxcc-2.13.66.0+6dfecc895/MODULE_85a47887d4fc41e26097+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2714 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_87223ed2919e0305fc45+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2715 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_8998739069f9b9438f2f+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2716 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_8b47f33881599fb2f73b+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2717 |
neuronxcc-2.13.66.0+6dfecc895/MODULE_8f8b48a08a0c68320dbf+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2718 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_93630d1069f7d37ea9a9+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2719 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_9486a445d1865f79a2ad+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2720 |
neuronxcc-2.13.66.0+6dfecc895/MODULE_98b888cee6ab04043987+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2721 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_a130605def82b6bc9ff7+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2722 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_a264074c4beb4bfa0769+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2723 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_a2907d828d1fdb092f2e+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2724 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_a3feec44b99a9925e1ff+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2725 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_a9515c34757db218879c+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2726 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_aaef2b3e98127eff8e39+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2727 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_b3601d975fd89ccfc423+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2728 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_b51bb8f50ce5fd56bd66+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2729 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_b79abe9895bfb1cca41c+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2730 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_bcd40c343f7ed90f678c+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2731 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_bd60eb80b95a1932a570+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2732 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_cb3c0c5398c9bf1f33c9+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2733 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_cc4336e144da396deeb6+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2734 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_cc80730ff341e79c3dee+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2735 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_cd6c1f7c99ce035a6c89+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2736 |
neuronxcc-2.13.66.0+6dfecc895/MODULE_cda75e05b1d55681d8eb+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2737 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_cebdcedfc8ecf222048c+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2738 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_cf647d4b6272e9ec7bfa+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2739 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_d0ed4cee650aac0b8a50+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2740 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_d1cae76c5b1ad6358a3b+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2741 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_d1e17083fc706ff1bd04+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2742 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_d56b11b891ba274f9a15+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2743 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_d5708b280f59fe3ad8a4+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2744 |
neuronxcc-2.13.66.0+6dfecc895/MODULE_d66f5802e5ad890e3919+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2745 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_d6fe9b0a8aabbba68c81+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2746 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_d9512ae8a122305821db+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2747 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_d9e5f45d7ef4d847d204+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2748 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_dee9e70fbf34b30e5604+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2749 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_e12bbb76e0fade707575+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2750 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_e2449d2d5a14cd2cadc6+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2751 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_e4399ab0388d19f561ab+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2752 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_e4fd29ccefa49ebbf681+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2753 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_e7572f71621618e422b4+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2754 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_e7e33963f76f02322430+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2755 |
neuronxcc-2.13.66.0+6dfecc895/MODULE_ea017e5effcd92c4e6ff+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2756 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_eaa1070fca3c7e27aa55+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2757 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_ed3e0b1e03de33122200+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2758 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_eddbf1ef02bd12d48612+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2759 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_ee52dc80c1702c4661e4+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2760 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_eee99099cb73269cdc4c+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2761 |
neuronxcc-2.13.66.0+6dfecc895/MODULE_f2145a17aa8d689f7038+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2762 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_f62dd3a630fd90fd0da6+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2763 |
neuronxcc-2.13.66.0+6dfecc895/MODULE_f74f07a635721468c2ae+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2764 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_f85314cf29074baad1bd+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2765 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_f95d4270b8e479b16dbe+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2766 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_f96048bdfffb74fb6409+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2767 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_fb292bd72f57a48a1c63+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
neuronxcc-2.13.66.0+6dfecc895/0_REGISTRY/0.0.22.dev0/inference/llama/meta-llama/Llama-2-13b-chat-hf/55d02a833c68f65f88c9.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"architectures": ["LlamaForCausalLM"], "attention_bias": false, "attention_dropout": 0.0, "bos_token_id": 1, "eos_token_id": 2, "hidden_act": "silu", "hidden_size": 5120, "initializer_range": 0.02, "intermediate_size": 13824, "max_position_embeddings": 4096, "model_type": "llama", "neuron": {"auto_cast_type": "fp16", "batch_size": 8, "checkpoint_id": "meta-llama/Llama-2-13b-chat-hf", "checkpoint_revision": "a2cb7a712bb6e5e736ca7f8cd98167f81a0b5bd8", "compiler_type": "neuronx-cc", "compiler_version": "2.13.66.0+6dfecc895", "num_cores": 8, "sequence_length": 4096, "task": "text-generation"}, "num_attention_heads": 40, "num_hidden_layers": 40, "num_key_value_heads": 40, "pretraining_tp": 1, "rms_norm_eps": 1e-05, "rope_scaling": null, "rope_theta": 10000.0, "tie_word_embeddings": false, "torch_dtype": "float16", "use_cache": true, "vocab_size": 32000}
|
neuronxcc-2.13.66.0+6dfecc895/0_REGISTRY/0.0.22.dev0/inference/llama/meta-llama/Llama-2-13b-chat-hf/a4fb9901e6811328a109.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"architectures": ["LlamaForCausalLM"], "attention_bias": false, "attention_dropout": 0.0, "bos_token_id": 1, "eos_token_id": 2, "hidden_act": "silu", "hidden_size": 5120, "initializer_range": 0.02, "intermediate_size": 13824, "max_position_embeddings": 4096, "model_type": "llama", "neuron": {"auto_cast_type": "fp16", "batch_size": 16, "checkpoint_id": "meta-llama/Llama-2-13b-chat-hf", "checkpoint_revision": "a2cb7a712bb6e5e736ca7f8cd98167f81a0b5bd8", "compiler_type": "neuronx-cc", "compiler_version": "2.13.66.0+6dfecc895", "num_cores": 8, "sequence_length": 4096, "task": "text-generation"}, "num_attention_heads": 40, "num_hidden_layers": 40, "num_key_value_heads": 40, "pretraining_tp": 1, "rms_norm_eps": 1e-05, "rope_scaling": null, "rope_theta": 10000.0, "tie_word_embeddings": false, "torch_dtype": "float16", "use_cache": true, "vocab_size": 32000}
|
neuronxcc-2.13.66.0+6dfecc895/0_REGISTRY/0.0.22.dev0/inference/llama/meta-llama/Llama-2-13b-chat-hf/a8c0b413e79c91496630.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"architectures": ["LlamaForCausalLM"], "attention_bias": false, "attention_dropout": 0.0, "bos_token_id": 1, "eos_token_id": 2, "hidden_act": "silu", "hidden_size": 5120, "initializer_range": 0.02, "intermediate_size": 13824, "max_position_embeddings": 4096, "model_type": "llama", "neuron": {"auto_cast_type": "fp16", "batch_size": 4, "checkpoint_id": "meta-llama/Llama-2-13b-chat-hf", "checkpoint_revision": "a2cb7a712bb6e5e736ca7f8cd98167f81a0b5bd8", "compiler_type": "neuronx-cc", "compiler_version": "2.13.66.0+6dfecc895", "num_cores": 8, "sequence_length": 4096, "task": "text-generation"}, "num_attention_heads": 40, "num_hidden_layers": 40, "num_key_value_heads": 40, "pretraining_tp": 1, "rms_norm_eps": 1e-05, "rope_scaling": null, "rope_theta": 10000.0, "tie_word_embeddings": false, "torch_dtype": "float16", "use_cache": true, "vocab_size": 32000}
|
neuronxcc-2.13.66.0+6dfecc895/0_REGISTRY/0.0.22.dev0/inference/llama/meta-llama/Llama-2-13b-chat-hf/d68250e23574798328a7.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"architectures": ["LlamaForCausalLM"], "attention_bias": false, "attention_dropout": 0.0, "bos_token_id": 1, "eos_token_id": 2, "hidden_act": "silu", "hidden_size": 5120, "initializer_range": 0.02, "intermediate_size": 13824, "max_position_embeddings": 4096, "model_type": "llama", "neuron": {"auto_cast_type": "fp16", "batch_size": 1, "checkpoint_id": "meta-llama/Llama-2-13b-chat-hf", "checkpoint_revision": "a2cb7a712bb6e5e736ca7f8cd98167f81a0b5bd8", "compiler_type": "neuronx-cc", "compiler_version": "2.13.66.0+6dfecc895", "num_cores": 8, "sequence_length": 4096, "task": "text-generation"}, "num_attention_heads": 40, "num_hidden_layers": 40, "num_key_value_heads": 40, "pretraining_tp": 1, "rms_norm_eps": 1e-05, "rope_scaling": null, "rope_theta": 10000.0, "tie_word_embeddings": false, "torch_dtype": "float16", "use_cache": true, "vocab_size": 32000}
|
neuronxcc-2.13.66.0+6dfecc895/0_REGISTRY/0.0.22.dev0/inference/mistral/mistralai/Mistral-7B-Instruct-v0.2/1245bb72b32d75db76f9.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"architectures": ["MistralForCausalLM"], "attention_dropout": 0.0, "bos_token_id": 1, "eos_token_id": 2, "hidden_act": "silu", "hidden_size": 4096, "initializer_range": 0.02, "intermediate_size": 14336, "max_position_embeddings": 32768, "model_type": "mistral", "neuron": {"auto_cast_type": "bf16", "batch_size": 4, "checkpoint_id": "mistralai/Mistral-7B-Instruct-v0.2", "checkpoint_revision": "41b61a33a2483885c981aa79e0df6b32407ed873", "compiler_type": "neuronx-cc", "compiler_version": "2.13.66.0+6dfecc895", "num_cores": 8, "sequence_length": 4096, "task": "text-generation"}, "num_attention_heads": 32, "num_hidden_layers": 32, "num_key_value_heads": 8, "rms_norm_eps": 1e-05, "rope_theta": 1000000.0, "sliding_window": null, "tie_word_embeddings": false, "torch_dtype": "bfloat16", "use_cache": true, "vocab_size": 32000}
|
neuronxcc-2.13.66.0+6dfecc895/0_REGISTRY/0.0.22.dev0/inference/mistral/mistralai/Mistral-7B-Instruct-v0.2/5e1e1d2ca63370d9d0a0.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"architectures": ["MistralForCausalLM"], "attention_dropout": 0.0, "bos_token_id": 1, "eos_token_id": 2, "hidden_act": "silu", "hidden_size": 4096, "initializer_range": 0.02, "intermediate_size": 14336, "max_position_embeddings": 32768, "model_type": "mistral", "neuron": {"auto_cast_type": "fp16", "batch_size": 8, "checkpoint_id": "mistralai/Mistral-7B-Instruct-v0.2", "checkpoint_revision": "41b61a33a2483885c981aa79e0df6b32407ed873", "compiler_type": "neuronx-cc", "compiler_version": "2.13.66.0+6dfecc895", "num_cores": 8, "sequence_length": 4096, "task": "text-generation"}, "num_attention_heads": 32, "num_hidden_layers": 32, "num_key_value_heads": 8, "rms_norm_eps": 1e-05, "rope_theta": 1000000.0, "sliding_window": null, "tie_word_embeddings": false, "torch_dtype": "bfloat16", "use_cache": true, "vocab_size": 32000}
|
neuronxcc-2.13.66.0+6dfecc895/0_REGISTRY/0.0.22.dev0/inference/mistral/mistralai/Mistral-7B-Instruct-v0.2/6255cc2875c3d0c5e501.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"architectures": ["MistralForCausalLM"], "attention_dropout": 0.0, "bos_token_id": 1, "eos_token_id": 2, "hidden_act": "silu", "hidden_size": 4096, "initializer_range": 0.02, "intermediate_size": 14336, "max_position_embeddings": 32768, "model_type": "mistral", "neuron": {"auto_cast_type": "fp16", "batch_size": 32, "checkpoint_id": "mistralai/Mistral-7B-Instruct-v0.2", "checkpoint_revision": "41b61a33a2483885c981aa79e0df6b32407ed873", "compiler_type": "neuronx-cc", "compiler_version": "2.13.66.0+6dfecc895", "num_cores": 8, "sequence_length": 4096, "task": "text-generation"}, "num_attention_heads": 32, "num_hidden_layers": 32, "num_key_value_heads": 8, "rms_norm_eps": 1e-05, "rope_theta": 1000000.0, "sliding_window": null, "tie_word_embeddings": false, "torch_dtype": "bfloat16", "use_cache": true, "vocab_size": 32000}
|
neuronxcc-2.13.66.0+6dfecc895/0_REGISTRY/0.0.22.dev0/inference/mistral/mistralai/Mistral-7B-Instruct-v0.2/64e0d5cd868faca4549f.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"architectures": ["MistralForCausalLM"], "attention_dropout": 0.0, "bos_token_id": 1, "eos_token_id": 2, "hidden_act": "silu", "hidden_size": 4096, "initializer_range": 0.02, "intermediate_size": 14336, "max_position_embeddings": 32768, "model_type": "mistral", "neuron": {"auto_cast_type": "bf16", "batch_size": 1, "checkpoint_id": "mistralai/Mistral-7B-Instruct-v0.2", "checkpoint_revision": "41b61a33a2483885c981aa79e0df6b32407ed873", "compiler_type": "neuronx-cc", "compiler_version": "2.13.66.0+6dfecc895", "num_cores": 8, "sequence_length": 4096, "task": "text-generation"}, "num_attention_heads": 32, "num_hidden_layers": 32, "num_key_value_heads": 8, "rms_norm_eps": 1e-05, "rope_theta": 1000000.0, "sliding_window": null, "tie_word_embeddings": false, "torch_dtype": "bfloat16", "use_cache": true, "vocab_size": 32000}
|
neuronxcc-2.13.66.0+6dfecc895/0_REGISTRY/0.0.22.dev0/inference/mistral/mistralai/Mistral-7B-Instruct-v0.2/733bc79383c0cc56537e.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"architectures": ["MistralForCausalLM"], "attention_dropout": 0.0, "bos_token_id": 1, "eos_token_id": 2, "hidden_act": "silu", "hidden_size": 4096, "initializer_range": 0.02, "intermediate_size": 14336, "max_position_embeddings": 32768, "model_type": "mistral", "neuron": {"auto_cast_type": "bf16", "batch_size": 16, "checkpoint_id": "mistralai/Mistral-7B-Instruct-v0.2", "checkpoint_revision": "41b61a33a2483885c981aa79e0df6b32407ed873", "compiler_type": "neuronx-cc", "compiler_version": "2.13.66.0+6dfecc895", "num_cores": 8, "sequence_length": 4096, "task": "text-generation"}, "num_attention_heads": 32, "num_hidden_layers": 32, "num_key_value_heads": 8, "rms_norm_eps": 1e-05, "rope_theta": 1000000.0, "sliding_window": null, "tie_word_embeddings": false, "torch_dtype": "bfloat16", "use_cache": true, "vocab_size": 32000}
|
neuronxcc-2.13.66.0+6dfecc895/0_REGISTRY/0.0.22.dev0/inference/mistral/mistralai/Mistral-7B-Instruct-v0.2/7fd9b858cf45bbf6355f.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"architectures": ["MistralForCausalLM"], "attention_dropout": 0.0, "bos_token_id": 1, "eos_token_id": 2, "hidden_act": "silu", "hidden_size": 4096, "initializer_range": 0.02, "intermediate_size": 14336, "max_position_embeddings": 32768, "model_type": "mistral", "neuron": {"auto_cast_type": "fp16", "batch_size": 16, "checkpoint_id": "mistralai/Mistral-7B-Instruct-v0.2", "checkpoint_revision": "41b61a33a2483885c981aa79e0df6b32407ed873", "compiler_type": "neuronx-cc", "compiler_version": "2.13.66.0+6dfecc895", "num_cores": 8, "sequence_length": 4096, "task": "text-generation"}, "num_attention_heads": 32, "num_hidden_layers": 32, "num_key_value_heads": 8, "rms_norm_eps": 1e-05, "rope_theta": 1000000.0, "sliding_window": null, "tie_word_embeddings": false, "torch_dtype": "bfloat16", "use_cache": true, "vocab_size": 32000}
|
neuronxcc-2.13.66.0+6dfecc895/0_REGISTRY/0.0.22.dev0/inference/mistral/mistralai/Mistral-7B-Instruct-v0.2/979fce2dd4e4d499c2f0.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"architectures": ["MistralForCausalLM"], "attention_dropout": 0.0, "bos_token_id": 1, "eos_token_id": 2, "hidden_act": "silu", "hidden_size": 4096, "initializer_range": 0.02, "intermediate_size": 14336, "max_position_embeddings": 32768, "model_type": "mistral", "neuron": {"auto_cast_type": "fp16", "batch_size": 4, "checkpoint_id": "mistralai/Mistral-7B-Instruct-v0.2", "checkpoint_revision": "41b61a33a2483885c981aa79e0df6b32407ed873", "compiler_type": "neuronx-cc", "compiler_version": "2.13.66.0+6dfecc895", "num_cores": 8, "sequence_length": 4096, "task": "text-generation"}, "num_attention_heads": 32, "num_hidden_layers": 32, "num_key_value_heads": 8, "rms_norm_eps": 1e-05, "rope_theta": 1000000.0, "sliding_window": null, "tie_word_embeddings": false, "torch_dtype": "bfloat16", "use_cache": true, "vocab_size": 32000}
|
neuronxcc-2.13.66.0+6dfecc895/0_REGISTRY/0.0.22.dev0/inference/mistral/mistralai/Mistral-7B-Instruct-v0.2/aa1ba12921766e16b7dc.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"architectures": ["MistralForCausalLM"], "attention_dropout": 0.0, "bos_token_id": 1, "eos_token_id": 2, "hidden_act": "silu", "hidden_size": 4096, "initializer_range": 0.02, "intermediate_size": 14336, "max_position_embeddings": 32768, "model_type": "mistral", "neuron": {"auto_cast_type": "fp16", "batch_size": 1, "checkpoint_id": "mistralai/Mistral-7B-Instruct-v0.2", "checkpoint_revision": "41b61a33a2483885c981aa79e0df6b32407ed873", "compiler_type": "neuronx-cc", "compiler_version": "2.13.66.0+6dfecc895", "num_cores": 8, "sequence_length": 4096, "task": "text-generation"}, "num_attention_heads": 32, "num_hidden_layers": 32, "num_key_value_heads": 8, "rms_norm_eps": 1e-05, "rope_theta": 1000000.0, "sliding_window": null, "tie_word_embeddings": false, "torch_dtype": "bfloat16", "use_cache": true, "vocab_size": 32000}
|
neuronxcc-2.13.66.0+6dfecc895/0_REGISTRY/0.0.22.dev0/inference/mistral/mistralai/Mistral-7B-Instruct-v0.2/ca240a79f952204527fc.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"architectures": ["MistralForCausalLM"], "attention_dropout": 0.0, "bos_token_id": 1, "eos_token_id": 2, "hidden_act": "silu", "hidden_size": 4096, "initializer_range": 0.02, "intermediate_size": 14336, "max_position_embeddings": 32768, "model_type": "mistral", "neuron": {"auto_cast_type": "bf16", "batch_size": 8, "checkpoint_id": "mistralai/Mistral-7B-Instruct-v0.2", "checkpoint_revision": "41b61a33a2483885c981aa79e0df6b32407ed873", "compiler_type": "neuronx-cc", "compiler_version": "2.13.66.0+6dfecc895", "num_cores": 8, "sequence_length": 4096, "task": "text-generation"}, "num_attention_heads": 32, "num_hidden_layers": 32, "num_key_value_heads": 8, "rms_norm_eps": 1e-05, "rope_theta": 1000000.0, "sliding_window": null, "tie_word_embeddings": false, "torch_dtype": "bfloat16", "use_cache": true, "vocab_size": 32000}
|
neuronxcc-2.13.66.0+6dfecc895/0_REGISTRY/0.0.22.dev0/inference/mistral/mistralai/Mistral-7B-Instruct-v0.2/eec3579b9122a80133a1.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"architectures": ["MistralForCausalLM"], "attention_dropout": 0.0, "bos_token_id": 1, "eos_token_id": 2, "hidden_act": "silu", "hidden_size": 4096, "initializer_range": 0.02, "intermediate_size": 14336, "max_position_embeddings": 32768, "model_type": "mistral", "neuron": {"auto_cast_type": "bf16", "batch_size": 32, "checkpoint_id": "mistralai/Mistral-7B-Instruct-v0.2", "checkpoint_revision": "41b61a33a2483885c981aa79e0df6b32407ed873", "compiler_type": "neuronx-cc", "compiler_version": "2.13.66.0+6dfecc895", "num_cores": 8, "sequence_length": 4096, "task": "text-generation"}, "num_attention_heads": 32, "num_hidden_layers": 32, "num_key_value_heads": 8, "rms_norm_eps": 1e-05, "rope_theta": 1000000.0, "sliding_window": null, "tie_word_embeddings": false, "torch_dtype": "bfloat16", "use_cache": true, "vocab_size": 32000}
|
neuronxcc-2.13.66.0+6dfecc895/0_REGISTRY/0.0.22/inference/llama/meta-llama/Llama-2-7b-chat-hf/06b52fde14a8f28d6a3d.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"architectures": ["LlamaForCausalLM"], "attention_bias": false, "attention_dropout": 0.0, "bos_token_id": 1, "eos_token_id": 2, "hidden_act": "silu", "hidden_size": 4096, "initializer_range": 0.02, "intermediate_size": 11008, "max_position_embeddings": 4096, "model_type": "llama", "neuron": {"auto_cast_type": "fp16", "batch_size": 1, "checkpoint_id": "meta-llama/Llama-2-7b-chat-hf", "checkpoint_revision": "f5db02db724555f92da89c216ac04704f23d4590", "compiler_type": "neuronx-cc", "compiler_version": "2.13.66.0+6dfecc895", "num_cores": 2, "sequence_length": 4096, "task": "text-generation"}, "num_attention_heads": 32, "num_hidden_layers": 32, "num_key_value_heads": 32, "pretraining_tp": 1, "rms_norm_eps": 1e-05, "rope_scaling": null, "rope_theta": 10000.0, "tie_word_embeddings": false, "torch_dtype": "float16", "use_cache": true, "vocab_size": 32000}
|
neuronxcc-2.13.66.0+6dfecc895/MODULE_007ddbaadfdea74c4db5+2c2d707e/model.neff
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 13282304
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8559beec2df842857f647f9921c6ff30f0f3f20a4e17b0e3c7142e24902f7d90
|
3 |
size 13282304
|
neuronxcc-2.13.66.0+6dfecc895/MODULE_01076e8d78b992483879+2c2d707e/compile_flags.txt
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
--model-type=transformer --auto-cast=none
|
neuronxcc-2.13.66.0+6dfecc895/MODULE_01076e8d78b992483879+2c2d707e/model.hlo_module.pb
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d6c5cb1275fbbfedb3e7c4d72e9f6d73845364943f9acbd07471933811598a8c
|
3 |
+
size 318327
|
neuronxcc-2.13.66.0+6dfecc895/MODULE_01076e8d78b992483879+2c2d707e/model.neff
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b746795a76c3239b01e328887743aa1ff4f15a53edfd7ce972e87d1d25efc2ae
|
3 |
+
size 2479104
|
neuronxcc-2.13.66.0+6dfecc895/MODULE_023098bfa18bb6b7e093+2c2d707e/compile_flags.txt
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
--model-type=transformer --auto-cast=none
|
neuronxcc-2.13.66.0+6dfecc895/MODULE_023098bfa18bb6b7e093+2c2d707e/model.hlo_module.pb
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6a6ee9aeae30bd5ffafa657854c5e7fe9f5ee68d40fb5051fa38ddb466ab550a
|
3 |
+
size 380699
|
neuronxcc-2.13.66.0+6dfecc895/MODULE_023098bfa18bb6b7e093+2c2d707e/model.neff
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fb3f3c7216a6bf0233c0d9a87aa36f17575d8300bb9c386b78fea60e1043a3ba
|
3 |
+
size 18709504
|
neuronxcc-2.13.66.0+6dfecc895/MODULE_068011707d27c0821a21+2c2d707e/compile_flags.txt
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
--model-type=transformer --auto-cast=none
|
neuronxcc-2.13.66.0+6dfecc895/MODULE_068011707d27c0821a21+2c2d707e/model.hlo_module.pb
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:33455a4af632d1f01d5ba298df3d50b02e3e117471d40338a86b56ff493e59e2
|
3 |
+
size 357616
|
neuronxcc-2.13.66.0+6dfecc895/MODULE_068011707d27c0821a21+2c2d707e/model.neff
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:45314103ad7921853f53cc774885c2192c599b7317e859ac0e235144b003a7f9
|
3 |
+
size 28959744
|
neuronxcc-2.13.66.0+6dfecc895/MODULE_0c9f98ff6f5d2ff116cb+2c2d707e/compile_flags.txt
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
--model-type=transformer --auto-cast=none
|
neuronxcc-2.13.66.0+6dfecc895/MODULE_0c9f98ff6f5d2ff116cb+2c2d707e/model.hlo_module.pb
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ac56ab5510f7844416010b4518e04c84a2df0dbae79e033b76c6e731507d9a80
|
3 |
+
size 299226
|
neuronxcc-2.13.66.0+6dfecc895/MODULE_0c9f98ff6f5d2ff116cb+2c2d707e/model.neff
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:60bd9a4f077016460a5a442a5353e313304939c7752a1a609f0f74a209fc7985
|
3 |
+
size 7814144
|
neuronxcc-2.13.66.0+6dfecc895/MODULE_104a70223ddf21bd9b47+2c2d707e/compile_flags.txt
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
--model-type=transformer --auto-cast=none
|
neuronxcc-2.13.66.0+6dfecc895/MODULE_104a70223ddf21bd9b47+2c2d707e/model.hlo_module.pb
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1e7047a8a0af3e0426169af64ca17c84415f74416273f08a0bbe78a93e9cd816
|
3 |
+
size 419433
|
neuronxcc-2.13.66.0+6dfecc895/MODULE_104a70223ddf21bd9b47+2c2d707e/model.neff
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:be52dbcdf1c3a2fe1f2a3185a7e622b1b9a274d2dc3efd3f935b844e8d5a4412
|
3 |
+
size 8530944
|
neuronxcc-2.13.66.0+6dfecc895/MODULE_122e6a965070aa927ca3+2c2d707e/compile_flags.txt
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
--model-type=transformer --auto-cast=none
|
neuronxcc-2.13.66.0+6dfecc895/MODULE_122e6a965070aa927ca3+2c2d707e/model.hlo_module.pb
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4785aa52c8c855926a7eee940c7db2b1869e6541bd9d0c4a1cb68bc96a4d9a5c
|
3 |
+
size 329721
|
neuronxcc-2.13.66.0+6dfecc895/MODULE_122e6a965070aa927ca3+2c2d707e/model.neff
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:23e8954ecb98f9debff5025a0118a27ae96c1744abace766ccbc9c98dcab34e5
|
3 |
+
size 2468864
|
neuronxcc-2.13.66.0+6dfecc895/MODULE_1f1e07d570ee56041d0a+2c2d707e/compile_flags.txt
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
--model-type=transformer --auto-cast=none
|
neuronxcc-2.13.66.0+6dfecc895/MODULE_1f1e07d570ee56041d0a+2c2d707e/model.hlo_module.pb
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:107d39f49881e6d2982ea9d36c22953545de064b0bbae09b7ac4cc2cd8144575
|
3 |
+
size 318327
|
neuronxcc-2.13.66.0+6dfecc895/MODULE_1f1e07d570ee56041d0a+2c2d707e/model.neff
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:67441fee53b92ca9d81863bb3177306b38c16c873f801b356e1e50e79e3f261f
|
3 |
+
size 2581504
|
neuronxcc-2.13.66.0+6dfecc895/MODULE_20906ae3bb104009b559+2c2d707e/compile_flags.txt
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
--model-type=transformer --auto-cast=none
|
neuronxcc-2.13.66.0+6dfecc895/MODULE_20906ae3bb104009b559+2c2d707e/model.hlo_module.pb
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:21e40c363503f6a8e7f9909acc1a367f1185440f5a601f63e8e9203264807752
|
3 |
+
size 410810
|
neuronxcc-2.13.66.0+6dfecc895/MODULE_20906ae3bb104009b559+2c2d707e/model.neff
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f735dd1ca52546b029bf3b6c832291b2dfcfa3498c7e0d16e5da513c27437900
|
3 |
+
size 3216384
|
neuronxcc-2.13.66.0+6dfecc895/MODULE_21b1b0223e4fb6f5af41+2c2d707e/model.neff
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 2161664
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a3f7daaa297382b89110fd4fa0c5bf14ea42e5008640cb0778fa0653ca455b89
|
3 |
size 2161664
|
neuronxcc-2.13.66.0+6dfecc895/MODULE_21d7ca83fa40eaf22249+2c2d707e/model.hlo_module.pb
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3fea25155c53bcf57abee0cb3bc910b63454a0c95fd7b2bb50a36bd2539cf184
|
3 |
+
size 318327
|
neuronxcc-2.13.66.0+6dfecc895/MODULE_237d06dbfd8a5be615d7+2c2d707e/compile_flags.txt
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
--model-type=transformer --auto-cast=none
|
neuronxcc-2.13.66.0+6dfecc895/MODULE_237d06dbfd8a5be615d7+2c2d707e/model.hlo_module.pb
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:888056ebb363a72225fbd0c21dfc7124667cea21cece58e6de57285793a4a205
|
3 |
+
size 318138
|
neuronxcc-2.13.66.0+6dfecc895/MODULE_237d06dbfd8a5be615d7+2c2d707e/model.neff
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:22aa3623e3c8ba6578c4ae047aa81b155e31be00f3aa8634f5511e164144588a
|
3 |
+
size 3144704
|
neuronxcc-2.13.66.0+6dfecc895/MODULE_259391de413611a000d7+2c2d707e/compile_flags.txt
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
--model-type=transformer --auto-cast=none
|
neuronxcc-2.13.66.0+6dfecc895/MODULE_259391de413611a000d7+2c2d707e/model.hlo_module.pb
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:567cf9d49d838ee5bb1e67dcb3d79c00b18972f82e113b396ddfebbd1a41b397
|
3 |
+
size 346060
|
neuronxcc-2.13.66.0+6dfecc895/MODULE_259391de413611a000d7+2c2d707e/model.neff
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7849f5d2ef765bdf5998b357cc3e1e438f2b0db49c427c2fc62473b8c2af91f7
|
3 |
+
size 30546944
|
neuronxcc-2.13.66.0+6dfecc895/MODULE_298bc643cbb368dd898d+2c2d707e/compile_flags.txt
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
--model-type=transformer --auto-cast=none
|