dacorvo HF staff commited on
Commit
94d71a4
1 Parent(s): 5a79963

Synchronizing local compiler cache.

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. .gitattributes +97 -20
  2. neuronxcc-2.13.66.0+6dfecc895/0_REGISTRY/0.0.22.dev0/inference/llama/meta-llama/Llama-2-13b-chat-hf/55d02a833c68f65f88c9.json +1 -0
  3. neuronxcc-2.13.66.0+6dfecc895/0_REGISTRY/0.0.22.dev0/inference/llama/meta-llama/Llama-2-13b-chat-hf/a4fb9901e6811328a109.json +1 -0
  4. neuronxcc-2.13.66.0+6dfecc895/0_REGISTRY/0.0.22.dev0/inference/llama/meta-llama/Llama-2-13b-chat-hf/a8c0b413e79c91496630.json +1 -0
  5. neuronxcc-2.13.66.0+6dfecc895/0_REGISTRY/0.0.22.dev0/inference/llama/meta-llama/Llama-2-13b-chat-hf/d68250e23574798328a7.json +1 -0
  6. neuronxcc-2.13.66.0+6dfecc895/0_REGISTRY/0.0.22.dev0/inference/mistral/mistralai/Mistral-7B-Instruct-v0.2/1245bb72b32d75db76f9.json +1 -0
  7. neuronxcc-2.13.66.0+6dfecc895/0_REGISTRY/0.0.22.dev0/inference/mistral/mistralai/Mistral-7B-Instruct-v0.2/5e1e1d2ca63370d9d0a0.json +1 -0
  8. neuronxcc-2.13.66.0+6dfecc895/0_REGISTRY/0.0.22.dev0/inference/mistral/mistralai/Mistral-7B-Instruct-v0.2/6255cc2875c3d0c5e501.json +1 -0
  9. neuronxcc-2.13.66.0+6dfecc895/0_REGISTRY/0.0.22.dev0/inference/mistral/mistralai/Mistral-7B-Instruct-v0.2/64e0d5cd868faca4549f.json +1 -0
  10. neuronxcc-2.13.66.0+6dfecc895/0_REGISTRY/0.0.22.dev0/inference/mistral/mistralai/Mistral-7B-Instruct-v0.2/733bc79383c0cc56537e.json +1 -0
  11. neuronxcc-2.13.66.0+6dfecc895/0_REGISTRY/0.0.22.dev0/inference/mistral/mistralai/Mistral-7B-Instruct-v0.2/7fd9b858cf45bbf6355f.json +1 -0
  12. neuronxcc-2.13.66.0+6dfecc895/0_REGISTRY/0.0.22.dev0/inference/mistral/mistralai/Mistral-7B-Instruct-v0.2/979fce2dd4e4d499c2f0.json +1 -0
  13. neuronxcc-2.13.66.0+6dfecc895/0_REGISTRY/0.0.22.dev0/inference/mistral/mistralai/Mistral-7B-Instruct-v0.2/aa1ba12921766e16b7dc.json +1 -0
  14. neuronxcc-2.13.66.0+6dfecc895/0_REGISTRY/0.0.22.dev0/inference/mistral/mistralai/Mistral-7B-Instruct-v0.2/ca240a79f952204527fc.json +1 -0
  15. neuronxcc-2.13.66.0+6dfecc895/0_REGISTRY/0.0.22.dev0/inference/mistral/mistralai/Mistral-7B-Instruct-v0.2/eec3579b9122a80133a1.json +1 -0
  16. neuronxcc-2.13.66.0+6dfecc895/0_REGISTRY/0.0.22/inference/llama/meta-llama/Llama-2-7b-chat-hf/06b52fde14a8f28d6a3d.json +1 -0
  17. neuronxcc-2.13.66.0+6dfecc895/MODULE_007ddbaadfdea74c4db5+2c2d707e/model.neff +1 -1
  18. neuronxcc-2.13.66.0+6dfecc895/MODULE_01076e8d78b992483879+2c2d707e/compile_flags.txt +1 -0
  19. neuronxcc-2.13.66.0+6dfecc895/MODULE_01076e8d78b992483879+2c2d707e/model.hlo_module.pb +3 -0
  20. neuronxcc-2.13.66.0+6dfecc895/MODULE_01076e8d78b992483879+2c2d707e/model.neff +3 -0
  21. neuronxcc-2.13.66.0+6dfecc895/MODULE_023098bfa18bb6b7e093+2c2d707e/compile_flags.txt +1 -0
  22. neuronxcc-2.13.66.0+6dfecc895/MODULE_023098bfa18bb6b7e093+2c2d707e/model.hlo_module.pb +3 -0
  23. neuronxcc-2.13.66.0+6dfecc895/MODULE_023098bfa18bb6b7e093+2c2d707e/model.neff +3 -0
  24. neuronxcc-2.13.66.0+6dfecc895/MODULE_068011707d27c0821a21+2c2d707e/compile_flags.txt +1 -0
  25. neuronxcc-2.13.66.0+6dfecc895/MODULE_068011707d27c0821a21+2c2d707e/model.hlo_module.pb +3 -0
  26. neuronxcc-2.13.66.0+6dfecc895/MODULE_068011707d27c0821a21+2c2d707e/model.neff +3 -0
  27. neuronxcc-2.13.66.0+6dfecc895/MODULE_0c9f98ff6f5d2ff116cb+2c2d707e/compile_flags.txt +1 -0
  28. neuronxcc-2.13.66.0+6dfecc895/MODULE_0c9f98ff6f5d2ff116cb+2c2d707e/model.hlo_module.pb +3 -0
  29. neuronxcc-2.13.66.0+6dfecc895/MODULE_0c9f98ff6f5d2ff116cb+2c2d707e/model.neff +3 -0
  30. neuronxcc-2.13.66.0+6dfecc895/MODULE_104a70223ddf21bd9b47+2c2d707e/compile_flags.txt +1 -0
  31. neuronxcc-2.13.66.0+6dfecc895/MODULE_104a70223ddf21bd9b47+2c2d707e/model.hlo_module.pb +3 -0
  32. neuronxcc-2.13.66.0+6dfecc895/MODULE_104a70223ddf21bd9b47+2c2d707e/model.neff +3 -0
  33. neuronxcc-2.13.66.0+6dfecc895/MODULE_122e6a965070aa927ca3+2c2d707e/compile_flags.txt +1 -0
  34. neuronxcc-2.13.66.0+6dfecc895/MODULE_122e6a965070aa927ca3+2c2d707e/model.hlo_module.pb +3 -0
  35. neuronxcc-2.13.66.0+6dfecc895/MODULE_122e6a965070aa927ca3+2c2d707e/model.neff +3 -0
  36. neuronxcc-2.13.66.0+6dfecc895/MODULE_1f1e07d570ee56041d0a+2c2d707e/compile_flags.txt +1 -0
  37. neuronxcc-2.13.66.0+6dfecc895/MODULE_1f1e07d570ee56041d0a+2c2d707e/model.hlo_module.pb +3 -0
  38. neuronxcc-2.13.66.0+6dfecc895/MODULE_1f1e07d570ee56041d0a+2c2d707e/model.neff +3 -0
  39. neuronxcc-2.13.66.0+6dfecc895/MODULE_20906ae3bb104009b559+2c2d707e/compile_flags.txt +1 -0
  40. neuronxcc-2.13.66.0+6dfecc895/MODULE_20906ae3bb104009b559+2c2d707e/model.hlo_module.pb +3 -0
  41. neuronxcc-2.13.66.0+6dfecc895/MODULE_20906ae3bb104009b559+2c2d707e/model.neff +3 -0
  42. neuronxcc-2.13.66.0+6dfecc895/MODULE_21b1b0223e4fb6f5af41+2c2d707e/model.neff +1 -1
  43. neuronxcc-2.13.66.0+6dfecc895/MODULE_21d7ca83fa40eaf22249+2c2d707e/model.hlo_module.pb +3 -0
  44. neuronxcc-2.13.66.0+6dfecc895/MODULE_237d06dbfd8a5be615d7+2c2d707e/compile_flags.txt +1 -0
  45. neuronxcc-2.13.66.0+6dfecc895/MODULE_237d06dbfd8a5be615d7+2c2d707e/model.hlo_module.pb +3 -0
  46. neuronxcc-2.13.66.0+6dfecc895/MODULE_237d06dbfd8a5be615d7+2c2d707e/model.neff +3 -0
  47. neuronxcc-2.13.66.0+6dfecc895/MODULE_259391de413611a000d7+2c2d707e/compile_flags.txt +1 -0
  48. neuronxcc-2.13.66.0+6dfecc895/MODULE_259391de413611a000d7+2c2d707e/model.hlo_module.pb +3 -0
  49. neuronxcc-2.13.66.0+6dfecc895/MODULE_259391de413611a000d7+2c2d707e/model.neff +3 -0
  50. neuronxcc-2.13.66.0+6dfecc895/MODULE_298bc643cbb368dd898d+2c2d707e/compile_flags.txt +1 -0
.gitattributes CHANGED
@@ -2654,37 +2654,114 @@ neuronxcc-2.13.66.0+6dfecc895/MODULE_5f931e8bf304c87202cd+2c2d707e/model.neff fi
2654
  neuronxcc-2.13.66.0+6dfecc895/MODULE_a4fe1c700a9abdb20641+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
2655
  neuronxcc-2.13.66.0+6dfecc895/MODULE_b54a08c18ad776940cd0+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
2656
  neuronxcc-2.13.66.0+6dfecc895/MODULE_b59ff3b7e545f85152c8+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
2657
- neuronxcc-2.13.66.0+6dfecc895/MODULE_01fe42b103324d50dd0f+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
 
 
 
 
 
 
 
2658
  neuronxcc-2.13.66.0+6dfecc895/MODULE_21b1b0223e4fb6f5af41+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
 
 
 
 
 
 
2659
  neuronxcc-2.13.66.0+6dfecc895/MODULE_3020655465d2e0990c19+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
2660
- neuronxcc-2.13.66.0+6dfecc895/MODULE_4051477874156d7450fe+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
2661
- neuronxcc-2.13.66.0+6dfecc895/MODULE_410c6d6a0c764608be0d+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
 
 
 
 
 
2662
  neuronxcc-2.13.66.0+6dfecc895/MODULE_426cd9312d26b5e0bf95+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
2663
- neuronxcc-2.13.66.0+6dfecc895/MODULE_443c7de81db84f0f078c+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
2664
  neuronxcc-2.13.66.0+6dfecc895/MODULE_44563e64a3dddda1db4d+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
 
2665
  neuronxcc-2.13.66.0+6dfecc895/MODULE_47eae16823191f315893+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
2666
- neuronxcc-2.13.66.0+6dfecc895/MODULE_4d18af62746967c79d82+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
2667
- neuronxcc-2.13.66.0+6dfecc895/MODULE_539309b68144a4afde0b+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
2668
- neuronxcc-2.13.66.0+6dfecc895/MODULE_53f35b4110e7bebbcc45+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
2669
- neuronxcc-2.13.66.0+6dfecc895/MODULE_5ab5b6d9ff18b8896d5a+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
 
 
 
 
 
 
2670
  neuronxcc-2.13.66.0+6dfecc895/MODULE_62cafa382ec618cff287+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
2671
- neuronxcc-2.13.66.0+6dfecc895/MODULE_639cfa0c302f955a704e+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
2672
- neuronxcc-2.13.66.0+6dfecc895/MODULE_64d9d7ab844b064ddcff+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
2673
- neuronxcc-2.13.66.0+6dfecc895/MODULE_72f780796470e2d45102+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
2674
- neuronxcc-2.13.66.0+6dfecc895/MODULE_7943455ee983f978e58c+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
2675
- neuronxcc-2.13.66.0+6dfecc895/MODULE_7c67afcb8bd12bae0123+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
 
 
 
 
 
 
 
 
 
 
 
 
2676
  neuronxcc-2.13.66.0+6dfecc895/MODULE_85a47887d4fc41e26097+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
 
 
 
2677
  neuronxcc-2.13.66.0+6dfecc895/MODULE_8f8b48a08a0c68320dbf+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
 
 
2678
  neuronxcc-2.13.66.0+6dfecc895/MODULE_98b888cee6ab04043987+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
2679
- neuronxcc-2.13.66.0+6dfecc895/MODULE_9db2a3438f041d4e467e+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
2680
- neuronxcc-2.13.66.0+6dfecc895/MODULE_a29e3f3cc47445e1c231+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
2681
- neuronxcc-2.13.66.0+6dfecc895/MODULE_a97de47fb0d0f47ea4c0+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
2682
- neuronxcc-2.13.66.0+6dfecc895/MODULE_b7517ea4b617cd73f3ad+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
 
 
 
 
 
 
 
 
 
 
 
2683
  neuronxcc-2.13.66.0+6dfecc895/MODULE_cda75e05b1d55681d8eb+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
2684
- neuronxcc-2.13.66.0+6dfecc895/MODULE_d4cc88cd9d2d907c99f6+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
 
 
 
 
 
 
2685
  neuronxcc-2.13.66.0+6dfecc895/MODULE_d66f5802e5ad890e3919+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
2686
- neuronxcc-2.13.66.0+6dfecc895/MODULE_e334ed8a755e5380cbbd+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
 
 
 
 
 
 
 
 
 
2687
  neuronxcc-2.13.66.0+6dfecc895/MODULE_ea017e5effcd92c4e6ff+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
2688
- neuronxcc-2.13.66.0+6dfecc895/MODULE_ee55eab3eac6b30f23a0+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
 
 
 
 
2689
  neuronxcc-2.13.66.0+6dfecc895/MODULE_f2145a17aa8d689f7038+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
 
2690
  neuronxcc-2.13.66.0+6dfecc895/MODULE_f74f07a635721468c2ae+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
 
 
 
 
 
2654
  neuronxcc-2.13.66.0+6dfecc895/MODULE_a4fe1c700a9abdb20641+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
2655
  neuronxcc-2.13.66.0+6dfecc895/MODULE_b54a08c18ad776940cd0+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
2656
  neuronxcc-2.13.66.0+6dfecc895/MODULE_b59ff3b7e545f85152c8+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
2657
+ neuronxcc-2.13.66.0+6dfecc895/MODULE_01076e8d78b992483879+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
2658
+ neuronxcc-2.13.66.0+6dfecc895/MODULE_023098bfa18bb6b7e093+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
2659
+ neuronxcc-2.13.66.0+6dfecc895/MODULE_068011707d27c0821a21+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
2660
+ neuronxcc-2.13.66.0+6dfecc895/MODULE_0c9f98ff6f5d2ff116cb+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
2661
+ neuronxcc-2.13.66.0+6dfecc895/MODULE_104a70223ddf21bd9b47+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
2662
+ neuronxcc-2.13.66.0+6dfecc895/MODULE_122e6a965070aa927ca3+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
2663
+ neuronxcc-2.13.66.0+6dfecc895/MODULE_1f1e07d570ee56041d0a+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
2664
+ neuronxcc-2.13.66.0+6dfecc895/MODULE_20906ae3bb104009b559+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
2665
  neuronxcc-2.13.66.0+6dfecc895/MODULE_21b1b0223e4fb6f5af41+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
2666
+ neuronxcc-2.13.66.0+6dfecc895/MODULE_237d06dbfd8a5be615d7+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
2667
+ neuronxcc-2.13.66.0+6dfecc895/MODULE_259391de413611a000d7+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
2668
+ neuronxcc-2.13.66.0+6dfecc895/MODULE_2af13ac81b81096c1639+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
2669
+ neuronxcc-2.13.66.0+6dfecc895/MODULE_2b8fde7222de84e947e7+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
2670
+ neuronxcc-2.13.66.0+6dfecc895/MODULE_2bee1e5c93ed7d1f7e41+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
2671
+ neuronxcc-2.13.66.0+6dfecc895/MODULE_2c1ec1a942837fc9dd52+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
2672
  neuronxcc-2.13.66.0+6dfecc895/MODULE_3020655465d2e0990c19+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
2673
+ neuronxcc-2.13.66.0+6dfecc895/MODULE_322406123b6432adb6dc+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
2674
+ neuronxcc-2.13.66.0+6dfecc895/MODULE_39eb97b1b9533436c683+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
2675
+ neuronxcc-2.13.66.0+6dfecc895/MODULE_3b402aecf275deb431f9+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
2676
+ neuronxcc-2.13.66.0+6dfecc895/MODULE_3c0c7b7b3d473ebc8a65+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
2677
+ neuronxcc-2.13.66.0+6dfecc895/MODULE_3c95e3e5da57364deaaa+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
2678
+ neuronxcc-2.13.66.0+6dfecc895/MODULE_3f3330ac017793bff7e9+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
2679
+ neuronxcc-2.13.66.0+6dfecc895/MODULE_4254b9adcf600cfbd813+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
2680
  neuronxcc-2.13.66.0+6dfecc895/MODULE_426cd9312d26b5e0bf95+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
2681
+ neuronxcc-2.13.66.0+6dfecc895/MODULE_42ebbddc061c448d5837+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
2682
  neuronxcc-2.13.66.0+6dfecc895/MODULE_44563e64a3dddda1db4d+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
2683
+ neuronxcc-2.13.66.0+6dfecc895/MODULE_475e56c6ad56c5870fbe+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
2684
  neuronxcc-2.13.66.0+6dfecc895/MODULE_47eae16823191f315893+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
2685
+ neuronxcc-2.13.66.0+6dfecc895/MODULE_4b82c477c6cc7a064950+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
2686
+ neuronxcc-2.13.66.0+6dfecc895/MODULE_4ff3e786a52274ce1036+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
2687
+ neuronxcc-2.13.66.0+6dfecc895/MODULE_52e827b70e965558e166+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
2688
+ neuronxcc-2.13.66.0+6dfecc895/MODULE_538f209e64b33d73a48d+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
2689
+ neuronxcc-2.13.66.0+6dfecc895/MODULE_583712a6b0541c0cfdd0+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
2690
+ neuronxcc-2.13.66.0+6dfecc895/MODULE_5b1656a79ce81111a281+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
2691
+ neuronxcc-2.13.66.0+6dfecc895/MODULE_5b4747041cb35db7b730+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
2692
+ neuronxcc-2.13.66.0+6dfecc895/MODULE_5ff9a21793629fea6aaf+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
2693
+ neuronxcc-2.13.66.0+6dfecc895/MODULE_6265c4a1043ac00bd8ad+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
2694
+ neuronxcc-2.13.66.0+6dfecc895/MODULE_62c11966b3a4b6df942f+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
2695
  neuronxcc-2.13.66.0+6dfecc895/MODULE_62cafa382ec618cff287+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
2696
+ neuronxcc-2.13.66.0+6dfecc895/MODULE_64e39442db5e247a51cc+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
2697
+ neuronxcc-2.13.66.0+6dfecc895/MODULE_69ac5dff199c51754201+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
2698
+ neuronxcc-2.13.66.0+6dfecc895/MODULE_6edfc9ee4f2dcc13e351+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
2699
+ neuronxcc-2.13.66.0+6dfecc895/MODULE_6f0081dc753efeb38458+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
2700
+ neuronxcc-2.13.66.0+6dfecc895/MODULE_6f687780991c4858fa8e+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
2701
+ neuronxcc-2.13.66.0+6dfecc895/MODULE_70731d92d305a068cba1+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
2702
+ neuronxcc-2.13.66.0+6dfecc895/MODULE_761df4753670d0439b7a+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
2703
+ neuronxcc-2.13.66.0+6dfecc895/MODULE_775a72fd321efed8ea24+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
2704
+ neuronxcc-2.13.66.0+6dfecc895/MODULE_7828f484ba2832828302+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
2705
+ neuronxcc-2.13.66.0+6dfecc895/MODULE_7c12958cee70be03cbf3+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
2706
+ neuronxcc-2.13.66.0+6dfecc895/MODULE_7cac27e9135d049acdd7+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
2707
+ neuronxcc-2.13.66.0+6dfecc895/MODULE_7e2a3993bbf047863253+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
2708
+ neuronxcc-2.13.66.0+6dfecc895/MODULE_7ea40bbcf7d07a3c3ead+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
2709
+ neuronxcc-2.13.66.0+6dfecc895/MODULE_83cc94a2f92353b536c9+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
2710
+ neuronxcc-2.13.66.0+6dfecc895/MODULE_84290d79205fc78f7b65+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
2711
+ neuronxcc-2.13.66.0+6dfecc895/MODULE_84b20d16b60b305cfd59+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
2712
+ neuronxcc-2.13.66.0+6dfecc895/MODULE_85336feb2a590ec9a4ad+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
2713
  neuronxcc-2.13.66.0+6dfecc895/MODULE_85a47887d4fc41e26097+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
2714
+ neuronxcc-2.13.66.0+6dfecc895/MODULE_87223ed2919e0305fc45+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
2715
+ neuronxcc-2.13.66.0+6dfecc895/MODULE_8998739069f9b9438f2f+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
2716
+ neuronxcc-2.13.66.0+6dfecc895/MODULE_8b47f33881599fb2f73b+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
2717
  neuronxcc-2.13.66.0+6dfecc895/MODULE_8f8b48a08a0c68320dbf+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
2718
+ neuronxcc-2.13.66.0+6dfecc895/MODULE_93630d1069f7d37ea9a9+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
2719
+ neuronxcc-2.13.66.0+6dfecc895/MODULE_9486a445d1865f79a2ad+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
2720
  neuronxcc-2.13.66.0+6dfecc895/MODULE_98b888cee6ab04043987+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
2721
+ neuronxcc-2.13.66.0+6dfecc895/MODULE_a130605def82b6bc9ff7+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
2722
+ neuronxcc-2.13.66.0+6dfecc895/MODULE_a264074c4beb4bfa0769+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
2723
+ neuronxcc-2.13.66.0+6dfecc895/MODULE_a2907d828d1fdb092f2e+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
2724
+ neuronxcc-2.13.66.0+6dfecc895/MODULE_a3feec44b99a9925e1ff+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
2725
+ neuronxcc-2.13.66.0+6dfecc895/MODULE_a9515c34757db218879c+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
2726
+ neuronxcc-2.13.66.0+6dfecc895/MODULE_aaef2b3e98127eff8e39+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
2727
+ neuronxcc-2.13.66.0+6dfecc895/MODULE_b3601d975fd89ccfc423+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
2728
+ neuronxcc-2.13.66.0+6dfecc895/MODULE_b51bb8f50ce5fd56bd66+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
2729
+ neuronxcc-2.13.66.0+6dfecc895/MODULE_b79abe9895bfb1cca41c+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
2730
+ neuronxcc-2.13.66.0+6dfecc895/MODULE_bcd40c343f7ed90f678c+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
2731
+ neuronxcc-2.13.66.0+6dfecc895/MODULE_bd60eb80b95a1932a570+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
2732
+ neuronxcc-2.13.66.0+6dfecc895/MODULE_cb3c0c5398c9bf1f33c9+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
2733
+ neuronxcc-2.13.66.0+6dfecc895/MODULE_cc4336e144da396deeb6+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
2734
+ neuronxcc-2.13.66.0+6dfecc895/MODULE_cc80730ff341e79c3dee+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
2735
+ neuronxcc-2.13.66.0+6dfecc895/MODULE_cd6c1f7c99ce035a6c89+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
2736
  neuronxcc-2.13.66.0+6dfecc895/MODULE_cda75e05b1d55681d8eb+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
2737
+ neuronxcc-2.13.66.0+6dfecc895/MODULE_cebdcedfc8ecf222048c+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
2738
+ neuronxcc-2.13.66.0+6dfecc895/MODULE_cf647d4b6272e9ec7bfa+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
2739
+ neuronxcc-2.13.66.0+6dfecc895/MODULE_d0ed4cee650aac0b8a50+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
2740
+ neuronxcc-2.13.66.0+6dfecc895/MODULE_d1cae76c5b1ad6358a3b+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
2741
+ neuronxcc-2.13.66.0+6dfecc895/MODULE_d1e17083fc706ff1bd04+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
2742
+ neuronxcc-2.13.66.0+6dfecc895/MODULE_d56b11b891ba274f9a15+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
2743
+ neuronxcc-2.13.66.0+6dfecc895/MODULE_d5708b280f59fe3ad8a4+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
2744
  neuronxcc-2.13.66.0+6dfecc895/MODULE_d66f5802e5ad890e3919+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
2745
+ neuronxcc-2.13.66.0+6dfecc895/MODULE_d6fe9b0a8aabbba68c81+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
2746
+ neuronxcc-2.13.66.0+6dfecc895/MODULE_d9512ae8a122305821db+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
2747
+ neuronxcc-2.13.66.0+6dfecc895/MODULE_d9e5f45d7ef4d847d204+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
2748
+ neuronxcc-2.13.66.0+6dfecc895/MODULE_dee9e70fbf34b30e5604+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
2749
+ neuronxcc-2.13.66.0+6dfecc895/MODULE_e12bbb76e0fade707575+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
2750
+ neuronxcc-2.13.66.0+6dfecc895/MODULE_e2449d2d5a14cd2cadc6+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
2751
+ neuronxcc-2.13.66.0+6dfecc895/MODULE_e4399ab0388d19f561ab+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
2752
+ neuronxcc-2.13.66.0+6dfecc895/MODULE_e4fd29ccefa49ebbf681+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
2753
+ neuronxcc-2.13.66.0+6dfecc895/MODULE_e7572f71621618e422b4+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
2754
+ neuronxcc-2.13.66.0+6dfecc895/MODULE_e7e33963f76f02322430+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
2755
  neuronxcc-2.13.66.0+6dfecc895/MODULE_ea017e5effcd92c4e6ff+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
2756
+ neuronxcc-2.13.66.0+6dfecc895/MODULE_eaa1070fca3c7e27aa55+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
2757
+ neuronxcc-2.13.66.0+6dfecc895/MODULE_ed3e0b1e03de33122200+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
2758
+ neuronxcc-2.13.66.0+6dfecc895/MODULE_eddbf1ef02bd12d48612+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
2759
+ neuronxcc-2.13.66.0+6dfecc895/MODULE_ee52dc80c1702c4661e4+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
2760
+ neuronxcc-2.13.66.0+6dfecc895/MODULE_eee99099cb73269cdc4c+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
2761
  neuronxcc-2.13.66.0+6dfecc895/MODULE_f2145a17aa8d689f7038+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
2762
+ neuronxcc-2.13.66.0+6dfecc895/MODULE_f62dd3a630fd90fd0da6+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
2763
  neuronxcc-2.13.66.0+6dfecc895/MODULE_f74f07a635721468c2ae+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
2764
+ neuronxcc-2.13.66.0+6dfecc895/MODULE_f85314cf29074baad1bd+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
2765
+ neuronxcc-2.13.66.0+6dfecc895/MODULE_f95d4270b8e479b16dbe+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
2766
+ neuronxcc-2.13.66.0+6dfecc895/MODULE_f96048bdfffb74fb6409+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
2767
+ neuronxcc-2.13.66.0+6dfecc895/MODULE_fb292bd72f57a48a1c63+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
neuronxcc-2.13.66.0+6dfecc895/0_REGISTRY/0.0.22.dev0/inference/llama/meta-llama/Llama-2-13b-chat-hf/55d02a833c68f65f88c9.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"architectures": ["LlamaForCausalLM"], "attention_bias": false, "attention_dropout": 0.0, "bos_token_id": 1, "eos_token_id": 2, "hidden_act": "silu", "hidden_size": 5120, "initializer_range": 0.02, "intermediate_size": 13824, "max_position_embeddings": 4096, "model_type": "llama", "neuron": {"auto_cast_type": "fp16", "batch_size": 8, "checkpoint_id": "meta-llama/Llama-2-13b-chat-hf", "checkpoint_revision": "a2cb7a712bb6e5e736ca7f8cd98167f81a0b5bd8", "compiler_type": "neuronx-cc", "compiler_version": "2.13.66.0+6dfecc895", "num_cores": 8, "sequence_length": 4096, "task": "text-generation"}, "num_attention_heads": 40, "num_hidden_layers": 40, "num_key_value_heads": 40, "pretraining_tp": 1, "rms_norm_eps": 1e-05, "rope_scaling": null, "rope_theta": 10000.0, "tie_word_embeddings": false, "torch_dtype": "float16", "use_cache": true, "vocab_size": 32000}
neuronxcc-2.13.66.0+6dfecc895/0_REGISTRY/0.0.22.dev0/inference/llama/meta-llama/Llama-2-13b-chat-hf/a4fb9901e6811328a109.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"architectures": ["LlamaForCausalLM"], "attention_bias": false, "attention_dropout": 0.0, "bos_token_id": 1, "eos_token_id": 2, "hidden_act": "silu", "hidden_size": 5120, "initializer_range": 0.02, "intermediate_size": 13824, "max_position_embeddings": 4096, "model_type": "llama", "neuron": {"auto_cast_type": "fp16", "batch_size": 16, "checkpoint_id": "meta-llama/Llama-2-13b-chat-hf", "checkpoint_revision": "a2cb7a712bb6e5e736ca7f8cd98167f81a0b5bd8", "compiler_type": "neuronx-cc", "compiler_version": "2.13.66.0+6dfecc895", "num_cores": 8, "sequence_length": 4096, "task": "text-generation"}, "num_attention_heads": 40, "num_hidden_layers": 40, "num_key_value_heads": 40, "pretraining_tp": 1, "rms_norm_eps": 1e-05, "rope_scaling": null, "rope_theta": 10000.0, "tie_word_embeddings": false, "torch_dtype": "float16", "use_cache": true, "vocab_size": 32000}
neuronxcc-2.13.66.0+6dfecc895/0_REGISTRY/0.0.22.dev0/inference/llama/meta-llama/Llama-2-13b-chat-hf/a8c0b413e79c91496630.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"architectures": ["LlamaForCausalLM"], "attention_bias": false, "attention_dropout": 0.0, "bos_token_id": 1, "eos_token_id": 2, "hidden_act": "silu", "hidden_size": 5120, "initializer_range": 0.02, "intermediate_size": 13824, "max_position_embeddings": 4096, "model_type": "llama", "neuron": {"auto_cast_type": "fp16", "batch_size": 4, "checkpoint_id": "meta-llama/Llama-2-13b-chat-hf", "checkpoint_revision": "a2cb7a712bb6e5e736ca7f8cd98167f81a0b5bd8", "compiler_type": "neuronx-cc", "compiler_version": "2.13.66.0+6dfecc895", "num_cores": 8, "sequence_length": 4096, "task": "text-generation"}, "num_attention_heads": 40, "num_hidden_layers": 40, "num_key_value_heads": 40, "pretraining_tp": 1, "rms_norm_eps": 1e-05, "rope_scaling": null, "rope_theta": 10000.0, "tie_word_embeddings": false, "torch_dtype": "float16", "use_cache": true, "vocab_size": 32000}
neuronxcc-2.13.66.0+6dfecc895/0_REGISTRY/0.0.22.dev0/inference/llama/meta-llama/Llama-2-13b-chat-hf/d68250e23574798328a7.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"architectures": ["LlamaForCausalLM"], "attention_bias": false, "attention_dropout": 0.0, "bos_token_id": 1, "eos_token_id": 2, "hidden_act": "silu", "hidden_size": 5120, "initializer_range": 0.02, "intermediate_size": 13824, "max_position_embeddings": 4096, "model_type": "llama", "neuron": {"auto_cast_type": "fp16", "batch_size": 1, "checkpoint_id": "meta-llama/Llama-2-13b-chat-hf", "checkpoint_revision": "a2cb7a712bb6e5e736ca7f8cd98167f81a0b5bd8", "compiler_type": "neuronx-cc", "compiler_version": "2.13.66.0+6dfecc895", "num_cores": 8, "sequence_length": 4096, "task": "text-generation"}, "num_attention_heads": 40, "num_hidden_layers": 40, "num_key_value_heads": 40, "pretraining_tp": 1, "rms_norm_eps": 1e-05, "rope_scaling": null, "rope_theta": 10000.0, "tie_word_embeddings": false, "torch_dtype": "float16", "use_cache": true, "vocab_size": 32000}
neuronxcc-2.13.66.0+6dfecc895/0_REGISTRY/0.0.22.dev0/inference/mistral/mistralai/Mistral-7B-Instruct-v0.2/1245bb72b32d75db76f9.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"architectures": ["MistralForCausalLM"], "attention_dropout": 0.0, "bos_token_id": 1, "eos_token_id": 2, "hidden_act": "silu", "hidden_size": 4096, "initializer_range": 0.02, "intermediate_size": 14336, "max_position_embeddings": 32768, "model_type": "mistral", "neuron": {"auto_cast_type": "bf16", "batch_size": 4, "checkpoint_id": "mistralai/Mistral-7B-Instruct-v0.2", "checkpoint_revision": "41b61a33a2483885c981aa79e0df6b32407ed873", "compiler_type": "neuronx-cc", "compiler_version": "2.13.66.0+6dfecc895", "num_cores": 8, "sequence_length": 4096, "task": "text-generation"}, "num_attention_heads": 32, "num_hidden_layers": 32, "num_key_value_heads": 8, "rms_norm_eps": 1e-05, "rope_theta": 1000000.0, "sliding_window": null, "tie_word_embeddings": false, "torch_dtype": "bfloat16", "use_cache": true, "vocab_size": 32000}
neuronxcc-2.13.66.0+6dfecc895/0_REGISTRY/0.0.22.dev0/inference/mistral/mistralai/Mistral-7B-Instruct-v0.2/5e1e1d2ca63370d9d0a0.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"architectures": ["MistralForCausalLM"], "attention_dropout": 0.0, "bos_token_id": 1, "eos_token_id": 2, "hidden_act": "silu", "hidden_size": 4096, "initializer_range": 0.02, "intermediate_size": 14336, "max_position_embeddings": 32768, "model_type": "mistral", "neuron": {"auto_cast_type": "fp16", "batch_size": 8, "checkpoint_id": "mistralai/Mistral-7B-Instruct-v0.2", "checkpoint_revision": "41b61a33a2483885c981aa79e0df6b32407ed873", "compiler_type": "neuronx-cc", "compiler_version": "2.13.66.0+6dfecc895", "num_cores": 8, "sequence_length": 4096, "task": "text-generation"}, "num_attention_heads": 32, "num_hidden_layers": 32, "num_key_value_heads": 8, "rms_norm_eps": 1e-05, "rope_theta": 1000000.0, "sliding_window": null, "tie_word_embeddings": false, "torch_dtype": "bfloat16", "use_cache": true, "vocab_size": 32000}
neuronxcc-2.13.66.0+6dfecc895/0_REGISTRY/0.0.22.dev0/inference/mistral/mistralai/Mistral-7B-Instruct-v0.2/6255cc2875c3d0c5e501.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"architectures": ["MistralForCausalLM"], "attention_dropout": 0.0, "bos_token_id": 1, "eos_token_id": 2, "hidden_act": "silu", "hidden_size": 4096, "initializer_range": 0.02, "intermediate_size": 14336, "max_position_embeddings": 32768, "model_type": "mistral", "neuron": {"auto_cast_type": "fp16", "batch_size": 32, "checkpoint_id": "mistralai/Mistral-7B-Instruct-v0.2", "checkpoint_revision": "41b61a33a2483885c981aa79e0df6b32407ed873", "compiler_type": "neuronx-cc", "compiler_version": "2.13.66.0+6dfecc895", "num_cores": 8, "sequence_length": 4096, "task": "text-generation"}, "num_attention_heads": 32, "num_hidden_layers": 32, "num_key_value_heads": 8, "rms_norm_eps": 1e-05, "rope_theta": 1000000.0, "sliding_window": null, "tie_word_embeddings": false, "torch_dtype": "bfloat16", "use_cache": true, "vocab_size": 32000}
neuronxcc-2.13.66.0+6dfecc895/0_REGISTRY/0.0.22.dev0/inference/mistral/mistralai/Mistral-7B-Instruct-v0.2/64e0d5cd868faca4549f.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"architectures": ["MistralForCausalLM"], "attention_dropout": 0.0, "bos_token_id": 1, "eos_token_id": 2, "hidden_act": "silu", "hidden_size": 4096, "initializer_range": 0.02, "intermediate_size": 14336, "max_position_embeddings": 32768, "model_type": "mistral", "neuron": {"auto_cast_type": "bf16", "batch_size": 1, "checkpoint_id": "mistralai/Mistral-7B-Instruct-v0.2", "checkpoint_revision": "41b61a33a2483885c981aa79e0df6b32407ed873", "compiler_type": "neuronx-cc", "compiler_version": "2.13.66.0+6dfecc895", "num_cores": 8, "sequence_length": 4096, "task": "text-generation"}, "num_attention_heads": 32, "num_hidden_layers": 32, "num_key_value_heads": 8, "rms_norm_eps": 1e-05, "rope_theta": 1000000.0, "sliding_window": null, "tie_word_embeddings": false, "torch_dtype": "bfloat16", "use_cache": true, "vocab_size": 32000}
neuronxcc-2.13.66.0+6dfecc895/0_REGISTRY/0.0.22.dev0/inference/mistral/mistralai/Mistral-7B-Instruct-v0.2/733bc79383c0cc56537e.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"architectures": ["MistralForCausalLM"], "attention_dropout": 0.0, "bos_token_id": 1, "eos_token_id": 2, "hidden_act": "silu", "hidden_size": 4096, "initializer_range": 0.02, "intermediate_size": 14336, "max_position_embeddings": 32768, "model_type": "mistral", "neuron": {"auto_cast_type": "bf16", "batch_size": 16, "checkpoint_id": "mistralai/Mistral-7B-Instruct-v0.2", "checkpoint_revision": "41b61a33a2483885c981aa79e0df6b32407ed873", "compiler_type": "neuronx-cc", "compiler_version": "2.13.66.0+6dfecc895", "num_cores": 8, "sequence_length": 4096, "task": "text-generation"}, "num_attention_heads": 32, "num_hidden_layers": 32, "num_key_value_heads": 8, "rms_norm_eps": 1e-05, "rope_theta": 1000000.0, "sliding_window": null, "tie_word_embeddings": false, "torch_dtype": "bfloat16", "use_cache": true, "vocab_size": 32000}
neuronxcc-2.13.66.0+6dfecc895/0_REGISTRY/0.0.22.dev0/inference/mistral/mistralai/Mistral-7B-Instruct-v0.2/7fd9b858cf45bbf6355f.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"architectures": ["MistralForCausalLM"], "attention_dropout": 0.0, "bos_token_id": 1, "eos_token_id": 2, "hidden_act": "silu", "hidden_size": 4096, "initializer_range": 0.02, "intermediate_size": 14336, "max_position_embeddings": 32768, "model_type": "mistral", "neuron": {"auto_cast_type": "fp16", "batch_size": 16, "checkpoint_id": "mistralai/Mistral-7B-Instruct-v0.2", "checkpoint_revision": "41b61a33a2483885c981aa79e0df6b32407ed873", "compiler_type": "neuronx-cc", "compiler_version": "2.13.66.0+6dfecc895", "num_cores": 8, "sequence_length": 4096, "task": "text-generation"}, "num_attention_heads": 32, "num_hidden_layers": 32, "num_key_value_heads": 8, "rms_norm_eps": 1e-05, "rope_theta": 1000000.0, "sliding_window": null, "tie_word_embeddings": false, "torch_dtype": "bfloat16", "use_cache": true, "vocab_size": 32000}
neuronxcc-2.13.66.0+6dfecc895/0_REGISTRY/0.0.22.dev0/inference/mistral/mistralai/Mistral-7B-Instruct-v0.2/979fce2dd4e4d499c2f0.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"architectures": ["MistralForCausalLM"], "attention_dropout": 0.0, "bos_token_id": 1, "eos_token_id": 2, "hidden_act": "silu", "hidden_size": 4096, "initializer_range": 0.02, "intermediate_size": 14336, "max_position_embeddings": 32768, "model_type": "mistral", "neuron": {"auto_cast_type": "fp16", "batch_size": 4, "checkpoint_id": "mistralai/Mistral-7B-Instruct-v0.2", "checkpoint_revision": "41b61a33a2483885c981aa79e0df6b32407ed873", "compiler_type": "neuronx-cc", "compiler_version": "2.13.66.0+6dfecc895", "num_cores": 8, "sequence_length": 4096, "task": "text-generation"}, "num_attention_heads": 32, "num_hidden_layers": 32, "num_key_value_heads": 8, "rms_norm_eps": 1e-05, "rope_theta": 1000000.0, "sliding_window": null, "tie_word_embeddings": false, "torch_dtype": "bfloat16", "use_cache": true, "vocab_size": 32000}
neuronxcc-2.13.66.0+6dfecc895/0_REGISTRY/0.0.22.dev0/inference/mistral/mistralai/Mistral-7B-Instruct-v0.2/aa1ba12921766e16b7dc.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"architectures": ["MistralForCausalLM"], "attention_dropout": 0.0, "bos_token_id": 1, "eos_token_id": 2, "hidden_act": "silu", "hidden_size": 4096, "initializer_range": 0.02, "intermediate_size": 14336, "max_position_embeddings": 32768, "model_type": "mistral", "neuron": {"auto_cast_type": "fp16", "batch_size": 1, "checkpoint_id": "mistralai/Mistral-7B-Instruct-v0.2", "checkpoint_revision": "41b61a33a2483885c981aa79e0df6b32407ed873", "compiler_type": "neuronx-cc", "compiler_version": "2.13.66.0+6dfecc895", "num_cores": 8, "sequence_length": 4096, "task": "text-generation"}, "num_attention_heads": 32, "num_hidden_layers": 32, "num_key_value_heads": 8, "rms_norm_eps": 1e-05, "rope_theta": 1000000.0, "sliding_window": null, "tie_word_embeddings": false, "torch_dtype": "bfloat16", "use_cache": true, "vocab_size": 32000}
neuronxcc-2.13.66.0+6dfecc895/0_REGISTRY/0.0.22.dev0/inference/mistral/mistralai/Mistral-7B-Instruct-v0.2/ca240a79f952204527fc.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"architectures": ["MistralForCausalLM"], "attention_dropout": 0.0, "bos_token_id": 1, "eos_token_id": 2, "hidden_act": "silu", "hidden_size": 4096, "initializer_range": 0.02, "intermediate_size": 14336, "max_position_embeddings": 32768, "model_type": "mistral", "neuron": {"auto_cast_type": "bf16", "batch_size": 8, "checkpoint_id": "mistralai/Mistral-7B-Instruct-v0.2", "checkpoint_revision": "41b61a33a2483885c981aa79e0df6b32407ed873", "compiler_type": "neuronx-cc", "compiler_version": "2.13.66.0+6dfecc895", "num_cores": 8, "sequence_length": 4096, "task": "text-generation"}, "num_attention_heads": 32, "num_hidden_layers": 32, "num_key_value_heads": 8, "rms_norm_eps": 1e-05, "rope_theta": 1000000.0, "sliding_window": null, "tie_word_embeddings": false, "torch_dtype": "bfloat16", "use_cache": true, "vocab_size": 32000}
neuronxcc-2.13.66.0+6dfecc895/0_REGISTRY/0.0.22.dev0/inference/mistral/mistralai/Mistral-7B-Instruct-v0.2/eec3579b9122a80133a1.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"architectures": ["MistralForCausalLM"], "attention_dropout": 0.0, "bos_token_id": 1, "eos_token_id": 2, "hidden_act": "silu", "hidden_size": 4096, "initializer_range": 0.02, "intermediate_size": 14336, "max_position_embeddings": 32768, "model_type": "mistral", "neuron": {"auto_cast_type": "bf16", "batch_size": 32, "checkpoint_id": "mistralai/Mistral-7B-Instruct-v0.2", "checkpoint_revision": "41b61a33a2483885c981aa79e0df6b32407ed873", "compiler_type": "neuronx-cc", "compiler_version": "2.13.66.0+6dfecc895", "num_cores": 8, "sequence_length": 4096, "task": "text-generation"}, "num_attention_heads": 32, "num_hidden_layers": 32, "num_key_value_heads": 8, "rms_norm_eps": 1e-05, "rope_theta": 1000000.0, "sliding_window": null, "tie_word_embeddings": false, "torch_dtype": "bfloat16", "use_cache": true, "vocab_size": 32000}
neuronxcc-2.13.66.0+6dfecc895/0_REGISTRY/0.0.22/inference/llama/meta-llama/Llama-2-7b-chat-hf/06b52fde14a8f28d6a3d.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"architectures": ["LlamaForCausalLM"], "attention_bias": false, "attention_dropout": 0.0, "bos_token_id": 1, "eos_token_id": 2, "hidden_act": "silu", "hidden_size": 4096, "initializer_range": 0.02, "intermediate_size": 11008, "max_position_embeddings": 4096, "model_type": "llama", "neuron": {"auto_cast_type": "fp16", "batch_size": 1, "checkpoint_id": "meta-llama/Llama-2-7b-chat-hf", "checkpoint_revision": "f5db02db724555f92da89c216ac04704f23d4590", "compiler_type": "neuronx-cc", "compiler_version": "2.13.66.0+6dfecc895", "num_cores": 2, "sequence_length": 4096, "task": "text-generation"}, "num_attention_heads": 32, "num_hidden_layers": 32, "num_key_value_heads": 32, "pretraining_tp": 1, "rms_norm_eps": 1e-05, "rope_scaling": null, "rope_theta": 10000.0, "tie_word_embeddings": false, "torch_dtype": "float16", "use_cache": true, "vocab_size": 32000}
neuronxcc-2.13.66.0+6dfecc895/MODULE_007ddbaadfdea74c4db5+2c2d707e/model.neff CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3ad504235ae58759a762486abdfcb61460190608c0d5d68eb7748bef1e742863
3
  size 13282304
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8559beec2df842857f647f9921c6ff30f0f3f20a4e17b0e3c7142e24902f7d90
3
  size 13282304
neuronxcc-2.13.66.0+6dfecc895/MODULE_01076e8d78b992483879+2c2d707e/compile_flags.txt ADDED
@@ -0,0 +1 @@
 
 
1
+ --model-type=transformer --auto-cast=none
neuronxcc-2.13.66.0+6dfecc895/MODULE_01076e8d78b992483879+2c2d707e/model.hlo_module.pb ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d6c5cb1275fbbfedb3e7c4d72e9f6d73845364943f9acbd07471933811598a8c
3
+ size 318327
neuronxcc-2.13.66.0+6dfecc895/MODULE_01076e8d78b992483879+2c2d707e/model.neff ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b746795a76c3239b01e328887743aa1ff4f15a53edfd7ce972e87d1d25efc2ae
3
+ size 2479104
neuronxcc-2.13.66.0+6dfecc895/MODULE_023098bfa18bb6b7e093+2c2d707e/compile_flags.txt ADDED
@@ -0,0 +1 @@
 
 
1
+ --model-type=transformer --auto-cast=none
neuronxcc-2.13.66.0+6dfecc895/MODULE_023098bfa18bb6b7e093+2c2d707e/model.hlo_module.pb ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6a6ee9aeae30bd5ffafa657854c5e7fe9f5ee68d40fb5051fa38ddb466ab550a
3
+ size 380699
neuronxcc-2.13.66.0+6dfecc895/MODULE_023098bfa18bb6b7e093+2c2d707e/model.neff ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fb3f3c7216a6bf0233c0d9a87aa36f17575d8300bb9c386b78fea60e1043a3ba
3
+ size 18709504
neuronxcc-2.13.66.0+6dfecc895/MODULE_068011707d27c0821a21+2c2d707e/compile_flags.txt ADDED
@@ -0,0 +1 @@
 
 
1
+ --model-type=transformer --auto-cast=none
neuronxcc-2.13.66.0+6dfecc895/MODULE_068011707d27c0821a21+2c2d707e/model.hlo_module.pb ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:33455a4af632d1f01d5ba298df3d50b02e3e117471d40338a86b56ff493e59e2
3
+ size 357616
neuronxcc-2.13.66.0+6dfecc895/MODULE_068011707d27c0821a21+2c2d707e/model.neff ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:45314103ad7921853f53cc774885c2192c599b7317e859ac0e235144b003a7f9
3
+ size 28959744
neuronxcc-2.13.66.0+6dfecc895/MODULE_0c9f98ff6f5d2ff116cb+2c2d707e/compile_flags.txt ADDED
@@ -0,0 +1 @@
 
 
1
+ --model-type=transformer --auto-cast=none
neuronxcc-2.13.66.0+6dfecc895/MODULE_0c9f98ff6f5d2ff116cb+2c2d707e/model.hlo_module.pb ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ac56ab5510f7844416010b4518e04c84a2df0dbae79e033b76c6e731507d9a80
3
+ size 299226
neuronxcc-2.13.66.0+6dfecc895/MODULE_0c9f98ff6f5d2ff116cb+2c2d707e/model.neff ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:60bd9a4f077016460a5a442a5353e313304939c7752a1a609f0f74a209fc7985
3
+ size 7814144
neuronxcc-2.13.66.0+6dfecc895/MODULE_104a70223ddf21bd9b47+2c2d707e/compile_flags.txt ADDED
@@ -0,0 +1 @@
 
 
1
+ --model-type=transformer --auto-cast=none
neuronxcc-2.13.66.0+6dfecc895/MODULE_104a70223ddf21bd9b47+2c2d707e/model.hlo_module.pb ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1e7047a8a0af3e0426169af64ca17c84415f74416273f08a0bbe78a93e9cd816
3
+ size 419433
neuronxcc-2.13.66.0+6dfecc895/MODULE_104a70223ddf21bd9b47+2c2d707e/model.neff ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:be52dbcdf1c3a2fe1f2a3185a7e622b1b9a274d2dc3efd3f935b844e8d5a4412
3
+ size 8530944
neuronxcc-2.13.66.0+6dfecc895/MODULE_122e6a965070aa927ca3+2c2d707e/compile_flags.txt ADDED
@@ -0,0 +1 @@
 
 
1
+ --model-type=transformer --auto-cast=none
neuronxcc-2.13.66.0+6dfecc895/MODULE_122e6a965070aa927ca3+2c2d707e/model.hlo_module.pb ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4785aa52c8c855926a7eee940c7db2b1869e6541bd9d0c4a1cb68bc96a4d9a5c
3
+ size 329721
neuronxcc-2.13.66.0+6dfecc895/MODULE_122e6a965070aa927ca3+2c2d707e/model.neff ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:23e8954ecb98f9debff5025a0118a27ae96c1744abace766ccbc9c98dcab34e5
3
+ size 2468864
neuronxcc-2.13.66.0+6dfecc895/MODULE_1f1e07d570ee56041d0a+2c2d707e/compile_flags.txt ADDED
@@ -0,0 +1 @@
 
 
1
+ --model-type=transformer --auto-cast=none
neuronxcc-2.13.66.0+6dfecc895/MODULE_1f1e07d570ee56041d0a+2c2d707e/model.hlo_module.pb ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:107d39f49881e6d2982ea9d36c22953545de064b0bbae09b7ac4cc2cd8144575
3
+ size 318327
neuronxcc-2.13.66.0+6dfecc895/MODULE_1f1e07d570ee56041d0a+2c2d707e/model.neff ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:67441fee53b92ca9d81863bb3177306b38c16c873f801b356e1e50e79e3f261f
3
+ size 2581504
neuronxcc-2.13.66.0+6dfecc895/MODULE_20906ae3bb104009b559+2c2d707e/compile_flags.txt ADDED
@@ -0,0 +1 @@
 
 
1
+ --model-type=transformer --auto-cast=none
neuronxcc-2.13.66.0+6dfecc895/MODULE_20906ae3bb104009b559+2c2d707e/model.hlo_module.pb ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:21e40c363503f6a8e7f9909acc1a367f1185440f5a601f63e8e9203264807752
3
+ size 410810
neuronxcc-2.13.66.0+6dfecc895/MODULE_20906ae3bb104009b559+2c2d707e/model.neff ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f735dd1ca52546b029bf3b6c832291b2dfcfa3498c7e0d16e5da513c27437900
3
+ size 3216384
neuronxcc-2.13.66.0+6dfecc895/MODULE_21b1b0223e4fb6f5af41+2c2d707e/model.neff CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:647d4971554b115074a5d1efb73a71b547215bc89bc5ac3af9683f91af042454
3
  size 2161664
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a3f7daaa297382b89110fd4fa0c5bf14ea42e5008640cb0778fa0653ca455b89
3
  size 2161664
neuronxcc-2.13.66.0+6dfecc895/MODULE_21d7ca83fa40eaf22249+2c2d707e/model.hlo_module.pb ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3fea25155c53bcf57abee0cb3bc910b63454a0c95fd7b2bb50a36bd2539cf184
3
+ size 318327
neuronxcc-2.13.66.0+6dfecc895/MODULE_237d06dbfd8a5be615d7+2c2d707e/compile_flags.txt ADDED
@@ -0,0 +1 @@
 
 
1
+ --model-type=transformer --auto-cast=none
neuronxcc-2.13.66.0+6dfecc895/MODULE_237d06dbfd8a5be615d7+2c2d707e/model.hlo_module.pb ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:888056ebb363a72225fbd0c21dfc7124667cea21cece58e6de57285793a4a205
3
+ size 318138
neuronxcc-2.13.66.0+6dfecc895/MODULE_237d06dbfd8a5be615d7+2c2d707e/model.neff ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:22aa3623e3c8ba6578c4ae047aa81b155e31be00f3aa8634f5511e164144588a
3
+ size 3144704
neuronxcc-2.13.66.0+6dfecc895/MODULE_259391de413611a000d7+2c2d707e/compile_flags.txt ADDED
@@ -0,0 +1 @@
 
 
1
+ --model-type=transformer --auto-cast=none
neuronxcc-2.13.66.0+6dfecc895/MODULE_259391de413611a000d7+2c2d707e/model.hlo_module.pb ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:567cf9d49d838ee5bb1e67dcb3d79c00b18972f82e113b396ddfebbd1a41b397
3
+ size 346060
neuronxcc-2.13.66.0+6dfecc895/MODULE_259391de413611a000d7+2c2d707e/model.neff ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7849f5d2ef765bdf5998b357cc3e1e438f2b0db49c427c2fc62473b8c2af91f7
3
+ size 30546944
neuronxcc-2.13.66.0+6dfecc895/MODULE_298bc643cbb368dd898d+2c2d707e/compile_flags.txt ADDED
@@ -0,0 +1 @@
 
 
1
+ --model-type=transformer --auto-cast=none