Synchronizing local compiler cache.
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- .gitattributes +48 -0
- neuronxcc-2.14.213.0+013d129b/0_REGISTRY/0.0.24.dev0/inference/llama/NousResearch/Hermes-2-Theta-Llama-3-8B/7560e48b8ccab7f8e283.json +1 -0
- neuronxcc-2.14.213.0+013d129b/0_REGISTRY/0.0.24.dev0/inference/llama/NousResearch/Hermes-2-Theta-Llama-3-8B/7bedca11d8eef0f022b7.json +1 -0
- neuronxcc-2.14.213.0+013d129b/0_REGISTRY/0.0.24.dev0/inference/llama/meta-llama/Meta-Llama-3-8B/17c656c7abb64c7466dd.json +1 -0
- neuronxcc-2.14.213.0+013d129b/0_REGISTRY/0.0.24.dev0/inference/llama/meta-llama/Meta-Llama-3-8B/57089b23be0910d8cbc8.json +1 -0
- neuronxcc-2.14.213.0+013d129b/0_REGISTRY/0.0.24.dev0/inference/llama/meta-llama/Meta-Llama-3-8B/6767790cca5f811d84f5.json +1 -0
- neuronxcc-2.14.213.0+013d129b/0_REGISTRY/0.0.24.dev0/inference/llama/meta-llama/Meta-Llama-3-8B/740ed7b654b7c18270dd.json +1 -0
- neuronxcc-2.14.213.0+013d129b/0_REGISTRY/0.0.24.dev0/inference/llama/meta-llama/Meta-Llama-3-8B/91b57a8edda1c1c3a3ce.json +1 -0
- neuronxcc-2.14.213.0+013d129b/0_REGISTRY/0.0.24.dev0/inference/llama/meta-llama/Meta-Llama-3-8B/d93f0bb3e47016036365.json +1 -0
- neuronxcc-2.14.213.0+013d129b/0_REGISTRY/0.0.24.dev0/inference/llama/princeton-nlp/Sheared-LLaMA-1.3B/f69d881a5f54838a96cb.json +1 -0
- neuronxcc-2.14.213.0+013d129b/0_REGISTRY/0.0.24.dev0/inference/llama/princeton-nlp/Sheared-LLaMA-2.7B/65af25a07a9af664c36d.json +1 -0
- neuronxcc-2.14.213.0+013d129b/MODULE_0157f35eb303445e190f+2c2d707e/compile_flags.txt +1 -0
- neuronxcc-2.14.213.0+013d129b/MODULE_0157f35eb303445e190f+2c2d707e/model.hlo_module.pb +3 -0
- neuronxcc-2.14.213.0+013d129b/MODULE_0157f35eb303445e190f+2c2d707e/model.neff +3 -0
- neuronxcc-2.14.213.0+013d129b/MODULE_0176fb35e78494db681c+2c2d707e/compile_flags.txt +1 -0
- neuronxcc-2.14.213.0+013d129b/MODULE_0176fb35e78494db681c+2c2d707e/model.hlo_module.pb +3 -0
- neuronxcc-2.14.213.0+013d129b/MODULE_0176fb35e78494db681c+2c2d707e/model.neff +3 -0
- neuronxcc-2.14.213.0+013d129b/MODULE_01cc804175cc5fb0e309+2c2d707e/compile_flags.txt +1 -0
- neuronxcc-2.14.213.0+013d129b/MODULE_01cc804175cc5fb0e309+2c2d707e/model.hlo_module.pb +3 -0
- neuronxcc-2.14.213.0+013d129b/MODULE_01cc804175cc5fb0e309+2c2d707e/model.neff +3 -0
- neuronxcc-2.14.213.0+013d129b/MODULE_146077388d26b5450bf4+2c2d707e/compile_flags.txt +1 -0
- neuronxcc-2.14.213.0+013d129b/MODULE_146077388d26b5450bf4+2c2d707e/model.hlo_module.pb +3 -0
- neuronxcc-2.14.213.0+013d129b/MODULE_146077388d26b5450bf4+2c2d707e/model.neff +3 -0
- neuronxcc-2.14.213.0+013d129b/MODULE_1d5c76706b604a934e43+2c2d707e/compile_flags.txt +1 -0
- neuronxcc-2.14.213.0+013d129b/MODULE_1d5c76706b604a934e43+2c2d707e/model.hlo_module.pb +3 -0
- neuronxcc-2.14.213.0+013d129b/MODULE_1d5c76706b604a934e43+2c2d707e/model.neff +3 -0
- neuronxcc-2.14.213.0+013d129b/MODULE_1e7a2f7302fa2bde6e72+2c2d707e/compile_flags.txt +1 -0
- neuronxcc-2.14.213.0+013d129b/MODULE_1e7a2f7302fa2bde6e72+2c2d707e/model.hlo_module.pb +3 -0
- neuronxcc-2.14.213.0+013d129b/MODULE_1e7a2f7302fa2bde6e72+2c2d707e/model.neff +3 -0
- neuronxcc-2.14.213.0+013d129b/MODULE_21e3dcaee19883fe287e+2c2d707e/compile_flags.txt +1 -0
- neuronxcc-2.14.213.0+013d129b/MODULE_21e3dcaee19883fe287e+2c2d707e/model.hlo_module.pb +3 -0
- neuronxcc-2.14.213.0+013d129b/MODULE_21e3dcaee19883fe287e+2c2d707e/model.neff +3 -0
- neuronxcc-2.14.213.0+013d129b/MODULE_298c803bdff39c3d92ed+2c2d707e/compile_flags.txt +1 -0
- neuronxcc-2.14.213.0+013d129b/MODULE_298c803bdff39c3d92ed+2c2d707e/model.hlo_module.pb +3 -0
- neuronxcc-2.14.213.0+013d129b/MODULE_298c803bdff39c3d92ed+2c2d707e/model.neff +3 -0
- neuronxcc-2.14.213.0+013d129b/MODULE_29fb2a5ae4896a78c559+2c2d707e/compile_flags.txt +1 -0
- neuronxcc-2.14.213.0+013d129b/MODULE_29fb2a5ae4896a78c559+2c2d707e/model.hlo_module.pb +3 -0
- neuronxcc-2.14.213.0+013d129b/MODULE_29fb2a5ae4896a78c559+2c2d707e/model.neff +3 -0
- neuronxcc-2.14.213.0+013d129b/MODULE_2b55711d93e1566cdd78+2c2d707e/compile_flags.txt +1 -0
- neuronxcc-2.14.213.0+013d129b/MODULE_2b55711d93e1566cdd78+2c2d707e/model.hlo_module.pb +3 -0
- neuronxcc-2.14.213.0+013d129b/MODULE_2b55711d93e1566cdd78+2c2d707e/model.neff +0 -0
- neuronxcc-2.14.213.0+013d129b/MODULE_2f46e3e3a9cc37a9f386+2c2d707e/compile_flags.txt +1 -0
- neuronxcc-2.14.213.0+013d129b/MODULE_2f46e3e3a9cc37a9f386+2c2d707e/model.hlo_module.pb +3 -0
- neuronxcc-2.14.213.0+013d129b/MODULE_2f46e3e3a9cc37a9f386+2c2d707e/model.neff +3 -0
- neuronxcc-2.14.213.0+013d129b/MODULE_33719efab65aba8971de+2c2d707e/compile_flags.txt +1 -0
- neuronxcc-2.14.213.0+013d129b/MODULE_33719efab65aba8971de+2c2d707e/model.hlo_module.pb +3 -0
- neuronxcc-2.14.213.0+013d129b/MODULE_33719efab65aba8971de+2c2d707e/model.neff +3 -0
- neuronxcc-2.14.213.0+013d129b/MODULE_345116edd09879b7ebe4+2c2d707e/compile_flags.txt +1 -0
- neuronxcc-2.14.213.0+013d129b/MODULE_345116edd09879b7ebe4+2c2d707e/model.hlo_module.pb +3 -0
- neuronxcc-2.14.213.0+013d129b/MODULE_345116edd09879b7ebe4+2c2d707e/model.neff +3 -0
.gitattributes
CHANGED
@@ -401,3 +401,51 @@ neuronxcc-2.14.213.0+013d129b/MODULE_b56a2aeda0f893ae933e+2c2d707e/model.neff fi
|
|
401 |
neuronxcc-2.14.213.0+013d129b/MODULE_7651246321963ddd5906+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
402 |
neuronxcc-2.14.213.0+013d129b/MODULE_ade80a2b19e816657dab+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
403 |
neuronxcc-2.14.213.0+013d129b/MODULE_3ee79106ae9bfc013100+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
401 |
neuronxcc-2.14.213.0+013d129b/MODULE_7651246321963ddd5906+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
402 |
neuronxcc-2.14.213.0+013d129b/MODULE_ade80a2b19e816657dab+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
403 |
neuronxcc-2.14.213.0+013d129b/MODULE_3ee79106ae9bfc013100+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
404 |
+
neuronxcc-2.14.213.0+013d129b/MODULE_0157f35eb303445e190f+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
405 |
+
neuronxcc-2.14.213.0+013d129b/MODULE_0176fb35e78494db681c+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
406 |
+
neuronxcc-2.14.213.0+013d129b/MODULE_01cc804175cc5fb0e309+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
407 |
+
neuronxcc-2.14.213.0+013d129b/MODULE_146077388d26b5450bf4+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
408 |
+
neuronxcc-2.14.213.0+013d129b/MODULE_1d5c76706b604a934e43+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
409 |
+
neuronxcc-2.14.213.0+013d129b/MODULE_1e7a2f7302fa2bde6e72+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
410 |
+
neuronxcc-2.14.213.0+013d129b/MODULE_21e3dcaee19883fe287e+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
411 |
+
neuronxcc-2.14.213.0+013d129b/MODULE_298c803bdff39c3d92ed+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
412 |
+
neuronxcc-2.14.213.0+013d129b/MODULE_29fb2a5ae4896a78c559+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
413 |
+
neuronxcc-2.14.213.0+013d129b/MODULE_2f46e3e3a9cc37a9f386+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
414 |
+
neuronxcc-2.14.213.0+013d129b/MODULE_33719efab65aba8971de+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
415 |
+
neuronxcc-2.14.213.0+013d129b/MODULE_345116edd09879b7ebe4+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
416 |
+
neuronxcc-2.14.213.0+013d129b/MODULE_35628e0e7065fd39f1c5+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
417 |
+
neuronxcc-2.14.213.0+013d129b/MODULE_35d96999ee4913118e5e+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
418 |
+
neuronxcc-2.14.213.0+013d129b/MODULE_37baed5161817467e45e+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
419 |
+
neuronxcc-2.14.213.0+013d129b/MODULE_392abcf826a8895949c4+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
420 |
+
neuronxcc-2.14.213.0+013d129b/MODULE_4db722886dbd5a0e90d3+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
421 |
+
neuronxcc-2.14.213.0+013d129b/MODULE_4f822640d7fcf1269c2a+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
422 |
+
neuronxcc-2.14.213.0+013d129b/MODULE_5ddb9c233d7c07c4b83e+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
423 |
+
neuronxcc-2.14.213.0+013d129b/MODULE_697621df8336098e9fb7+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
424 |
+
neuronxcc-2.14.213.0+013d129b/MODULE_712f16088b92ce1552a7+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
425 |
+
neuronxcc-2.14.213.0+013d129b/MODULE_7e1a306b8f44990e78be+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
426 |
+
neuronxcc-2.14.213.0+013d129b/MODULE_822bf0763f23d1cc785a+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
427 |
+
neuronxcc-2.14.213.0+013d129b/MODULE_88bb293cbec6b542e9b1+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
428 |
+
neuronxcc-2.14.213.0+013d129b/MODULE_8a2412619fc03f78847e+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
429 |
+
neuronxcc-2.14.213.0+013d129b/MODULE_8ae58871e7bd6db4281f+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
430 |
+
neuronxcc-2.14.213.0+013d129b/MODULE_941adcb49c0b0f9430a7+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
431 |
+
neuronxcc-2.14.213.0+013d129b/MODULE_9434d1e41373f6a0341d+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
432 |
+
neuronxcc-2.14.213.0+013d129b/MODULE_981bf151b4d4d1bfaba6+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
433 |
+
neuronxcc-2.14.213.0+013d129b/MODULE_99e853ec7bc39799a1f7+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
434 |
+
neuronxcc-2.14.213.0+013d129b/MODULE_a5ebe619cd15ee115b6b+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
435 |
+
neuronxcc-2.14.213.0+013d129b/MODULE_b79befd674e052c44c9f+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
436 |
+
neuronxcc-2.14.213.0+013d129b/MODULE_b90aa3def33709e0aece+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
437 |
+
neuronxcc-2.14.213.0+013d129b/MODULE_bc64d40e1427eab85ba8+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
438 |
+
neuronxcc-2.14.213.0+013d129b/MODULE_bc9b64a5de7b4f5eae3a+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
439 |
+
neuronxcc-2.14.213.0+013d129b/MODULE_ce4004e47d7f9259e48d+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
440 |
+
neuronxcc-2.14.213.0+013d129b/MODULE_cebc0d79dffdb4b073d7+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
441 |
+
neuronxcc-2.14.213.0+013d129b/MODULE_cf27c4eb2bcac29fb7ec+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
442 |
+
neuronxcc-2.14.213.0+013d129b/MODULE_d11a14fe0d09008357f2+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
443 |
+
neuronxcc-2.14.213.0+013d129b/MODULE_d37372bb65f76ac89b24+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
444 |
+
neuronxcc-2.14.213.0+013d129b/MODULE_d3c1fe65e3a050366815+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
445 |
+
neuronxcc-2.14.213.0+013d129b/MODULE_dde109d51980e5534145+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
446 |
+
neuronxcc-2.14.213.0+013d129b/MODULE_ddff37e03914d1e4cc1a+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
447 |
+
neuronxcc-2.14.213.0+013d129b/MODULE_eae40350bbf4ea1569ad+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
448 |
+
neuronxcc-2.14.213.0+013d129b/MODULE_ec7ce1cb59fb29fdc73b+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
449 |
+
neuronxcc-2.14.213.0+013d129b/MODULE_ed56de1578306228c0e9+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
450 |
+
neuronxcc-2.14.213.0+013d129b/MODULE_f3c3e815bc8fb3c7b0a3+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
451 |
+
neuronxcc-2.14.213.0+013d129b/MODULE_f5819d12264aac7692e2+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
neuronxcc-2.14.213.0+013d129b/0_REGISTRY/0.0.24.dev0/inference/llama/NousResearch/Hermes-2-Theta-Llama-3-8B/7560e48b8ccab7f8e283.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"architectures": ["LlamaForCausalLM"], "attention_bias": false, "attention_dropout": 0.0, "bos_token_id": 128000, "eos_token_id": 128003, "hidden_act": "silu", "hidden_size": 4096, "initializer_range": 0.02, "intermediate_size": 14336, "max_position_embeddings": 8192, "mlp_bias": false, "model_type": "llama", "neuron": {"auto_cast_type": "fp16", "batch_size": 4, "checkpoint_id": "NousResearch/Hermes-2-Theta-Llama-3-8B", "checkpoint_revision": "885173e97ab8572b444f7db1290d5d0386e26816", "compiler_type": "neuronx-cc", "compiler_version": "2.14.213.0+013d129b", "num_cores": 2, "sequence_length": 4096, "task": "text-generation"}, "num_attention_heads": 32, "num_hidden_layers": 32, "num_key_value_heads": 8, "pretraining_tp": 1, "rms_norm_eps": 1e-05, "rope_scaling": null, "rope_theta": 500000.0, "tie_word_embeddings": false, "torch_dtype": "bfloat16", "use_cache": true, "vocab_size": 128256}
|
neuronxcc-2.14.213.0+013d129b/0_REGISTRY/0.0.24.dev0/inference/llama/NousResearch/Hermes-2-Theta-Llama-3-8B/7bedca11d8eef0f022b7.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"architectures": ["LlamaForCausalLM"], "attention_bias": false, "attention_dropout": 0.0, "bos_token_id": 128000, "eos_token_id": 128003, "hidden_act": "silu", "hidden_size": 4096, "initializer_range": 0.02, "intermediate_size": 14336, "max_position_embeddings": 8192, "mlp_bias": false, "model_type": "llama", "neuron": {"auto_cast_type": "fp16", "batch_size": 4, "checkpoint_id": "NousResearch/Hermes-2-Theta-Llama-3-8B", "checkpoint_revision": "81fc25d402859151f907ad479b18070a3c5a3c11", "compiler_type": "neuronx-cc", "compiler_version": "2.14.213.0+013d129b", "num_cores": 2, "sequence_length": 4096, "task": "text-generation"}, "num_attention_heads": 32, "num_hidden_layers": 32, "num_key_value_heads": 8, "pretraining_tp": 1, "rms_norm_eps": 1e-05, "rope_scaling": null, "rope_theta": 500000.0, "tie_word_embeddings": false, "torch_dtype": "bfloat16", "use_cache": true, "vocab_size": 128256}
|
neuronxcc-2.14.213.0+013d129b/0_REGISTRY/0.0.24.dev0/inference/llama/meta-llama/Meta-Llama-3-8B/17c656c7abb64c7466dd.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"architectures": ["LlamaForCausalLM"], "attention_bias": false, "attention_dropout": 0.0, "bos_token_id": 128000, "eos_token_id": 128001, "hidden_act": "silu", "hidden_size": 4096, "initializer_range": 0.02, "intermediate_size": 14336, "max_position_embeddings": 8192, "mlp_bias": false, "model_type": "llama", "neuron": {"auto_cast_type": "fp16", "batch_size": 16, "checkpoint_id": "meta-llama/Meta-Llama-3-8B", "checkpoint_revision": "62bd457b6fe961a42a631306577e622c83876cb6", "compiler_type": "neuronx-cc", "compiler_version": "2.14.213.0+013d129b", "num_cores": 8, "sequence_length": 4096, "task": "text-generation"}, "num_attention_heads": 32, "num_hidden_layers": 32, "num_key_value_heads": 8, "pretraining_tp": 1, "rms_norm_eps": 1e-05, "rope_scaling": null, "rope_theta": 500000.0, "tie_word_embeddings": false, "torch_dtype": "bfloat16", "use_cache": true, "vocab_size": 128256}
|
neuronxcc-2.14.213.0+013d129b/0_REGISTRY/0.0.24.dev0/inference/llama/meta-llama/Meta-Llama-3-8B/57089b23be0910d8cbc8.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"architectures": ["LlamaForCausalLM"], "attention_bias": false, "attention_dropout": 0.0, "bos_token_id": 128000, "eos_token_id": 128001, "hidden_act": "silu", "hidden_size": 4096, "initializer_range": 0.02, "intermediate_size": 14336, "max_position_embeddings": 8192, "mlp_bias": false, "model_type": "llama", "neuron": {"auto_cast_type": "fp16", "batch_size": 1, "checkpoint_id": "meta-llama/Meta-Llama-3-8B", "checkpoint_revision": "62bd457b6fe961a42a631306577e622c83876cb6", "compiler_type": "neuronx-cc", "compiler_version": "2.14.213.0+013d129b", "num_cores": 8, "sequence_length": 4096, "task": "text-generation"}, "num_attention_heads": 32, "num_hidden_layers": 32, "num_key_value_heads": 8, "pretraining_tp": 1, "rms_norm_eps": 1e-05, "rope_scaling": null, "rope_theta": 500000.0, "tie_word_embeddings": false, "torch_dtype": "bfloat16", "use_cache": true, "vocab_size": 128256}
|
neuronxcc-2.14.213.0+013d129b/0_REGISTRY/0.0.24.dev0/inference/llama/meta-llama/Meta-Llama-3-8B/6767790cca5f811d84f5.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"architectures": ["LlamaForCausalLM"], "attention_bias": false, "attention_dropout": 0.0, "bos_token_id": 128000, "eos_token_id": 128001, "hidden_act": "silu", "hidden_size": 4096, "initializer_range": 0.02, "intermediate_size": 14336, "max_position_embeddings": 8192, "mlp_bias": false, "model_type": "llama", "neuron": {"auto_cast_type": "fp16", "batch_size": 4, "checkpoint_id": "meta-llama/Meta-Llama-3-8B", "checkpoint_revision": "62bd457b6fe961a42a631306577e622c83876cb6", "compiler_type": "neuronx-cc", "compiler_version": "2.14.213.0+013d129b", "num_cores": 2, "sequence_length": 4096, "task": "text-generation"}, "num_attention_heads": 32, "num_hidden_layers": 32, "num_key_value_heads": 8, "pretraining_tp": 1, "rms_norm_eps": 1e-05, "rope_scaling": null, "rope_theta": 500000.0, "tie_word_embeddings": false, "torch_dtype": "bfloat16", "use_cache": true, "vocab_size": 128256}
|
neuronxcc-2.14.213.0+013d129b/0_REGISTRY/0.0.24.dev0/inference/llama/meta-llama/Meta-Llama-3-8B/740ed7b654b7c18270dd.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"architectures": ["LlamaForCausalLM"], "attention_bias": false, "attention_dropout": 0.0, "bos_token_id": 128000, "eos_token_id": 128001, "hidden_act": "silu", "hidden_size": 4096, "initializer_range": 0.02, "intermediate_size": 14336, "max_position_embeddings": 8192, "mlp_bias": false, "model_type": "llama", "neuron": {"auto_cast_type": "fp16", "batch_size": 32, "checkpoint_id": "meta-llama/Meta-Llama-3-8B", "checkpoint_revision": "62bd457b6fe961a42a631306577e622c83876cb6", "compiler_type": "neuronx-cc", "compiler_version": "2.14.213.0+013d129b", "num_cores": 8, "sequence_length": 4096, "task": "text-generation"}, "num_attention_heads": 32, "num_hidden_layers": 32, "num_key_value_heads": 8, "pretraining_tp": 1, "rms_norm_eps": 1e-05, "rope_scaling": null, "rope_theta": 500000.0, "tie_word_embeddings": false, "torch_dtype": "bfloat16", "use_cache": true, "vocab_size": 128256}
|
neuronxcc-2.14.213.0+013d129b/0_REGISTRY/0.0.24.dev0/inference/llama/meta-llama/Meta-Llama-3-8B/91b57a8edda1c1c3a3ce.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"architectures": ["LlamaForCausalLM"], "attention_bias": false, "attention_dropout": 0.0, "bos_token_id": 128000, "eos_token_id": 128001, "hidden_act": "silu", "hidden_size": 4096, "initializer_range": 0.02, "intermediate_size": 14336, "max_position_embeddings": 8192, "mlp_bias": false, "model_type": "llama", "neuron": {"auto_cast_type": "fp16", "batch_size": 4, "checkpoint_id": "meta-llama/Meta-Llama-3-8B", "checkpoint_revision": "62bd457b6fe961a42a631306577e622c83876cb6", "compiler_type": "neuronx-cc", "compiler_version": "2.14.213.0+013d129b", "num_cores": 8, "sequence_length": 4096, "task": "text-generation"}, "num_attention_heads": 32, "num_hidden_layers": 32, "num_key_value_heads": 8, "pretraining_tp": 1, "rms_norm_eps": 1e-05, "rope_scaling": null, "rope_theta": 500000.0, "tie_word_embeddings": false, "torch_dtype": "bfloat16", "use_cache": true, "vocab_size": 128256}
|
neuronxcc-2.14.213.0+013d129b/0_REGISTRY/0.0.24.dev0/inference/llama/meta-llama/Meta-Llama-3-8B/d93f0bb3e47016036365.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"architectures": ["LlamaForCausalLM"], "attention_bias": false, "attention_dropout": 0.0, "bos_token_id": 128000, "eos_token_id": 128001, "hidden_act": "silu", "hidden_size": 4096, "initializer_range": 0.02, "intermediate_size": 14336, "max_position_embeddings": 8192, "mlp_bias": false, "model_type": "llama", "neuron": {"auto_cast_type": "fp16", "batch_size": 8, "checkpoint_id": "meta-llama/Meta-Llama-3-8B", "checkpoint_revision": "62bd457b6fe961a42a631306577e622c83876cb6", "compiler_type": "neuronx-cc", "compiler_version": "2.14.213.0+013d129b", "num_cores": 8, "sequence_length": 4096, "task": "text-generation"}, "num_attention_heads": 32, "num_hidden_layers": 32, "num_key_value_heads": 8, "pretraining_tp": 1, "rms_norm_eps": 1e-05, "rope_scaling": null, "rope_theta": 500000.0, "tie_word_embeddings": false, "torch_dtype": "bfloat16", "use_cache": true, "vocab_size": 128256}
|
neuronxcc-2.14.213.0+013d129b/0_REGISTRY/0.0.24.dev0/inference/llama/princeton-nlp/Sheared-LLaMA-1.3B/f69d881a5f54838a96cb.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"architectures": ["LlamaForCausalLM"], "attention_bias": false, "attention_dropout": 0.0, "bos_token_id": 1, "eos_token_id": 2, "hidden_act": "silu", "hidden_size": 2048, "initializer_range": 0.02, "intermediate_size": 5504, "max_position_embeddings": 4096, "mlp_bias": false, "model_type": "llama", "neuron": {"auto_cast_type": "fp32", "batch_size": 4, "checkpoint_id": "princeton-nlp/Sheared-LLaMA-1.3B", "checkpoint_revision": "a4b76938edbf571ea7d7d9904861cbdca08809b4", "compiler_type": "neuronx-cc", "compiler_version": "2.14.213.0+013d129b", "num_cores": 2, "sequence_length": 4096, "task": "text-generation"}, "num_attention_heads": 16, "num_hidden_layers": 24, "num_key_value_heads": 16, "pad_token_id": 0, "pretraining_tp": 1, "rms_norm_eps": 1e-05, "rope_scaling": null, "rope_theta": 10000.0, "tie_word_embeddings": false, "torch_dtype": "float32", "use_cache": true, "vocab_size": 32000}
|
neuronxcc-2.14.213.0+013d129b/0_REGISTRY/0.0.24.dev0/inference/llama/princeton-nlp/Sheared-LLaMA-2.7B/65af25a07a9af664c36d.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"architectures": ["LlamaForCausalLM"], "attention_bias": false, "attention_dropout": 0.0, "bos_token_id": 1, "eos_token_id": 2, "hidden_act": "silu", "hidden_size": 2560, "initializer_range": 0.02, "intermediate_size": 6912, "max_position_embeddings": 4096, "mlp_bias": false, "model_type": "llama", "neuron": {"auto_cast_type": "fp16", "batch_size": 4, "checkpoint_id": "princeton-nlp/Sheared-LLaMA-2.7B", "checkpoint_revision": "2f157a0306b75d37694ae05f6a4067220254d540", "compiler_type": "neuronx-cc", "compiler_version": "2.14.213.0+013d129b", "num_cores": 2, "sequence_length": 4096, "task": "text-generation"}, "num_attention_heads": 20, "num_hidden_layers": 32, "num_key_value_heads": 20, "pad_token_id": 0, "pretraining_tp": 1, "rms_norm_eps": 1e-05, "rope_scaling": null, "rope_theta": 10000.0, "tie_word_embeddings": false, "torch_dtype": "float32", "use_cache": true, "vocab_size": 32000}
|
neuronxcc-2.14.213.0+013d129b/MODULE_0157f35eb303445e190f+2c2d707e/compile_flags.txt
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
--model-type=transformer --auto-cast=none
|
neuronxcc-2.14.213.0+013d129b/MODULE_0157f35eb303445e190f+2c2d707e/model.hlo_module.pb
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:78bda1c787c58a7c91b56f5c7bc8cffba94e94affe25ed93afd5e75f1b41e5ef
|
3 |
+
size 263042
|
neuronxcc-2.14.213.0+013d129b/MODULE_0157f35eb303445e190f+2c2d707e/model.neff
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8707aff7a4548a17e4b1a9cdc0f731909a6f9661fc8c021aff486e777f6d012a
|
3 |
+
size 2950144
|
neuronxcc-2.14.213.0+013d129b/MODULE_0176fb35e78494db681c+2c2d707e/compile_flags.txt
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
--model-type=transformer --auto-cast=none
|
neuronxcc-2.14.213.0+013d129b/MODULE_0176fb35e78494db681c+2c2d707e/model.hlo_module.pb
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5178ed4ecb814449145b310b3b7c5f60238d21270b2cedd6725f9ebb17cc80aa
|
3 |
+
size 256609
|
neuronxcc-2.14.213.0+013d129b/MODULE_0176fb35e78494db681c+2c2d707e/model.neff
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c5d72b028aa844df5430ef1e00dd6958aca2a52986f19fe1c3f23090c3116b9a
|
3 |
+
size 3748864
|
neuronxcc-2.14.213.0+013d129b/MODULE_01cc804175cc5fb0e309+2c2d707e/compile_flags.txt
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
--model-type=transformer --auto-cast=none
|
neuronxcc-2.14.213.0+013d129b/MODULE_01cc804175cc5fb0e309+2c2d707e/model.hlo_module.pb
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d1f9c7e6febf4b6937cf831c6ec7659ef5b065859fc687e36653a12472a9a257
|
3 |
+
size 360581
|
neuronxcc-2.14.213.0+013d129b/MODULE_01cc804175cc5fb0e309+2c2d707e/model.neff
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d73bdb0e4ba255c5efad14cd2396f9ec9e61cf8e80c3c9f028bee75885525917
|
3 |
+
size 3963904
|
neuronxcc-2.14.213.0+013d129b/MODULE_146077388d26b5450bf4+2c2d707e/compile_flags.txt
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
--model-type=transformer --auto-cast=none
|
neuronxcc-2.14.213.0+013d129b/MODULE_146077388d26b5450bf4+2c2d707e/model.hlo_module.pb
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:069b6db549c78b0645211b900002a69c5a791edfeac2f850bb6b4544d10f6535
|
3 |
+
size 323888
|
neuronxcc-2.14.213.0+013d129b/MODULE_146077388d26b5450bf4+2c2d707e/model.neff
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3399c960a5b7e3d5c77ee10c6474ae1729bc462a9969d33541632e7751d2909c
|
3 |
+
size 2653184
|
neuronxcc-2.14.213.0+013d129b/MODULE_1d5c76706b604a934e43+2c2d707e/compile_flags.txt
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
--model-type=transformer --auto-cast=none
|
neuronxcc-2.14.213.0+013d129b/MODULE_1d5c76706b604a934e43+2c2d707e/model.hlo_module.pb
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:75ddd0fa36baa1ffccb172c1a5e0c2af3a9aec90cf1a79ecbef7a9e747040e4a
|
3 |
+
size 333872
|
neuronxcc-2.14.213.0+013d129b/MODULE_1d5c76706b604a934e43+2c2d707e/model.neff
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:adb3389f28222e26edd1e762ecc770c7b09aeb038f831c6b845429bbf25045f1
|
3 |
+
size 2386944
|
neuronxcc-2.14.213.0+013d129b/MODULE_1e7a2f7302fa2bde6e72+2c2d707e/compile_flags.txt
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
--model-type=transformer --auto-cast=none
|
neuronxcc-2.14.213.0+013d129b/MODULE_1e7a2f7302fa2bde6e72+2c2d707e/model.hlo_module.pb
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:12d0cae17db1f3f34e3982dff35139cf4d2ce78c855cfa280486263850234f5f
|
3 |
+
size 350595
|
neuronxcc-2.14.213.0+013d129b/MODULE_1e7a2f7302fa2bde6e72+2c2d707e/model.neff
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e51a18e1517e5810b1214528cb2547af00043d3313f42cd61a82e779a23784f2
|
3 |
+
size 3585024
|
neuronxcc-2.14.213.0+013d129b/MODULE_21e3dcaee19883fe287e+2c2d707e/compile_flags.txt
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
--model-type=transformer --auto-cast=none
|
neuronxcc-2.14.213.0+013d129b/MODULE_21e3dcaee19883fe287e+2c2d707e/model.hlo_module.pb
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c13b522ad45166c5df2d2864c1eb75df2e240879c6db4533b22fec098ee634cf
|
3 |
+
size 266465
|
neuronxcc-2.14.213.0+013d129b/MODULE_21e3dcaee19883fe287e+2c2d707e/model.neff
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ac3da95930a4625d028e4223d1acf870ecf01483fee18d7b12c0d0dd20a4e703
|
3 |
+
size 13579264
|
neuronxcc-2.14.213.0+013d129b/MODULE_298c803bdff39c3d92ed+2c2d707e/compile_flags.txt
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
--model-type=transformer --auto-cast=none
|
neuronxcc-2.14.213.0+013d129b/MODULE_298c803bdff39c3d92ed+2c2d707e/model.hlo_module.pb
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ea4765221484edc95f6b892f58d320d4640f81b80c34a882c4e96efab5208b14
|
3 |
+
size 325426
|
neuronxcc-2.14.213.0+013d129b/MODULE_298c803bdff39c3d92ed+2c2d707e/model.neff
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:188c4e77e56f8578f751fe2819c365c94bf9782f40e3b5a282b73a68808861ce
|
3 |
+
size 34233344
|
neuronxcc-2.14.213.0+013d129b/MODULE_29fb2a5ae4896a78c559+2c2d707e/compile_flags.txt
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
--model-type=transformer --auto-cast=none
|
neuronxcc-2.14.213.0+013d129b/MODULE_29fb2a5ae4896a78c559+2c2d707e/model.hlo_module.pb
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4f8ee595e96ede06e08a1ff8f0fb0a8fa92f20c3e0b69a1c1e07452f872475b8
|
3 |
+
size 350595
|
neuronxcc-2.14.213.0+013d129b/MODULE_29fb2a5ae4896a78c559+2c2d707e/model.neff
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5038d968469d32789fb84f57eebc1a9a42d281fc03662548566a0d220cfb6228
|
3 |
+
size 6145024
|
neuronxcc-2.14.213.0+013d129b/MODULE_2b55711d93e1566cdd78+2c2d707e/compile_flags.txt
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
--model-type=transformer --auto-cast=none
|
neuronxcc-2.14.213.0+013d129b/MODULE_2b55711d93e1566cdd78+2c2d707e/model.hlo_module.pb
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:65c9163db0fcabd8c5baaa381b64b90b7cb9a63aa5a497c6666801bced2b885e
|
3 |
+
size 44451
|
neuronxcc-2.14.213.0+013d129b/MODULE_2b55711d93e1566cdd78+2c2d707e/model.neff
ADDED
Binary file (400 kB). View file
|
|
neuronxcc-2.14.213.0+013d129b/MODULE_2f46e3e3a9cc37a9f386+2c2d707e/compile_flags.txt
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
--model-type=transformer --auto-cast=none
|
neuronxcc-2.14.213.0+013d129b/MODULE_2f46e3e3a9cc37a9f386+2c2d707e/model.hlo_module.pb
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2e2ab921c34bb717a4691d89c6ce8dd6964f182097f6a0ea187df455e3f62a5c
|
3 |
+
size 323888
|
neuronxcc-2.14.213.0+013d129b/MODULE_2f46e3e3a9cc37a9f386+2c2d707e/model.neff
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1cc63b96da126818f2442e0505ee541c3ce21fa1eee53458cc273db24ef8e943
|
3 |
+
size 2448384
|
neuronxcc-2.14.213.0+013d129b/MODULE_33719efab65aba8971de+2c2d707e/compile_flags.txt
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
--model-type=transformer --auto-cast=none
|
neuronxcc-2.14.213.0+013d129b/MODULE_33719efab65aba8971de+2c2d707e/model.hlo_module.pb
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:79f9714a849abc7a81c860cd24be5de76ad7c037cc74d9c2a225804e0c55e069
|
3 |
+
size 266465
|
neuronxcc-2.14.213.0+013d129b/MODULE_33719efab65aba8971de+2c2d707e/model.neff
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dcc2d5e4d5e98e43f31d9dd1d7ce01fbca9e7858994f586e81669cba0094a10a
|
3 |
+
size 3830784
|
neuronxcc-2.14.213.0+013d129b/MODULE_345116edd09879b7ebe4+2c2d707e/compile_flags.txt
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
--model-type=transformer --auto-cast=none
|
neuronxcc-2.14.213.0+013d129b/MODULE_345116edd09879b7ebe4+2c2d707e/model.hlo_module.pb
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2ae6fb8fd3c66e17e30fe2e19e2f8b2a8ae8f85d02519fb10b586606a9587c83
|
3 |
+
size 360718
|
neuronxcc-2.14.213.0+013d129b/MODULE_345116edd09879b7ebe4+2c2d707e/model.neff
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a8b44ab0897f8d69f01746b53dac24042f0a1d2ef8ae347618dd722c0b23b1e1
|
3 |
+
size 10875904
|