Synchronizing local compiler cache.
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- .gitattributes +40 -0
- neuronxcc-2.15.143.0+e39249ad/0_REGISTRY/0.0.27.dev0/inference/qwen2/Qwen/Qwen2.5-0.5B/6d0af0ea85413b9a8bc4.json +1 -0
- neuronxcc-2.15.143.0+e39249ad/0_REGISTRY/0.0.27.dev0/inference/qwen2/Qwen/Qwen2.5-0.5B/f404b6bcd5e4c946681b.json +1 -0
- neuronxcc-2.15.143.0+e39249ad/0_REGISTRY/0.0.27.dev0/inference/qwen2/Qwen/Qwen2.5-72B-Instruct/058a352bb7d4c0e8af68.json +1 -0
- neuronxcc-2.15.143.0+e39249ad/0_REGISTRY/0.0.27.dev0/inference/qwen2/Qwen/Qwen2.5-72B-Instruct/090bc30b9eaa90b56de8.json +1 -0
- neuronxcc-2.15.143.0+e39249ad/0_REGISTRY/0.0.27.dev0/inference/qwen2/Qwen/Qwen2.5-72B-Instruct/355ef61d7e21c9ca4dfd.json +1 -0
- neuronxcc-2.15.143.0+e39249ad/0_REGISTRY/0.0.27.dev0/inference/qwen2/Qwen/Qwen2.5-72B-Instruct/5feb3df570ed48ce4ef9.json +1 -0
- neuronxcc-2.15.143.0+e39249ad/0_REGISTRY/0.0.27.dev0/inference/qwen2/Qwen/Qwen2.5-72B-Instruct/62d648e67c1df9861c81.json +1 -0
- neuronxcc-2.15.143.0+e39249ad/0_REGISTRY/0.0.27.dev0/inference/qwen2/Qwen/Qwen2.5-72B-Instruct/b0090f8c5a66f58c402e.json +1 -0
- neuronxcc-2.15.143.0+e39249ad/0_REGISTRY/0.0.27.dev0/inference/qwen2/Qwen/Qwen2.5-Math-7B-Instruct/73abe935a165dd5a8d7d.json +1 -0
- neuronxcc-2.15.143.0+e39249ad/MODULE_025073d88f6dec21a13d+39f12043/compile_flags.json +1 -0
- neuronxcc-2.15.143.0+e39249ad/MODULE_025073d88f6dec21a13d+39f12043/model.done +0 -0
- neuronxcc-2.15.143.0+e39249ad/MODULE_025073d88f6dec21a13d+39f12043/model.hlo_module.pb +3 -0
- neuronxcc-2.15.143.0+e39249ad/MODULE_025073d88f6dec21a13d+39f12043/model.neff +0 -0
- neuronxcc-2.15.143.0+e39249ad/MODULE_10d128cdbda38f2dd83b+39f12043/compile_flags.json +1 -0
- neuronxcc-2.15.143.0+e39249ad/MODULE_10d128cdbda38f2dd83b+39f12043/model.done +0 -0
- neuronxcc-2.15.143.0+e39249ad/MODULE_10d128cdbda38f2dd83b+39f12043/model.hlo_module.pb +3 -0
- neuronxcc-2.15.143.0+e39249ad/MODULE_10d128cdbda38f2dd83b+39f12043/model.neff +0 -0
- neuronxcc-2.15.143.0+e39249ad/MODULE_19508710902bacc178f4+39f12043/compile_flags.json +1 -0
- neuronxcc-2.15.143.0+e39249ad/MODULE_19508710902bacc178f4+39f12043/model.done +0 -0
- neuronxcc-2.15.143.0+e39249ad/MODULE_19508710902bacc178f4+39f12043/model.hlo_module.pb +3 -0
- neuronxcc-2.15.143.0+e39249ad/MODULE_19508710902bacc178f4+39f12043/model.neff +3 -0
- neuronxcc-2.15.143.0+e39249ad/MODULE_26a5181917a99c6440c2+39f12043/compile_flags.json +1 -0
- neuronxcc-2.15.143.0+e39249ad/MODULE_26a5181917a99c6440c2+39f12043/model.done +0 -0
- neuronxcc-2.15.143.0+e39249ad/MODULE_26a5181917a99c6440c2+39f12043/model.hlo_module.pb +3 -0
- neuronxcc-2.15.143.0+e39249ad/MODULE_26a5181917a99c6440c2+39f12043/model.neff +3 -0
- neuronxcc-2.15.143.0+e39249ad/MODULE_348cd8119f4a5353ee24+39f12043/compile_flags.json +1 -0
- neuronxcc-2.15.143.0+e39249ad/MODULE_348cd8119f4a5353ee24+39f12043/model.done +0 -0
- neuronxcc-2.15.143.0+e39249ad/MODULE_348cd8119f4a5353ee24+39f12043/model.hlo_module.pb +3 -0
- neuronxcc-2.15.143.0+e39249ad/MODULE_348cd8119f4a5353ee24+39f12043/model.neff +3 -0
- neuronxcc-2.15.143.0+e39249ad/MODULE_38e952fa2492adf691ff+39f12043/compile_flags.json +1 -0
- neuronxcc-2.15.143.0+e39249ad/MODULE_38e952fa2492adf691ff+39f12043/model.done +0 -0
- neuronxcc-2.15.143.0+e39249ad/MODULE_38e952fa2492adf691ff+39f12043/model.hlo_module.pb +3 -0
- neuronxcc-2.15.143.0+e39249ad/MODULE_38e952fa2492adf691ff+39f12043/model.neff +3 -0
- neuronxcc-2.15.143.0+e39249ad/MODULE_445d572321d7551de96d+39f12043/compile_flags.json +1 -0
- neuronxcc-2.15.143.0+e39249ad/MODULE_445d572321d7551de96d+39f12043/model.done +0 -0
- neuronxcc-2.15.143.0+e39249ad/MODULE_445d572321d7551de96d+39f12043/model.hlo_module.pb +3 -0
- neuronxcc-2.15.143.0+e39249ad/MODULE_445d572321d7551de96d+39f12043/model.neff +3 -0
- neuronxcc-2.15.143.0+e39249ad/MODULE_4d076c0c56a5768c4069+39f12043/compile_flags.json +1 -0
- neuronxcc-2.15.143.0+e39249ad/MODULE_4d076c0c56a5768c4069+39f12043/model.done +0 -0
- neuronxcc-2.15.143.0+e39249ad/MODULE_4d076c0c56a5768c4069+39f12043/model.hlo_module.pb +3 -0
- neuronxcc-2.15.143.0+e39249ad/MODULE_4d076c0c56a5768c4069+39f12043/model.neff +3 -0
- neuronxcc-2.15.143.0+e39249ad/MODULE_5263f71385ed4e05d605+39f12043/compile_flags.json +1 -0
- neuronxcc-2.15.143.0+e39249ad/MODULE_5263f71385ed4e05d605+39f12043/model.done +0 -0
- neuronxcc-2.15.143.0+e39249ad/MODULE_5263f71385ed4e05d605+39f12043/model.hlo_module.pb +3 -0
- neuronxcc-2.15.143.0+e39249ad/MODULE_5263f71385ed4e05d605+39f12043/model.neff +3 -0
- neuronxcc-2.15.143.0+e39249ad/MODULE_5425d7325a97f7a4932e+39f12043/compile_flags.json +1 -0
- neuronxcc-2.15.143.0+e39249ad/MODULE_5425d7325a97f7a4932e+39f12043/model.done +0 -0
- neuronxcc-2.15.143.0+e39249ad/MODULE_5425d7325a97f7a4932e+39f12043/model.hlo_module.pb +3 -0
- neuronxcc-2.15.143.0+e39249ad/MODULE_5425d7325a97f7a4932e+39f12043/model.neff +3 -0
.gitattributes
CHANGED
@@ -6328,3 +6328,43 @@ neuronxcc-2.15.143.0+e39249ad/MODULE_05d8ecae48e91ee8980d/text_encoder_2/model.n
|
|
6328 |
neuronxcc-2.15.143.0+e39249ad/MODULE_05d8ecae48e91ee8980d/unet/model.neuron filter=lfs diff=lfs merge=lfs -text
|
6329 |
neuronxcc-2.15.143.0+e39249ad/MODULE_05d8ecae48e91ee8980d/vae_decoder/model.neuron filter=lfs diff=lfs merge=lfs -text
|
6330 |
neuronxcc-2.15.143.0+e39249ad/MODULE_05d8ecae48e91ee8980d/vae_encoder/model.neuron filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
6328 |
neuronxcc-2.15.143.0+e39249ad/MODULE_05d8ecae48e91ee8980d/unet/model.neuron filter=lfs diff=lfs merge=lfs -text
|
6329 |
neuronxcc-2.15.143.0+e39249ad/MODULE_05d8ecae48e91ee8980d/vae_decoder/model.neuron filter=lfs diff=lfs merge=lfs -text
|
6330 |
neuronxcc-2.15.143.0+e39249ad/MODULE_05d8ecae48e91ee8980d/vae_encoder/model.neuron filter=lfs diff=lfs merge=lfs -text
|
6331 |
+
neuronxcc-2.15.143.0+e39249ad/MODULE_19508710902bacc178f4+39f12043/model.neff filter=lfs diff=lfs merge=lfs -text
|
6332 |
+
neuronxcc-2.15.143.0+e39249ad/MODULE_26a5181917a99c6440c2+39f12043/model.neff filter=lfs diff=lfs merge=lfs -text
|
6333 |
+
neuronxcc-2.15.143.0+e39249ad/MODULE_348cd8119f4a5353ee24+39f12043/model.neff filter=lfs diff=lfs merge=lfs -text
|
6334 |
+
neuronxcc-2.15.143.0+e39249ad/MODULE_38e952fa2492adf691ff+39f12043/model.neff filter=lfs diff=lfs merge=lfs -text
|
6335 |
+
neuronxcc-2.15.143.0+e39249ad/MODULE_445d572321d7551de96d+39f12043/model.neff filter=lfs diff=lfs merge=lfs -text
|
6336 |
+
neuronxcc-2.15.143.0+e39249ad/MODULE_4d076c0c56a5768c4069+39f12043/model.neff filter=lfs diff=lfs merge=lfs -text
|
6337 |
+
neuronxcc-2.15.143.0+e39249ad/MODULE_5263f71385ed4e05d605+39f12043/model.neff filter=lfs diff=lfs merge=lfs -text
|
6338 |
+
neuronxcc-2.15.143.0+e39249ad/MODULE_5425d7325a97f7a4932e+39f12043/model.neff filter=lfs diff=lfs merge=lfs -text
|
6339 |
+
neuronxcc-2.15.143.0+e39249ad/MODULE_577ca4a419d665365921+39f12043/model.neff filter=lfs diff=lfs merge=lfs -text
|
6340 |
+
neuronxcc-2.15.143.0+e39249ad/MODULE_5bba44dbf59b43b3d1f0+39f12043/model.neff filter=lfs diff=lfs merge=lfs -text
|
6341 |
+
neuronxcc-2.15.143.0+e39249ad/MODULE_5c88ac7fb93085af9c2b+39f12043/model.neff filter=lfs diff=lfs merge=lfs -text
|
6342 |
+
neuronxcc-2.15.143.0+e39249ad/MODULE_6158c090f65032e00f74+39f12043/model.neff filter=lfs diff=lfs merge=lfs -text
|
6343 |
+
neuronxcc-2.15.143.0+e39249ad/MODULE_62d7bdfdb721536bb071+39f12043/model.neff filter=lfs diff=lfs merge=lfs -text
|
6344 |
+
neuronxcc-2.15.143.0+e39249ad/MODULE_6402a35ae65f70f2e6b3+39f12043/model.neff filter=lfs diff=lfs merge=lfs -text
|
6345 |
+
neuronxcc-2.15.143.0+e39249ad/MODULE_66477408e960f0ab49ba+39f12043/model.neff filter=lfs diff=lfs merge=lfs -text
|
6346 |
+
neuronxcc-2.15.143.0+e39249ad/MODULE_6e446bc9fb621acf17ec+39f12043/model.neff filter=lfs diff=lfs merge=lfs -text
|
6347 |
+
neuronxcc-2.15.143.0+e39249ad/MODULE_7df64ced3de7c4dfd196+39f12043/model.neff filter=lfs diff=lfs merge=lfs -text
|
6348 |
+
neuronxcc-2.15.143.0+e39249ad/MODULE_7dff79b209c4936eccf6+39f12043/model.neff filter=lfs diff=lfs merge=lfs -text
|
6349 |
+
neuronxcc-2.15.143.0+e39249ad/MODULE_7f495f1e5eab37e231f8+39f12043/model.neff filter=lfs diff=lfs merge=lfs -text
|
6350 |
+
neuronxcc-2.15.143.0+e39249ad/MODULE_822748c7e4759c0698fc+39f12043/model.neff filter=lfs diff=lfs merge=lfs -text
|
6351 |
+
neuronxcc-2.15.143.0+e39249ad/MODULE_8568ef054dcab0a881e6+39f12043/model.neff filter=lfs diff=lfs merge=lfs -text
|
6352 |
+
neuronxcc-2.15.143.0+e39249ad/MODULE_8d073502ce4185d60215+39f12043/model.neff filter=lfs diff=lfs merge=lfs -text
|
6353 |
+
neuronxcc-2.15.143.0+e39249ad/MODULE_8eb7c7f43b1ddb9995d7+39f12043/model.neff filter=lfs diff=lfs merge=lfs -text
|
6354 |
+
neuronxcc-2.15.143.0+e39249ad/MODULE_98773a4d5b572f0b4e19+39f12043/model.neff filter=lfs diff=lfs merge=lfs -text
|
6355 |
+
neuronxcc-2.15.143.0+e39249ad/MODULE_9bf7d4560f134fd504aa+39f12043/model.neff filter=lfs diff=lfs merge=lfs -text
|
6356 |
+
neuronxcc-2.15.143.0+e39249ad/MODULE_9c3a05bace15af5d38e1+39f12043/model.neff filter=lfs diff=lfs merge=lfs -text
|
6357 |
+
neuronxcc-2.15.143.0+e39249ad/MODULE_aa16542849c94822cf60+39f12043/model.neff filter=lfs diff=lfs merge=lfs -text
|
6358 |
+
neuronxcc-2.15.143.0+e39249ad/MODULE_addf3ee88910c0f4f81e+39f12043/model.neff filter=lfs diff=lfs merge=lfs -text
|
6359 |
+
neuronxcc-2.15.143.0+e39249ad/MODULE_b6d1e63d522c57afb5b8+39f12043/model.neff filter=lfs diff=lfs merge=lfs -text
|
6360 |
+
neuronxcc-2.15.143.0+e39249ad/MODULE_bcd777280ee4ee0105a8+39f12043/model.neff filter=lfs diff=lfs merge=lfs -text
|
6361 |
+
neuronxcc-2.15.143.0+e39249ad/MODULE_c59ef31c53c35de18bfa+39f12043/model.neff filter=lfs diff=lfs merge=lfs -text
|
6362 |
+
neuronxcc-2.15.143.0+e39249ad/MODULE_d3c5967570c46d6191a9+39f12043/model.neff filter=lfs diff=lfs merge=lfs -text
|
6363 |
+
neuronxcc-2.15.143.0+e39249ad/MODULE_d71ff4a9a47bb2779232+39f12043/model.neff filter=lfs diff=lfs merge=lfs -text
|
6364 |
+
neuronxcc-2.15.143.0+e39249ad/MODULE_e00e29076f606df4175f+39f12043/model.neff filter=lfs diff=lfs merge=lfs -text
|
6365 |
+
neuronxcc-2.15.143.0+e39249ad/MODULE_e02f71073a5bbd82b90b+39f12043/model.neff filter=lfs diff=lfs merge=lfs -text
|
6366 |
+
neuronxcc-2.15.143.0+e39249ad/MODULE_e63ec966f940f9aac5ed+39f12043/model.neff filter=lfs diff=lfs merge=lfs -text
|
6367 |
+
neuronxcc-2.15.143.0+e39249ad/MODULE_eae3a509248ee092e093+39f12043/model.neff filter=lfs diff=lfs merge=lfs -text
|
6368 |
+
neuronxcc-2.15.143.0+e39249ad/MODULE_f4cf938415821e326a97+39f12043/model.neff filter=lfs diff=lfs merge=lfs -text
|
6369 |
+
neuronxcc-2.15.143.0+e39249ad/MODULE_f7f5761cfc68a7c66eb3+39f12043/model.neff filter=lfs diff=lfs merge=lfs -text
|
6370 |
+
neuronxcc-2.15.143.0+e39249ad/MODULE_fbc0c1dcbdfb5e889d3e+39f12043/model.neff filter=lfs diff=lfs merge=lfs -text
|
neuronxcc-2.15.143.0+e39249ad/0_REGISTRY/0.0.27.dev0/inference/qwen2/Qwen/Qwen2.5-0.5B/6d0af0ea85413b9a8bc4.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"architectures": ["Qwen2ForCausalLM"], "attention_dropout": 0.0, "bos_token_id": 151643, "eos_token_id": 151643, "hidden_act": "silu", "hidden_size": 896, "initializer_range": 0.02, "intermediate_size": 4864, "max_position_embeddings": 32768, "max_window_layers": 24, "model_type": "qwen2", "neuron": {"auto_cast_type": "fp16", "batch_size": 1, "checkpoint_id": "Qwen/Qwen2.5-0.5B", "checkpoint_revision": "060db6499f32faf8b98477b0a26969ef7d8b9987", "compiler_type": "neuronx-cc", "compiler_version": "2.15.143.0+e39249ad", "num_cores": 2, "sequence_length": 4096, "task": "text-generation"}, "num_attention_heads": 14, "num_hidden_layers": 24, "num_key_value_heads": 2, "rms_norm_eps": 1e-06, "rope_theta": 1000000.0, "sliding_window": null, "tie_word_embeddings": true, "torch_dtype": "bfloat16", "use_cache": true, "use_mrope": false, "use_sliding_window": false, "vocab_size": 151936}
|
neuronxcc-2.15.143.0+e39249ad/0_REGISTRY/0.0.27.dev0/inference/qwen2/Qwen/Qwen2.5-0.5B/f404b6bcd5e4c946681b.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"architectures": ["Qwen2ForCausalLM"], "attention_dropout": 0.0, "bos_token_id": 151643, "eos_token_id": 151643, "hidden_act": "silu", "hidden_size": 896, "initializer_range": 0.02, "intermediate_size": 4864, "max_position_embeddings": 32768, "max_window_layers": 24, "model_type": "qwen2", "neuron": {"auto_cast_type": "fp16", "batch_size": 4, "checkpoint_id": "Qwen/Qwen2.5-0.5B", "checkpoint_revision": "060db6499f32faf8b98477b0a26969ef7d8b9987", "compiler_type": "neuronx-cc", "compiler_version": "2.15.143.0+e39249ad", "num_cores": 2, "sequence_length": 4096, "task": "text-generation"}, "num_attention_heads": 14, "num_hidden_layers": 24, "num_key_value_heads": 2, "rms_norm_eps": 1e-06, "rope_theta": 1000000.0, "sliding_window": null, "tie_word_embeddings": true, "torch_dtype": "bfloat16", "use_cache": true, "use_mrope": false, "use_sliding_window": false, "vocab_size": 151936}
|
neuronxcc-2.15.143.0+e39249ad/0_REGISTRY/0.0.27.dev0/inference/qwen2/Qwen/Qwen2.5-72B-Instruct/058a352bb7d4c0e8af68.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"architectures": ["Qwen2ForCausalLM"], "attention_dropout": 0.0, "bos_token_id": 151643, "eos_token_id": 151645, "hidden_act": "silu", "hidden_size": 8192, "initializer_range": 0.02, "intermediate_size": 29568, "max_position_embeddings": 32768, "max_window_layers": 70, "model_type": "qwen2", "neuron": {"auto_cast_type": "bf16", "batch_size": 1, "checkpoint_id": "Qwen/Qwen2.5-72B-Instruct", "checkpoint_revision": "d3d951150c1e5848237cd6a7ad11df4836aee842", "compiler_type": "neuronx-cc", "compiler_version": "2.15.143.0+e39249ad", "num_cores": 24, "sequence_length": 32768, "task": "text-generation"}, "num_attention_heads": 64, "num_hidden_layers": 80, "num_key_value_heads": 8, "rms_norm_eps": 1e-06, "rope_theta": 1000000.0, "sliding_window": null, "tie_word_embeddings": false, "torch_dtype": "bfloat16", "use_cache": true, "use_sliding_window": false, "vocab_size": 152064}
|
neuronxcc-2.15.143.0+e39249ad/0_REGISTRY/0.0.27.dev0/inference/qwen2/Qwen/Qwen2.5-72B-Instruct/090bc30b9eaa90b56de8.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"architectures": ["Qwen2ForCausalLM"], "attention_dropout": 0.0, "bos_token_id": 151643, "eos_token_id": 151645, "hidden_act": "silu", "hidden_size": 8192, "initializer_range": 0.02, "intermediate_size": 29568, "max_position_embeddings": 32768, "max_window_layers": 70, "model_type": "qwen2", "neuron": {"auto_cast_type": "bf16", "batch_size": 4, "checkpoint_id": "Qwen/Qwen2.5-72B-Instruct", "checkpoint_revision": "d3d951150c1e5848237cd6a7ad11df4836aee842", "compiler_type": "neuronx-cc", "compiler_version": "2.15.143.0+e39249ad", "num_cores": 24, "sequence_length": 4096, "task": "text-generation"}, "num_attention_heads": 64, "num_hidden_layers": 80, "num_key_value_heads": 8, "rms_norm_eps": 1e-06, "rope_theta": 1000000.0, "sliding_window": null, "tie_word_embeddings": false, "torch_dtype": "bfloat16", "use_cache": true, "use_sliding_window": false, "vocab_size": 152064}
|
neuronxcc-2.15.143.0+e39249ad/0_REGISTRY/0.0.27.dev0/inference/qwen2/Qwen/Qwen2.5-72B-Instruct/355ef61d7e21c9ca4dfd.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"architectures": ["Qwen2ForCausalLM"], "attention_dropout": 0.0, "bos_token_id": 151643, "eos_token_id": 151645, "hidden_act": "silu", "hidden_size": 8192, "initializer_range": 0.02, "intermediate_size": 29568, "max_position_embeddings": 32768, "max_window_layers": 70, "model_type": "qwen2", "neuron": {"auto_cast_type": "bf16", "batch_size": 4, "checkpoint_id": "Qwen/Qwen2.5-72B-Instruct", "checkpoint_revision": "d3d951150c1e5848237cd6a7ad11df4836aee842", "compiler_type": "neuronx-cc", "compiler_version": "2.15.143.0+e39249ad", "num_cores": 24, "sequence_length": 32768, "task": "text-generation"}, "num_attention_heads": 64, "num_hidden_layers": 80, "num_key_value_heads": 8, "rms_norm_eps": 1e-06, "rope_theta": 1000000.0, "sliding_window": null, "tie_word_embeddings": false, "torch_dtype": "bfloat16", "use_cache": true, "use_sliding_window": false, "vocab_size": 152064}
|
neuronxcc-2.15.143.0+e39249ad/0_REGISTRY/0.0.27.dev0/inference/qwen2/Qwen/Qwen2.5-72B-Instruct/5feb3df570ed48ce4ef9.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"architectures": ["Qwen2ForCausalLM"], "attention_dropout": 0.0, "bos_token_id": 151643, "eos_token_id": 151645, "hidden_act": "silu", "hidden_size": 8192, "initializer_range": 0.02, "intermediate_size": 29568, "max_position_embeddings": 32768, "max_window_layers": 70, "model_type": "qwen2", "neuron": {"auto_cast_type": "bf16", "batch_size": 1, "checkpoint_id": "Qwen/Qwen2.5-72B-Instruct", "checkpoint_revision": "d3d951150c1e5848237cd6a7ad11df4836aee842", "compiler_type": "neuronx-cc", "compiler_version": "2.15.143.0+e39249ad", "num_cores": 24, "sequence_length": 2048, "task": "text-generation"}, "num_attention_heads": 64, "num_hidden_layers": 80, "num_key_value_heads": 8, "rms_norm_eps": 1e-06, "rope_theta": 1000000.0, "sliding_window": null, "tie_word_embeddings": false, "torch_dtype": "bfloat16", "use_cache": true, "use_sliding_window": false, "vocab_size": 152064}
|
neuronxcc-2.15.143.0+e39249ad/0_REGISTRY/0.0.27.dev0/inference/qwen2/Qwen/Qwen2.5-72B-Instruct/62d648e67c1df9861c81.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"architectures": ["Qwen2ForCausalLM"], "attention_dropout": 0.0, "bos_token_id": 151643, "eos_token_id": 151645, "hidden_act": "silu", "hidden_size": 8192, "initializer_range": 0.02, "intermediate_size": 29568, "max_position_embeddings": 32768, "max_window_layers": 70, "model_type": "qwen2", "neuron": {"auto_cast_type": "bf16", "batch_size": 1, "checkpoint_id": "Qwen/Qwen2.5-72B-Instruct", "checkpoint_revision": "d3d951150c1e5848237cd6a7ad11df4836aee842", "compiler_type": "neuronx-cc", "compiler_version": "2.15.143.0+e39249ad", "num_cores": 24, "sequence_length": 3072, "task": "text-generation"}, "num_attention_heads": 64, "num_hidden_layers": 80, "num_key_value_heads": 8, "rms_norm_eps": 1e-06, "rope_theta": 1000000.0, "sliding_window": null, "tie_word_embeddings": false, "torch_dtype": "bfloat16", "use_cache": true, "use_sliding_window": false, "vocab_size": 152064}
|
neuronxcc-2.15.143.0+e39249ad/0_REGISTRY/0.0.27.dev0/inference/qwen2/Qwen/Qwen2.5-72B-Instruct/b0090f8c5a66f58c402e.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"architectures": ["Qwen2ForCausalLM"], "attention_dropout": 0.0, "bos_token_id": 151643, "eos_token_id": 151645, "hidden_act": "silu", "hidden_size": 8192, "initializer_range": 0.02, "intermediate_size": 29568, "max_position_embeddings": 32768, "max_window_layers": 70, "model_type": "qwen2", "neuron": {"auto_cast_type": "bf16", "batch_size": 4, "checkpoint_id": "Qwen/Qwen2.5-72B-Instruct", "checkpoint_revision": "d3d951150c1e5848237cd6a7ad11df4836aee842", "compiler_type": "neuronx-cc", "compiler_version": "2.15.143.0+e39249ad", "num_cores": 24, "sequence_length": 3072, "task": "text-generation"}, "num_attention_heads": 64, "num_hidden_layers": 80, "num_key_value_heads": 8, "rms_norm_eps": 1e-06, "rope_theta": 1000000.0, "sliding_window": null, "tie_word_embeddings": false, "torch_dtype": "bfloat16", "use_cache": true, "use_sliding_window": false, "vocab_size": 152064}
|
neuronxcc-2.15.143.0+e39249ad/0_REGISTRY/0.0.27.dev0/inference/qwen2/Qwen/Qwen2.5-Math-7B-Instruct/73abe935a165dd5a8d7d.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"architectures": ["Qwen2ForCausalLM"], "attention_dropout": 0.0, "bos_token_id": 151643, "eos_token_id": 151645, "hidden_act": "silu", "hidden_size": 3584, "initializer_range": 0.02, "intermediate_size": 18944, "max_position_embeddings": 4096, "max_window_layers": 28, "model_type": "qwen2", "neuron": {"auto_cast_type": "bf16", "batch_size": 32, "checkpoint_id": "Qwen/Qwen2.5-Math-7B-Instruct", "checkpoint_revision": "ef9926d75ab1d54532f6a30dd5e760355eb9aa4d", "compiler_type": "neuronx-cc", "compiler_version": "2.15.143.0+e39249ad", "num_cores": 24, "sequence_length": 4096, "task": "text-generation"}, "num_attention_heads": 28, "num_hidden_layers": 28, "num_key_value_heads": 4, "rms_norm_eps": 1e-06, "rope_theta": 10000.0, "sliding_window": null, "tie_word_embeddings": false, "torch_dtype": "bfloat16", "use_cache": true, "use_sliding_window": false, "vocab_size": 152064}
|
neuronxcc-2.15.143.0+e39249ad/MODULE_025073d88f6dec21a13d+39f12043/compile_flags.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
["--model-type=transformer", "--auto-cast=none", "--execute-repetition=1"]
|
neuronxcc-2.15.143.0+e39249ad/MODULE_025073d88f6dec21a13d+39f12043/model.done
ADDED
File without changes
|
neuronxcc-2.15.143.0+e39249ad/MODULE_025073d88f6dec21a13d+39f12043/model.hlo_module.pb
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5f38e8a8f69d59558c745da4a1098dd0e0deba005bf77c0c86dbdfea6d57d2fc
|
3 |
+
size 278705
|
neuronxcc-2.15.143.0+e39249ad/MODULE_025073d88f6dec21a13d+39f12043/model.neff
ADDED
Binary file (933 kB). View file
|
|
neuronxcc-2.15.143.0+e39249ad/MODULE_10d128cdbda38f2dd83b+39f12043/compile_flags.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
["--model-type=transformer", "--auto-cast=none", "--execute-repetition=1"]
|
neuronxcc-2.15.143.0+e39249ad/MODULE_10d128cdbda38f2dd83b+39f12043/model.done
ADDED
File without changes
|
neuronxcc-2.15.143.0+e39249ad/MODULE_10d128cdbda38f2dd83b+39f12043/model.hlo_module.pb
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:87def0ac88d7df6d6719764216a6a002a9018794b5ac82665fe9246a4a235da3
|
3 |
+
size 278705
|
neuronxcc-2.15.143.0+e39249ad/MODULE_10d128cdbda38f2dd83b+39f12043/model.neff
ADDED
Binary file (871 kB). View file
|
|
neuronxcc-2.15.143.0+e39249ad/MODULE_19508710902bacc178f4+39f12043/compile_flags.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
["--model-type=transformer", "--auto-cast=none", "--execute-repetition=1"]
|
neuronxcc-2.15.143.0+e39249ad/MODULE_19508710902bacc178f4+39f12043/model.done
ADDED
File without changes
|
neuronxcc-2.15.143.0+e39249ad/MODULE_19508710902bacc178f4+39f12043/model.hlo_module.pb
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5042d5b8fa959d76f07f22ee5b51e4f24a4aac185d8c50bc69d5b5353ef72ed8
|
3 |
+
size 941713
|
neuronxcc-2.15.143.0+e39249ad/MODULE_19508710902bacc178f4+39f12043/model.neff
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:247762813c5117bec51730858c274d65c69391e160996400fa08775ab24e1a52
|
3 |
+
size 8193024
|
neuronxcc-2.15.143.0+e39249ad/MODULE_26a5181917a99c6440c2+39f12043/compile_flags.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
["--model-type=transformer", "--auto-cast=none", "--execute-repetition=1"]
|
neuronxcc-2.15.143.0+e39249ad/MODULE_26a5181917a99c6440c2+39f12043/model.done
ADDED
File without changes
|
neuronxcc-2.15.143.0+e39249ad/MODULE_26a5181917a99c6440c2+39f12043/model.hlo_module.pb
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:62c3aa4f33a1233cb66b53cbaaf2f048c2ef4eaf7f6463ed72ce465fd541f904
|
3 |
+
size 750092
|
neuronxcc-2.15.143.0+e39249ad/MODULE_26a5181917a99c6440c2+39f12043/model.neff
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a572f08d4c78811520f290a62842fd48fb4a48c7aab513acbe9ccbce735fa791
|
3 |
+
size 1035264
|
neuronxcc-2.15.143.0+e39249ad/MODULE_348cd8119f4a5353ee24+39f12043/compile_flags.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
["--model-type=transformer", "--auto-cast=none", "--execute-repetition=1"]
|
neuronxcc-2.15.143.0+e39249ad/MODULE_348cd8119f4a5353ee24+39f12043/model.done
ADDED
File without changes
|
neuronxcc-2.15.143.0+e39249ad/MODULE_348cd8119f4a5353ee24+39f12043/model.hlo_module.pb
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d3e114cec205798df7ef944feb91491edd02bb78dd79a897634586c0f9331bda
|
3 |
+
size 222784
|
neuronxcc-2.15.143.0+e39249ad/MODULE_348cd8119f4a5353ee24+39f12043/model.neff
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:53c9b579b20763b43eec1672b0fbbb7342c9f7d2e9f1e222d8a852da03edddd8
|
3 |
+
size 1065984
|
neuronxcc-2.15.143.0+e39249ad/MODULE_38e952fa2492adf691ff+39f12043/compile_flags.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
["--model-type=transformer", "--auto-cast=none", "--execute-repetition=1"]
|
neuronxcc-2.15.143.0+e39249ad/MODULE_38e952fa2492adf691ff+39f12043/model.done
ADDED
File without changes
|
neuronxcc-2.15.143.0+e39249ad/MODULE_38e952fa2492adf691ff+39f12043/model.hlo_module.pb
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a5a832ec2310116b1861f678414c4e5aba7f8fa047b95948989bdf0a8360841d
|
3 |
+
size 941713
|
neuronxcc-2.15.143.0+e39249ad/MODULE_38e952fa2492adf691ff+39f12043/model.neff
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:53b3f3f60a02b5e71983eca5219119523d804fd87ebe0ae094e50f381cc4007c
|
3 |
+
size 8295424
|
neuronxcc-2.15.143.0+e39249ad/MODULE_445d572321d7551de96d+39f12043/compile_flags.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
["--model-type=transformer", "--auto-cast=none", "--execute-repetition=1"]
|
neuronxcc-2.15.143.0+e39249ad/MODULE_445d572321d7551de96d+39f12043/model.done
ADDED
File without changes
|
neuronxcc-2.15.143.0+e39249ad/MODULE_445d572321d7551de96d+39f12043/model.hlo_module.pb
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:457905e0cb64161cbcae2504ca770c64ae2922a38ff31fd31df5eb0220c6963a
|
3 |
+
size 750092
|
neuronxcc-2.15.143.0+e39249ad/MODULE_445d572321d7551de96d+39f12043/model.neff
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:67ccd6801d7df38b0454752e6a6b96e0a197714123d6b6ade61c7aac511a69c4
|
3 |
+
size 9227264
|
neuronxcc-2.15.143.0+e39249ad/MODULE_4d076c0c56a5768c4069+39f12043/compile_flags.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
["--model-type=transformer", "--auto-cast=none", "--execute-repetition=1"]
|
neuronxcc-2.15.143.0+e39249ad/MODULE_4d076c0c56a5768c4069+39f12043/model.done
ADDED
File without changes
|
neuronxcc-2.15.143.0+e39249ad/MODULE_4d076c0c56a5768c4069+39f12043/model.hlo_module.pb
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f72711846367f071f3aad88c865e284b58148912b47602dc2ccbf4d249e5fdbf
|
3 |
+
size 750092
|
neuronxcc-2.15.143.0+e39249ad/MODULE_4d076c0c56a5768c4069+39f12043/model.neff
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d19c5c00fc234b52105480c9094e53c8612e9fe0f6da06cc015e124d49029705
|
3 |
+
size 10589184
|
neuronxcc-2.15.143.0+e39249ad/MODULE_5263f71385ed4e05d605+39f12043/compile_flags.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
["--model-type=transformer", "--auto-cast=none", "--execute-repetition=1"]
|
neuronxcc-2.15.143.0+e39249ad/MODULE_5263f71385ed4e05d605+39f12043/model.done
ADDED
File without changes
|
neuronxcc-2.15.143.0+e39249ad/MODULE_5263f71385ed4e05d605+39f12043/model.hlo_module.pb
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:928c2207ec03af54038c3456aaecda6fe647be9f7cd2d1d2b63be8a5c55069cb
|
3 |
+
size 1103969
|
neuronxcc-2.15.143.0+e39249ad/MODULE_5263f71385ed4e05d605+39f12043/model.neff
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3b16e17c52195e71e68e8f5711d5ca933f9a414410d4d3b60d79a1916ec3e46c
|
3 |
+
size 5479424
|
neuronxcc-2.15.143.0+e39249ad/MODULE_5425d7325a97f7a4932e+39f12043/compile_flags.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
["--model-type=transformer", "--auto-cast=none", "--execute-repetition=1"]
|
neuronxcc-2.15.143.0+e39249ad/MODULE_5425d7325a97f7a4932e+39f12043/model.done
ADDED
File without changes
|
neuronxcc-2.15.143.0+e39249ad/MODULE_5425d7325a97f7a4932e+39f12043/model.hlo_module.pb
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fd49b5e7ee2ad050dc5217983f71e0f327853c563ac71e4712822c4a471f1488
|
3 |
+
size 941713
|
neuronxcc-2.15.143.0+e39249ad/MODULE_5425d7325a97f7a4932e+39f12043/model.neff
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:73f4dca6c5b0d30e15da1037f4cf8723f83549722deee4ed9d86b853e719559c
|
3 |
+
size 7957504
|