dacorvo HF Staff commited on
Commit
ba566e9
·
verified ·
1 Parent(s): 36e3909

Synchronizing local compiler cache.

Browse files
Files changed (31) hide show
  1. .gitattributes +3 -0
  2. neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.6.dev2/929b02754a13cbfdf657d863c3fc6f3bce672879bc6ae48ab45be21e881e9ec2/a28e46704c048d210631.json +88 -0
  3. neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.6.dev2/qwen3/Qwen/Qwen3-0.6B/a28e46704c048d210631.json +88 -0
  4. neuronxcc-2.21.33363.0+82129205/MODULE_17476209562158013765+e30acd3a/model.neff +0 -0
  5. neuronxcc-2.21.33363.0+82129205/MODULE_5006ac810070ead7ed92+24129607/compile_flags.json +1 -0
  6. neuronxcc-2.21.33363.0+82129205/MODULE_5006ac810070ead7ed92+24129607/model.done +0 -0
  7. neuronxcc-2.21.33363.0+82129205/MODULE_5006ac810070ead7ed92+24129607/model.hlo_module.pb +3 -0
  8. neuronxcc-2.21.33363.0+82129205/MODULE_5006ac810070ead7ed92+24129607/model.neff +3 -0
  9. neuronxcc-2.21.33363.0+82129205/MODULE_9e22b55ec8c0b02cf4ef+28fcbe05/compile_flags.json +1 -0
  10. neuronxcc-2.21.33363.0+82129205/MODULE_9e22b55ec8c0b02cf4ef+28fcbe05/model.done +0 -0
  11. neuronxcc-2.21.33363.0+82129205/MODULE_9e22b55ec8c0b02cf4ef+28fcbe05/model.hlo_module.pb +3 -0
  12. neuronxcc-2.21.33363.0+82129205/MODULE_9e22b55ec8c0b02cf4ef+28fcbe05/model.neff +0 -0
  13. neuronxcc-2.21.33363.0+82129205/MODULE_a1d5b9d5676277a73661+a02c3a36/compile_flags.json +1 -0
  14. neuronxcc-2.21.33363.0+82129205/MODULE_a1d5b9d5676277a73661+a02c3a36/model.done +0 -0
  15. neuronxcc-2.21.33363.0+82129205/MODULE_a1d5b9d5676277a73661+a02c3a36/model.hlo_module.pb +3 -0
  16. neuronxcc-2.21.33363.0+82129205/MODULE_a1d5b9d5676277a73661+a02c3a36/model.neff +3 -0
  17. neuronxcc-2.21.33363.0+82129205/MODULE_a1d5b9d5676277a73661+a02c3a36/wrapped_neff.hlo +3 -0
  18. neuronxcc-2.21.33363.0+82129205/MODULE_ad16674dd3fc5a51c226+a02c3a36/model.neff +1 -1
  19. neuronxcc-2.21.33363.0+82129205/MODULE_ad16674dd3fc5a51c226+a02c3a36/wrapped_neff.hlo +1 -1
  20. neuronxcc-2.21.33363.0+82129205/MODULE_b54a5aa9a7bb0faeb6b1+940786cd/compile_flags.json +1 -0
  21. neuronxcc-2.21.33363.0+82129205/MODULE_b54a5aa9a7bb0faeb6b1+940786cd/model.done +0 -0
  22. neuronxcc-2.21.33363.0+82129205/MODULE_b54a5aa9a7bb0faeb6b1+940786cd/model.hlo_module.pb +3 -0
  23. neuronxcc-2.21.33363.0+82129205/MODULE_b54a5aa9a7bb0faeb6b1+940786cd/model.neff +0 -0
  24. neuronxcc-2.21.33363.0+82129205/MODULE_e79d2ef691b5cd91e631+d4248311/compile_flags.json +1 -0
  25. neuronxcc-2.21.33363.0+82129205/MODULE_e79d2ef691b5cd91e631+d4248311/model.done +0 -0
  26. neuronxcc-2.21.33363.0+82129205/MODULE_e79d2ef691b5cd91e631+d4248311/model.hlo_module.pb +3 -0
  27. neuronxcc-2.21.33363.0+82129205/MODULE_e79d2ef691b5cd91e631+d4248311/model.neff +0 -0
  28. neuronxcc-2.21.33363.0+82129205/MODULE_f1638265f2796bf1b8b8+81944ebb/compile_flags.json +1 -0
  29. neuronxcc-2.21.33363.0+82129205/MODULE_f1638265f2796bf1b8b8+81944ebb/model.done +0 -0
  30. neuronxcc-2.21.33363.0+82129205/MODULE_f1638265f2796bf1b8b8+81944ebb/model.hlo_module.pb +3 -0
  31. neuronxcc-2.21.33363.0+82129205/MODULE_f1638265f2796bf1b8b8+81944ebb/model.neff +0 -0
.gitattributes CHANGED
@@ -7126,3 +7126,6 @@ neuronxcc-2.21.33363.0+82129205/MODULE_5620f0d58954f88c2890+24129607/model.neff
7126
  neuronxcc-2.21.33363.0+82129205/MODULE_4ff804c2533da46e613e+24129607/model.neff filter=lfs diff=lfs merge=lfs -text
7127
  neuronxcc-2.21.33363.0+82129205/MODULE_5742ef8f5910f4e17377+a02c3a36/model.neff filter=lfs diff=lfs merge=lfs -text
7128
  neuronxcc-2.21.33363.0+82129205/MODULE_5742ef8f5910f4e17377+a02c3a36/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text
 
 
 
 
7126
  neuronxcc-2.21.33363.0+82129205/MODULE_4ff804c2533da46e613e+24129607/model.neff filter=lfs diff=lfs merge=lfs -text
7127
  neuronxcc-2.21.33363.0+82129205/MODULE_5742ef8f5910f4e17377+a02c3a36/model.neff filter=lfs diff=lfs merge=lfs -text
7128
  neuronxcc-2.21.33363.0+82129205/MODULE_5742ef8f5910f4e17377+a02c3a36/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text
7129
+ neuronxcc-2.21.33363.0+82129205/MODULE_5006ac810070ead7ed92+24129607/model.neff filter=lfs diff=lfs merge=lfs -text
7130
+ neuronxcc-2.21.33363.0+82129205/MODULE_a1d5b9d5676277a73661+a02c3a36/model.neff filter=lfs diff=lfs merge=lfs -text
7131
+ neuronxcc-2.21.33363.0+82129205/MODULE_a1d5b9d5676277a73661+a02c3a36/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text
neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.6.dev2/929b02754a13cbfdf657d863c3fc6f3bce672879bc6ae48ab45be21e881e9ec2/a28e46704c048d210631.json ADDED
@@ -0,0 +1,88 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_entry_class": "SingleModelCacheEntry",
3
+ "_model_id": "Qwen/Qwen3-0.6B",
4
+ "_task": "text-generation",
5
+ "architectures": [
6
+ "Qwen3ForCausalLM"
7
+ ],
8
+ "attention_bias": false,
9
+ "attention_dropout": 0.0,
10
+ "dtype": "bfloat16",
11
+ "head_dim": 128,
12
+ "hidden_act": "silu",
13
+ "hidden_size": 1024,
14
+ "initializer_range": 0.02,
15
+ "intermediate_size": 3072,
16
+ "layer_types": [
17
+ "full_attention",
18
+ "full_attention",
19
+ "full_attention",
20
+ "full_attention",
21
+ "full_attention",
22
+ "full_attention",
23
+ "full_attention",
24
+ "full_attention",
25
+ "full_attention",
26
+ "full_attention",
27
+ "full_attention",
28
+ "full_attention",
29
+ "full_attention",
30
+ "full_attention",
31
+ "full_attention",
32
+ "full_attention",
33
+ "full_attention",
34
+ "full_attention",
35
+ "full_attention",
36
+ "full_attention",
37
+ "full_attention",
38
+ "full_attention",
39
+ "full_attention",
40
+ "full_attention",
41
+ "full_attention",
42
+ "full_attention",
43
+ "full_attention",
44
+ "full_attention"
45
+ ],
46
+ "max_position_embeddings": 40960,
47
+ "max_window_layers": 28,
48
+ "model_type": "qwen3",
49
+ "neuron": {
50
+ "_serialized_key": "NxDNeuronConfig",
51
+ "batch_size": 4,
52
+ "capacity_factor": null,
53
+ "checkpoint_id": "Qwen/Qwen3-0.6B",
54
+ "checkpoint_revision": "c1899de289a04d12100db370d81485cdf75e47ca",
55
+ "continuous_batching": true,
56
+ "ep_degree": 1,
57
+ "fused_qkv": true,
58
+ "glu_mlp": true,
59
+ "local_ranks_size": 2,
60
+ "max_batch_size": 4,
61
+ "max_context_length": 1024,
62
+ "max_topk": 256,
63
+ "n_active_tokens": 1024,
64
+ "neuronxcc_version": "2.21.33363.0+82129205",
65
+ "on_device_sampling": false,
66
+ "optimum_neuron_version": "0.4.6.dev2",
67
+ "output_logits": false,
68
+ "pp_degree": 1,
69
+ "prefill_chunk_size": 0,
70
+ "sequence_length": 1024,
71
+ "speculation_length": 0,
72
+ "start_rank_id": 0,
73
+ "target": "trn1",
74
+ "torch_dtype": "bfloat16",
75
+ "tp_degree": 2
76
+ },
77
+ "num_attention_heads": 16,
78
+ "num_hidden_layers": 28,
79
+ "num_key_value_heads": 8,
80
+ "rms_norm_eps": 1e-06,
81
+ "rope_scaling": null,
82
+ "rope_theta": 1000000,
83
+ "sliding_window": null,
84
+ "tie_word_embeddings": true,
85
+ "use_cache": true,
86
+ "use_sliding_window": false,
87
+ "vocab_size": 151936
88
+ }
neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.6.dev2/qwen3/Qwen/Qwen3-0.6B/a28e46704c048d210631.json ADDED
@@ -0,0 +1,88 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_entry_class": "SingleModelCacheEntry",
3
+ "_model_id": "Qwen/Qwen3-0.6B",
4
+ "_task": "text-generation",
5
+ "architectures": [
6
+ "Qwen3ForCausalLM"
7
+ ],
8
+ "attention_bias": false,
9
+ "attention_dropout": 0.0,
10
+ "dtype": "bfloat16",
11
+ "head_dim": 128,
12
+ "hidden_act": "silu",
13
+ "hidden_size": 1024,
14
+ "initializer_range": 0.02,
15
+ "intermediate_size": 3072,
16
+ "layer_types": [
17
+ "full_attention",
18
+ "full_attention",
19
+ "full_attention",
20
+ "full_attention",
21
+ "full_attention",
22
+ "full_attention",
23
+ "full_attention",
24
+ "full_attention",
25
+ "full_attention",
26
+ "full_attention",
27
+ "full_attention",
28
+ "full_attention",
29
+ "full_attention",
30
+ "full_attention",
31
+ "full_attention",
32
+ "full_attention",
33
+ "full_attention",
34
+ "full_attention",
35
+ "full_attention",
36
+ "full_attention",
37
+ "full_attention",
38
+ "full_attention",
39
+ "full_attention",
40
+ "full_attention",
41
+ "full_attention",
42
+ "full_attention",
43
+ "full_attention",
44
+ "full_attention"
45
+ ],
46
+ "max_position_embeddings": 40960,
47
+ "max_window_layers": 28,
48
+ "model_type": "qwen3",
49
+ "neuron": {
50
+ "_serialized_key": "NxDNeuronConfig",
51
+ "batch_size": 4,
52
+ "capacity_factor": null,
53
+ "checkpoint_id": "Qwen/Qwen3-0.6B",
54
+ "checkpoint_revision": "c1899de289a04d12100db370d81485cdf75e47ca",
55
+ "continuous_batching": true,
56
+ "ep_degree": 1,
57
+ "fused_qkv": true,
58
+ "glu_mlp": true,
59
+ "local_ranks_size": 2,
60
+ "max_batch_size": 4,
61
+ "max_context_length": 1024,
62
+ "max_topk": 256,
63
+ "n_active_tokens": 1024,
64
+ "neuronxcc_version": "2.21.33363.0+82129205",
65
+ "on_device_sampling": false,
66
+ "optimum_neuron_version": "0.4.6.dev2",
67
+ "output_logits": false,
68
+ "pp_degree": 1,
69
+ "prefill_chunk_size": 0,
70
+ "sequence_length": 1024,
71
+ "speculation_length": 0,
72
+ "start_rank_id": 0,
73
+ "target": "trn1",
74
+ "torch_dtype": "bfloat16",
75
+ "tp_degree": 2
76
+ },
77
+ "num_attention_heads": 16,
78
+ "num_hidden_layers": 28,
79
+ "num_key_value_heads": 8,
80
+ "rms_norm_eps": 1e-06,
81
+ "rope_scaling": null,
82
+ "rope_theta": 1000000,
83
+ "sliding_window": null,
84
+ "tie_word_embeddings": true,
85
+ "use_cache": true,
86
+ "use_sliding_window": false,
87
+ "vocab_size": 151936
88
+ }
neuronxcc-2.21.33363.0+82129205/MODULE_17476209562158013765+e30acd3a/model.neff CHANGED
Binary files a/neuronxcc-2.21.33363.0+82129205/MODULE_17476209562158013765+e30acd3a/model.neff and b/neuronxcc-2.21.33363.0+82129205/MODULE_17476209562158013765+e30acd3a/model.neff differ
 
neuronxcc-2.21.33363.0+82129205/MODULE_5006ac810070ead7ed92+24129607/compile_flags.json ADDED
@@ -0,0 +1 @@
 
 
1
+ ["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/context_encoding/_tp0_bk0/log-neuron-cc.txt"]
neuronxcc-2.21.33363.0+82129205/MODULE_5006ac810070ead7ed92+24129607/model.done ADDED
File without changes
neuronxcc-2.21.33363.0+82129205/MODULE_5006ac810070ead7ed92+24129607/model.hlo_module.pb ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:db2a056d98b98672d37a1e08b48bf6f37953aba9b4c616720de52a80dbeeabfb
3
+ size 693532
neuronxcc-2.21.33363.0+82129205/MODULE_5006ac810070ead7ed92+24129607/model.neff ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8a605026a3de07a515ce0814ecd12488cf6cb11c72ed4113ad5cdde2ebdf566e
3
+ size 5039104
neuronxcc-2.21.33363.0+82129205/MODULE_9e22b55ec8c0b02cf4ef+28fcbe05/compile_flags.json ADDED
@@ -0,0 +1 @@
 
 
1
+ ["--target=trn1", "--enable-saturate-infinity", "--auto-cast=none", "--model-type=transformer", "-O1", "--logfile=/tmp/nxdi_test_69445d02-1e2d-4f77-9ed8-c9029402b637/compiler_workdir/SoftmaxWithMask/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"]
neuronxcc-2.21.33363.0+82129205/MODULE_9e22b55ec8c0b02cf4ef+28fcbe05/model.done ADDED
File without changes
neuronxcc-2.21.33363.0+82129205/MODULE_9e22b55ec8c0b02cf4ef+28fcbe05/model.hlo_module.pb ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:70f96487dad4bb02b98bf2c955fe59650a5fdbcf1d763fdf56ec412b62b5774c
3
+ size 5596
neuronxcc-2.21.33363.0+82129205/MODULE_9e22b55ec8c0b02cf4ef+28fcbe05/model.neff ADDED
Binary file (31.7 kB). View file
 
neuronxcc-2.21.33363.0+82129205/MODULE_a1d5b9d5676277a73661+a02c3a36/compile_flags.json ADDED
@@ -0,0 +1 @@
 
 
1
+ ["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/token_generation/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"]
neuronxcc-2.21.33363.0+82129205/MODULE_a1d5b9d5676277a73661+a02c3a36/model.done ADDED
File without changes
neuronxcc-2.21.33363.0+82129205/MODULE_a1d5b9d5676277a73661+a02c3a36/model.hlo_module.pb ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1eefc21dfba0ef82c19273eba57dd5a0bf0554faaa2d39d11cd99f0c330170b5
3
+ size 735532
neuronxcc-2.21.33363.0+82129205/MODULE_a1d5b9d5676277a73661+a02c3a36/model.neff ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:120cbfa9f71dd5236635bc11c0b1e835fb832b9c0ec11ab84e350f086e92b1f7
3
+ size 2305024
neuronxcc-2.21.33363.0+82129205/MODULE_a1d5b9d5676277a73661+a02c3a36/wrapped_neff.hlo ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:842619c244312132fec3c4e8bc1ad737c011b8de21b6e4a28657d07f6e0b5dc3
3
+ size 2442081
neuronxcc-2.21.33363.0+82129205/MODULE_ad16674dd3fc5a51c226+a02c3a36/model.neff CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2b8be74d754d3877ff4c9586c81611124a2989d55ff021b4915372155a27fe1a
3
  size 3073024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2f7ccb3c563a4c0fdae234892df68dcd6c60cd41674bf983c7a5693709d2af9c
3
  size 3073024
neuronxcc-2.21.33363.0+82129205/MODULE_ad16674dd3fc5a51c226+a02c3a36/wrapped_neff.hlo CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a1a2dfe758abc52214d97cbae6fd8bfe738893d16164557e687784ac1c1a80a9
3
  size 3147125
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1a6ac7c0556c0e218f9e95cabc999fa5d73cb79aabcc96ccbc57e3c5325e36e9
3
  size 3147125
neuronxcc-2.21.33363.0+82129205/MODULE_b54a5aa9a7bb0faeb6b1+940786cd/compile_flags.json ADDED
@@ -0,0 +1 @@
 
 
1
+ ["--target=trn1", "--enable-saturate-infinity", "--auto-cast=none", "--model-type=transformer", "-O1", "--logfile=/tmp/nxdi_test_4e549635-b641-407e-bfcf-0de9fb256e44/compiler_workdir/SoftmaxWithMask/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"]
neuronxcc-2.21.33363.0+82129205/MODULE_b54a5aa9a7bb0faeb6b1+940786cd/model.done ADDED
File without changes
neuronxcc-2.21.33363.0+82129205/MODULE_b54a5aa9a7bb0faeb6b1+940786cd/model.hlo_module.pb ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f9a258ce111db27dc5ba46ec4f9f6877c56b0777a5534c0eba14488ff9eaf298
3
+ size 5596
neuronxcc-2.21.33363.0+82129205/MODULE_b54a5aa9a7bb0faeb6b1+940786cd/model.neff ADDED
Binary file (31.7 kB). View file
 
neuronxcc-2.21.33363.0+82129205/MODULE_e79d2ef691b5cd91e631+d4248311/compile_flags.json ADDED
@@ -0,0 +1 @@
 
 
1
+ ["--target=trn1", "--enable-saturate-infinity", "--auto-cast=none", "--model-type=transformer", "-O1", "--logfile=/tmp/nxdi_test_de4f3c0b-dec2-4039-854c-30a1f038d511/compiler_workdir/SoftmaxNoMask/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"]
neuronxcc-2.21.33363.0+82129205/MODULE_e79d2ef691b5cd91e631+d4248311/model.done ADDED
File without changes
neuronxcc-2.21.33363.0+82129205/MODULE_e79d2ef691b5cd91e631+d4248311/model.hlo_module.pb ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8e542c76cf27c3f807feac47dd3f58fd4c308e8d9e932f0732774bee19d640d8
3
+ size 3881
neuronxcc-2.21.33363.0+82129205/MODULE_e79d2ef691b5cd91e631+d4248311/model.neff ADDED
Binary file (31.7 kB). View file
 
neuronxcc-2.21.33363.0+82129205/MODULE_f1638265f2796bf1b8b8+81944ebb/compile_flags.json ADDED
@@ -0,0 +1 @@
 
 
1
+ ["--target=trn1", "--enable-saturate-infinity", "--auto-cast=none", "--model-type=transformer", "-O1", "--logfile=/tmp/nxdi_test_1a5ee6fa-840a-4fa0-b1c4-3b83c44912b0/compiler_workdir/SoftmaxNoMask/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"]
neuronxcc-2.21.33363.0+82129205/MODULE_f1638265f2796bf1b8b8+81944ebb/model.done ADDED
File without changes
neuronxcc-2.21.33363.0+82129205/MODULE_f1638265f2796bf1b8b8+81944ebb/model.hlo_module.pb ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5efb0ea01dc0241314f91e19cbd9be551d1a66e7dbadd7cd4d6473d6b7d4b99a
3
+ size 3881
neuronxcc-2.21.33363.0+82129205/MODULE_f1638265f2796bf1b8b8+81944ebb/model.neff ADDED
Binary file (31.7 kB). View file