tengomucho HF Staff commited on
Commit
f405660
·
verified ·
1 Parent(s): 206019f

Synchronizing local compiler cache.

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. .gitattributes +24 -0
  2. neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.3/llama/llamafactory/tiny-random-Llama-3/e16b019c51f845891789.json +62 -0
  3. neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.3/llama4_text/tiny-random/llama-4/06fe21b7c35243f4bba9.json +81 -0
  4. neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.4.dev0/llama/meta-llama/Llama-3.2-1B-Instruct/534b7169afd0669cb851.json +62 -0
  5. neuronxcc-2.21.33363.0+82129205/MODULE_03def246761e956f7a81+a02c3a36/compile_flags.json +1 -0
  6. neuronxcc-2.21.33363.0+82129205/MODULE_03def246761e956f7a81+a02c3a36/model.done +0 -0
  7. neuronxcc-2.21.33363.0+82129205/MODULE_03def246761e956f7a81+a02c3a36/model.hlo_module.pb +3 -0
  8. neuronxcc-2.21.33363.0+82129205/MODULE_03def246761e956f7a81+a02c3a36/model.neff +3 -0
  9. neuronxcc-2.21.33363.0+82129205/MODULE_03def246761e956f7a81+a02c3a36/wrapped_neff.hlo +3 -0
  10. neuronxcc-2.21.33363.0+82129205/MODULE_306829ff9e3811933fe7+a02c3a36/compile_flags.json +1 -0
  11. neuronxcc-2.21.33363.0+82129205/MODULE_306829ff9e3811933fe7+a02c3a36/model.done +0 -0
  12. neuronxcc-2.21.33363.0+82129205/MODULE_306829ff9e3811933fe7+a02c3a36/model.hlo_module.pb +3 -0
  13. neuronxcc-2.21.33363.0+82129205/MODULE_306829ff9e3811933fe7+a02c3a36/model.neff +3 -0
  14. neuronxcc-2.21.33363.0+82129205/MODULE_306829ff9e3811933fe7+a02c3a36/wrapped_neff.hlo +3 -0
  15. neuronxcc-2.21.33363.0+82129205/MODULE_574e9a764503b48fbba9+24129607/compile_flags.json +1 -0
  16. neuronxcc-2.21.33363.0+82129205/MODULE_574e9a764503b48fbba9+24129607/model.done +0 -0
  17. neuronxcc-2.21.33363.0+82129205/MODULE_574e9a764503b48fbba9+24129607/model.hlo_module.pb +3 -0
  18. neuronxcc-2.21.33363.0+82129205/MODULE_574e9a764503b48fbba9+24129607/model.neff +3 -0
  19. neuronxcc-2.21.33363.0+82129205/MODULE_5f6f4f62aba29e11d946+24129607/compile_flags.json +1 -0
  20. neuronxcc-2.21.33363.0+82129205/MODULE_5f6f4f62aba29e11d946+24129607/model.done +0 -0
  21. neuronxcc-2.21.33363.0+82129205/MODULE_5f6f4f62aba29e11d946+24129607/model.hlo_module.pb +3 -0
  22. neuronxcc-2.21.33363.0+82129205/MODULE_5f6f4f62aba29e11d946+24129607/model.neff +3 -0
  23. neuronxcc-2.21.33363.0+82129205/MODULE_8414d37eab328896acb7+a02c3a36/compile_flags.json +1 -0
  24. neuronxcc-2.21.33363.0+82129205/MODULE_8414d37eab328896acb7+a02c3a36/model.done +0 -0
  25. neuronxcc-2.21.33363.0+82129205/MODULE_8414d37eab328896acb7+a02c3a36/model.hlo_module.pb +3 -0
  26. neuronxcc-2.21.33363.0+82129205/MODULE_8414d37eab328896acb7+a02c3a36/model.neff +3 -0
  27. neuronxcc-2.21.33363.0+82129205/MODULE_8414d37eab328896acb7+a02c3a36/wrapped_neff.hlo +3 -0
  28. neuronxcc-2.21.33363.0+82129205/MODULE_9d35248a93d4142a3cf1+24129607/compile_flags.json +1 -0
  29. neuronxcc-2.21.33363.0+82129205/MODULE_9d35248a93d4142a3cf1+24129607/model.done +0 -0
  30. neuronxcc-2.21.33363.0+82129205/MODULE_9d35248a93d4142a3cf1+24129607/model.hlo_module.pb +3 -0
  31. neuronxcc-2.21.33363.0+82129205/MODULE_9d35248a93d4142a3cf1+24129607/model.neff +3 -0
  32. neuronxcc-2.21.33363.0+82129205/MODULE_9e174a0ad6384712cfa5+24129607/compile_flags.json +1 -0
  33. neuronxcc-2.21.33363.0+82129205/MODULE_9e174a0ad6384712cfa5+24129607/model.done +0 -0
  34. neuronxcc-2.21.33363.0+82129205/MODULE_9e174a0ad6384712cfa5+24129607/model.hlo_module.pb +3 -0
  35. neuronxcc-2.21.33363.0+82129205/MODULE_9e174a0ad6384712cfa5+24129607/model.neff +3 -0
  36. neuronxcc-2.21.33363.0+82129205/MODULE_a38bf2241a80d200aa33+a02c3a36/compile_flags.json +1 -0
  37. neuronxcc-2.21.33363.0+82129205/MODULE_a38bf2241a80d200aa33+a02c3a36/model.done +0 -0
  38. neuronxcc-2.21.33363.0+82129205/MODULE_a38bf2241a80d200aa33+a02c3a36/model.hlo_module.pb +3 -0
  39. neuronxcc-2.21.33363.0+82129205/MODULE_a38bf2241a80d200aa33+a02c3a36/model.neff +3 -0
  40. neuronxcc-2.21.33363.0+82129205/MODULE_a38bf2241a80d200aa33+a02c3a36/wrapped_neff.hlo +3 -0
  41. neuronxcc-2.21.33363.0+82129205/MODULE_c0808787f3555a6627cc+24129607/compile_flags.json +1 -0
  42. neuronxcc-2.21.33363.0+82129205/MODULE_c0808787f3555a6627cc+24129607/model.done +0 -0
  43. neuronxcc-2.21.33363.0+82129205/MODULE_c0808787f3555a6627cc+24129607/model.hlo_module.pb +3 -0
  44. neuronxcc-2.21.33363.0+82129205/MODULE_c0808787f3555a6627cc+24129607/model.neff +3 -0
  45. neuronxcc-2.21.33363.0+82129205/MODULE_c2b3afa51c57d431a332+a02c3a36/compile_flags.json +1 -0
  46. neuronxcc-2.21.33363.0+82129205/MODULE_c2b3afa51c57d431a332+a02c3a36/model.done +0 -0
  47. neuronxcc-2.21.33363.0+82129205/MODULE_c2b3afa51c57d431a332+a02c3a36/model.hlo_module.pb +3 -0
  48. neuronxcc-2.21.33363.0+82129205/MODULE_c2b3afa51c57d431a332+a02c3a36/model.neff +3 -0
  49. neuronxcc-2.21.33363.0+82129205/MODULE_c2b3afa51c57d431a332+a02c3a36/wrapped_neff.hlo +3 -0
  50. neuronxcc-2.21.33363.0+82129205/MODULE_cedace9d3d693aab8d35+a02c3a36/compile_flags.json +1 -0
.gitattributes CHANGED
@@ -6168,3 +6168,27 @@ neuronxcc-2.21.33363.0+82129205/MODULE_ecf84edc7dafa7cf47bc+6e4949b4/model.neff
6168
  neuronxcc-2.21.33363.0+82129205/MODULE_f0c0b96c282628d572b0+a02c3a36/model.neff filter=lfs diff=lfs merge=lfs -text
6169
  neuronxcc-2.21.33363.0+82129205/MODULE_f0c0b96c282628d572b0+a02c3a36/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text
6170
  neuronxcc-2.21.33363.0+82129205/MODULE_728ea12fa65b10279163+24129607/model.neff filter=lfs diff=lfs merge=lfs -text
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
6168
  neuronxcc-2.21.33363.0+82129205/MODULE_f0c0b96c282628d572b0+a02c3a36/model.neff filter=lfs diff=lfs merge=lfs -text
6169
  neuronxcc-2.21.33363.0+82129205/MODULE_f0c0b96c282628d572b0+a02c3a36/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text
6170
  neuronxcc-2.21.33363.0+82129205/MODULE_728ea12fa65b10279163+24129607/model.neff filter=lfs diff=lfs merge=lfs -text
6171
+ neuronxcc-2.21.33363.0+82129205/MODULE_03def246761e956f7a81+a02c3a36/model.neff filter=lfs diff=lfs merge=lfs -text
6172
+ neuronxcc-2.21.33363.0+82129205/MODULE_03def246761e956f7a81+a02c3a36/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text
6173
+ neuronxcc-2.21.33363.0+82129205/MODULE_306829ff9e3811933fe7+a02c3a36/model.neff filter=lfs diff=lfs merge=lfs -text
6174
+ neuronxcc-2.21.33363.0+82129205/MODULE_306829ff9e3811933fe7+a02c3a36/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text
6175
+ neuronxcc-2.21.33363.0+82129205/MODULE_574e9a764503b48fbba9+24129607/model.neff filter=lfs diff=lfs merge=lfs -text
6176
+ neuronxcc-2.21.33363.0+82129205/MODULE_5f6f4f62aba29e11d946+24129607/model.neff filter=lfs diff=lfs merge=lfs -text
6177
+ neuronxcc-2.21.33363.0+82129205/MODULE_8414d37eab328896acb7+a02c3a36/model.neff filter=lfs diff=lfs merge=lfs -text
6178
+ neuronxcc-2.21.33363.0+82129205/MODULE_8414d37eab328896acb7+a02c3a36/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text
6179
+ neuronxcc-2.21.33363.0+82129205/MODULE_9d35248a93d4142a3cf1+24129607/model.neff filter=lfs diff=lfs merge=lfs -text
6180
+ neuronxcc-2.21.33363.0+82129205/MODULE_9e174a0ad6384712cfa5+24129607/model.neff filter=lfs diff=lfs merge=lfs -text
6181
+ neuronxcc-2.21.33363.0+82129205/MODULE_a38bf2241a80d200aa33+a02c3a36/model.neff filter=lfs diff=lfs merge=lfs -text
6182
+ neuronxcc-2.21.33363.0+82129205/MODULE_a38bf2241a80d200aa33+a02c3a36/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text
6183
+ neuronxcc-2.21.33363.0+82129205/MODULE_c0808787f3555a6627cc+24129607/model.neff filter=lfs diff=lfs merge=lfs -text
6184
+ neuronxcc-2.21.33363.0+82129205/MODULE_c2b3afa51c57d431a332+a02c3a36/model.neff filter=lfs diff=lfs merge=lfs -text
6185
+ neuronxcc-2.21.33363.0+82129205/MODULE_c2b3afa51c57d431a332+a02c3a36/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text
6186
+ neuronxcc-2.21.33363.0+82129205/MODULE_cedace9d3d693aab8d35+a02c3a36/model.neff filter=lfs diff=lfs merge=lfs -text
6187
+ neuronxcc-2.21.33363.0+82129205/MODULE_cedace9d3d693aab8d35+a02c3a36/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text
6188
+ neuronxcc-2.21.33363.0+82129205/MODULE_d5ada2fae774253484ca+24129607/model.neff filter=lfs diff=lfs merge=lfs -text
6189
+ neuronxcc-2.21.33363.0+82129205/MODULE_e973fc6fe6bd9c3d7c03+a02c3a36/model.neff filter=lfs diff=lfs merge=lfs -text
6190
+ neuronxcc-2.21.33363.0+82129205/MODULE_e973fc6fe6bd9c3d7c03+a02c3a36/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text
6191
+ neuronxcc-2.21.33363.0+82129205/MODULE_f81f36ad8e744c8da4f2+24129607/model.neff filter=lfs diff=lfs merge=lfs -text
6192
+ neuronxcc-2.22.12471.0+b4a00d10/MODULE_ab3e50332a1f49feba2d+84337dd9/model.neff filter=lfs diff=lfs merge=lfs -text
6193
+ neuronxcc-2.22.12471.0+b4a00d10/MODULE_ab3e50332a1f49feba2d+84337dd9/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text
6194
+ neuronxcc-2.22.12471.0+b4a00d10/MODULE_ba94bd052390e13a7dc4+519f203d/model.neff filter=lfs diff=lfs merge=lfs -text
neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.3/llama/llamafactory/tiny-random-Llama-3/e16b019c51f845891789.json ADDED
@@ -0,0 +1,62 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_entry_class": "SingleModelCacheEntry",
3
+ "_model_id": "llamafactory/tiny-random-Llama-3",
4
+ "_task": "text-generation",
5
+ "architectures": [
6
+ "LlamaForCausalLM"
7
+ ],
8
+ "attention_bias": false,
9
+ "attention_dropout": 0.0,
10
+ "dtype": "float16",
11
+ "head_dim": 4,
12
+ "hidden_act": "silu",
13
+ "hidden_size": 16,
14
+ "initializer_range": 0.02,
15
+ "intermediate_size": 64,
16
+ "max_position_embeddings": 131072,
17
+ "mlp_bias": false,
18
+ "model_type": "llama",
19
+ "neuron": {
20
+ "_serialized_key": "NxDNeuronConfig",
21
+ "batch_size": 1,
22
+ "capacity_factor": null,
23
+ "checkpoint_id": "llamafactory/tiny-random-Llama-3",
24
+ "checkpoint_revision": "bf2a2e3bf199ad2ee96f02a3c00246c608db22a8",
25
+ "continuous_batching": false,
26
+ "ep_degree": 1,
27
+ "fused_qkv": true,
28
+ "glu_mlp": true,
29
+ "local_ranks_size": 2,
30
+ "max_batch_size": 1,
31
+ "max_context_length": 1024,
32
+ "max_topk": 256,
33
+ "n_active_tokens": 1024,
34
+ "neuronxcc_version": "2.21.33363.0+82129205",
35
+ "on_device_sampling": true,
36
+ "optimum_neuron_version": "0.4.3",
37
+ "output_logits": false,
38
+ "pp_degree": 1,
39
+ "sequence_length": 1024,
40
+ "speculation_length": 0,
41
+ "start_rank_id": 0,
42
+ "target": "trn1",
43
+ "torch_dtype": "float16",
44
+ "tp_degree": 2
45
+ },
46
+ "num_attention_heads": 4,
47
+ "num_hidden_layers": 2,
48
+ "num_key_value_heads": 4,
49
+ "pretraining_tp": 1,
50
+ "rms_norm_eps": 1e-05,
51
+ "rope_scaling": {
52
+ "factor": 8.0,
53
+ "high_freq_factor": 4.0,
54
+ "low_freq_factor": 1.0,
55
+ "original_max_position_embeddings": 8192,
56
+ "rope_type": "llama3"
57
+ },
58
+ "rope_theta": 500000.0,
59
+ "tie_word_embeddings": false,
60
+ "use_cache": true,
61
+ "vocab_size": 128256
62
+ }
neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.3/llama4_text/tiny-random/llama-4/06fe21b7c35243f4bba9.json ADDED
@@ -0,0 +1,81 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_entry_class": "SingleModelCacheEntry",
3
+ "_model_id": "tiny-random/llama-4",
4
+ "_task": "text-generation",
5
+ "attention_bias": false,
6
+ "attention_chunk_size": 128,
7
+ "attention_dropout": 0.0,
8
+ "attn_scale": 0.1,
9
+ "attn_temperature_tuning": 4,
10
+ "cache_implementation": "hybrid",
11
+ "dtype": "bfloat16",
12
+ "floor_scale": 8192,
13
+ "for_llm_compressor": false,
14
+ "head_dim": 32,
15
+ "hidden_act": "silu",
16
+ "hidden_size": 32,
17
+ "initializer_range": 0.02,
18
+ "interleave_moe_layer_step": 2,
19
+ "intermediate_size": 64,
20
+ "intermediate_size_mlp": 128,
21
+ "layer_types": [
22
+ "chunked_attention",
23
+ "chunked_attention",
24
+ "chunked_attention",
25
+ "full_attention"
26
+ ],
27
+ "max_position_embeddings": 1048576,
28
+ "model_type": "llama4_text",
29
+ "moe_layers": [
30
+ 1,
31
+ 3
32
+ ],
33
+ "neuron": {
34
+ "_serialized_key": "NxDNeuronConfig",
35
+ "batch_size": 1,
36
+ "capacity_factor": null,
37
+ "checkpoint_id": "tiny-random/llama-4",
38
+ "checkpoint_revision": "9e716f5d4d1ffe0a44a15f46f4a12b840439aba4",
39
+ "continuous_batching": false,
40
+ "ep_degree": 1,
41
+ "fused_qkv": false,
42
+ "glu_mlp": true,
43
+ "local_ranks_size": 2,
44
+ "max_batch_size": 1,
45
+ "max_context_length": 1024,
46
+ "max_topk": 256,
47
+ "n_active_tokens": 1024,
48
+ "neuronxcc_version": "2.21.33363.0+82129205",
49
+ "on_device_sampling": true,
50
+ "optimum_neuron_version": "0.4.3",
51
+ "output_logits": false,
52
+ "pp_degree": 1,
53
+ "sequence_length": 1024,
54
+ "speculation_length": 0,
55
+ "start_rank_id": 0,
56
+ "target": "trn1",
57
+ "torch_dtype": "bfloat16",
58
+ "tp_degree": 2
59
+ },
60
+ "no_rope_layers": [
61
+ 1,
62
+ 1,
63
+ 1,
64
+ 0
65
+ ],
66
+ "num_attention_heads": 1,
67
+ "num_experts_per_tok": 1,
68
+ "num_hidden_layers": 4,
69
+ "num_key_value_heads": 1,
70
+ "num_local_experts": 8,
71
+ "output_router_logits": false,
72
+ "rms_norm_eps": 1e-05,
73
+ "rope_scaling": null,
74
+ "rope_theta": 500000.0,
75
+ "router_aux_loss_coef": 0.001,
76
+ "router_jitter_noise": 0.0,
77
+ "tie_word_embeddings": true,
78
+ "use_cache": true,
79
+ "use_qk_norm": true,
80
+ "vocab_size": 202048
81
+ }
neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.4.dev0/llama/meta-llama/Llama-3.2-1B-Instruct/534b7169afd0669cb851.json ADDED
@@ -0,0 +1,62 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_entry_class": "SingleModelCacheEntry",
3
+ "_model_id": "meta-llama/Llama-3.2-1B-Instruct",
4
+ "_task": "text-generation",
5
+ "architectures": [
6
+ "LlamaForCausalLM"
7
+ ],
8
+ "attention_bias": false,
9
+ "attention_dropout": 0.0,
10
+ "dtype": "bfloat16",
11
+ "head_dim": 64,
12
+ "hidden_act": "silu",
13
+ "hidden_size": 2048,
14
+ "initializer_range": 0.02,
15
+ "intermediate_size": 8192,
16
+ "max_position_embeddings": 131072,
17
+ "mlp_bias": false,
18
+ "model_type": "llama",
19
+ "neuron": {
20
+ "_serialized_key": "NxDNeuronConfig",
21
+ "batch_size": 4,
22
+ "capacity_factor": null,
23
+ "checkpoint_id": "meta-llama/Llama-3.2-1B-Instruct",
24
+ "checkpoint_revision": "9213176726f574b556790deb65791e0c5aa438b6",
25
+ "continuous_batching": true,
26
+ "ep_degree": 1,
27
+ "fused_qkv": true,
28
+ "glu_mlp": true,
29
+ "local_ranks_size": 1,
30
+ "max_batch_size": 4,
31
+ "max_context_length": 4096,
32
+ "max_topk": 256,
33
+ "n_active_tokens": 4096,
34
+ "neuronxcc_version": "2.21.33363.0+82129205",
35
+ "on_device_sampling": true,
36
+ "optimum_neuron_version": "0.4.4.dev0",
37
+ "output_logits": false,
38
+ "pp_degree": 1,
39
+ "sequence_length": 4096,
40
+ "speculation_length": 0,
41
+ "start_rank_id": 0,
42
+ "target": "trn1",
43
+ "torch_dtype": "bfloat16",
44
+ "tp_degree": 1
45
+ },
46
+ "num_attention_heads": 32,
47
+ "num_hidden_layers": 16,
48
+ "num_key_value_heads": 8,
49
+ "pretraining_tp": 1,
50
+ "rms_norm_eps": 1e-05,
51
+ "rope_scaling": {
52
+ "factor": 32.0,
53
+ "high_freq_factor": 4.0,
54
+ "low_freq_factor": 1.0,
55
+ "original_max_position_embeddings": 8192,
56
+ "rope_type": "llama3"
57
+ },
58
+ "rope_theta": 500000.0,
59
+ "tie_word_embeddings": true,
60
+ "use_cache": true,
61
+ "vocab_size": 128256
62
+ }
neuronxcc-2.21.33363.0+82129205/MODULE_03def246761e956f7a81+a02c3a36/compile_flags.json ADDED
@@ -0,0 +1 @@
 
 
1
+ ["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/token_generation/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"]
neuronxcc-2.21.33363.0+82129205/MODULE_03def246761e956f7a81+a02c3a36/model.done ADDED
File without changes
neuronxcc-2.21.33363.0+82129205/MODULE_03def246761e956f7a81+a02c3a36/model.hlo_module.pb ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:67b0911c04d1a1f3cba5e5e77dcb1605b3a39eb823f45a2645cd969fc52f2a63
3
+ size 389975
neuronxcc-2.21.33363.0+82129205/MODULE_03def246761e956f7a81+a02c3a36/model.neff ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f77cfb7776c65ad90fa220e5207223152f0e725bfc73a917149dddb5eec8b79e
3
+ size 5633024
neuronxcc-2.21.33363.0+82129205/MODULE_03def246761e956f7a81+a02c3a36/wrapped_neff.hlo ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6fa880602fb3a301629e465c6a877077f25928b70ca435815df251f07425bc01
3
+ size 5707929
neuronxcc-2.21.33363.0+82129205/MODULE_306829ff9e3811933fe7+a02c3a36/compile_flags.json ADDED
@@ -0,0 +1 @@
 
 
1
+ ["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/token_generation/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"]
neuronxcc-2.21.33363.0+82129205/MODULE_306829ff9e3811933fe7+a02c3a36/model.done ADDED
File without changes
neuronxcc-2.21.33363.0+82129205/MODULE_306829ff9e3811933fe7+a02c3a36/model.hlo_module.pb ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5d61ac2165fde7772e8d3035b0f89b50beec5e0d305548cbacc624eefa9452d3
3
+ size 82753
neuronxcc-2.21.33363.0+82129205/MODULE_306829ff9e3811933fe7+a02c3a36/model.neff ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7e63b61edcd20b2b6c18802faa1c4c4067acb53a0f0603d4faabc7f2d7add610
3
+ size 277504
neuronxcc-2.21.33363.0+82129205/MODULE_306829ff9e3811933fe7+a02c3a36/wrapped_neff.hlo ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:59403d318f2bcb77b55553d070b94acabd3bbdbc52da0f20e804759a51cdd6a5
3
+ size 285854
neuronxcc-2.21.33363.0+82129205/MODULE_574e9a764503b48fbba9+24129607/compile_flags.json ADDED
@@ -0,0 +1 @@
 
 
1
+ ["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/context_encoding/_tp0_bk0/log-neuron-cc.txt"]
neuronxcc-2.21.33363.0+82129205/MODULE_574e9a764503b48fbba9+24129607/model.done ADDED
File without changes
neuronxcc-2.21.33363.0+82129205/MODULE_574e9a764503b48fbba9+24129607/model.hlo_module.pb ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3810428d8bc2193c766cd607d41079f3021e3860107b7580c4158183051b8100
3
+ size 1061093
neuronxcc-2.21.33363.0+82129205/MODULE_574e9a764503b48fbba9+24129607/model.neff ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b581f570131f39602819f273cd00c47873372b06194dc7cb33c9c5dd15bb32fa
3
+ size 9473024
neuronxcc-2.21.33363.0+82129205/MODULE_5f6f4f62aba29e11d946+24129607/compile_flags.json ADDED
@@ -0,0 +1 @@
 
 
1
+ ["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/context_encoding/_tp0_bk0/log-neuron-cc.txt"]
neuronxcc-2.21.33363.0+82129205/MODULE_5f6f4f62aba29e11d946+24129607/model.done ADDED
File without changes
neuronxcc-2.21.33363.0+82129205/MODULE_5f6f4f62aba29e11d946+24129607/model.hlo_module.pb ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9ff29a9d610dd9881a52dec279a06be490a45580450ffe418a317e9eb5295330
3
+ size 694128
neuronxcc-2.21.33363.0+82129205/MODULE_5f6f4f62aba29e11d946+24129607/model.neff ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9a5bf9bbaba0b0f3abcb6c9408d5be74ee9fddec0f3a1a933943271af767839d
3
+ size 625664
neuronxcc-2.21.33363.0+82129205/MODULE_8414d37eab328896acb7+a02c3a36/compile_flags.json ADDED
@@ -0,0 +1 @@
 
 
1
+ ["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/token_generation/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"]
neuronxcc-2.21.33363.0+82129205/MODULE_8414d37eab328896acb7+a02c3a36/model.done ADDED
File without changes
neuronxcc-2.21.33363.0+82129205/MODULE_8414d37eab328896acb7+a02c3a36/model.hlo_module.pb ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:828b718ac0d544f14a9a683c76b442c49520573027ba2e8347fdd5e79531704b
3
+ size 702870
neuronxcc-2.21.33363.0+82129205/MODULE_8414d37eab328896acb7+a02c3a36/model.neff ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b73bb9f42bc0c9fc82cdd455b1df42a8d677843e6df2cdaa0156d783b7a884b4
3
+ size 3503104
neuronxcc-2.21.33363.0+82129205/MODULE_8414d37eab328896acb7+a02c3a36/wrapped_neff.hlo ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:027c95630275e4b5fedbcb1e196c594c6ee27e9450d57d8c29e3da0f97b4bbe2
3
+ size 3640300
neuronxcc-2.21.33363.0+82129205/MODULE_9d35248a93d4142a3cf1+24129607/compile_flags.json ADDED
@@ -0,0 +1 @@
 
 
1
+ ["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/context_encoding/_tp0_bk0/log-neuron-cc.txt"]
neuronxcc-2.21.33363.0+82129205/MODULE_9d35248a93d4142a3cf1+24129607/model.done ADDED
File without changes
neuronxcc-2.21.33363.0+82129205/MODULE_9d35248a93d4142a3cf1+24129607/model.hlo_module.pb ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1ff789deef8176afeab268439fb0770b9b965fd178c19b0aead0f8be9a02e0b6
3
+ size 739558
neuronxcc-2.21.33363.0+82129205/MODULE_9d35248a93d4142a3cf1+24129607/model.neff ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f516045352a9ee7a801257fbcdc2acf8ec33bfc172b6bfd19e961216ee11254d
3
+ size 26133504
neuronxcc-2.21.33363.0+82129205/MODULE_9e174a0ad6384712cfa5+24129607/compile_flags.json ADDED
@@ -0,0 +1 @@
 
 
1
+ ["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/context_encoding/_tp0_bk0/log-neuron-cc.txt"]
neuronxcc-2.21.33363.0+82129205/MODULE_9e174a0ad6384712cfa5+24129607/model.done ADDED
File without changes
neuronxcc-2.21.33363.0+82129205/MODULE_9e174a0ad6384712cfa5+24129607/model.hlo_module.pb ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2091cd37242da699619a7ee893e9cd7c02bb92c4cd99e0ba1ffec00be7827fcb
3
+ size 83504
neuronxcc-2.21.33363.0+82129205/MODULE_9e174a0ad6384712cfa5+24129607/model.neff ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f67671a80c4bec27cdd099109748d4d5d7ff35f171ba81528abe3c6eb5bdd473
3
+ size 328704
neuronxcc-2.21.33363.0+82129205/MODULE_a38bf2241a80d200aa33+a02c3a36/compile_flags.json ADDED
@@ -0,0 +1 @@
 
 
1
+ ["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/token_generation/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"]
neuronxcc-2.21.33363.0+82129205/MODULE_a38bf2241a80d200aa33+a02c3a36/model.done ADDED
File without changes
neuronxcc-2.21.33363.0+82129205/MODULE_a38bf2241a80d200aa33+a02c3a36/model.hlo_module.pb ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f25ade0a3f52e4ef283ba2768a1420e559bb8c5c6ab4b261c432d72a52fc9e6d
3
+ size 863510
neuronxcc-2.21.33363.0+82129205/MODULE_a38bf2241a80d200aa33+a02c3a36/model.neff ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a54421adaac8624539899fec33dc8c608ae949455c3bd1a97d068c17abc28eaa
3
+ size 6769664
neuronxcc-2.21.33363.0+82129205/MODULE_a38bf2241a80d200aa33+a02c3a36/wrapped_neff.hlo ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a7a398b3a74d052420d442286f85440cb1c2491ded5182d08474c39b537c0ed3
3
+ size 6936331
neuronxcc-2.21.33363.0+82129205/MODULE_c0808787f3555a6627cc+24129607/compile_flags.json ADDED
@@ -0,0 +1 @@
 
 
1
+ ["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/context_encoding/_tp0_bk0/log-neuron-cc.txt"]
neuronxcc-2.21.33363.0+82129205/MODULE_c0808787f3555a6627cc+24129607/model.done ADDED
File without changes
neuronxcc-2.21.33363.0+82129205/MODULE_c0808787f3555a6627cc+24129607/model.hlo_module.pb ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dd0ca28f6aa86847fba45aec92c730116dca2fd2549b970fd744ceafbe276fd5
3
+ size 865460
neuronxcc-2.21.33363.0+82129205/MODULE_c0808787f3555a6627cc+24129607/model.neff ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fee68fdda56ade80ef20eead9552203f09b3c7b075091ffe419527eda0b756d4
3
+ size 36148224
neuronxcc-2.21.33363.0+82129205/MODULE_c2b3afa51c57d431a332+a02c3a36/compile_flags.json ADDED
@@ -0,0 +1 @@
 
 
1
+ ["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/token_generation/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"]
neuronxcc-2.21.33363.0+82129205/MODULE_c2b3afa51c57d431a332+a02c3a36/model.done ADDED
File without changes
neuronxcc-2.21.33363.0+82129205/MODULE_c2b3afa51c57d431a332+a02c3a36/model.hlo_module.pb ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2c2920e5fde77a80d2d66c9ba5addf46e53d032f533c7097cba34e31243f84ed
3
+ size 588406
neuronxcc-2.21.33363.0+82129205/MODULE_c2b3afa51c57d431a332+a02c3a36/model.neff ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c8017f2ca25aa30c01e839314f958eedb8512833a8e66bfd9d075b9943b0980c
3
+ size 1926144
neuronxcc-2.21.33363.0+82129205/MODULE_c2b3afa51c57d431a332+a02c3a36/wrapped_neff.hlo ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:be407fd3aecea94529ce6cc1917f9b19dd88a49aa9a67cd85524e1b93a5b54cd
3
+ size 2082478
neuronxcc-2.21.33363.0+82129205/MODULE_cedace9d3d693aab8d35+a02c3a36/compile_flags.json ADDED
@@ -0,0 +1 @@
 
 
1
+ ["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/token_generation/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"]