dacorvo HF Staff commited on
Commit
181e57b
·
verified ·
1 Parent(s): f8ca4c8

Synchronizing local compiler cache.

Browse files
Files changed (48) hide show
  1. .gitattributes +14 -0
  2. neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.4.dev2/llama/meta-llama/Llama-3.1-8B-Instruct/88837b9b04ca62ade2e5.json +62 -0
  3. neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.4.dev2/llama/meta-llama/Llama-3.2-1B-Instruct/184d3988bab3b0aea22a.json +62 -0
  4. neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.4.dev2/llama/meta-llama/Llama-3.2-1B-Instruct/1aff29ca40a5d84dc158.json +63 -0
  5. neuronxcc-2.21.33363.0+82129205/MODULE_0c0c570336081d2ddd3c+24129607/compile_flags.json +1 -0
  6. neuronxcc-2.21.33363.0+82129205/MODULE_0c0c570336081d2ddd3c+24129607/model.done +0 -0
  7. neuronxcc-2.21.33363.0+82129205/MODULE_0c0c570336081d2ddd3c+24129607/model.hlo_module.pb +3 -0
  8. neuronxcc-2.21.33363.0+82129205/MODULE_0c0c570336081d2ddd3c+24129607/model.neff +3 -0
  9. neuronxcc-2.21.33363.0+82129205/MODULE_1ac352f09de58a202958+24129607/compile_flags.json +1 -0
  10. neuronxcc-2.21.33363.0+82129205/MODULE_1ac352f09de58a202958+24129607/model.done +0 -0
  11. neuronxcc-2.21.33363.0+82129205/MODULE_1ac352f09de58a202958+24129607/model.hlo_module.pb +3 -0
  12. neuronxcc-2.21.33363.0+82129205/MODULE_1ac352f09de58a202958+24129607/model.neff +3 -0
  13. neuronxcc-2.21.33363.0+82129205/MODULE_3127262d3bc119879dfa+24129607/compile_flags.json +1 -0
  14. neuronxcc-2.21.33363.0+82129205/MODULE_3127262d3bc119879dfa+24129607/model.done +0 -0
  15. neuronxcc-2.21.33363.0+82129205/MODULE_3127262d3bc119879dfa+24129607/model.hlo_module.pb +3 -0
  16. neuronxcc-2.21.33363.0+82129205/MODULE_3127262d3bc119879dfa+24129607/model.neff +3 -0
  17. neuronxcc-2.21.33363.0+82129205/MODULE_85454497bce26576d95d+a02c3a36/compile_flags.json +1 -0
  18. neuronxcc-2.21.33363.0+82129205/MODULE_85454497bce26576d95d+a02c3a36/model.done +0 -0
  19. neuronxcc-2.21.33363.0+82129205/MODULE_85454497bce26576d95d+a02c3a36/model.hlo_module.pb +3 -0
  20. neuronxcc-2.21.33363.0+82129205/MODULE_85454497bce26576d95d+a02c3a36/model.neff +3 -0
  21. neuronxcc-2.21.33363.0+82129205/MODULE_85454497bce26576d95d+a02c3a36/wrapped_neff.hlo +3 -0
  22. neuronxcc-2.21.33363.0+82129205/MODULE_9088cab965c880f237a4+a02c3a36/compile_flags.json +1 -0
  23. neuronxcc-2.21.33363.0+82129205/MODULE_9088cab965c880f237a4+a02c3a36/model.done +0 -0
  24. neuronxcc-2.21.33363.0+82129205/MODULE_9088cab965c880f237a4+a02c3a36/model.hlo_module.pb +3 -0
  25. neuronxcc-2.21.33363.0+82129205/MODULE_9088cab965c880f237a4+a02c3a36/model.neff +3 -0
  26. neuronxcc-2.21.33363.0+82129205/MODULE_9088cab965c880f237a4+a02c3a36/wrapped_neff.hlo +3 -0
  27. neuronxcc-2.21.33363.0+82129205/MODULE_a7db8b94be5fa8c63086+24129607/compile_flags.json +1 -0
  28. neuronxcc-2.21.33363.0+82129205/MODULE_a7db8b94be5fa8c63086+24129607/model.done +0 -0
  29. neuronxcc-2.21.33363.0+82129205/MODULE_a7db8b94be5fa8c63086+24129607/model.hlo_module.pb +3 -0
  30. neuronxcc-2.21.33363.0+82129205/MODULE_a7db8b94be5fa8c63086+24129607/model.neff +3 -0
  31. neuronxcc-2.21.33363.0+82129205/MODULE_cafaaccbcb3304f08d70+24129607/compile_flags.json +1 -0
  32. neuronxcc-2.21.33363.0+82129205/MODULE_cafaaccbcb3304f08d70+24129607/model.done +0 -0
  33. neuronxcc-2.21.33363.0+82129205/MODULE_cafaaccbcb3304f08d70+24129607/model.hlo_module.pb +3 -0
  34. neuronxcc-2.21.33363.0+82129205/MODULE_cafaaccbcb3304f08d70+24129607/model.neff +3 -0
  35. neuronxcc-2.21.33363.0+82129205/MODULE_da1fe9f94d1912f89f98+24129607/compile_flags.json +1 -0
  36. neuronxcc-2.21.33363.0+82129205/MODULE_da1fe9f94d1912f89f98+24129607/model.done +0 -0
  37. neuronxcc-2.21.33363.0+82129205/MODULE_da1fe9f94d1912f89f98+24129607/model.hlo_module.pb +3 -0
  38. neuronxcc-2.21.33363.0+82129205/MODULE_da1fe9f94d1912f89f98+24129607/model.neff +3 -0
  39. neuronxcc-2.21.33363.0+82129205/MODULE_e423e95ee77bbcfd6982+a02c3a36/compile_flags.json +1 -0
  40. neuronxcc-2.21.33363.0+82129205/MODULE_e423e95ee77bbcfd6982+a02c3a36/model.done +0 -0
  41. neuronxcc-2.21.33363.0+82129205/MODULE_e423e95ee77bbcfd6982+a02c3a36/model.hlo_module.pb +3 -0
  42. neuronxcc-2.21.33363.0+82129205/MODULE_e423e95ee77bbcfd6982+a02c3a36/model.neff +3 -0
  43. neuronxcc-2.21.33363.0+82129205/MODULE_e423e95ee77bbcfd6982+a02c3a36/wrapped_neff.hlo +3 -0
  44. neuronxcc-2.21.33363.0+82129205/MODULE_fa675f3a434a3d346112+a02c3a36/compile_flags.json +1 -0
  45. neuronxcc-2.21.33363.0+82129205/MODULE_fa675f3a434a3d346112+a02c3a36/model.done +0 -0
  46. neuronxcc-2.21.33363.0+82129205/MODULE_fa675f3a434a3d346112+a02c3a36/model.hlo_module.pb +3 -0
  47. neuronxcc-2.21.33363.0+82129205/MODULE_fa675f3a434a3d346112+a02c3a36/model.neff +3 -0
  48. neuronxcc-2.21.33363.0+82129205/MODULE_fa675f3a434a3d346112+a02c3a36/wrapped_neff.hlo +3 -0
.gitattributes CHANGED
@@ -15158,3 +15158,17 @@ neuronxcc-2.21.33363.0+82129205/MODULE_a22c65ba0c6c7a55032b+692b3dff/model.neff
15158
  neuronxcc-2.21.33363.0+82129205/MODULE_a22c65ba0c6c7a55032b+692b3dff/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text
15159
  neuronxcc-2.21.33363.0+82129205/MODULE_dac939ac0fb756b0c5a0+8669224f/model.neff filter=lfs diff=lfs merge=lfs -text
15160
  neuronxcc-2.21.33363.0+82129205/MODULE_dac939ac0fb756b0c5a0+8669224f/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
15158
  neuronxcc-2.21.33363.0+82129205/MODULE_a22c65ba0c6c7a55032b+692b3dff/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text
15159
  neuronxcc-2.21.33363.0+82129205/MODULE_dac939ac0fb756b0c5a0+8669224f/model.neff filter=lfs diff=lfs merge=lfs -text
15160
  neuronxcc-2.21.33363.0+82129205/MODULE_dac939ac0fb756b0c5a0+8669224f/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text
15161
+ neuronxcc-2.21.33363.0+82129205/MODULE_0c0c570336081d2ddd3c+24129607/model.neff filter=lfs diff=lfs merge=lfs -text
15162
+ neuronxcc-2.21.33363.0+82129205/MODULE_1ac352f09de58a202958+24129607/model.neff filter=lfs diff=lfs merge=lfs -text
15163
+ neuronxcc-2.21.33363.0+82129205/MODULE_3127262d3bc119879dfa+24129607/model.neff filter=lfs diff=lfs merge=lfs -text
15164
+ neuronxcc-2.21.33363.0+82129205/MODULE_85454497bce26576d95d+a02c3a36/model.neff filter=lfs diff=lfs merge=lfs -text
15165
+ neuronxcc-2.21.33363.0+82129205/MODULE_85454497bce26576d95d+a02c3a36/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text
15166
+ neuronxcc-2.21.33363.0+82129205/MODULE_9088cab965c880f237a4+a02c3a36/model.neff filter=lfs diff=lfs merge=lfs -text
15167
+ neuronxcc-2.21.33363.0+82129205/MODULE_9088cab965c880f237a4+a02c3a36/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text
15168
+ neuronxcc-2.21.33363.0+82129205/MODULE_a7db8b94be5fa8c63086+24129607/model.neff filter=lfs diff=lfs merge=lfs -text
15169
+ neuronxcc-2.21.33363.0+82129205/MODULE_cafaaccbcb3304f08d70+24129607/model.neff filter=lfs diff=lfs merge=lfs -text
15170
+ neuronxcc-2.21.33363.0+82129205/MODULE_da1fe9f94d1912f89f98+24129607/model.neff filter=lfs diff=lfs merge=lfs -text
15171
+ neuronxcc-2.21.33363.0+82129205/MODULE_e423e95ee77bbcfd6982+a02c3a36/model.neff filter=lfs diff=lfs merge=lfs -text
15172
+ neuronxcc-2.21.33363.0+82129205/MODULE_e423e95ee77bbcfd6982+a02c3a36/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text
15173
+ neuronxcc-2.21.33363.0+82129205/MODULE_fa675f3a434a3d346112+a02c3a36/model.neff filter=lfs diff=lfs merge=lfs -text
15174
+ neuronxcc-2.21.33363.0+82129205/MODULE_fa675f3a434a3d346112+a02c3a36/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text
neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.4.dev2/llama/meta-llama/Llama-3.1-8B-Instruct/88837b9b04ca62ade2e5.json ADDED
@@ -0,0 +1,62 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_entry_class": "SingleModelCacheEntry",
3
+ "_model_id": "meta-llama/Llama-3.1-8B-Instruct",
4
+ "_task": "text-generation",
5
+ "architectures": [
6
+ "LlamaForCausalLM"
7
+ ],
8
+ "attention_bias": false,
9
+ "attention_dropout": 0.0,
10
+ "dtype": "bfloat16",
11
+ "head_dim": 128,
12
+ "hidden_act": "silu",
13
+ "hidden_size": 4096,
14
+ "initializer_range": 0.02,
15
+ "intermediate_size": 14336,
16
+ "max_position_embeddings": 131072,
17
+ "mlp_bias": false,
18
+ "model_type": "llama",
19
+ "neuron": {
20
+ "_serialized_key": "NxDNeuronConfig",
21
+ "batch_size": 1,
22
+ "capacity_factor": null,
23
+ "checkpoint_id": "meta-llama/Llama-3.1-8B-Instruct",
24
+ "checkpoint_revision": "0e9e39f249a16976918f6564b8830bc894c89659",
25
+ "continuous_batching": false,
26
+ "ep_degree": 1,
27
+ "fused_qkv": true,
28
+ "glu_mlp": true,
29
+ "local_ranks_size": 2,
30
+ "max_batch_size": 1,
31
+ "max_context_length": 4096,
32
+ "max_topk": 256,
33
+ "n_active_tokens": 4096,
34
+ "neuronxcc_version": "2.21.33363.0+82129205",
35
+ "on_device_sampling": false,
36
+ "optimum_neuron_version": "0.4.4.dev2",
37
+ "output_logits": false,
38
+ "pp_degree": 1,
39
+ "sequence_length": 4096,
40
+ "speculation_length": 0,
41
+ "start_rank_id": 0,
42
+ "target": "trn1",
43
+ "torch_dtype": "bfloat16",
44
+ "tp_degree": 2
45
+ },
46
+ "num_attention_heads": 32,
47
+ "num_hidden_layers": 32,
48
+ "num_key_value_heads": 8,
49
+ "pretraining_tp": 1,
50
+ "rms_norm_eps": 1e-05,
51
+ "rope_scaling": {
52
+ "factor": 8.0,
53
+ "high_freq_factor": 4.0,
54
+ "low_freq_factor": 1.0,
55
+ "original_max_position_embeddings": 8192,
56
+ "rope_type": "llama3"
57
+ },
58
+ "rope_theta": 500000.0,
59
+ "tie_word_embeddings": false,
60
+ "use_cache": true,
61
+ "vocab_size": 128256
62
+ }
neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.4.dev2/llama/meta-llama/Llama-3.2-1B-Instruct/184d3988bab3b0aea22a.json ADDED
@@ -0,0 +1,62 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_entry_class": "SingleModelCacheEntry",
3
+ "_model_id": "meta-llama/Llama-3.2-1B-Instruct",
4
+ "_task": "text-generation",
5
+ "architectures": [
6
+ "LlamaForCausalLM"
7
+ ],
8
+ "attention_bias": false,
9
+ "attention_dropout": 0.0,
10
+ "dtype": "bfloat16",
11
+ "head_dim": 64,
12
+ "hidden_act": "silu",
13
+ "hidden_size": 2048,
14
+ "initializer_range": 0.02,
15
+ "intermediate_size": 8192,
16
+ "max_position_embeddings": 131072,
17
+ "mlp_bias": false,
18
+ "model_type": "llama",
19
+ "neuron": {
20
+ "_serialized_key": "NxDNeuronConfig",
21
+ "batch_size": 1,
22
+ "capacity_factor": null,
23
+ "checkpoint_id": "meta-llama/Llama-3.2-1B-Instruct",
24
+ "checkpoint_revision": "9213176726f574b556790deb65791e0c5aa438b6",
25
+ "continuous_batching": false,
26
+ "ep_degree": 1,
27
+ "fused_qkv": true,
28
+ "glu_mlp": true,
29
+ "local_ranks_size": 2,
30
+ "max_batch_size": 1,
31
+ "max_context_length": 8192,
32
+ "max_topk": 256,
33
+ "n_active_tokens": 8192,
34
+ "neuronxcc_version": "2.21.33363.0+82129205",
35
+ "on_device_sampling": false,
36
+ "optimum_neuron_version": "0.4.4.dev2",
37
+ "output_logits": false,
38
+ "pp_degree": 1,
39
+ "sequence_length": 8192,
40
+ "speculation_length": 0,
41
+ "start_rank_id": 0,
42
+ "target": "trn1",
43
+ "torch_dtype": "bfloat16",
44
+ "tp_degree": 2
45
+ },
46
+ "num_attention_heads": 32,
47
+ "num_hidden_layers": 16,
48
+ "num_key_value_heads": 8,
49
+ "pretraining_tp": 1,
50
+ "rms_norm_eps": 1e-05,
51
+ "rope_scaling": {
52
+ "factor": 32.0,
53
+ "high_freq_factor": 4.0,
54
+ "low_freq_factor": 1.0,
55
+ "original_max_position_embeddings": 8192,
56
+ "rope_type": "llama3"
57
+ },
58
+ "rope_theta": 500000.0,
59
+ "tie_word_embeddings": true,
60
+ "use_cache": true,
61
+ "vocab_size": 128256
62
+ }
neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.4.dev2/llama/meta-llama/Llama-3.2-1B-Instruct/1aff29ca40a5d84dc158.json ADDED
@@ -0,0 +1,63 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_entry_class": "SingleModelCacheEntry",
3
+ "_model_id": "meta-llama/Llama-3.2-1B-Instruct",
4
+ "_task": "text-generation",
5
+ "architectures": [
6
+ "LlamaForCausalLM"
7
+ ],
8
+ "attention_bias": false,
9
+ "attention_dropout": 0.0,
10
+ "dtype": "bfloat16",
11
+ "head_dim": 64,
12
+ "hidden_act": "silu",
13
+ "hidden_size": 2048,
14
+ "initializer_range": 0.02,
15
+ "intermediate_size": 8192,
16
+ "max_position_embeddings": 131072,
17
+ "mlp_bias": false,
18
+ "model_type": "llama",
19
+ "neuron": {
20
+ "_serialized_key": "NxDNeuronConfig",
21
+ "batch_size": 1,
22
+ "capacity_factor": null,
23
+ "checkpoint_id": "meta-llama/Llama-3.2-1B-Instruct",
24
+ "checkpoint_revision": "9213176726f574b556790deb65791e0c5aa438b6",
25
+ "continuous_batching": false,
26
+ "ep_degree": 1,
27
+ "fused_qkv": true,
28
+ "glu_mlp": true,
29
+ "local_ranks_size": 2,
30
+ "max_batch_size": 1,
31
+ "max_context_length": 8192,
32
+ "max_topk": 256,
33
+ "n_active_tokens": 8192,
34
+ "neuronxcc_version": "2.21.33363.0+82129205",
35
+ "on_device_sampling": false,
36
+ "optimum_neuron_version": "0.4.4.dev2",
37
+ "output_logits": false,
38
+ "pp_degree": 1,
39
+ "sequence_length": 8192,
40
+ "sequence_parallel_enabled": true,
41
+ "speculation_length": 0,
42
+ "start_rank_id": 0,
43
+ "target": "trn1",
44
+ "torch_dtype": "bfloat16",
45
+ "tp_degree": 2
46
+ },
47
+ "num_attention_heads": 32,
48
+ "num_hidden_layers": 16,
49
+ "num_key_value_heads": 8,
50
+ "pretraining_tp": 1,
51
+ "rms_norm_eps": 1e-05,
52
+ "rope_scaling": {
53
+ "factor": 32.0,
54
+ "high_freq_factor": 4.0,
55
+ "low_freq_factor": 1.0,
56
+ "original_max_position_embeddings": 8192,
57
+ "rope_type": "llama3"
58
+ },
59
+ "rope_theta": 500000.0,
60
+ "tie_word_embeddings": true,
61
+ "use_cache": true,
62
+ "vocab_size": 128256
63
+ }
neuronxcc-2.21.33363.0+82129205/MODULE_0c0c570336081d2ddd3c+24129607/compile_flags.json ADDED
@@ -0,0 +1 @@
 
 
1
+ ["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/context_encoding/_tp0_bk0/log-neuron-cc.txt"]
neuronxcc-2.21.33363.0+82129205/MODULE_0c0c570336081d2ddd3c+24129607/model.done ADDED
File without changes
neuronxcc-2.21.33363.0+82129205/MODULE_0c0c570336081d2ddd3c+24129607/model.hlo_module.pb ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:19f928de65496854001ada7e5e53a70b74032c92d33e8c48710fb591fb579ccc
3
+ size 434848
neuronxcc-2.21.33363.0+82129205/MODULE_0c0c570336081d2ddd3c+24129607/model.neff ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3d8c21ed45fb889dd1b85413d67e9ff34d25354073330931cc7bceb2f401e862
3
+ size 114985984
neuronxcc-2.21.33363.0+82129205/MODULE_1ac352f09de58a202958+24129607/compile_flags.json ADDED
@@ -0,0 +1 @@
 
 
1
+ ["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/context_encoding/_tp0_bk0/log-neuron-cc.txt"]
neuronxcc-2.21.33363.0+82129205/MODULE_1ac352f09de58a202958+24129607/model.done ADDED
File without changes
neuronxcc-2.21.33363.0+82129205/MODULE_1ac352f09de58a202958+24129607/model.hlo_module.pb ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8f0a59f05f75f44d4f152165dd1498bbacd1bb716a5038c4edefa78073442b0c
3
+ size 928451
neuronxcc-2.21.33363.0+82129205/MODULE_1ac352f09de58a202958+24129607/model.neff ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:576906166482527d7ac353da0534e8fe32fa597ef3ab1f5c105a0538e3da863a
3
+ size 41851904
neuronxcc-2.21.33363.0+82129205/MODULE_3127262d3bc119879dfa+24129607/compile_flags.json ADDED
@@ -0,0 +1 @@
 
 
1
+ ["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/context_encoding/_tp0_bk0/log-neuron-cc.txt"]
neuronxcc-2.21.33363.0+82129205/MODULE_3127262d3bc119879dfa+24129607/model.done ADDED
File without changes
neuronxcc-2.21.33363.0+82129205/MODULE_3127262d3bc119879dfa+24129607/model.hlo_module.pb ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9e2d78445e08d3210569f8562c247dacd71c96303252860c4275cd1aa5223c24
3
+ size 465940
neuronxcc-2.21.33363.0+82129205/MODULE_3127262d3bc119879dfa+24129607/model.neff ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bf958b8008d117987b44745851fca69111ec2ac1ab25578a16fed03f2580b530
3
+ size 114279424
neuronxcc-2.21.33363.0+82129205/MODULE_85454497bce26576d95d+a02c3a36/compile_flags.json ADDED
@@ -0,0 +1 @@
 
 
1
+ ["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/token_generation/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"]
neuronxcc-2.21.33363.0+82129205/MODULE_85454497bce26576d95d+a02c3a36/model.done ADDED
File without changes
neuronxcc-2.21.33363.0+82129205/MODULE_85454497bce26576d95d+a02c3a36/model.hlo_module.pb ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c2941ff5bfa2ac33683363d48b44dd5eb9a7930bd31fdea40bf832b3cadc2e25
3
+ size 769257
neuronxcc-2.21.33363.0+82129205/MODULE_85454497bce26576d95d+a02c3a36/model.neff ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1b7f6ea5e68057a9d5ad76e682963091a6503e49155f4c601cbd9c31a835d58c
3
+ size 8899584
neuronxcc-2.21.33363.0+82129205/MODULE_85454497bce26576d95d+a02c3a36/wrapped_neff.hlo ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3692add274fc47e40761a3044d5e14815585874653cfb04fcb9a420478d78c18
3
+ size 9047399
neuronxcc-2.21.33363.0+82129205/MODULE_9088cab965c880f237a4+a02c3a36/compile_flags.json ADDED
@@ -0,0 +1 @@
 
 
1
+ ["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/token_generation/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"]
neuronxcc-2.21.33363.0+82129205/MODULE_9088cab965c880f237a4+a02c3a36/model.done ADDED
File without changes
neuronxcc-2.21.33363.0+82129205/MODULE_9088cab965c880f237a4+a02c3a36/model.hlo_module.pb ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3f3742f0d123d956d174e40c072a858a13a03ef258da8f2056da95bbed4653ab
3
+ size 756502
neuronxcc-2.21.33363.0+82129205/MODULE_9088cab965c880f237a4+a02c3a36/model.neff ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:95a2b18be62bf42c74fa32c3167d04500cd5dcf04213099083be59e17ef89ee8
3
+ size 6902784
neuronxcc-2.21.33363.0+82129205/MODULE_9088cab965c880f237a4+a02c3a36/wrapped_neff.hlo ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3fa0f993403352abd4aad1c6397c69b3cb2599e47624d4b32fa8fa0c3e2f4560
3
+ size 7050133
neuronxcc-2.21.33363.0+82129205/MODULE_a7db8b94be5fa8c63086+24129607/compile_flags.json ADDED
@@ -0,0 +1 @@
 
 
1
+ ["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/context_encoding/_tp0_bk0/log-neuron-cc.txt"]
neuronxcc-2.21.33363.0+82129205/MODULE_a7db8b94be5fa8c63086+24129607/model.done ADDED
File without changes
neuronxcc-2.21.33363.0+82129205/MODULE_a7db8b94be5fa8c63086+24129607/model.hlo_module.pb ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aff7812e7179908192c31870402bb39536413f49103f4d67f6d7f204f3e5185f
3
+ size 972333
neuronxcc-2.21.33363.0+82129205/MODULE_a7db8b94be5fa8c63086+24129607/model.neff ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f0c7cfabffc71aff561f9f1a1a4f12dbbe2c485599f7f1c0c901469bef84860d
3
+ size 41892864
neuronxcc-2.21.33363.0+82129205/MODULE_cafaaccbcb3304f08d70+24129607/compile_flags.json ADDED
@@ -0,0 +1 @@
 
 
1
+ ["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/context_encoding/_tp0_bk0/log-neuron-cc.txt"]
neuronxcc-2.21.33363.0+82129205/MODULE_cafaaccbcb3304f08d70+24129607/model.done ADDED
File without changes
neuronxcc-2.21.33363.0+82129205/MODULE_cafaaccbcb3304f08d70+24129607/model.hlo_module.pb ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f9a75d6679d5de1f5062dfddb72d5621e645bc2830fdb1b70c65529e581d9cd0
3
+ size 505502
neuronxcc-2.21.33363.0+82129205/MODULE_cafaaccbcb3304f08d70+24129607/model.neff ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:549f16d4c19caabedc4e743121854d85ce13e58b9deed7463efd5706da06c9e7
3
+ size 114074624
neuronxcc-2.21.33363.0+82129205/MODULE_da1fe9f94d1912f89f98+24129607/compile_flags.json ADDED
@@ -0,0 +1 @@
 
 
1
+ ["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/context_encoding/_tp0_bk0/log-neuron-cc.txt"]
neuronxcc-2.21.33363.0+82129205/MODULE_da1fe9f94d1912f89f98+24129607/model.done ADDED
File without changes
neuronxcc-2.21.33363.0+82129205/MODULE_da1fe9f94d1912f89f98+24129607/model.hlo_module.pb ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1239ef1590682b574cd985d60ca0602fb970b86e4a717dc3a70cb4afaaabb860
3
+ size 869444
neuronxcc-2.21.33363.0+82129205/MODULE_da1fe9f94d1912f89f98+24129607/model.neff ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1872dff540e41af1855780dc910589f7bfcdf22983d14413e19ffcc5ca6e963f
3
+ size 6616064
neuronxcc-2.21.33363.0+82129205/MODULE_e423e95ee77bbcfd6982+a02c3a36/compile_flags.json ADDED
@@ -0,0 +1 @@
 
 
1
+ ["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/token_generation/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"]
neuronxcc-2.21.33363.0+82129205/MODULE_e423e95ee77bbcfd6982+a02c3a36/model.done ADDED
File without changes
neuronxcc-2.21.33363.0+82129205/MODULE_e423e95ee77bbcfd6982+a02c3a36/model.hlo_module.pb ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7d3e756d8fcdf483ac9d147d0dd0a09ec65b64b3e8fd6380879fb2315321d65d
3
+ size 395607
neuronxcc-2.21.33363.0+82129205/MODULE_e423e95ee77bbcfd6982+a02c3a36/model.neff ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:62664749edfececd6069d80c0fdb784d83afb1bb3838d22a7a6a7a429144b4db
3
+ size 2171904
neuronxcc-2.21.33363.0+82129205/MODULE_e423e95ee77bbcfd6982+a02c3a36/wrapped_neff.hlo ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:63cf62f2c48a4f9cde1e8da4213d91c7a2fe5f7debbf1d62ee79f1ebc70a3c66
3
+ size 2245876
neuronxcc-2.21.33363.0+82129205/MODULE_fa675f3a434a3d346112+a02c3a36/compile_flags.json ADDED
@@ -0,0 +1 @@
 
 
1
+ ["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/token_generation/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"]
neuronxcc-2.21.33363.0+82129205/MODULE_fa675f3a434a3d346112+a02c3a36/model.done ADDED
File without changes
neuronxcc-2.21.33363.0+82129205/MODULE_fa675f3a434a3d346112+a02c3a36/model.hlo_module.pb ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e56bcad5523a0e96e80ff0aad4077fb4427df4e57058d493e20a6511c91c9449
3
+ size 799960
neuronxcc-2.21.33363.0+82129205/MODULE_fa675f3a434a3d346112+a02c3a36/model.neff ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b566d1ca9bbe809614e9c072e9e909f8c8ceb89ff61085c391bce4f157564943
3
+ size 6872064
neuronxcc-2.21.33363.0+82129205/MODULE_fa675f3a434a3d346112+a02c3a36/wrapped_neff.hlo ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7bf109196d8338da1e36f5ecd489bc4f0483167a41755481ae26722ae50d6a46
3
+ size 7019528