tengomucho HF Staff commited on
Commit
df9915c
·
verified ·
1 Parent(s): 5154500

Synchronizing local compiler cache.

Browse files
Files changed (35) hide show
  1. .gitattributes +1 -0
  2. neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.6.dev3/441269935591cad8d370e512c0b93cdd2fce6247c40e5a4866d872ee5338b0de/51c77185b9832eaebdfc.json +81 -0
  3. neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.6.dev3/gemma3_text/unsloth/gemma-3-270m-it/51c77185b9832eaebdfc.json +81 -0
  4. neuronxcc-2.21.33363.0+82129205/MODULE_17476209562158013765+e30acd3a/model.neff +0 -0
  5. neuronxcc-2.21.33363.0+82129205/MODULE_1980033719e8e5ff938d+9462c5c2/compile_flags.json +1 -0
  6. neuronxcc-2.21.33363.0+82129205/MODULE_1980033719e8e5ff938d+9462c5c2/model.done +0 -0
  7. neuronxcc-2.21.33363.0+82129205/MODULE_1980033719e8e5ff938d+9462c5c2/model.hlo_module.pb +3 -0
  8. neuronxcc-2.21.33363.0+82129205/MODULE_1980033719e8e5ff938d+9462c5c2/model.neff +0 -0
  9. neuronxcc-2.21.33363.0+82129205/MODULE_3ae38b2f10558b767b68+45415967/compile_flags.json +1 -0
  10. neuronxcc-2.21.33363.0+82129205/MODULE_3ae38b2f10558b767b68+45415967/model.done +0 -0
  11. neuronxcc-2.21.33363.0+82129205/MODULE_3ae38b2f10558b767b68+45415967/model.hlo_module.pb +3 -0
  12. neuronxcc-2.21.33363.0+82129205/MODULE_3ae38b2f10558b767b68+45415967/model.neff +0 -0
  13. neuronxcc-2.21.33363.0+82129205/MODULE_4e68975fa752b951c6f0+c4c89da0/compile_flags.json +1 -0
  14. neuronxcc-2.21.33363.0+82129205/MODULE_4e68975fa752b951c6f0+c4c89da0/model.done +0 -0
  15. neuronxcc-2.21.33363.0+82129205/MODULE_4e68975fa752b951c6f0+c4c89da0/model.hlo_module.pb +3 -0
  16. neuronxcc-2.21.33363.0+82129205/MODULE_4e68975fa752b951c6f0+c4c89da0/model.neff +0 -0
  17. neuronxcc-2.21.33363.0+82129205/MODULE_526995fbc83a4a64429c+5a3ee265/compile_flags.json +1 -0
  18. neuronxcc-2.21.33363.0+82129205/MODULE_526995fbc83a4a64429c+5a3ee265/model.done +0 -0
  19. neuronxcc-2.21.33363.0+82129205/MODULE_526995fbc83a4a64429c+5a3ee265/model.hlo_module.pb +3 -0
  20. neuronxcc-2.21.33363.0+82129205/MODULE_526995fbc83a4a64429c+5a3ee265/model.neff +0 -0
  21. neuronxcc-2.21.33363.0+82129205/MODULE_8b48097eaa2ae85e1c16+48fd059c/compile_flags.json +1 -0
  22. neuronxcc-2.21.33363.0+82129205/MODULE_8b48097eaa2ae85e1c16+48fd059c/model.done +0 -0
  23. neuronxcc-2.21.33363.0+82129205/MODULE_8b48097eaa2ae85e1c16+48fd059c/model.hlo_module.pb +3 -0
  24. neuronxcc-2.21.33363.0+82129205/MODULE_8b48097eaa2ae85e1c16+48fd059c/model.neff +0 -0
  25. neuronxcc-2.21.33363.0+82129205/MODULE_952fafb4c315904dcb0e+f2c40fef/compile_flags.json +1 -0
  26. neuronxcc-2.21.33363.0+82129205/MODULE_952fafb4c315904dcb0e+f2c40fef/model.done +0 -0
  27. neuronxcc-2.21.33363.0+82129205/MODULE_952fafb4c315904dcb0e+f2c40fef/model.hlo_module.pb +3 -0
  28. neuronxcc-2.21.33363.0+82129205/MODULE_952fafb4c315904dcb0e+f2c40fef/model.neff +3 -0
  29. neuronxcc-2.21.33363.0+82129205/MODULE_c5bb11161997e6aa48a1+a02c3a36/model.hlo_module.pb +1 -1
  30. neuronxcc-2.21.33363.0+82129205/MODULE_c5bb11161997e6aa48a1+a02c3a36/model.neff +1 -1
  31. neuronxcc-2.21.33363.0+82129205/MODULE_c5bb11161997e6aa48a1+a02c3a36/wrapped_neff.hlo +1 -1
  32. neuronxcc-2.21.33363.0+82129205/MODULE_d617d5a80725dd447538+37d32d7c/compile_flags.json +1 -0
  33. neuronxcc-2.21.33363.0+82129205/MODULE_d617d5a80725dd447538+37d32d7c/model.done +0 -0
  34. neuronxcc-2.21.33363.0+82129205/MODULE_d617d5a80725dd447538+37d32d7c/model.hlo_module.pb +3 -0
  35. neuronxcc-2.21.33363.0+82129205/MODULE_d617d5a80725dd447538+37d32d7c/model.neff +0 -0
.gitattributes CHANGED
@@ -7026,3 +7026,4 @@ neuronxcc-2.21.33363.0+82129205/MODULE_cf5d937b64d087a8e0ee+a02c3a36/model.neff
7026
  neuronxcc-2.21.33363.0+82129205/MODULE_cf5d937b64d087a8e0ee+a02c3a36/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text
7027
  neuronxcc-2.21.33363.0+82129205/MODULE_fe6b8b40a8e1d622e71e+a02c3a36/model.neff filter=lfs diff=lfs merge=lfs -text
7028
  neuronxcc-2.21.33363.0+82129205/MODULE_fe6b8b40a8e1d622e71e+a02c3a36/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text
 
 
7026
  neuronxcc-2.21.33363.0+82129205/MODULE_cf5d937b64d087a8e0ee+a02c3a36/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text
7027
  neuronxcc-2.21.33363.0+82129205/MODULE_fe6b8b40a8e1d622e71e+a02c3a36/model.neff filter=lfs diff=lfs merge=lfs -text
7028
  neuronxcc-2.21.33363.0+82129205/MODULE_fe6b8b40a8e1d622e71e+a02c3a36/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text
7029
+ neuronxcc-2.21.33363.0+82129205/MODULE_952fafb4c315904dcb0e+f2c40fef/model.neff filter=lfs diff=lfs merge=lfs -text
neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.6.dev3/441269935591cad8d370e512c0b93cdd2fce6247c40e5a4866d872ee5338b0de/51c77185b9832eaebdfc.json ADDED
@@ -0,0 +1,81 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_entry_class": "SingleModelCacheEntry",
3
+ "_model_id": "unsloth/gemma-3-270m-it",
4
+ "_sliding_window_pattern": 6,
5
+ "_task": "text-generation",
6
+ "architectures": [
7
+ "Gemma3ForCausalLM"
8
+ ],
9
+ "attention_bias": false,
10
+ "attention_dropout": 0.0,
11
+ "attn_logit_softcapping": null,
12
+ "dtype": "bfloat16",
13
+ "final_logit_softcapping": null,
14
+ "head_dim": 256,
15
+ "hidden_activation": "gelu_pytorch_tanh",
16
+ "hidden_size": 640,
17
+ "initializer_range": 0.02,
18
+ "intermediate_size": 2048,
19
+ "layer_types": [
20
+ "sliding_attention",
21
+ "sliding_attention",
22
+ "sliding_attention",
23
+ "sliding_attention",
24
+ "sliding_attention",
25
+ "full_attention",
26
+ "sliding_attention",
27
+ "sliding_attention",
28
+ "sliding_attention",
29
+ "sliding_attention",
30
+ "sliding_attention",
31
+ "full_attention",
32
+ "sliding_attention",
33
+ "sliding_attention",
34
+ "sliding_attention",
35
+ "sliding_attention",
36
+ "sliding_attention",
37
+ "full_attention"
38
+ ],
39
+ "max_position_embeddings": 32768,
40
+ "model_type": "gemma3_text",
41
+ "neuron": {
42
+ "_serialized_key": "NxDNeuronConfig",
43
+ "batch_size": 1,
44
+ "capacity_factor": null,
45
+ "checkpoint_id": "unsloth/gemma-3-270m-it",
46
+ "checkpoint_revision": "23cf460f6bb16954176b3ddcc8d4f250501458a9",
47
+ "continuous_batching": false,
48
+ "ep_degree": 1,
49
+ "fused_qkv": true,
50
+ "glu_mlp": true,
51
+ "local_ranks_size": 2,
52
+ "max_batch_size": 1,
53
+ "max_context_length": 8192,
54
+ "max_topk": 256,
55
+ "n_active_tokens": 8192,
56
+ "neuronxcc_version": "2.21.33363.0+82129205",
57
+ "on_device_sampling": true,
58
+ "optimum_neuron_version": "0.4.6.dev3",
59
+ "output_logits": false,
60
+ "pp_degree": 1,
61
+ "sequence_length": 8192,
62
+ "speculation_length": 0,
63
+ "start_rank_id": 0,
64
+ "target": "trn1",
65
+ "torch_dtype": "bfloat16",
66
+ "tp_degree": 2
67
+ },
68
+ "num_attention_heads": 4,
69
+ "num_hidden_layers": 18,
70
+ "num_key_value_heads": 1,
71
+ "query_pre_attn_scalar": 256,
72
+ "rms_norm_eps": 1e-06,
73
+ "rope_local_base_freq": 10000.0,
74
+ "rope_scaling": null,
75
+ "rope_theta": 1000000.0,
76
+ "sliding_window": 512,
77
+ "unsloth_fixed": true,
78
+ "use_bidirectional_attention": false,
79
+ "use_cache": true,
80
+ "vocab_size": 262144
81
+ }
neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.6.dev3/gemma3_text/unsloth/gemma-3-270m-it/51c77185b9832eaebdfc.json ADDED
@@ -0,0 +1,81 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_entry_class": "SingleModelCacheEntry",
3
+ "_model_id": "unsloth/gemma-3-270m-it",
4
+ "_sliding_window_pattern": 6,
5
+ "_task": "text-generation",
6
+ "architectures": [
7
+ "Gemma3ForCausalLM"
8
+ ],
9
+ "attention_bias": false,
10
+ "attention_dropout": 0.0,
11
+ "attn_logit_softcapping": null,
12
+ "dtype": "bfloat16",
13
+ "final_logit_softcapping": null,
14
+ "head_dim": 256,
15
+ "hidden_activation": "gelu_pytorch_tanh",
16
+ "hidden_size": 640,
17
+ "initializer_range": 0.02,
18
+ "intermediate_size": 2048,
19
+ "layer_types": [
20
+ "sliding_attention",
21
+ "sliding_attention",
22
+ "sliding_attention",
23
+ "sliding_attention",
24
+ "sliding_attention",
25
+ "full_attention",
26
+ "sliding_attention",
27
+ "sliding_attention",
28
+ "sliding_attention",
29
+ "sliding_attention",
30
+ "sliding_attention",
31
+ "full_attention",
32
+ "sliding_attention",
33
+ "sliding_attention",
34
+ "sliding_attention",
35
+ "sliding_attention",
36
+ "sliding_attention",
37
+ "full_attention"
38
+ ],
39
+ "max_position_embeddings": 32768,
40
+ "model_type": "gemma3_text",
41
+ "neuron": {
42
+ "_serialized_key": "NxDNeuronConfig",
43
+ "batch_size": 1,
44
+ "capacity_factor": null,
45
+ "checkpoint_id": "unsloth/gemma-3-270m-it",
46
+ "checkpoint_revision": "23cf460f6bb16954176b3ddcc8d4f250501458a9",
47
+ "continuous_batching": false,
48
+ "ep_degree": 1,
49
+ "fused_qkv": true,
50
+ "glu_mlp": true,
51
+ "local_ranks_size": 2,
52
+ "max_batch_size": 1,
53
+ "max_context_length": 8192,
54
+ "max_topk": 256,
55
+ "n_active_tokens": 8192,
56
+ "neuronxcc_version": "2.21.33363.0+82129205",
57
+ "on_device_sampling": true,
58
+ "optimum_neuron_version": "0.4.6.dev3",
59
+ "output_logits": false,
60
+ "pp_degree": 1,
61
+ "sequence_length": 8192,
62
+ "speculation_length": 0,
63
+ "start_rank_id": 0,
64
+ "target": "trn1",
65
+ "torch_dtype": "bfloat16",
66
+ "tp_degree": 2
67
+ },
68
+ "num_attention_heads": 4,
69
+ "num_hidden_layers": 18,
70
+ "num_key_value_heads": 1,
71
+ "query_pre_attn_scalar": 256,
72
+ "rms_norm_eps": 1e-06,
73
+ "rope_local_base_freq": 10000.0,
74
+ "rope_scaling": null,
75
+ "rope_theta": 1000000.0,
76
+ "sliding_window": 512,
77
+ "unsloth_fixed": true,
78
+ "use_bidirectional_attention": false,
79
+ "use_cache": true,
80
+ "vocab_size": 262144
81
+ }
neuronxcc-2.21.33363.0+82129205/MODULE_17476209562158013765+e30acd3a/model.neff CHANGED
Binary files a/neuronxcc-2.21.33363.0+82129205/MODULE_17476209562158013765+e30acd3a/model.neff and b/neuronxcc-2.21.33363.0+82129205/MODULE_17476209562158013765+e30acd3a/model.neff differ
 
neuronxcc-2.21.33363.0+82129205/MODULE_1980033719e8e5ff938d+9462c5c2/compile_flags.json ADDED
@@ -0,0 +1 @@
 
 
1
+ ["--target=trn1", "--enable-saturate-infinity", "--auto-cast=none", "--model-type=transformer", "-O1", "--logfile=/tmp/nxdi_test_ae3de8dc-521b-489e-b0f7-8de4a42742e5/compiler_workdir/NewAttentionBlock/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"]
neuronxcc-2.21.33363.0+82129205/MODULE_1980033719e8e5ff938d+9462c5c2/model.done ADDED
File without changes
neuronxcc-2.21.33363.0+82129205/MODULE_1980033719e8e5ff938d+9462c5c2/model.hlo_module.pb ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f409d8cc6bc5037c585be1e7ac4f332ca2d5938432853ee512e99ced1ae7345f
3
+ size 8611
neuronxcc-2.21.33363.0+82129205/MODULE_1980033719e8e5ff938d+9462c5c2/model.neff ADDED
Binary file (82.9 kB). View file
 
neuronxcc-2.21.33363.0+82129205/MODULE_3ae38b2f10558b767b68+45415967/compile_flags.json ADDED
@@ -0,0 +1 @@
 
 
1
+ ["--target=trn1", "--enable-saturate-infinity", "--auto-cast=none", "--model-type=transformer", "-O1", "--logfile=/tmp/nxdi_test_55003c3e-af6c-4439-9d6e-9c570991aeb3/compiler_workdir/OldSoftmaxModule/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"]
neuronxcc-2.21.33363.0+82129205/MODULE_3ae38b2f10558b767b68+45415967/model.done ADDED
File without changes
neuronxcc-2.21.33363.0+82129205/MODULE_3ae38b2f10558b767b68+45415967/model.hlo_module.pb ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5114d4a4b6883064dcb776ed5bd26ee295ba206bf9cfbe32191a6df351c35e1e
3
+ size 4581
neuronxcc-2.21.33363.0+82129205/MODULE_3ae38b2f10558b767b68+45415967/model.neff ADDED
Binary file (42 kB). View file
 
neuronxcc-2.21.33363.0+82129205/MODULE_4e68975fa752b951c6f0+c4c89da0/compile_flags.json ADDED
@@ -0,0 +1 @@
 
 
1
+ ["--target=trn1", "--enable-saturate-infinity", "--auto-cast=none", "--model-type=transformer", "-O1", "--logfile=/tmp/nxdi_test_6cad8bdf-58af-41ad-8549-f9f413408e7f/compiler_workdir/NewSoftmaxModule/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"]
neuronxcc-2.21.33363.0+82129205/MODULE_4e68975fa752b951c6f0+c4c89da0/model.done ADDED
File without changes
neuronxcc-2.21.33363.0+82129205/MODULE_4e68975fa752b951c6f0+c4c89da0/model.hlo_module.pb ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:db2e93fef39637b2e7d1ceb514fa3024d9836275bca2d538f49802342c231f0e
3
+ size 5471
neuronxcc-2.21.33363.0+82129205/MODULE_4e68975fa752b951c6f0+c4c89da0/model.neff ADDED
Binary file (42 kB). View file
 
neuronxcc-2.21.33363.0+82129205/MODULE_526995fbc83a4a64429c+5a3ee265/compile_flags.json ADDED
@@ -0,0 +1 @@
 
 
1
+ ["--target=trn1", "--enable-saturate-infinity", "--auto-cast=none", "--model-type=transformer", "-O1", "--logfile=/tmp/nxdi_test_fb164dc3-f066-411a-a8fd-746da0c9bf29/compiler_workdir/OldAttentionBlock/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"]
neuronxcc-2.21.33363.0+82129205/MODULE_526995fbc83a4a64429c+5a3ee265/model.done ADDED
File without changes
neuronxcc-2.21.33363.0+82129205/MODULE_526995fbc83a4a64429c+5a3ee265/model.hlo_module.pb ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5257f6d788833b506fbb149a4f7b96779ca2ed998a12765781b35e1b7f4ec017
3
+ size 7691
neuronxcc-2.21.33363.0+82129205/MODULE_526995fbc83a4a64429c+5a3ee265/model.neff ADDED
Binary file (72.7 kB). View file
 
neuronxcc-2.21.33363.0+82129205/MODULE_8b48097eaa2ae85e1c16+48fd059c/compile_flags.json ADDED
@@ -0,0 +1 @@
 
 
1
+ ["--target=trn1", "--enable-saturate-infinity", "--auto-cast=none", "--model-type=transformer", "-O1", "--logfile=/tmp/nxdi_test_b8301d09-8942-4560-aa05-f878496ccc01/compiler_workdir/NewAttentionBlock/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"]
neuronxcc-2.21.33363.0+82129205/MODULE_8b48097eaa2ae85e1c16+48fd059c/model.done ADDED
File without changes
neuronxcc-2.21.33363.0+82129205/MODULE_8b48097eaa2ae85e1c16+48fd059c/model.hlo_module.pb ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f409d8cc6bc5037c585be1e7ac4f332ca2d5938432853ee512e99ced1ae7345f
3
+ size 8611
neuronxcc-2.21.33363.0+82129205/MODULE_8b48097eaa2ae85e1c16+48fd059c/model.neff ADDED
Binary file (82.9 kB). View file
 
neuronxcc-2.21.33363.0+82129205/MODULE_952fafb4c315904dcb0e+f2c40fef/compile_flags.json ADDED
@@ -0,0 +1 @@
 
 
1
+ ["--target=trn1", "--enable-saturate-infinity", "--auto-cast=none", "--model-type=transformer", "-O1", "--logfile=/tmp/nxdi_test_a8de0c8f-5baf-485b-afeb-d86316569c80/compiler_workdir/ScaledQKComparisonModule/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"]
neuronxcc-2.21.33363.0+82129205/MODULE_952fafb4c315904dcb0e+f2c40fef/model.done ADDED
File without changes
neuronxcc-2.21.33363.0+82129205/MODULE_952fafb4c315904dcb0e+f2c40fef/model.hlo_module.pb ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:138b427bf7769ac62d72b0c008b58065b93c16f2f09976be109e29ef90de7854
3
+ size 4940
neuronxcc-2.21.33363.0+82129205/MODULE_952fafb4c315904dcb0e+f2c40fef/model.neff ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:318f983d6956631fa0b8d49cd12366f749070eebd7e9a7b6d7be6545b7ff5997
3
+ size 390144
neuronxcc-2.21.33363.0+82129205/MODULE_c5bb11161997e6aa48a1+a02c3a36/model.hlo_module.pb CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e95f5492fef1d5ad43e4a1b4416793874f6d0ba40e0ab4a77108d39e8741dc78
3
  size 586366
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:906e54fd0845481cd8e557aa253fbb18b9f71a3032ab259e9212591290afcf44
3
  size 586366
neuronxcc-2.21.33363.0+82129205/MODULE_c5bb11161997e6aa48a1+a02c3a36/model.neff CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7b0aef01c52aa301d7843faf5544f0da2c3828857f90a7691fa20e746a2a98d2
3
  size 1680384
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6110180fe3ea8a5b7f48097e5e386a55599b94768fd6d3c7c14f710dfd78f858
3
  size 1680384
neuronxcc-2.21.33363.0+82129205/MODULE_c5bb11161997e6aa48a1+a02c3a36/wrapped_neff.hlo CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c33fe492e2baf3fabbcde4493553c1ca310fb599ea5b1446592241352c9055ce
3
  size 1802773
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9e4dd3dc7a69530934ceeb5d9aa72380371611786ac96c9f55a167e7ded19372
3
  size 1802773
neuronxcc-2.21.33363.0+82129205/MODULE_d617d5a80725dd447538+37d32d7c/compile_flags.json ADDED
@@ -0,0 +1 @@
 
 
1
+ ["--target=trn1", "--enable-saturate-infinity", "--auto-cast=none", "--model-type=transformer", "-O1", "--logfile=/tmp/nxdi_test_5cb94fcd-6a90-4e47-9256-fb0d0362f564/compiler_workdir/OldAttentionBlock/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"]
neuronxcc-2.21.33363.0+82129205/MODULE_d617d5a80725dd447538+37d32d7c/model.done ADDED
File without changes
neuronxcc-2.21.33363.0+82129205/MODULE_d617d5a80725dd447538+37d32d7c/model.hlo_module.pb ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5257f6d788833b506fbb149a4f7b96779ca2ed998a12765781b35e1b7f4ec017
3
+ size 7691
neuronxcc-2.21.33363.0+82129205/MODULE_d617d5a80725dd447538+37d32d7c/model.neff ADDED
Binary file (72.7 kB). View file