Synchronizing local compiler cache.
Browse files- .gitattributes +14 -0
- neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.4.dev2/llama/meta-llama/Llama-3.1-8B-Instruct/88837b9b04ca62ade2e5.json +62 -0
- neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.4.dev2/llama/meta-llama/Llama-3.2-1B-Instruct/184d3988bab3b0aea22a.json +62 -0
- neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.4.dev2/llama/meta-llama/Llama-3.2-1B-Instruct/1aff29ca40a5d84dc158.json +63 -0
- neuronxcc-2.21.33363.0+82129205/MODULE_0c0c570336081d2ddd3c+24129607/compile_flags.json +1 -0
- neuronxcc-2.21.33363.0+82129205/MODULE_0c0c570336081d2ddd3c+24129607/model.done +0 -0
- neuronxcc-2.21.33363.0+82129205/MODULE_0c0c570336081d2ddd3c+24129607/model.hlo_module.pb +3 -0
- neuronxcc-2.21.33363.0+82129205/MODULE_0c0c570336081d2ddd3c+24129607/model.neff +3 -0
- neuronxcc-2.21.33363.0+82129205/MODULE_1ac352f09de58a202958+24129607/compile_flags.json +1 -0
- neuronxcc-2.21.33363.0+82129205/MODULE_1ac352f09de58a202958+24129607/model.done +0 -0
- neuronxcc-2.21.33363.0+82129205/MODULE_1ac352f09de58a202958+24129607/model.hlo_module.pb +3 -0
- neuronxcc-2.21.33363.0+82129205/MODULE_1ac352f09de58a202958+24129607/model.neff +3 -0
- neuronxcc-2.21.33363.0+82129205/MODULE_3127262d3bc119879dfa+24129607/compile_flags.json +1 -0
- neuronxcc-2.21.33363.0+82129205/MODULE_3127262d3bc119879dfa+24129607/model.done +0 -0
- neuronxcc-2.21.33363.0+82129205/MODULE_3127262d3bc119879dfa+24129607/model.hlo_module.pb +3 -0
- neuronxcc-2.21.33363.0+82129205/MODULE_3127262d3bc119879dfa+24129607/model.neff +3 -0
- neuronxcc-2.21.33363.0+82129205/MODULE_85454497bce26576d95d+a02c3a36/compile_flags.json +1 -0
- neuronxcc-2.21.33363.0+82129205/MODULE_85454497bce26576d95d+a02c3a36/model.done +0 -0
- neuronxcc-2.21.33363.0+82129205/MODULE_85454497bce26576d95d+a02c3a36/model.hlo_module.pb +3 -0
- neuronxcc-2.21.33363.0+82129205/MODULE_85454497bce26576d95d+a02c3a36/model.neff +3 -0
- neuronxcc-2.21.33363.0+82129205/MODULE_85454497bce26576d95d+a02c3a36/wrapped_neff.hlo +3 -0
- neuronxcc-2.21.33363.0+82129205/MODULE_9088cab965c880f237a4+a02c3a36/compile_flags.json +1 -0
- neuronxcc-2.21.33363.0+82129205/MODULE_9088cab965c880f237a4+a02c3a36/model.done +0 -0
- neuronxcc-2.21.33363.0+82129205/MODULE_9088cab965c880f237a4+a02c3a36/model.hlo_module.pb +3 -0
- neuronxcc-2.21.33363.0+82129205/MODULE_9088cab965c880f237a4+a02c3a36/model.neff +3 -0
- neuronxcc-2.21.33363.0+82129205/MODULE_9088cab965c880f237a4+a02c3a36/wrapped_neff.hlo +3 -0
- neuronxcc-2.21.33363.0+82129205/MODULE_a7db8b94be5fa8c63086+24129607/compile_flags.json +1 -0
- neuronxcc-2.21.33363.0+82129205/MODULE_a7db8b94be5fa8c63086+24129607/model.done +0 -0
- neuronxcc-2.21.33363.0+82129205/MODULE_a7db8b94be5fa8c63086+24129607/model.hlo_module.pb +3 -0
- neuronxcc-2.21.33363.0+82129205/MODULE_a7db8b94be5fa8c63086+24129607/model.neff +3 -0
- neuronxcc-2.21.33363.0+82129205/MODULE_cafaaccbcb3304f08d70+24129607/compile_flags.json +1 -0
- neuronxcc-2.21.33363.0+82129205/MODULE_cafaaccbcb3304f08d70+24129607/model.done +0 -0
- neuronxcc-2.21.33363.0+82129205/MODULE_cafaaccbcb3304f08d70+24129607/model.hlo_module.pb +3 -0
- neuronxcc-2.21.33363.0+82129205/MODULE_cafaaccbcb3304f08d70+24129607/model.neff +3 -0
- neuronxcc-2.21.33363.0+82129205/MODULE_da1fe9f94d1912f89f98+24129607/compile_flags.json +1 -0
- neuronxcc-2.21.33363.0+82129205/MODULE_da1fe9f94d1912f89f98+24129607/model.done +0 -0
- neuronxcc-2.21.33363.0+82129205/MODULE_da1fe9f94d1912f89f98+24129607/model.hlo_module.pb +3 -0
- neuronxcc-2.21.33363.0+82129205/MODULE_da1fe9f94d1912f89f98+24129607/model.neff +3 -0
- neuronxcc-2.21.33363.0+82129205/MODULE_e423e95ee77bbcfd6982+a02c3a36/compile_flags.json +1 -0
- neuronxcc-2.21.33363.0+82129205/MODULE_e423e95ee77bbcfd6982+a02c3a36/model.done +0 -0
- neuronxcc-2.21.33363.0+82129205/MODULE_e423e95ee77bbcfd6982+a02c3a36/model.hlo_module.pb +3 -0
- neuronxcc-2.21.33363.0+82129205/MODULE_e423e95ee77bbcfd6982+a02c3a36/model.neff +3 -0
- neuronxcc-2.21.33363.0+82129205/MODULE_e423e95ee77bbcfd6982+a02c3a36/wrapped_neff.hlo +3 -0
- neuronxcc-2.21.33363.0+82129205/MODULE_fa675f3a434a3d346112+a02c3a36/compile_flags.json +1 -0
- neuronxcc-2.21.33363.0+82129205/MODULE_fa675f3a434a3d346112+a02c3a36/model.done +0 -0
- neuronxcc-2.21.33363.0+82129205/MODULE_fa675f3a434a3d346112+a02c3a36/model.hlo_module.pb +3 -0
- neuronxcc-2.21.33363.0+82129205/MODULE_fa675f3a434a3d346112+a02c3a36/model.neff +3 -0
- neuronxcc-2.21.33363.0+82129205/MODULE_fa675f3a434a3d346112+a02c3a36/wrapped_neff.hlo +3 -0
.gitattributes
CHANGED
|
@@ -15158,3 +15158,17 @@ neuronxcc-2.21.33363.0+82129205/MODULE_a22c65ba0c6c7a55032b+692b3dff/model.neff
|
|
| 15158 |
neuronxcc-2.21.33363.0+82129205/MODULE_a22c65ba0c6c7a55032b+692b3dff/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text
|
| 15159 |
neuronxcc-2.21.33363.0+82129205/MODULE_dac939ac0fb756b0c5a0+8669224f/model.neff filter=lfs diff=lfs merge=lfs -text
|
| 15160 |
neuronxcc-2.21.33363.0+82129205/MODULE_dac939ac0fb756b0c5a0+8669224f/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 15158 |
neuronxcc-2.21.33363.0+82129205/MODULE_a22c65ba0c6c7a55032b+692b3dff/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text
|
| 15159 |
neuronxcc-2.21.33363.0+82129205/MODULE_dac939ac0fb756b0c5a0+8669224f/model.neff filter=lfs diff=lfs merge=lfs -text
|
| 15160 |
neuronxcc-2.21.33363.0+82129205/MODULE_dac939ac0fb756b0c5a0+8669224f/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text
|
| 15161 |
+
neuronxcc-2.21.33363.0+82129205/MODULE_0c0c570336081d2ddd3c+24129607/model.neff filter=lfs diff=lfs merge=lfs -text
|
| 15162 |
+
neuronxcc-2.21.33363.0+82129205/MODULE_1ac352f09de58a202958+24129607/model.neff filter=lfs diff=lfs merge=lfs -text
|
| 15163 |
+
neuronxcc-2.21.33363.0+82129205/MODULE_3127262d3bc119879dfa+24129607/model.neff filter=lfs diff=lfs merge=lfs -text
|
| 15164 |
+
neuronxcc-2.21.33363.0+82129205/MODULE_85454497bce26576d95d+a02c3a36/model.neff filter=lfs diff=lfs merge=lfs -text
|
| 15165 |
+
neuronxcc-2.21.33363.0+82129205/MODULE_85454497bce26576d95d+a02c3a36/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text
|
| 15166 |
+
neuronxcc-2.21.33363.0+82129205/MODULE_9088cab965c880f237a4+a02c3a36/model.neff filter=lfs diff=lfs merge=lfs -text
|
| 15167 |
+
neuronxcc-2.21.33363.0+82129205/MODULE_9088cab965c880f237a4+a02c3a36/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text
|
| 15168 |
+
neuronxcc-2.21.33363.0+82129205/MODULE_a7db8b94be5fa8c63086+24129607/model.neff filter=lfs diff=lfs merge=lfs -text
|
| 15169 |
+
neuronxcc-2.21.33363.0+82129205/MODULE_cafaaccbcb3304f08d70+24129607/model.neff filter=lfs diff=lfs merge=lfs -text
|
| 15170 |
+
neuronxcc-2.21.33363.0+82129205/MODULE_da1fe9f94d1912f89f98+24129607/model.neff filter=lfs diff=lfs merge=lfs -text
|
| 15171 |
+
neuronxcc-2.21.33363.0+82129205/MODULE_e423e95ee77bbcfd6982+a02c3a36/model.neff filter=lfs diff=lfs merge=lfs -text
|
| 15172 |
+
neuronxcc-2.21.33363.0+82129205/MODULE_e423e95ee77bbcfd6982+a02c3a36/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text
|
| 15173 |
+
neuronxcc-2.21.33363.0+82129205/MODULE_fa675f3a434a3d346112+a02c3a36/model.neff filter=lfs diff=lfs merge=lfs -text
|
| 15174 |
+
neuronxcc-2.21.33363.0+82129205/MODULE_fa675f3a434a3d346112+a02c3a36/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text
|
neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.4.dev2/llama/meta-llama/Llama-3.1-8B-Instruct/88837b9b04ca62ade2e5.json
ADDED
|
@@ -0,0 +1,62 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"_entry_class": "SingleModelCacheEntry",
|
| 3 |
+
"_model_id": "meta-llama/Llama-3.1-8B-Instruct",
|
| 4 |
+
"_task": "text-generation",
|
| 5 |
+
"architectures": [
|
| 6 |
+
"LlamaForCausalLM"
|
| 7 |
+
],
|
| 8 |
+
"attention_bias": false,
|
| 9 |
+
"attention_dropout": 0.0,
|
| 10 |
+
"dtype": "bfloat16",
|
| 11 |
+
"head_dim": 128,
|
| 12 |
+
"hidden_act": "silu",
|
| 13 |
+
"hidden_size": 4096,
|
| 14 |
+
"initializer_range": 0.02,
|
| 15 |
+
"intermediate_size": 14336,
|
| 16 |
+
"max_position_embeddings": 131072,
|
| 17 |
+
"mlp_bias": false,
|
| 18 |
+
"model_type": "llama",
|
| 19 |
+
"neuron": {
|
| 20 |
+
"_serialized_key": "NxDNeuronConfig",
|
| 21 |
+
"batch_size": 1,
|
| 22 |
+
"capacity_factor": null,
|
| 23 |
+
"checkpoint_id": "meta-llama/Llama-3.1-8B-Instruct",
|
| 24 |
+
"checkpoint_revision": "0e9e39f249a16976918f6564b8830bc894c89659",
|
| 25 |
+
"continuous_batching": false,
|
| 26 |
+
"ep_degree": 1,
|
| 27 |
+
"fused_qkv": true,
|
| 28 |
+
"glu_mlp": true,
|
| 29 |
+
"local_ranks_size": 2,
|
| 30 |
+
"max_batch_size": 1,
|
| 31 |
+
"max_context_length": 4096,
|
| 32 |
+
"max_topk": 256,
|
| 33 |
+
"n_active_tokens": 4096,
|
| 34 |
+
"neuronxcc_version": "2.21.33363.0+82129205",
|
| 35 |
+
"on_device_sampling": false,
|
| 36 |
+
"optimum_neuron_version": "0.4.4.dev2",
|
| 37 |
+
"output_logits": false,
|
| 38 |
+
"pp_degree": 1,
|
| 39 |
+
"sequence_length": 4096,
|
| 40 |
+
"speculation_length": 0,
|
| 41 |
+
"start_rank_id": 0,
|
| 42 |
+
"target": "trn1",
|
| 43 |
+
"torch_dtype": "bfloat16",
|
| 44 |
+
"tp_degree": 2
|
| 45 |
+
},
|
| 46 |
+
"num_attention_heads": 32,
|
| 47 |
+
"num_hidden_layers": 32,
|
| 48 |
+
"num_key_value_heads": 8,
|
| 49 |
+
"pretraining_tp": 1,
|
| 50 |
+
"rms_norm_eps": 1e-05,
|
| 51 |
+
"rope_scaling": {
|
| 52 |
+
"factor": 8.0,
|
| 53 |
+
"high_freq_factor": 4.0,
|
| 54 |
+
"low_freq_factor": 1.0,
|
| 55 |
+
"original_max_position_embeddings": 8192,
|
| 56 |
+
"rope_type": "llama3"
|
| 57 |
+
},
|
| 58 |
+
"rope_theta": 500000.0,
|
| 59 |
+
"tie_word_embeddings": false,
|
| 60 |
+
"use_cache": true,
|
| 61 |
+
"vocab_size": 128256
|
| 62 |
+
}
|
neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.4.dev2/llama/meta-llama/Llama-3.2-1B-Instruct/184d3988bab3b0aea22a.json
ADDED
|
@@ -0,0 +1,62 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"_entry_class": "SingleModelCacheEntry",
|
| 3 |
+
"_model_id": "meta-llama/Llama-3.2-1B-Instruct",
|
| 4 |
+
"_task": "text-generation",
|
| 5 |
+
"architectures": [
|
| 6 |
+
"LlamaForCausalLM"
|
| 7 |
+
],
|
| 8 |
+
"attention_bias": false,
|
| 9 |
+
"attention_dropout": 0.0,
|
| 10 |
+
"dtype": "bfloat16",
|
| 11 |
+
"head_dim": 64,
|
| 12 |
+
"hidden_act": "silu",
|
| 13 |
+
"hidden_size": 2048,
|
| 14 |
+
"initializer_range": 0.02,
|
| 15 |
+
"intermediate_size": 8192,
|
| 16 |
+
"max_position_embeddings": 131072,
|
| 17 |
+
"mlp_bias": false,
|
| 18 |
+
"model_type": "llama",
|
| 19 |
+
"neuron": {
|
| 20 |
+
"_serialized_key": "NxDNeuronConfig",
|
| 21 |
+
"batch_size": 1,
|
| 22 |
+
"capacity_factor": null,
|
| 23 |
+
"checkpoint_id": "meta-llama/Llama-3.2-1B-Instruct",
|
| 24 |
+
"checkpoint_revision": "9213176726f574b556790deb65791e0c5aa438b6",
|
| 25 |
+
"continuous_batching": false,
|
| 26 |
+
"ep_degree": 1,
|
| 27 |
+
"fused_qkv": true,
|
| 28 |
+
"glu_mlp": true,
|
| 29 |
+
"local_ranks_size": 2,
|
| 30 |
+
"max_batch_size": 1,
|
| 31 |
+
"max_context_length": 8192,
|
| 32 |
+
"max_topk": 256,
|
| 33 |
+
"n_active_tokens": 8192,
|
| 34 |
+
"neuronxcc_version": "2.21.33363.0+82129205",
|
| 35 |
+
"on_device_sampling": false,
|
| 36 |
+
"optimum_neuron_version": "0.4.4.dev2",
|
| 37 |
+
"output_logits": false,
|
| 38 |
+
"pp_degree": 1,
|
| 39 |
+
"sequence_length": 8192,
|
| 40 |
+
"speculation_length": 0,
|
| 41 |
+
"start_rank_id": 0,
|
| 42 |
+
"target": "trn1",
|
| 43 |
+
"torch_dtype": "bfloat16",
|
| 44 |
+
"tp_degree": 2
|
| 45 |
+
},
|
| 46 |
+
"num_attention_heads": 32,
|
| 47 |
+
"num_hidden_layers": 16,
|
| 48 |
+
"num_key_value_heads": 8,
|
| 49 |
+
"pretraining_tp": 1,
|
| 50 |
+
"rms_norm_eps": 1e-05,
|
| 51 |
+
"rope_scaling": {
|
| 52 |
+
"factor": 32.0,
|
| 53 |
+
"high_freq_factor": 4.0,
|
| 54 |
+
"low_freq_factor": 1.0,
|
| 55 |
+
"original_max_position_embeddings": 8192,
|
| 56 |
+
"rope_type": "llama3"
|
| 57 |
+
},
|
| 58 |
+
"rope_theta": 500000.0,
|
| 59 |
+
"tie_word_embeddings": true,
|
| 60 |
+
"use_cache": true,
|
| 61 |
+
"vocab_size": 128256
|
| 62 |
+
}
|
neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.4.dev2/llama/meta-llama/Llama-3.2-1B-Instruct/1aff29ca40a5d84dc158.json
ADDED
|
@@ -0,0 +1,63 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"_entry_class": "SingleModelCacheEntry",
|
| 3 |
+
"_model_id": "meta-llama/Llama-3.2-1B-Instruct",
|
| 4 |
+
"_task": "text-generation",
|
| 5 |
+
"architectures": [
|
| 6 |
+
"LlamaForCausalLM"
|
| 7 |
+
],
|
| 8 |
+
"attention_bias": false,
|
| 9 |
+
"attention_dropout": 0.0,
|
| 10 |
+
"dtype": "bfloat16",
|
| 11 |
+
"head_dim": 64,
|
| 12 |
+
"hidden_act": "silu",
|
| 13 |
+
"hidden_size": 2048,
|
| 14 |
+
"initializer_range": 0.02,
|
| 15 |
+
"intermediate_size": 8192,
|
| 16 |
+
"max_position_embeddings": 131072,
|
| 17 |
+
"mlp_bias": false,
|
| 18 |
+
"model_type": "llama",
|
| 19 |
+
"neuron": {
|
| 20 |
+
"_serialized_key": "NxDNeuronConfig",
|
| 21 |
+
"batch_size": 1,
|
| 22 |
+
"capacity_factor": null,
|
| 23 |
+
"checkpoint_id": "meta-llama/Llama-3.2-1B-Instruct",
|
| 24 |
+
"checkpoint_revision": "9213176726f574b556790deb65791e0c5aa438b6",
|
| 25 |
+
"continuous_batching": false,
|
| 26 |
+
"ep_degree": 1,
|
| 27 |
+
"fused_qkv": true,
|
| 28 |
+
"glu_mlp": true,
|
| 29 |
+
"local_ranks_size": 2,
|
| 30 |
+
"max_batch_size": 1,
|
| 31 |
+
"max_context_length": 8192,
|
| 32 |
+
"max_topk": 256,
|
| 33 |
+
"n_active_tokens": 8192,
|
| 34 |
+
"neuronxcc_version": "2.21.33363.0+82129205",
|
| 35 |
+
"on_device_sampling": false,
|
| 36 |
+
"optimum_neuron_version": "0.4.4.dev2",
|
| 37 |
+
"output_logits": false,
|
| 38 |
+
"pp_degree": 1,
|
| 39 |
+
"sequence_length": 8192,
|
| 40 |
+
"sequence_parallel_enabled": true,
|
| 41 |
+
"speculation_length": 0,
|
| 42 |
+
"start_rank_id": 0,
|
| 43 |
+
"target": "trn1",
|
| 44 |
+
"torch_dtype": "bfloat16",
|
| 45 |
+
"tp_degree": 2
|
| 46 |
+
},
|
| 47 |
+
"num_attention_heads": 32,
|
| 48 |
+
"num_hidden_layers": 16,
|
| 49 |
+
"num_key_value_heads": 8,
|
| 50 |
+
"pretraining_tp": 1,
|
| 51 |
+
"rms_norm_eps": 1e-05,
|
| 52 |
+
"rope_scaling": {
|
| 53 |
+
"factor": 32.0,
|
| 54 |
+
"high_freq_factor": 4.0,
|
| 55 |
+
"low_freq_factor": 1.0,
|
| 56 |
+
"original_max_position_embeddings": 8192,
|
| 57 |
+
"rope_type": "llama3"
|
| 58 |
+
},
|
| 59 |
+
"rope_theta": 500000.0,
|
| 60 |
+
"tie_word_embeddings": true,
|
| 61 |
+
"use_cache": true,
|
| 62 |
+
"vocab_size": 128256
|
| 63 |
+
}
|
neuronxcc-2.21.33363.0+82129205/MODULE_0c0c570336081d2ddd3c+24129607/compile_flags.json
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/context_encoding/_tp0_bk0/log-neuron-cc.txt"]
|
neuronxcc-2.21.33363.0+82129205/MODULE_0c0c570336081d2ddd3c+24129607/model.done
ADDED
|
File without changes
|
neuronxcc-2.21.33363.0+82129205/MODULE_0c0c570336081d2ddd3c+24129607/model.hlo_module.pb
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:19f928de65496854001ada7e5e53a70b74032c92d33e8c48710fb591fb579ccc
|
| 3 |
+
size 434848
|
neuronxcc-2.21.33363.0+82129205/MODULE_0c0c570336081d2ddd3c+24129607/model.neff
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3d8c21ed45fb889dd1b85413d67e9ff34d25354073330931cc7bceb2f401e862
|
| 3 |
+
size 114985984
|
neuronxcc-2.21.33363.0+82129205/MODULE_1ac352f09de58a202958+24129607/compile_flags.json
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/context_encoding/_tp0_bk0/log-neuron-cc.txt"]
|
neuronxcc-2.21.33363.0+82129205/MODULE_1ac352f09de58a202958+24129607/model.done
ADDED
|
File without changes
|
neuronxcc-2.21.33363.0+82129205/MODULE_1ac352f09de58a202958+24129607/model.hlo_module.pb
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8f0a59f05f75f44d4f152165dd1498bbacd1bb716a5038c4edefa78073442b0c
|
| 3 |
+
size 928451
|
neuronxcc-2.21.33363.0+82129205/MODULE_1ac352f09de58a202958+24129607/model.neff
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:576906166482527d7ac353da0534e8fe32fa597ef3ab1f5c105a0538e3da863a
|
| 3 |
+
size 41851904
|
neuronxcc-2.21.33363.0+82129205/MODULE_3127262d3bc119879dfa+24129607/compile_flags.json
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/context_encoding/_tp0_bk0/log-neuron-cc.txt"]
|
neuronxcc-2.21.33363.0+82129205/MODULE_3127262d3bc119879dfa+24129607/model.done
ADDED
|
File without changes
|
neuronxcc-2.21.33363.0+82129205/MODULE_3127262d3bc119879dfa+24129607/model.hlo_module.pb
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9e2d78445e08d3210569f8562c247dacd71c96303252860c4275cd1aa5223c24
|
| 3 |
+
size 465940
|
neuronxcc-2.21.33363.0+82129205/MODULE_3127262d3bc119879dfa+24129607/model.neff
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:bf958b8008d117987b44745851fca69111ec2ac1ab25578a16fed03f2580b530
|
| 3 |
+
size 114279424
|
neuronxcc-2.21.33363.0+82129205/MODULE_85454497bce26576d95d+a02c3a36/compile_flags.json
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/token_generation/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"]
|
neuronxcc-2.21.33363.0+82129205/MODULE_85454497bce26576d95d+a02c3a36/model.done
ADDED
|
File without changes
|
neuronxcc-2.21.33363.0+82129205/MODULE_85454497bce26576d95d+a02c3a36/model.hlo_module.pb
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c2941ff5bfa2ac33683363d48b44dd5eb9a7930bd31fdea40bf832b3cadc2e25
|
| 3 |
+
size 769257
|
neuronxcc-2.21.33363.0+82129205/MODULE_85454497bce26576d95d+a02c3a36/model.neff
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1b7f6ea5e68057a9d5ad76e682963091a6503e49155f4c601cbd9c31a835d58c
|
| 3 |
+
size 8899584
|
neuronxcc-2.21.33363.0+82129205/MODULE_85454497bce26576d95d+a02c3a36/wrapped_neff.hlo
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3692add274fc47e40761a3044d5e14815585874653cfb04fcb9a420478d78c18
|
| 3 |
+
size 9047399
|
neuronxcc-2.21.33363.0+82129205/MODULE_9088cab965c880f237a4+a02c3a36/compile_flags.json
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/token_generation/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"]
|
neuronxcc-2.21.33363.0+82129205/MODULE_9088cab965c880f237a4+a02c3a36/model.done
ADDED
|
File without changes
|
neuronxcc-2.21.33363.0+82129205/MODULE_9088cab965c880f237a4+a02c3a36/model.hlo_module.pb
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3f3742f0d123d956d174e40c072a858a13a03ef258da8f2056da95bbed4653ab
|
| 3 |
+
size 756502
|
neuronxcc-2.21.33363.0+82129205/MODULE_9088cab965c880f237a4+a02c3a36/model.neff
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:95a2b18be62bf42c74fa32c3167d04500cd5dcf04213099083be59e17ef89ee8
|
| 3 |
+
size 6902784
|
neuronxcc-2.21.33363.0+82129205/MODULE_9088cab965c880f237a4+a02c3a36/wrapped_neff.hlo
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3fa0f993403352abd4aad1c6397c69b3cb2599e47624d4b32fa8fa0c3e2f4560
|
| 3 |
+
size 7050133
|
neuronxcc-2.21.33363.0+82129205/MODULE_a7db8b94be5fa8c63086+24129607/compile_flags.json
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/context_encoding/_tp0_bk0/log-neuron-cc.txt"]
|
neuronxcc-2.21.33363.0+82129205/MODULE_a7db8b94be5fa8c63086+24129607/model.done
ADDED
|
File without changes
|
neuronxcc-2.21.33363.0+82129205/MODULE_a7db8b94be5fa8c63086+24129607/model.hlo_module.pb
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:aff7812e7179908192c31870402bb39536413f49103f4d67f6d7f204f3e5185f
|
| 3 |
+
size 972333
|
neuronxcc-2.21.33363.0+82129205/MODULE_a7db8b94be5fa8c63086+24129607/model.neff
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f0c7cfabffc71aff561f9f1a1a4f12dbbe2c485599f7f1c0c901469bef84860d
|
| 3 |
+
size 41892864
|
neuronxcc-2.21.33363.0+82129205/MODULE_cafaaccbcb3304f08d70+24129607/compile_flags.json
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/context_encoding/_tp0_bk0/log-neuron-cc.txt"]
|
neuronxcc-2.21.33363.0+82129205/MODULE_cafaaccbcb3304f08d70+24129607/model.done
ADDED
|
File without changes
|
neuronxcc-2.21.33363.0+82129205/MODULE_cafaaccbcb3304f08d70+24129607/model.hlo_module.pb
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f9a75d6679d5de1f5062dfddb72d5621e645bc2830fdb1b70c65529e581d9cd0
|
| 3 |
+
size 505502
|
neuronxcc-2.21.33363.0+82129205/MODULE_cafaaccbcb3304f08d70+24129607/model.neff
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:549f16d4c19caabedc4e743121854d85ce13e58b9deed7463efd5706da06c9e7
|
| 3 |
+
size 114074624
|
neuronxcc-2.21.33363.0+82129205/MODULE_da1fe9f94d1912f89f98+24129607/compile_flags.json
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/context_encoding/_tp0_bk0/log-neuron-cc.txt"]
|
neuronxcc-2.21.33363.0+82129205/MODULE_da1fe9f94d1912f89f98+24129607/model.done
ADDED
|
File without changes
|
neuronxcc-2.21.33363.0+82129205/MODULE_da1fe9f94d1912f89f98+24129607/model.hlo_module.pb
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1239ef1590682b574cd985d60ca0602fb970b86e4a717dc3a70cb4afaaabb860
|
| 3 |
+
size 869444
|
neuronxcc-2.21.33363.0+82129205/MODULE_da1fe9f94d1912f89f98+24129607/model.neff
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1872dff540e41af1855780dc910589f7bfcdf22983d14413e19ffcc5ca6e963f
|
| 3 |
+
size 6616064
|
neuronxcc-2.21.33363.0+82129205/MODULE_e423e95ee77bbcfd6982+a02c3a36/compile_flags.json
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/token_generation/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"]
|
neuronxcc-2.21.33363.0+82129205/MODULE_e423e95ee77bbcfd6982+a02c3a36/model.done
ADDED
|
File without changes
|
neuronxcc-2.21.33363.0+82129205/MODULE_e423e95ee77bbcfd6982+a02c3a36/model.hlo_module.pb
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7d3e756d8fcdf483ac9d147d0dd0a09ec65b64b3e8fd6380879fb2315321d65d
|
| 3 |
+
size 395607
|
neuronxcc-2.21.33363.0+82129205/MODULE_e423e95ee77bbcfd6982+a02c3a36/model.neff
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:62664749edfececd6069d80c0fdb784d83afb1bb3838d22a7a6a7a429144b4db
|
| 3 |
+
size 2171904
|
neuronxcc-2.21.33363.0+82129205/MODULE_e423e95ee77bbcfd6982+a02c3a36/wrapped_neff.hlo
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:63cf62f2c48a4f9cde1e8da4213d91c7a2fe5f7debbf1d62ee79f1ebc70a3c66
|
| 3 |
+
size 2245876
|
neuronxcc-2.21.33363.0+82129205/MODULE_fa675f3a434a3d346112+a02c3a36/compile_flags.json
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/token_generation/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"]
|
neuronxcc-2.21.33363.0+82129205/MODULE_fa675f3a434a3d346112+a02c3a36/model.done
ADDED
|
File without changes
|
neuronxcc-2.21.33363.0+82129205/MODULE_fa675f3a434a3d346112+a02c3a36/model.hlo_module.pb
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e56bcad5523a0e96e80ff0aad4077fb4427df4e57058d493e20a6511c91c9449
|
| 3 |
+
size 799960
|
neuronxcc-2.21.33363.0+82129205/MODULE_fa675f3a434a3d346112+a02c3a36/model.neff
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b566d1ca9bbe809614e9c072e9e909f8c8ceb89ff61085c391bce4f157564943
|
| 3 |
+
size 6872064
|
neuronxcc-2.21.33363.0+82129205/MODULE_fa675f3a434a3d346112+a02c3a36/wrapped_neff.hlo
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7bf109196d8338da1e36f5ecd489bc4f0483167a41755481ae26722ae50d6a46
|
| 3 |
+
size 7019528
|