diff --git a/.gitattributes b/.gitattributes index ed253ba40fe7ae48a21600006f716f18c66dc729..7627a4e1ab52235ef973f09f2a4771b0d9293155 100644 --- a/.gitattributes +++ b/.gitattributes @@ -7141,3 +7141,24 @@ neuronxcc-2.21.33363.0+82129205/MODULE_50933980a498d1588ed1+a02c3a36/wrapped_nef neuronxcc-2.21.33363.0+82129205/MODULE_120ca30bc72b9b137b57+6170d8e1/model.neff filter=lfs diff=lfs merge=lfs -text neuronxcc-2.21.33363.0+82129205/MODULE_68b1b688bc907867445e+a02c3a36/model.neff filter=lfs diff=lfs merge=lfs -text neuronxcc-2.21.33363.0+82129205/MODULE_68b1b688bc907867445e+a02c3a36/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_0007bf645cd8f44068db+a02c3a36/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_0007bf645cd8f44068db+a02c3a36/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_404621bbb97f199be5e0+f077467b/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_404621bbb97f199be5e0+f077467b/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_8025f9b606fa6335fe08+a32116a7/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_a25a39b4c41e8b2cde6e+6170d8e1/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_a8db5771dcb730ef5627+3794e5d6/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_a8db5771dcb730ef5627+3794e5d6/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_a91a06f2317ad34aad7f+ac10809c/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_a91a06f2317ad34aad7f+ac10809c/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_bfde8ebf354636b209da+24129607/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_c30315f06032f1c043d1+30e2d3d0/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_c30315f06032f1c043d1+30e2d3d0/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_df184b2f6028b6fccfdc+db16d357/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_df184b2f6028b6fccfdc+db16d357/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_e737e0fdb56bf5bd26fc+a02c3a36/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_e737e0fdb56bf5bd26fc+a02c3a36/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_ef4584e237468f2869e3+dd1b78ca/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_ef4584e237468f2869e3+dd1b78ca/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_fb23d3cbf7cf9571e3f2+0338459e/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_fb23d3cbf7cf9571e3f2+0338459e/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text diff --git a/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.6.dev3/2da7a00f0478d50ae1e7f75f085c5b2773b5f355f427c61cf34cb6febd629d96/6b7aebc14c435ae3db63.json b/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.6.dev3/2da7a00f0478d50ae1e7f75f085c5b2773b5f355f427c61cf34cb6febd629d96/6b7aebc14c435ae3db63.json new file mode 100644 index 0000000000000000000000000000000000000000..18b3dd814a9962d736002ffa618954a880743a90 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.6.dev3/2da7a00f0478d50ae1e7f75f085c5b2773b5f355f427c61cf34cb6febd629d96/6b7aebc14c435ae3db63.json @@ -0,0 +1,60 @@ +{ + "_entry_class": "SingleModelCacheEntry", + "_model_id": "yujiepan/phi-4-tiny-random", + "_task": "text-generation", + "architectures": [ + "Phi3ForCausalLM" + ], + "attention_bias": false, + "attention_dropout": 0.0, + "auto_map": {}, + "dtype": "bfloat16", + "embd_pdrop": 0.0, + "hidden_act": "silu", + "hidden_size": 16, + "initializer_range": 0.02, + "intermediate_size": 32, + "max_position_embeddings": 16384, + "model_type": "phi3", + "neuron": { + "_serialized_key": "NxDNeuronConfig", + "batch_size": 1, + "capacity_factor": null, + "checkpoint_id": "yujiepan/phi-4-tiny-random", + "checkpoint_revision": "18a9a1168dc97ac6d128f811925670c275610f5a", + "continuous_batching": false, + "ep_degree": 1, + "fused_qkv": true, + "glu_mlp": true, + "local_ranks_size": 2, + "max_batch_size": 1, + "max_context_length": 1024, + "max_topk": 256, + "n_active_tokens": 1024, + "neuronxcc_version": "2.21.33363.0+82129205", + "on_device_sampling": true, + "optimum_neuron_version": "0.4.6.dev3", + "output_logits": false, + "pp_degree": 1, + "prefill_chunk_size": 0, + "sequence_length": 1024, + "speculation_length": 0, + "start_rank_id": 0, + "target": "trn1", + "torch_dtype": "bfloat16", + "tp_degree": 2 + }, + "num_attention_heads": 2, + "num_hidden_layers": 2, + "num_key_value_heads": 1, + "original_max_position_embeddings": 16384, + "partial_rotary_factor": 1.0, + "resid_pdrop": 0.0, + "rms_norm_eps": 1e-05, + "rope_scaling": null, + "rope_theta": 250000, + "sliding_window": null, + "tie_word_embeddings": false, + "use_cache": true, + "vocab_size": 100352 +} \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.6.dev3/441269935591cad8d370e512c0b93cdd2fce6247c40e5a4866d872ee5338b0de/e912866445bcdd7bd532.json b/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.6.dev3/441269935591cad8d370e512c0b93cdd2fce6247c40e5a4866d872ee5338b0de/e912866445bcdd7bd532.json new file mode 100644 index 0000000000000000000000000000000000000000..03661a7fc14cabd01210526826a45c47c1b0c931 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.6.dev3/441269935591cad8d370e512c0b93cdd2fce6247c40e5a4866d872ee5338b0de/e912866445bcdd7bd532.json @@ -0,0 +1,82 @@ +{ + "_entry_class": "SingleModelCacheEntry", + "_model_id": "unsloth/gemma-3-270m-it", + "_sliding_window_pattern": 6, + "_task": "text-generation", + "architectures": [ + "Gemma3ForCausalLM" + ], + "attention_bias": false, + "attention_dropout": 0.0, + "attn_logit_softcapping": null, + "dtype": "bfloat16", + "final_logit_softcapping": null, + "head_dim": 256, + "hidden_activation": "gelu_pytorch_tanh", + "hidden_size": 640, + "initializer_range": 0.02, + "intermediate_size": 2048, + "layer_types": [ + "sliding_attention", + "sliding_attention", + "sliding_attention", + "sliding_attention", + "sliding_attention", + "full_attention", + "sliding_attention", + "sliding_attention", + "sliding_attention", + "sliding_attention", + "sliding_attention", + "full_attention", + "sliding_attention", + "sliding_attention", + "sliding_attention", + "sliding_attention", + "sliding_attention", + "full_attention" + ], + "max_position_embeddings": 32768, + "model_type": "gemma3_text", + "neuron": { + "_serialized_key": "NxDNeuronConfig", + "batch_size": 1, + "capacity_factor": null, + "checkpoint_id": "unsloth/gemma-3-270m-it", + "checkpoint_revision": "23cf460f6bb16954176b3ddcc8d4f250501458a9", + "continuous_batching": false, + "ep_degree": 1, + "fused_qkv": true, + "glu_mlp": true, + "local_ranks_size": 2, + "max_batch_size": 1, + "max_context_length": 1024, + "max_topk": 256, + "n_active_tokens": 1024, + "neuronxcc_version": "2.21.33363.0+82129205", + "on_device_sampling": true, + "optimum_neuron_version": "0.4.6.dev3", + "output_logits": false, + "pp_degree": 1, + "prefill_chunk_size": 0, + "sequence_length": 1024, + "speculation_length": 0, + "start_rank_id": 0, + "target": "trn1", + "torch_dtype": "bfloat16", + "tp_degree": 2 + }, + "num_attention_heads": 4, + "num_hidden_layers": 18, + "num_key_value_heads": 1, + "query_pre_attn_scalar": 256, + "rms_norm_eps": 1e-06, + "rope_local_base_freq": 10000.0, + "rope_scaling": null, + "rope_theta": 1000000.0, + "sliding_window": 512, + "unsloth_fixed": true, + "use_bidirectional_attention": false, + "use_cache": true, + "vocab_size": 262144 +} \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.6.dev3/4ab8140bc7eb4a553d95855c5c2be2cf8c0fbab21b823d76183b6f51e98b6fc5/1171cdc1e0668ecced1b.json b/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.6.dev3/4ab8140bc7eb4a553d95855c5c2be2cf8c0fbab21b823d76183b6f51e98b6fc5/1171cdc1e0668ecced1b.json new file mode 100644 index 0000000000000000000000000000000000000000..83a4adbcfbfb3249b20ca9428c1d2b331cde40ac --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.6.dev3/4ab8140bc7eb4a553d95855c5c2be2cf8c0fbab21b823d76183b6f51e98b6fc5/1171cdc1e0668ecced1b.json @@ -0,0 +1,59 @@ +{ + "_entry_class": "SingleModelCacheEntry", + "_model_id": "dacorvo/Mixtral-tiny", + "_task": "text-generation", + "architectures": [ + "MixtralForCausalLM" + ], + "attention_dropout": 0.0, + "dtype": "float16", + "head_dim": 32, + "hidden_act": "silu", + "hidden_size": 1024, + "initializer_range": 0.02, + "intermediate_size": 3584, + "max_position_embeddings": 1024, + "model_type": "mixtral", + "neuron": { + "_serialized_key": "NxDNeuronConfig", + "batch_size": 1, + "capacity_factor": null, + "checkpoint_id": "dacorvo/Mixtral-tiny", + "checkpoint_revision": "c557ba205ddff6ea911f4719e0d543d6c08356b6", + "continuous_batching": false, + "ep_degree": 1, + "fused_qkv": false, + "glu_mlp": true, + "local_ranks_size": 2, + "max_batch_size": 1, + "max_context_length": 1024, + "max_topk": 256, + "n_active_tokens": 1024, + "neuronxcc_version": "2.21.33363.0+82129205", + "on_device_sampling": false, + "optimum_neuron_version": "0.4.6.dev3", + "output_logits": false, + "pp_degree": 1, + "prefill_chunk_size": 0, + "sequence_length": 1024, + "speculation_length": 0, + "start_rank_id": 0, + "target": "trn1", + "torch_dtype": "float16", + "tp_degree": 2 + }, + "num_attention_heads": 32, + "num_experts_per_tok": 2, + "num_hidden_layers": 2, + "num_key_value_heads": 8, + "num_local_experts": 8, + "output_router_logits": false, + "rms_norm_eps": 1e-05, + "rope_theta": 10000.0, + "router_aux_loss_coef": 0.001, + "router_jitter_noise": 0.0, + "sliding_window": 4096, + "tie_word_embeddings": false, + "use_cache": true, + "vocab_size": 32000 +} \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.6.dev3/6454afdf3e9d66c7226c13a575b718845c25e53b0699600ba2bb4f883e9d841b/4b6c7416e39455d1ad2e.json b/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.6.dev3/6454afdf3e9d66c7226c13a575b718845c25e53b0699600ba2bb4f883e9d841b/4b6c7416e39455d1ad2e.json new file mode 100644 index 0000000000000000000000000000000000000000..edf2e32a3ffa22640ab356b9183dd230e3eae002 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.6.dev3/6454afdf3e9d66c7226c13a575b718845c25e53b0699600ba2bb4f883e9d841b/4b6c7416e39455d1ad2e.json @@ -0,0 +1,63 @@ +{ + "_entry_class": "SingleModelCacheEntry", + "_model_id": "llamafactory/tiny-random-Llama-3", + "_task": "text-generation", + "architectures": [ + "LlamaForCausalLM" + ], + "attention_bias": false, + "attention_dropout": 0.0, + "dtype": "float16", + "head_dim": 4, + "hidden_act": "silu", + "hidden_size": 16, + "initializer_range": 0.02, + "intermediate_size": 64, + "max_position_embeddings": 131072, + "mlp_bias": false, + "model_type": "llama", + "neuron": { + "_serialized_key": "NxDNeuronConfig", + "batch_size": 1, + "capacity_factor": null, + "checkpoint_id": "llamafactory/tiny-random-Llama-3", + "checkpoint_revision": "bf2a2e3bf199ad2ee96f02a3c00246c608db22a8", + "continuous_batching": false, + "ep_degree": 1, + "fused_qkv": true, + "glu_mlp": true, + "local_ranks_size": 2, + "max_batch_size": 1, + "max_context_length": 512, + "max_topk": 256, + "n_active_tokens": 512, + "neuronxcc_version": "2.21.33363.0+82129205", + "on_device_sampling": true, + "optimum_neuron_version": "0.4.6.dev3", + "output_logits": false, + "pp_degree": 1, + "prefill_chunk_size": 0, + "sequence_length": 512, + "speculation_length": 0, + "start_rank_id": 0, + "target": "trn1", + "torch_dtype": "float16", + "tp_degree": 2 + }, + "num_attention_heads": 4, + "num_hidden_layers": 2, + "num_key_value_heads": 4, + "pretraining_tp": 1, + "rms_norm_eps": 1e-05, + "rope_scaling": { + "factor": 8.0, + "high_freq_factor": 4.0, + "low_freq_factor": 1.0, + "original_max_position_embeddings": 8192, + "rope_type": "llama3" + }, + "rope_theta": 500000.0, + "tie_word_embeddings": false, + "use_cache": true, + "vocab_size": 128256 +} \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.6.dev3/6454afdf3e9d66c7226c13a575b718845c25e53b0699600ba2bb4f883e9d841b/5d5179e2ac0b724548b0.json b/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.6.dev3/6454afdf3e9d66c7226c13a575b718845c25e53b0699600ba2bb4f883e9d841b/5d5179e2ac0b724548b0.json new file mode 100644 index 0000000000000000000000000000000000000000..d58e4598a93c1e6ceea114a81e737328e822c003 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.6.dev3/6454afdf3e9d66c7226c13a575b718845c25e53b0699600ba2bb4f883e9d841b/5d5179e2ac0b724548b0.json @@ -0,0 +1,63 @@ +{ + "_entry_class": "SingleModelCacheEntry", + "_model_id": "llamafactory/tiny-random-Llama-3", + "_task": "text-generation", + "architectures": [ + "LlamaForCausalLM" + ], + "attention_bias": false, + "attention_dropout": 0.0, + "dtype": "float16", + "head_dim": 4, + "hidden_act": "silu", + "hidden_size": 16, + "initializer_range": 0.02, + "intermediate_size": 64, + "max_position_embeddings": 131072, + "mlp_bias": false, + "model_type": "llama", + "neuron": { + "_serialized_key": "NxDNeuronConfig", + "batch_size": 1, + "capacity_factor": null, + "checkpoint_id": "llamafactory/tiny-random-Llama-3", + "checkpoint_revision": "bf2a2e3bf199ad2ee96f02a3c00246c608db22a8", + "continuous_batching": false, + "ep_degree": 1, + "fused_qkv": true, + "glu_mlp": true, + "local_ranks_size": 2, + "max_batch_size": 1, + "max_context_length": 1024, + "max_topk": 256, + "n_active_tokens": 1024, + "neuronxcc_version": "2.21.33363.0+82129205", + "on_device_sampling": true, + "optimum_neuron_version": "0.4.6.dev3", + "output_logits": false, + "pp_degree": 1, + "prefill_chunk_size": 0, + "sequence_length": 1024, + "speculation_length": 0, + "start_rank_id": 0, + "target": "trn1", + "torch_dtype": "float16", + "tp_degree": 2 + }, + "num_attention_heads": 4, + "num_hidden_layers": 2, + "num_key_value_heads": 4, + "pretraining_tp": 1, + "rms_norm_eps": 1e-05, + "rope_scaling": { + "factor": 8.0, + "high_freq_factor": 4.0, + "low_freq_factor": 1.0, + "original_max_position_embeddings": 8192, + "rope_type": "llama3" + }, + "rope_theta": 500000.0, + "tie_word_embeddings": false, + "use_cache": true, + "vocab_size": 128256 +} \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.6.dev3/6454afdf3e9d66c7226c13a575b718845c25e53b0699600ba2bb4f883e9d841b/8f8e8c8f417393bfd04a.json b/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.6.dev3/6454afdf3e9d66c7226c13a575b718845c25e53b0699600ba2bb4f883e9d841b/8f8e8c8f417393bfd04a.json new file mode 100644 index 0000000000000000000000000000000000000000..5b973fa16a70a24bf31d9634f4f43bb7fc66b3c3 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.6.dev3/6454afdf3e9d66c7226c13a575b718845c25e53b0699600ba2bb4f883e9d841b/8f8e8c8f417393bfd04a.json @@ -0,0 +1,63 @@ +{ + "_entry_class": "SingleModelCacheEntry", + "_model_id": "llamafactory/tiny-random-Llama-3", + "_task": "text-generation", + "architectures": [ + "LlamaForCausalLM" + ], + "attention_bias": false, + "attention_dropout": 0.0, + "dtype": "float16", + "head_dim": 4, + "hidden_act": "silu", + "hidden_size": 16, + "initializer_range": 0.02, + "intermediate_size": 64, + "max_position_embeddings": 131072, + "mlp_bias": false, + "model_type": "llama", + "neuron": { + "_serialized_key": "NxDNeuronConfig", + "batch_size": 2, + "capacity_factor": null, + "checkpoint_id": "llamafactory/tiny-random-Llama-3", + "checkpoint_revision": "bf2a2e3bf199ad2ee96f02a3c00246c608db22a8", + "continuous_batching": true, + "ep_degree": 1, + "fused_qkv": true, + "glu_mlp": true, + "local_ranks_size": 2, + "max_batch_size": 2, + "max_context_length": 128, + "max_topk": 256, + "n_active_tokens": 128, + "neuronxcc_version": "2.21.33363.0+82129205", + "on_device_sampling": true, + "optimum_neuron_version": "0.4.6.dev3", + "output_logits": false, + "pp_degree": 1, + "prefill_chunk_size": 0, + "sequence_length": 128, + "speculation_length": 0, + "start_rank_id": 0, + "target": "trn2", + "torch_dtype": "float16", + "tp_degree": 2 + }, + "num_attention_heads": 4, + "num_hidden_layers": 2, + "num_key_value_heads": 4, + "pretraining_tp": 1, + "rms_norm_eps": 1e-05, + "rope_scaling": { + "factor": 8.0, + "high_freq_factor": 4.0, + "low_freq_factor": 1.0, + "original_max_position_embeddings": 8192, + "rope_type": "llama3" + }, + "rope_theta": 500000.0, + "tie_word_embeddings": false, + "use_cache": true, + "vocab_size": 128256 +} \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.6.dev3/73707b485eab9008c7aba7f5dad0ce2384ac685318d5f888c12fa0d81ed90b19/87f1aaa5ae1a31bb7adc.json b/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.6.dev3/73707b485eab9008c7aba7f5dad0ce2384ac685318d5f888c12fa0d81ed90b19/87f1aaa5ae1a31bb7adc.json new file mode 100644 index 0000000000000000000000000000000000000000..5ebd30127d8aef646a275d1ef9f190184088dc00 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.6.dev3/73707b485eab9008c7aba7f5dad0ce2384ac685318d5f888c12fa0d81ed90b19/87f1aaa5ae1a31bb7adc.json @@ -0,0 +1,135 @@ +{ + "_entry_class": "SingleModelCacheEntry", + "_model_id": "HuggingFaceTB/SmolLM3-3B", + "_task": "text-generation", + "architectures": [ + "SmolLM3ForCausalLM" + ], + "attention_bias": false, + "attention_dropout": 0.0, + "dtype": "bfloat16", + "hidden_act": "silu", + "hidden_size": 2048, + "initializer_range": 0.02, + "intermediate_size": 11008, + "layer_types": [ + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention" + ], + "max_position_embeddings": 65536, + "max_window_layers": 28, + "mlp_bias": false, + "model_type": "smollm3", + "neuron": { + "_serialized_key": "NxDNeuronConfig", + "batch_size": 1, + "capacity_factor": null, + "checkpoint_id": "HuggingFaceTB/SmolLM3-3B", + "checkpoint_revision": "a07cc9a04f16550a088caea529712d1d335b0ac1", + "continuous_batching": false, + "ep_degree": 1, + "fused_qkv": true, + "glu_mlp": true, + "local_ranks_size": 2, + "max_batch_size": 1, + "max_context_length": 1024, + "max_topk": 256, + "n_active_tokens": 1024, + "neuronxcc_version": "2.21.33363.0+82129205", + "on_device_sampling": true, + "optimum_neuron_version": "0.4.6.dev3", + "output_logits": false, + "pp_degree": 1, + "prefill_chunk_size": 0, + "sequence_length": 1024, + "speculation_length": 0, + "start_rank_id": 0, + "target": "trn1", + "torch_dtype": "bfloat16", + "tp_degree": 2 + }, + "no_rope_layer_interval": 4, + "no_rope_layers": [ + 1, + 1, + 1, + 0, + 1, + 1, + 1, + 0, + 1, + 1, + 1, + 0, + 1, + 1, + 1, + 0, + 1, + 1, + 1, + 0, + 1, + 1, + 1, + 0, + 1, + 1, + 1, + 0, + 1, + 1, + 1, + 0, + 1, + 1, + 1, + 0 + ], + "num_attention_heads": 16, + "num_hidden_layers": 36, + "num_key_value_heads": 4, + "pretraining_tp": 2, + "rms_norm_eps": 1e-06, + "rope_scaling": null, + "rope_theta": 5000000.0, + "sliding_window": null, + "use_cache": false, + "use_sliding_window": false, + "vocab_size": 128256 +} \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.6.dev3/7518518c7e077820070186deda960d8cc49db068cdf0ac70664098fa2b6b698c/7e378b918d8aa52c31f9.json b/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.6.dev3/7518518c7e077820070186deda960d8cc49db068cdf0ac70664098fa2b6b698c/7e378b918d8aa52c31f9.json new file mode 100644 index 0000000000000000000000000000000000000000..eb9f1d0cfe4660390dbc84c7aa8524434aa1fb55 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.6.dev3/7518518c7e077820070186deda960d8cc49db068cdf0ac70664098fa2b6b698c/7e378b918d8aa52c31f9.json @@ -0,0 +1,65 @@ +{ + "_entry_class": "SingleModelCacheEntry", + "_model_id": "yujiepan/qwen2.5-128k-tiny-random", + "_task": "text-generation", + "architectures": [ + "Qwen2ForCausalLM" + ], + "attention_dropout": 0.0, + "dtype": "bfloat16", + "hidden_act": "silu", + "hidden_size": 8, + "initializer_range": 0.02, + "intermediate_size": 16, + "layer_types": [ + "full_attention", + "full_attention" + ], + "max_position_embeddings": 32768, + "max_window_layers": 1, + "model_type": "qwen2", + "neuron": { + "_serialized_key": "NxDNeuronConfig", + "batch_size": 1, + "capacity_factor": null, + "checkpoint_id": "yujiepan/qwen2.5-128k-tiny-random", + "checkpoint_revision": "c8296d4ca3f87782876d2382fbb6481d1beb8ef0", + "continuous_batching": false, + "ep_degree": 1, + "fused_qkv": false, + "glu_mlp": true, + "local_ranks_size": 2, + "max_batch_size": 1, + "max_context_length": 1024, + "max_topk": 256, + "n_active_tokens": 1024, + "neuronxcc_version": "2.21.33363.0+82129205", + "on_device_sampling": true, + "optimum_neuron_version": "0.4.6.dev3", + "output_logits": false, + "pp_degree": 1, + "prefill_chunk_size": 0, + "sequence_length": 1024, + "speculation_length": 0, + "start_rank_id": 0, + "target": "trn1", + "torch_dtype": "bfloat16", + "tp_degree": 2 + }, + "num_attention_heads": 4, + "num_hidden_layers": 2, + "num_key_value_heads": 2, + "rms_norm_eps": 1e-06, + "rope_scaling": { + "factor": 4.0, + "original_max_position_embeddings": 32768, + "rope_type": "yarn", + "type": "yarn" + }, + "rope_theta": 1000000.0, + "sliding_window": null, + "tie_word_embeddings": false, + "use_cache": true, + "use_sliding_window": false, + "vocab_size": 152064 +} \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.6.dev3/920f44ce6d3e004d1ce547ae06644f7be262180644b04573153aa15d98742edc/ad0f2997db25e16e085b.json b/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.6.dev3/920f44ce6d3e004d1ce547ae06644f7be262180644b04573153aa15d98742edc/ad0f2997db25e16e085b.json new file mode 100644 index 0000000000000000000000000000000000000000..52d5acc13998240384df38ecf2eff69f3ef4d042 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.6.dev3/920f44ce6d3e004d1ce547ae06644f7be262180644b04573153aa15d98742edc/ad0f2997db25e16e085b.json @@ -0,0 +1,66 @@ +{ + "_entry_class": "SingleModelCacheEntry", + "_model_id": "optimum-internal-testing/tiny-random-qwen3_moe", + "_task": "text-generation", + "architectures": [ + "Qwen3MoeForCausalLM" + ], + "attention_bias": false, + "attention_dropout": 0.0, + "decoder_sparse_step": 2, + "dtype": "float32", + "head_dim": 32, + "hidden_act": "silu", + "hidden_size": 64, + "initializer_range": 0.02, + "intermediate_size": 128, + "max_position_embeddings": 40960, + "max_window_layers": 1, + "mlp_only_layers": [], + "model_type": "qwen3_moe", + "moe_intermediate_size": 128, + "neuron": { + "_serialized_key": "NxDNeuronConfig", + "batch_size": 1, + "capacity_factor": null, + "checkpoint_id": "optimum-internal-testing/tiny-random-qwen3_moe", + "checkpoint_revision": "e0230be2839556b44b7400a233c73c74b4abb7af", + "continuous_batching": false, + "ep_degree": 1, + "fused_qkv": false, + "glu_mlp": true, + "local_ranks_size": 2, + "max_batch_size": 1, + "max_context_length": 1024, + "max_topk": 256, + "n_active_tokens": 1024, + "neuronxcc_version": "2.21.33363.0+82129205", + "on_device_sampling": true, + "optimum_neuron_version": "0.4.6.dev3", + "output_logits": false, + "pp_degree": 1, + "prefill_chunk_size": 0, + "sequence_length": 1024, + "speculation_length": 0, + "start_rank_id": 0, + "target": "trn1", + "torch_dtype": "float32", + "tp_degree": 2 + }, + "norm_topk_prob": true, + "num_attention_heads": 2, + "num_experts": 8, + "num_experts_per_tok": 2, + "num_hidden_layers": 2, + "num_key_value_heads": 1, + "output_router_logits": false, + "rms_norm_eps": 1e-06, + "rope_scaling": null, + "rope_theta": 1000000.0, + "router_aux_loss_coef": 0.001, + "sliding_window": null, + "tie_word_embeddings": true, + "use_cache": true, + "use_sliding_window": false, + "vocab_size": 151936 +} \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.6.dev3/9c24a2080ec26e9c74d5bd90866f74131aa4d5c975415b96f5e6600f081d5647/d244406bccd80288e991.json b/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.6.dev3/9c24a2080ec26e9c74d5bd90866f74131aa4d5c975415b96f5e6600f081d5647/d244406bccd80288e991.json new file mode 100644 index 0000000000000000000000000000000000000000..a55b49da2a9045011fb3650a640da380dec561cb --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.6.dev3/9c24a2080ec26e9c74d5bd90866f74131aa4d5c975415b96f5e6600f081d5647/d244406bccd80288e991.json @@ -0,0 +1,82 @@ +{ + "_entry_class": "SingleModelCacheEntry", + "_model_id": "tiny-random/llama-4", + "_task": "text-generation", + "attention_bias": false, + "attention_chunk_size": 128, + "attention_dropout": 0.0, + "attn_scale": 0.1, + "attn_temperature_tuning": 4, + "cache_implementation": "hybrid", + "dtype": "bfloat16", + "floor_scale": 8192, + "for_llm_compressor": false, + "head_dim": 32, + "hidden_act": "silu", + "hidden_size": 32, + "initializer_range": 0.02, + "interleave_moe_layer_step": 2, + "intermediate_size": 64, + "intermediate_size_mlp": 128, + "layer_types": [ + "chunked_attention", + "chunked_attention", + "chunked_attention", + "full_attention" + ], + "max_position_embeddings": 1048576, + "model_type": "llama4_text", + "moe_layers": [ + 1, + 3 + ], + "neuron": { + "_serialized_key": "NxDNeuronConfig", + "batch_size": 1, + "capacity_factor": null, + "checkpoint_id": "tiny-random/llama-4", + "checkpoint_revision": "9e716f5d4d1ffe0a44a15f46f4a12b840439aba4", + "continuous_batching": false, + "ep_degree": 1, + "fused_qkv": false, + "glu_mlp": true, + "local_ranks_size": 2, + "max_batch_size": 1, + "max_context_length": 1024, + "max_topk": 256, + "n_active_tokens": 1024, + "neuronxcc_version": "2.21.33363.0+82129205", + "on_device_sampling": true, + "optimum_neuron_version": "0.4.6.dev3", + "output_logits": false, + "pp_degree": 1, + "prefill_chunk_size": 0, + "sequence_length": 1024, + "speculation_length": 0, + "start_rank_id": 0, + "target": "trn1", + "torch_dtype": "bfloat16", + "tp_degree": 2 + }, + "no_rope_layers": [ + 1, + 1, + 1, + 0 + ], + "num_attention_heads": 1, + "num_experts_per_tok": 1, + "num_hidden_layers": 4, + "num_key_value_heads": 1, + "num_local_experts": 8, + "output_router_logits": false, + "rms_norm_eps": 1e-05, + "rope_scaling": null, + "rope_theta": 500000.0, + "router_aux_loss_coef": 0.001, + "router_jitter_noise": 0.0, + "tie_word_embeddings": true, + "use_cache": true, + "use_qk_norm": true, + "vocab_size": 202048 +} \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.6.dev3/cf6b9a360dcf294104671106bae2adbd9fd291823bb60a351883163684073231/124119d9f41b205009a0.json b/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.6.dev3/cf6b9a360dcf294104671106bae2adbd9fd291823bb60a351883163684073231/124119d9f41b205009a0.json new file mode 100644 index 0000000000000000000000000000000000000000..f418d2a06be93d78bc0cd40102f5d69a20a44ddb --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.6.dev3/cf6b9a360dcf294104671106bae2adbd9fd291823bb60a351883163684073231/124119d9f41b205009a0.json @@ -0,0 +1,64 @@ +{ + "_entry_class": "SingleModelCacheEntry", + "_model_id": "unsloth/Llama-3.2-1B-Instruct", + "_task": "text-generation", + "architectures": [ + "LlamaForCausalLM" + ], + "attention_bias": false, + "attention_dropout": 0.0, + "dtype": "bfloat16", + "head_dim": 64, + "hidden_act": "silu", + "hidden_size": 2048, + "initializer_range": 0.02, + "intermediate_size": 8192, + "max_position_embeddings": 131072, + "mlp_bias": false, + "model_type": "llama", + "neuron": { + "_serialized_key": "NxDNeuronConfig", + "batch_size": 1, + "capacity_factor": null, + "checkpoint_id": "unsloth/Llama-3.2-1B-Instruct", + "checkpoint_revision": "5a8abab4a5d6f164389b1079fb721cfab8d7126c", + "continuous_batching": false, + "ep_degree": 1, + "fused_qkv": true, + "glu_mlp": true, + "local_ranks_size": 2, + "max_batch_size": 1, + "max_context_length": 4096, + "max_topk": 256, + "n_active_tokens": 4096, + "neuronxcc_version": "2.21.33363.0+82129205", + "on_device_sampling": true, + "optimum_neuron_version": "0.4.6.dev3", + "output_logits": false, + "pp_degree": 1, + "prefill_chunk_size": 1024, + "sequence_length": 4096, + "speculation_length": 0, + "start_rank_id": 0, + "target": "trn1", + "torch_dtype": "bfloat16", + "tp_degree": 2 + }, + "num_attention_heads": 32, + "num_hidden_layers": 16, + "num_key_value_heads": 8, + "pretraining_tp": 1, + "rms_norm_eps": 1e-05, + "rope_scaling": { + "factor": 32.0, + "high_freq_factor": 4.0, + "low_freq_factor": 1.0, + "original_max_position_embeddings": 8192, + "rope_type": "llama3" + }, + "rope_theta": 500000.0, + "tie_word_embeddings": true, + "unsloth_fixed": true, + "use_cache": true, + "vocab_size": 128256 +} \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.6.dev3/cf6b9a360dcf294104671106bae2adbd9fd291823bb60a351883163684073231/80f4956a4a5775280772.json b/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.6.dev3/cf6b9a360dcf294104671106bae2adbd9fd291823bb60a351883163684073231/80f4956a4a5775280772.json new file mode 100644 index 0000000000000000000000000000000000000000..fd48c09ea37cb8cb7c9d71611d18c5b711e244c6 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.6.dev3/cf6b9a360dcf294104671106bae2adbd9fd291823bb60a351883163684073231/80f4956a4a5775280772.json @@ -0,0 +1,64 @@ +{ + "_entry_class": "SingleModelCacheEntry", + "_model_id": "unsloth/Llama-3.2-1B-Instruct", + "_task": "text-generation", + "architectures": [ + "LlamaForCausalLM" + ], + "attention_bias": false, + "attention_dropout": 0.0, + "dtype": "bfloat16", + "head_dim": 64, + "hidden_act": "silu", + "hidden_size": 2048, + "initializer_range": 0.02, + "intermediate_size": 8192, + "max_position_embeddings": 131072, + "mlp_bias": false, + "model_type": "llama", + "neuron": { + "_serialized_key": "NxDNeuronConfig", + "batch_size": 1, + "capacity_factor": null, + "checkpoint_id": "unsloth/Llama-3.2-1B-Instruct", + "checkpoint_revision": null, + "continuous_batching": false, + "ep_degree": 1, + "fused_qkv": false, + "glu_mlp": true, + "local_ranks_size": 2, + "max_batch_size": 1, + "max_context_length": 4096, + "max_topk": 256, + "n_active_tokens": 4096, + "neuronxcc_version": "2.21.33363.0+82129205", + "on_device_sampling": false, + "optimum_neuron_version": "0.4.6.dev3", + "output_logits": false, + "pp_degree": 1, + "prefill_chunk_size": 0, + "sequence_length": 4096, + "speculation_length": 5, + "start_rank_id": 0, + "target": "trn1", + "torch_dtype": "bfloat16", + "tp_degree": 2 + }, + "num_attention_heads": 32, + "num_hidden_layers": 16, + "num_key_value_heads": 8, + "pretraining_tp": 1, + "rms_norm_eps": 1e-05, + "rope_scaling": { + "factor": 32.0, + "high_freq_factor": 4.0, + "low_freq_factor": 1.0, + "original_max_position_embeddings": 8192, + "rope_type": "llama3" + }, + "rope_theta": 500000.0, + "tie_word_embeddings": true, + "unsloth_fixed": true, + "use_cache": true, + "vocab_size": 128256 +} \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.6.dev3/d139acf64685f15794bb983ff6eb881bdd31304bae88b0ce1ed20a54c21f2265/4aab0cb19b60948b084e.json b/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.6.dev3/d139acf64685f15794bb983ff6eb881bdd31304bae88b0ce1ed20a54c21f2265/4aab0cb19b60948b084e.json new file mode 100644 index 0000000000000000000000000000000000000000..202130a0db2dc520a85aead12163a8475ecb8c0a --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.6.dev3/d139acf64685f15794bb983ff6eb881bdd31304bae88b0ce1ed20a54c21f2265/4aab0cb19b60948b084e.json @@ -0,0 +1,59 @@ +{ + "_entry_class": "SingleModelCacheEntry", + "_model_id": "hf-internal-testing/tiny-random-GraniteForCausalLM", + "_task": "text-generation", + "architectures": [ + "GraniteForCausalLM" + ], + "attention_bias": false, + "attention_dropout": 0.0, + "attention_multiplier": 1.0, + "dtype": "float32", + "embedding_multiplier": 1.0, + "hidden_act": "silu", + "hidden_size": 32, + "initializer_range": 0.02, + "intermediate_size": 64, + "logits_scaling": 1.0, + "max_position_embeddings": 2048, + "mlp_bias": false, + "model_type": "granite", + "neuron": { + "_serialized_key": "NxDNeuronConfig", + "batch_size": 1, + "capacity_factor": null, + "checkpoint_id": "hf-internal-testing/tiny-random-GraniteForCausalLM", + "checkpoint_revision": "c3074ebc0ac2fe545305f5e5f6cce2cc9b2aa0c5", + "continuous_batching": false, + "ep_degree": 1, + "fused_qkv": true, + "glu_mlp": true, + "local_ranks_size": 2, + "max_batch_size": 1, + "max_context_length": 1024, + "max_topk": 256, + "n_active_tokens": 1024, + "neuronxcc_version": "2.21.33363.0+82129205", + "on_device_sampling": true, + "optimum_neuron_version": "0.4.6.dev3", + "output_logits": false, + "pp_degree": 1, + "prefill_chunk_size": 0, + "sequence_length": 1024, + "speculation_length": 0, + "start_rank_id": 0, + "target": "trn1", + "torch_dtype": "float32", + "tp_degree": 2 + }, + "num_attention_heads": 4, + "num_hidden_layers": 2, + "num_key_value_heads": 4, + "residual_multiplier": 1.0, + "rms_norm_eps": 1e-06, + "rope_scaling": null, + "rope_theta": 10000.0, + "tie_word_embeddings": false, + "use_cache": true, + "vocab_size": 49152 +} \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.6.dev3/granite/hf-internal-testing/tiny-random-GraniteForCausalLM/4aab0cb19b60948b084e.json b/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.6.dev3/granite/hf-internal-testing/tiny-random-GraniteForCausalLM/4aab0cb19b60948b084e.json new file mode 100644 index 0000000000000000000000000000000000000000..202130a0db2dc520a85aead12163a8475ecb8c0a --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.6.dev3/granite/hf-internal-testing/tiny-random-GraniteForCausalLM/4aab0cb19b60948b084e.json @@ -0,0 +1,59 @@ +{ + "_entry_class": "SingleModelCacheEntry", + "_model_id": "hf-internal-testing/tiny-random-GraniteForCausalLM", + "_task": "text-generation", + "architectures": [ + "GraniteForCausalLM" + ], + "attention_bias": false, + "attention_dropout": 0.0, + "attention_multiplier": 1.0, + "dtype": "float32", + "embedding_multiplier": 1.0, + "hidden_act": "silu", + "hidden_size": 32, + "initializer_range": 0.02, + "intermediate_size": 64, + "logits_scaling": 1.0, + "max_position_embeddings": 2048, + "mlp_bias": false, + "model_type": "granite", + "neuron": { + "_serialized_key": "NxDNeuronConfig", + "batch_size": 1, + "capacity_factor": null, + "checkpoint_id": "hf-internal-testing/tiny-random-GraniteForCausalLM", + "checkpoint_revision": "c3074ebc0ac2fe545305f5e5f6cce2cc9b2aa0c5", + "continuous_batching": false, + "ep_degree": 1, + "fused_qkv": true, + "glu_mlp": true, + "local_ranks_size": 2, + "max_batch_size": 1, + "max_context_length": 1024, + "max_topk": 256, + "n_active_tokens": 1024, + "neuronxcc_version": "2.21.33363.0+82129205", + "on_device_sampling": true, + "optimum_neuron_version": "0.4.6.dev3", + "output_logits": false, + "pp_degree": 1, + "prefill_chunk_size": 0, + "sequence_length": 1024, + "speculation_length": 0, + "start_rank_id": 0, + "target": "trn1", + "torch_dtype": "float32", + "tp_degree": 2 + }, + "num_attention_heads": 4, + "num_hidden_layers": 2, + "num_key_value_heads": 4, + "residual_multiplier": 1.0, + "rms_norm_eps": 1e-06, + "rope_scaling": null, + "rope_theta": 10000.0, + "tie_word_embeddings": false, + "use_cache": true, + "vocab_size": 49152 +} \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.6.dev3/llama/llamafactory/tiny-random-Llama-3/4b6c7416e39455d1ad2e.json b/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.6.dev3/llama/llamafactory/tiny-random-Llama-3/4b6c7416e39455d1ad2e.json new file mode 100644 index 0000000000000000000000000000000000000000..edf2e32a3ffa22640ab356b9183dd230e3eae002 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.6.dev3/llama/llamafactory/tiny-random-Llama-3/4b6c7416e39455d1ad2e.json @@ -0,0 +1,63 @@ +{ + "_entry_class": "SingleModelCacheEntry", + "_model_id": "llamafactory/tiny-random-Llama-3", + "_task": "text-generation", + "architectures": [ + "LlamaForCausalLM" + ], + "attention_bias": false, + "attention_dropout": 0.0, + "dtype": "float16", + "head_dim": 4, + "hidden_act": "silu", + "hidden_size": 16, + "initializer_range": 0.02, + "intermediate_size": 64, + "max_position_embeddings": 131072, + "mlp_bias": false, + "model_type": "llama", + "neuron": { + "_serialized_key": "NxDNeuronConfig", + "batch_size": 1, + "capacity_factor": null, + "checkpoint_id": "llamafactory/tiny-random-Llama-3", + "checkpoint_revision": "bf2a2e3bf199ad2ee96f02a3c00246c608db22a8", + "continuous_batching": false, + "ep_degree": 1, + "fused_qkv": true, + "glu_mlp": true, + "local_ranks_size": 2, + "max_batch_size": 1, + "max_context_length": 512, + "max_topk": 256, + "n_active_tokens": 512, + "neuronxcc_version": "2.21.33363.0+82129205", + "on_device_sampling": true, + "optimum_neuron_version": "0.4.6.dev3", + "output_logits": false, + "pp_degree": 1, + "prefill_chunk_size": 0, + "sequence_length": 512, + "speculation_length": 0, + "start_rank_id": 0, + "target": "trn1", + "torch_dtype": "float16", + "tp_degree": 2 + }, + "num_attention_heads": 4, + "num_hidden_layers": 2, + "num_key_value_heads": 4, + "pretraining_tp": 1, + "rms_norm_eps": 1e-05, + "rope_scaling": { + "factor": 8.0, + "high_freq_factor": 4.0, + "low_freq_factor": 1.0, + "original_max_position_embeddings": 8192, + "rope_type": "llama3" + }, + "rope_theta": 500000.0, + "tie_word_embeddings": false, + "use_cache": true, + "vocab_size": 128256 +} \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.6.dev3/llama4_text/tiny-random/llama-4/d244406bccd80288e991.json b/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.6.dev3/llama4_text/tiny-random/llama-4/d244406bccd80288e991.json new file mode 100644 index 0000000000000000000000000000000000000000..a55b49da2a9045011fb3650a640da380dec561cb --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.6.dev3/llama4_text/tiny-random/llama-4/d244406bccd80288e991.json @@ -0,0 +1,82 @@ +{ + "_entry_class": "SingleModelCacheEntry", + "_model_id": "tiny-random/llama-4", + "_task": "text-generation", + "attention_bias": false, + "attention_chunk_size": 128, + "attention_dropout": 0.0, + "attn_scale": 0.1, + "attn_temperature_tuning": 4, + "cache_implementation": "hybrid", + "dtype": "bfloat16", + "floor_scale": 8192, + "for_llm_compressor": false, + "head_dim": 32, + "hidden_act": "silu", + "hidden_size": 32, + "initializer_range": 0.02, + "interleave_moe_layer_step": 2, + "intermediate_size": 64, + "intermediate_size_mlp": 128, + "layer_types": [ + "chunked_attention", + "chunked_attention", + "chunked_attention", + "full_attention" + ], + "max_position_embeddings": 1048576, + "model_type": "llama4_text", + "moe_layers": [ + 1, + 3 + ], + "neuron": { + "_serialized_key": "NxDNeuronConfig", + "batch_size": 1, + "capacity_factor": null, + "checkpoint_id": "tiny-random/llama-4", + "checkpoint_revision": "9e716f5d4d1ffe0a44a15f46f4a12b840439aba4", + "continuous_batching": false, + "ep_degree": 1, + "fused_qkv": false, + "glu_mlp": true, + "local_ranks_size": 2, + "max_batch_size": 1, + "max_context_length": 1024, + "max_topk": 256, + "n_active_tokens": 1024, + "neuronxcc_version": "2.21.33363.0+82129205", + "on_device_sampling": true, + "optimum_neuron_version": "0.4.6.dev3", + "output_logits": false, + "pp_degree": 1, + "prefill_chunk_size": 0, + "sequence_length": 1024, + "speculation_length": 0, + "start_rank_id": 0, + "target": "trn1", + "torch_dtype": "bfloat16", + "tp_degree": 2 + }, + "no_rope_layers": [ + 1, + 1, + 1, + 0 + ], + "num_attention_heads": 1, + "num_experts_per_tok": 1, + "num_hidden_layers": 4, + "num_key_value_heads": 1, + "num_local_experts": 8, + "output_router_logits": false, + "rms_norm_eps": 1e-05, + "rope_scaling": null, + "rope_theta": 500000.0, + "router_aux_loss_coef": 0.001, + "router_jitter_noise": 0.0, + "tie_word_embeddings": true, + "use_cache": true, + "use_qk_norm": true, + "vocab_size": 202048 +} \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.6.dev3/mixtral/dacorvo/Mixtral-tiny/1171cdc1e0668ecced1b.json b/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.6.dev3/mixtral/dacorvo/Mixtral-tiny/1171cdc1e0668ecced1b.json new file mode 100644 index 0000000000000000000000000000000000000000..83a4adbcfbfb3249b20ca9428c1d2b331cde40ac --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.6.dev3/mixtral/dacorvo/Mixtral-tiny/1171cdc1e0668ecced1b.json @@ -0,0 +1,59 @@ +{ + "_entry_class": "SingleModelCacheEntry", + "_model_id": "dacorvo/Mixtral-tiny", + "_task": "text-generation", + "architectures": [ + "MixtralForCausalLM" + ], + "attention_dropout": 0.0, + "dtype": "float16", + "head_dim": 32, + "hidden_act": "silu", + "hidden_size": 1024, + "initializer_range": 0.02, + "intermediate_size": 3584, + "max_position_embeddings": 1024, + "model_type": "mixtral", + "neuron": { + "_serialized_key": "NxDNeuronConfig", + "batch_size": 1, + "capacity_factor": null, + "checkpoint_id": "dacorvo/Mixtral-tiny", + "checkpoint_revision": "c557ba205ddff6ea911f4719e0d543d6c08356b6", + "continuous_batching": false, + "ep_degree": 1, + "fused_qkv": false, + "glu_mlp": true, + "local_ranks_size": 2, + "max_batch_size": 1, + "max_context_length": 1024, + "max_topk": 256, + "n_active_tokens": 1024, + "neuronxcc_version": "2.21.33363.0+82129205", + "on_device_sampling": false, + "optimum_neuron_version": "0.4.6.dev3", + "output_logits": false, + "pp_degree": 1, + "prefill_chunk_size": 0, + "sequence_length": 1024, + "speculation_length": 0, + "start_rank_id": 0, + "target": "trn1", + "torch_dtype": "float16", + "tp_degree": 2 + }, + "num_attention_heads": 32, + "num_experts_per_tok": 2, + "num_hidden_layers": 2, + "num_key_value_heads": 8, + "num_local_experts": 8, + "output_router_logits": false, + "rms_norm_eps": 1e-05, + "rope_theta": 10000.0, + "router_aux_loss_coef": 0.001, + "router_jitter_noise": 0.0, + "sliding_window": 4096, + "tie_word_embeddings": false, + "use_cache": true, + "vocab_size": 32000 +} \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.6.dev3/phi3/yujiepan/phi-4-tiny-random/6b7aebc14c435ae3db63.json b/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.6.dev3/phi3/yujiepan/phi-4-tiny-random/6b7aebc14c435ae3db63.json new file mode 100644 index 0000000000000000000000000000000000000000..18b3dd814a9962d736002ffa618954a880743a90 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.6.dev3/phi3/yujiepan/phi-4-tiny-random/6b7aebc14c435ae3db63.json @@ -0,0 +1,60 @@ +{ + "_entry_class": "SingleModelCacheEntry", + "_model_id": "yujiepan/phi-4-tiny-random", + "_task": "text-generation", + "architectures": [ + "Phi3ForCausalLM" + ], + "attention_bias": false, + "attention_dropout": 0.0, + "auto_map": {}, + "dtype": "bfloat16", + "embd_pdrop": 0.0, + "hidden_act": "silu", + "hidden_size": 16, + "initializer_range": 0.02, + "intermediate_size": 32, + "max_position_embeddings": 16384, + "model_type": "phi3", + "neuron": { + "_serialized_key": "NxDNeuronConfig", + "batch_size": 1, + "capacity_factor": null, + "checkpoint_id": "yujiepan/phi-4-tiny-random", + "checkpoint_revision": "18a9a1168dc97ac6d128f811925670c275610f5a", + "continuous_batching": false, + "ep_degree": 1, + "fused_qkv": true, + "glu_mlp": true, + "local_ranks_size": 2, + "max_batch_size": 1, + "max_context_length": 1024, + "max_topk": 256, + "n_active_tokens": 1024, + "neuronxcc_version": "2.21.33363.0+82129205", + "on_device_sampling": true, + "optimum_neuron_version": "0.4.6.dev3", + "output_logits": false, + "pp_degree": 1, + "prefill_chunk_size": 0, + "sequence_length": 1024, + "speculation_length": 0, + "start_rank_id": 0, + "target": "trn1", + "torch_dtype": "bfloat16", + "tp_degree": 2 + }, + "num_attention_heads": 2, + "num_hidden_layers": 2, + "num_key_value_heads": 1, + "original_max_position_embeddings": 16384, + "partial_rotary_factor": 1.0, + "resid_pdrop": 0.0, + "rms_norm_eps": 1e-05, + "rope_scaling": null, + "rope_theta": 250000, + "sliding_window": null, + "tie_word_embeddings": false, + "use_cache": true, + "vocab_size": 100352 +} \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.6.dev3/qwen2/yujiepan/qwen2.5-128k-tiny-random/7e378b918d8aa52c31f9.json b/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.6.dev3/qwen2/yujiepan/qwen2.5-128k-tiny-random/7e378b918d8aa52c31f9.json new file mode 100644 index 0000000000000000000000000000000000000000..eb9f1d0cfe4660390dbc84c7aa8524434aa1fb55 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.6.dev3/qwen2/yujiepan/qwen2.5-128k-tiny-random/7e378b918d8aa52c31f9.json @@ -0,0 +1,65 @@ +{ + "_entry_class": "SingleModelCacheEntry", + "_model_id": "yujiepan/qwen2.5-128k-tiny-random", + "_task": "text-generation", + "architectures": [ + "Qwen2ForCausalLM" + ], + "attention_dropout": 0.0, + "dtype": "bfloat16", + "hidden_act": "silu", + "hidden_size": 8, + "initializer_range": 0.02, + "intermediate_size": 16, + "layer_types": [ + "full_attention", + "full_attention" + ], + "max_position_embeddings": 32768, + "max_window_layers": 1, + "model_type": "qwen2", + "neuron": { + "_serialized_key": "NxDNeuronConfig", + "batch_size": 1, + "capacity_factor": null, + "checkpoint_id": "yujiepan/qwen2.5-128k-tiny-random", + "checkpoint_revision": "c8296d4ca3f87782876d2382fbb6481d1beb8ef0", + "continuous_batching": false, + "ep_degree": 1, + "fused_qkv": false, + "glu_mlp": true, + "local_ranks_size": 2, + "max_batch_size": 1, + "max_context_length": 1024, + "max_topk": 256, + "n_active_tokens": 1024, + "neuronxcc_version": "2.21.33363.0+82129205", + "on_device_sampling": true, + "optimum_neuron_version": "0.4.6.dev3", + "output_logits": false, + "pp_degree": 1, + "prefill_chunk_size": 0, + "sequence_length": 1024, + "speculation_length": 0, + "start_rank_id": 0, + "target": "trn1", + "torch_dtype": "bfloat16", + "tp_degree": 2 + }, + "num_attention_heads": 4, + "num_hidden_layers": 2, + "num_key_value_heads": 2, + "rms_norm_eps": 1e-06, + "rope_scaling": { + "factor": 4.0, + "original_max_position_embeddings": 32768, + "rope_type": "yarn", + "type": "yarn" + }, + "rope_theta": 1000000.0, + "sliding_window": null, + "tie_word_embeddings": false, + "use_cache": true, + "use_sliding_window": false, + "vocab_size": 152064 +} \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.6.dev3/qwen3_moe/optimum-internal-testing/tiny-random-qwen3_moe/ad0f2997db25e16e085b.json b/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.6.dev3/qwen3_moe/optimum-internal-testing/tiny-random-qwen3_moe/ad0f2997db25e16e085b.json new file mode 100644 index 0000000000000000000000000000000000000000..52d5acc13998240384df38ecf2eff69f3ef4d042 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.6.dev3/qwen3_moe/optimum-internal-testing/tiny-random-qwen3_moe/ad0f2997db25e16e085b.json @@ -0,0 +1,66 @@ +{ + "_entry_class": "SingleModelCacheEntry", + "_model_id": "optimum-internal-testing/tiny-random-qwen3_moe", + "_task": "text-generation", + "architectures": [ + "Qwen3MoeForCausalLM" + ], + "attention_bias": false, + "attention_dropout": 0.0, + "decoder_sparse_step": 2, + "dtype": "float32", + "head_dim": 32, + "hidden_act": "silu", + "hidden_size": 64, + "initializer_range": 0.02, + "intermediate_size": 128, + "max_position_embeddings": 40960, + "max_window_layers": 1, + "mlp_only_layers": [], + "model_type": "qwen3_moe", + "moe_intermediate_size": 128, + "neuron": { + "_serialized_key": "NxDNeuronConfig", + "batch_size": 1, + "capacity_factor": null, + "checkpoint_id": "optimum-internal-testing/tiny-random-qwen3_moe", + "checkpoint_revision": "e0230be2839556b44b7400a233c73c74b4abb7af", + "continuous_batching": false, + "ep_degree": 1, + "fused_qkv": false, + "glu_mlp": true, + "local_ranks_size": 2, + "max_batch_size": 1, + "max_context_length": 1024, + "max_topk": 256, + "n_active_tokens": 1024, + "neuronxcc_version": "2.21.33363.0+82129205", + "on_device_sampling": true, + "optimum_neuron_version": "0.4.6.dev3", + "output_logits": false, + "pp_degree": 1, + "prefill_chunk_size": 0, + "sequence_length": 1024, + "speculation_length": 0, + "start_rank_id": 0, + "target": "trn1", + "torch_dtype": "float32", + "tp_degree": 2 + }, + "norm_topk_prob": true, + "num_attention_heads": 2, + "num_experts": 8, + "num_experts_per_tok": 2, + "num_hidden_layers": 2, + "num_key_value_heads": 1, + "output_router_logits": false, + "rms_norm_eps": 1e-06, + "rope_scaling": null, + "rope_theta": 1000000.0, + "router_aux_loss_coef": 0.001, + "sliding_window": null, + "tie_word_embeddings": true, + "use_cache": true, + "use_sliding_window": false, + "vocab_size": 151936 +} \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_0007bf645cd8f44068db+a02c3a36/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_0007bf645cd8f44068db+a02c3a36/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..5726abc7d1d8c52fa95bc7919439a23a23fe3b9a --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_0007bf645cd8f44068db+a02c3a36/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/token_generation/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_0007bf645cd8f44068db+a02c3a36/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_0007bf645cd8f44068db+a02c3a36/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_0007bf645cd8f44068db+a02c3a36/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_0007bf645cd8f44068db+a02c3a36/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..e738d22a04cf8409ac46e869018434bfde1f43c0 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_0007bf645cd8f44068db+a02c3a36/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f605a954b114104fa81403712a2efbe24d99be08d5bcfe37bb5b9a565639ad02 +size 443127 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_0007bf645cd8f44068db+a02c3a36/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_0007bf645cd8f44068db+a02c3a36/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..53623517d8743de7bd020b4018a350cbd71a695a --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_0007bf645cd8f44068db+a02c3a36/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a9796c856854a7194fedb64467f5f4cb0417ffa579f0ca3ba9f25e913d05ab51 +size 2171904 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_0007bf645cd8f44068db+a02c3a36/wrapped_neff.hlo b/neuronxcc-2.21.33363.0+82129205/MODULE_0007bf645cd8f44068db+a02c3a36/wrapped_neff.hlo new file mode 100644 index 0000000000000000000000000000000000000000..1d54ee4ef0274cb84518c0356917d149daf7e460 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_0007bf645cd8f44068db+a02c3a36/wrapped_neff.hlo @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dae9a2f5e6a2b76e04ccfddc992e1734f33c68688803a5ed27cc18d116416845 +size 2245991 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_1023294089137432912+e30acd3a/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_1023294089137432912+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_1023294089137432912+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_1023294089137432912+e30acd3a/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_1023294089137432912+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_1023294089137432912+e30acd3a/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_1023294089137432912+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..94a29962e1fbef2972379e89bec95b36ecbda193 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_1023294089137432912+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0dc8be214832248c940c41980c6f4dfeeea31616cbdd7b0f4d6e489f1ec8a9d4 +size 1291 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_1023294089137432912+e30acd3a/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_1023294089137432912+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..b7243715e6e755b5f0f2d49d9d28b01fba2e83af Binary files /dev/null and b/neuronxcc-2.21.33363.0+82129205/MODULE_1023294089137432912+e30acd3a/model.neff differ diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_10907752543637211265+e30acd3a/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_10907752543637211265+e30acd3a/model.hlo_module.pb index b90a86dc9847aa4694b1ae072a3a2d5a6c06a295..92b56ec303335fde579dd14fb10b570274bc9094 100644 --- a/neuronxcc-2.21.33363.0+82129205/MODULE_10907752543637211265+e30acd3a/model.hlo_module.pb +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_10907752543637211265+e30acd3a/model.hlo_module.pb @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:b36a2c38093715f8f1064e95c504963c4eefb108483ea5177b7a9b67c594c14c +oid sha256:9f985fe889da2802e231c02dc1c5f5e23faf4aea6cc57a68f87a88e6f2645a8d size 1584 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_10907752543637211265+e30acd3a/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_10907752543637211265+e30acd3a/model.neff index 05857a281a16252edfc671336951cf3143cea874..46da978640f2e25f9d8eb61977e83d998f5a8b1a 100644 Binary files a/neuronxcc-2.21.33363.0+82129205/MODULE_10907752543637211265+e30acd3a/model.neff and b/neuronxcc-2.21.33363.0+82129205/MODULE_10907752543637211265+e30acd3a/model.neff differ diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_10945286243277389437+e30acd3a/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_10945286243277389437+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_10945286243277389437+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_10945286243277389437+e30acd3a/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_10945286243277389437+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_10945286243277389437+e30acd3a/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_10945286243277389437+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..f2305e54005bda7c9d37a6935bff9a3678a6be66 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_10945286243277389437+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:799325c3cbe603da3b514db932484827f0bb64399ab98e4ec6ed46dfa0c1df18 +size 1146 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_10945286243277389437+e30acd3a/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_10945286243277389437+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..2d63dfcb5e058ccb2bceacb40e4708fa621f9b46 Binary files /dev/null and b/neuronxcc-2.21.33363.0+82129205/MODULE_10945286243277389437+e30acd3a/model.neff differ diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_11400907432531398953+e30acd3a/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_11400907432531398953+e30acd3a/model.hlo_module.pb index ad2498cb3ccc8151ea047c432b2b66e2e625d32e..5977dbd7062bf1699868f357bff7362515162614 100644 --- a/neuronxcc-2.21.33363.0+82129205/MODULE_11400907432531398953+e30acd3a/model.hlo_module.pb +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_11400907432531398953+e30acd3a/model.hlo_module.pb @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:1dcdc83733e2a421bdc65e593bd84b693b25114c7d871cc5383cf3ac18dbfdfb +oid sha256:6dc0732a47ea824b3bc9edce98dc564d7e2239653e42b4ad73eba3f5c05a129c size 1584 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_11400907432531398953+e30acd3a/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_11400907432531398953+e30acd3a/model.neff index 91d66f16cab01417f03cb68141cb534e3c471d76..00aafde68b6d8969778bdad9a45f249720f4a0b4 100644 Binary files a/neuronxcc-2.21.33363.0+82129205/MODULE_11400907432531398953+e30acd3a/model.neff and b/neuronxcc-2.21.33363.0+82129205/MODULE_11400907432531398953+e30acd3a/model.neff differ diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_12311847081050718470+e30acd3a/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_12311847081050718470+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_12311847081050718470+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_12311847081050718470+e30acd3a/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_12311847081050718470+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_12311847081050718470+e30acd3a/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_12311847081050718470+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..331d55e9c5c5104d78fd6e580c611cf958f119e0 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_12311847081050718470+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:202c1be8364d18d338faf4c87953dc16fc7b3ac04a5fe3e5d171c6d3e0991470 +size 1291 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_12311847081050718470+e30acd3a/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_12311847081050718470+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..7d356c192538dc165d55e9208900a375f9eadca4 Binary files /dev/null and b/neuronxcc-2.21.33363.0+82129205/MODULE_12311847081050718470+e30acd3a/model.neff differ diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_12324009378304635855+e30acd3a/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_12324009378304635855+e30acd3a/model.hlo_module.pb index ef9826bc0f3be4cee030dba2d27589e70ab9646c..d243543b950cbfa468e0924e87cc34a989d313fa 100644 --- a/neuronxcc-2.21.33363.0+82129205/MODULE_12324009378304635855+e30acd3a/model.hlo_module.pb +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_12324009378304635855+e30acd3a/model.hlo_module.pb @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:c03b599abe1f3c2c4641cf7e8ff997574d293007a2321ba5af97b65b188e6b99 +oid sha256:8d7ee9e65f3fb9be7829eb796985b1da258963af88be0f2def750ac7f1fbffab size 1584 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_12324009378304635855+e30acd3a/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_12324009378304635855+e30acd3a/model.neff index d98c76d93a56a5e20c58fcd99590b22d18f47a81..cc90bc2fea21b17e52b5f5ab92507b8156af5589 100644 Binary files a/neuronxcc-2.21.33363.0+82129205/MODULE_12324009378304635855+e30acd3a/model.neff and b/neuronxcc-2.21.33363.0+82129205/MODULE_12324009378304635855+e30acd3a/model.neff differ diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_12509236927544110827+e30acd3a/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_12509236927544110827+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_12509236927544110827+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_12509236927544110827+e30acd3a/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_12509236927544110827+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_12509236927544110827+e30acd3a/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_12509236927544110827+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..2ecfa2d03b9beddbb97cc31fc06ff97760801479 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_12509236927544110827+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1d2773ca28ac2c99e85df7fa91ca65164a84f48c5a12fa511cfeee1f94de867a +size 1291 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_12509236927544110827+e30acd3a/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_12509236927544110827+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..1d55c70d5070e9f70fdad94d0ea8e30429a75ab6 Binary files /dev/null and b/neuronxcc-2.21.33363.0+82129205/MODULE_12509236927544110827+e30acd3a/model.neff differ diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_12650363609878702055+e30acd3a/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_12650363609878702055+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_12650363609878702055+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_12650363609878702055+e30acd3a/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_12650363609878702055+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_12650363609878702055+e30acd3a/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_12650363609878702055+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..017e5c60b3f9035eb03017e570e3b06da04b41a8 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_12650363609878702055+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:268d593d3c53a3542f1ecef5bd498c2c42738b8f824d32c5c28f98a7ec6773de +size 1146 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_12650363609878702055+e30acd3a/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_12650363609878702055+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..2299f1eb1fcf0b3c8fcbd34354afe6f933bbcece Binary files /dev/null and b/neuronxcc-2.21.33363.0+82129205/MODULE_12650363609878702055+e30acd3a/model.neff differ diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_12666804432653521811+e30acd3a/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_12666804432653521811+e30acd3a/model.hlo_module.pb index 600468f9199a6c583c50512a0beb464459827ee0..e5a5df3bea32a18a00adda35606de0beef6c3ff0 100644 --- a/neuronxcc-2.21.33363.0+82129205/MODULE_12666804432653521811+e30acd3a/model.hlo_module.pb +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_12666804432653521811+e30acd3a/model.hlo_module.pb @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:b7aec6718d215967d85935fe984b05d9b16246efecfec2137a2e30759d81c555 +oid sha256:4baa97fba157edb4e63bab7a60ff02028ef5dabf4a8817ead4b2032415a36560 size 1585 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_12666804432653521811+e30acd3a/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_12666804432653521811+e30acd3a/model.neff index 3d3cb71282f1878c8bc1cf58c47d706d8177b831..057a2858b352997b35572b313a9a348f05c3da61 100644 Binary files a/neuronxcc-2.21.33363.0+82129205/MODULE_12666804432653521811+e30acd3a/model.neff and b/neuronxcc-2.21.33363.0+82129205/MODULE_12666804432653521811+e30acd3a/model.neff differ diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_1277765475941548362+e30acd3a/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_1277765475941548362+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_1277765475941548362+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_1277765475941548362+e30acd3a/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_1277765475941548362+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_1277765475941548362+e30acd3a/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_1277765475941548362+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..5bec3aebe844801dec14a79b282d9f92256c965d --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_1277765475941548362+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5e72c75050e083b3b085559f8b553b17c8a5492353dfa46c3c6014dae303b321 +size 1146 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_1277765475941548362+e30acd3a/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_1277765475941548362+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..9cb5d579afdd6f014e616e65a1d2aae641d3e9f5 Binary files /dev/null and b/neuronxcc-2.21.33363.0+82129205/MODULE_1277765475941548362+e30acd3a/model.neff differ diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_12795949123662846630+e30acd3a/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_12795949123662846630+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_12795949123662846630+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_12795949123662846630+e30acd3a/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_12795949123662846630+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_12795949123662846630+e30acd3a/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_12795949123662846630+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..a9387d3e05624edcdbd8fe5eaab14d302f864e24 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_12795949123662846630+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:784423994cf036520e6a3f69b0d7909b90230aa24f2e5c6eba250db4b610f641 +size 1146 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_12795949123662846630+e30acd3a/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_12795949123662846630+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..00c1e30635017175b00da277c80b095f154e0567 Binary files /dev/null and b/neuronxcc-2.21.33363.0+82129205/MODULE_12795949123662846630+e30acd3a/model.neff differ diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_13092192882592555392+e30acd3a/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_13092192882592555392+e30acd3a/model.hlo_module.pb index f215ff53bd093fc485dd3a3e0493ecd1677d0e3d..897d7792cfdd4a685dc7f32c32a8f0bf383b52d0 100644 --- a/neuronxcc-2.21.33363.0+82129205/MODULE_13092192882592555392+e30acd3a/model.hlo_module.pb +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_13092192882592555392+e30acd3a/model.hlo_module.pb @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:c7e5e8627e554f6106efe00a9e5443edd528624611d8c29ec34ebbb98fc7d8d2 +oid sha256:0ac3f4de6abf7374a1f0e079bf3c0583d397b183ac33463605e050031ddb5a35 size 1584 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_13092192882592555392+e30acd3a/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_13092192882592555392+e30acd3a/model.neff index 9ffe14c8c9aa9e52320b13760eb1c3f438fd0cfc..4caa9cccc6d97a6f63744867a08236e29ab79d17 100644 Binary files a/neuronxcc-2.21.33363.0+82129205/MODULE_13092192882592555392+e30acd3a/model.neff and b/neuronxcc-2.21.33363.0+82129205/MODULE_13092192882592555392+e30acd3a/model.neff differ diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_13129006844218143067+e30acd3a/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_13129006844218143067+e30acd3a/model.hlo_module.pb index 16a43cc54293e607a6255ad9da104a22d7521d04..077d73f32c1f3dc34e19b0bc2c8cced6e3b67400 100644 --- a/neuronxcc-2.21.33363.0+82129205/MODULE_13129006844218143067+e30acd3a/model.hlo_module.pb +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_13129006844218143067+e30acd3a/model.hlo_module.pb @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:5ac835add8ef9104a34341aa0f2a6c485e5ea7fb5e04bb187959e310c6ec0e14 -size 1584 +oid sha256:b553a4799b7b03c83f235a4fa45d249d466805aa0116b9ec39243b457e414676 +size 1585 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_13129006844218143067+e30acd3a/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_13129006844218143067+e30acd3a/model.neff index 48284eb792c98aa67cbc26bd9644d5b75a0ee03f..4d0747eaeb837d8670cca816642714ff4e77fe0e 100644 Binary files a/neuronxcc-2.21.33363.0+82129205/MODULE_13129006844218143067+e30acd3a/model.neff and b/neuronxcc-2.21.33363.0+82129205/MODULE_13129006844218143067+e30acd3a/model.neff differ diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_13163168066471565112+e30acd3a/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_13163168066471565112+e30acd3a/model.hlo_module.pb index 30a44c112a1e85be62e94865d7e39ea36faa66eb..162596d210ca077351817d8212b12f64c2807c6d 100644 --- a/neuronxcc-2.21.33363.0+82129205/MODULE_13163168066471565112+e30acd3a/model.hlo_module.pb +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_13163168066471565112+e30acd3a/model.hlo_module.pb @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:79ca38629b9bb8e54332a80e8e36748d843d502acfc7244cc95a320ec55b90c5 +oid sha256:1b3a1c703060f71c156de4a9049e6f0cdeaba34ba6073363f84bd9cdcbaa1e10 size 1584 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_13163168066471565112+e30acd3a/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_13163168066471565112+e30acd3a/model.neff index fc101a0aaec86df6f780f6d7ea7ce0e226d9e526..51e1823e10eab168138f4ecd80a9ad4a78222784 100644 Binary files a/neuronxcc-2.21.33363.0+82129205/MODULE_13163168066471565112+e30acd3a/model.neff and b/neuronxcc-2.21.33363.0+82129205/MODULE_13163168066471565112+e30acd3a/model.neff differ diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_131f9eb6c76c8d161c00+33f7fefb/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_131f9eb6c76c8d161c00+33f7fefb/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..d5fa0b2c8aeb938a58f51f6a213e0f329bd53106 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_131f9eb6c76c8d161c00+33f7fefb/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--enable-saturate-infinity", "--auto-cast=none", "--model-type=transformer", "-O1", "--logfile=/tmp/nxdi_test_e681caef-8946-41b0-8cd9-38ac72cf4974/compiler_workdir/SoftmaxWithMask/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_131f9eb6c76c8d161c00+33f7fefb/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_131f9eb6c76c8d161c00+33f7fefb/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_131f9eb6c76c8d161c00+33f7fefb/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_131f9eb6c76c8d161c00+33f7fefb/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..1122d44653d734af6a44cd149690f70cdefd9b05 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_131f9eb6c76c8d161c00+33f7fefb/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f9a258ce111db27dc5ba46ec4f9f6877c56b0777a5534c0eba14488ff9eaf298 +size 5596 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_131f9eb6c76c8d161c00+33f7fefb/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_131f9eb6c76c8d161c00+33f7fefb/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..8712f4f88dcd7bc0b5dcbc01f9b8d4c634f3d5fc Binary files /dev/null and b/neuronxcc-2.21.33363.0+82129205/MODULE_131f9eb6c76c8d161c00+33f7fefb/model.neff differ diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_13385766575326555678+e30acd3a/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_13385766575326555678+e30acd3a/model.hlo_module.pb index d5170eb98150404cddea97e8dc3b154e7948f12c..c3ebde5bbf5daedd5c2d076a4a2957875d6eabb7 100644 --- a/neuronxcc-2.21.33363.0+82129205/MODULE_13385766575326555678+e30acd3a/model.hlo_module.pb +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_13385766575326555678+e30acd3a/model.hlo_module.pb @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:175d7534042da2b21e67c22c6527992c0c5734601d3f8def1dccf42da367ec68 +oid sha256:1a9da9518b7ea1a102e5eaa7e2a5eaf36850216022160b9e197d7d39e8f31da2 size 1584 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_13385766575326555678+e30acd3a/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_13385766575326555678+e30acd3a/model.neff index 70df91ddb00894d7386c28d0bea946e1edfcf4a6..f7023150ffea473d46e4133322396d00483ca08e 100644 Binary files a/neuronxcc-2.21.33363.0+82129205/MODULE_13385766575326555678+e30acd3a/model.neff and b/neuronxcc-2.21.33363.0+82129205/MODULE_13385766575326555678+e30acd3a/model.neff differ diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_13521002922414225272+e30acd3a/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_13521002922414225272+e30acd3a/model.hlo_module.pb index 332a53812f106f5bdc39c5328bc3416d9da5009f..8b755ec6566a76846cf1f04ad02765fa144f93db 100644 --- a/neuronxcc-2.21.33363.0+82129205/MODULE_13521002922414225272+e30acd3a/model.hlo_module.pb +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_13521002922414225272+e30acd3a/model.hlo_module.pb @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:733d0fb0b8a00ad2f86ce0d3202e2731f51e7a752e198b9b302678f8317ea9c2 +oid sha256:7558ff395b222c4b53821dbdf3800f36d28f01a28581ed57aa4b073a46d66b7e size 1584 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_13521002922414225272+e30acd3a/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_13521002922414225272+e30acd3a/model.neff index 08334f268e5efc243a714ea6ca9812d5c2a571b9..5970ed2c4c4076acfaaf7776a946e2b2c8175169 100644 Binary files a/neuronxcc-2.21.33363.0+82129205/MODULE_13521002922414225272+e30acd3a/model.neff and b/neuronxcc-2.21.33363.0+82129205/MODULE_13521002922414225272+e30acd3a/model.neff differ diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_13673338043232097095+e30acd3a/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_13673338043232097095+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_13673338043232097095+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_13673338043232097095+e30acd3a/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_13673338043232097095+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_13673338043232097095+e30acd3a/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_13673338043232097095+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..c91a89a50a9cbe5b6061aeafdd7640914fa24a0c --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_13673338043232097095+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:65965ab8a4bc189aa5c76dfa39cfda780bbcc486796e362b06801d85e9965d72 +size 1291 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_13673338043232097095+e30acd3a/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_13673338043232097095+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..697d767abf70cabbca192242bde014f629b38af6 Binary files /dev/null and b/neuronxcc-2.21.33363.0+82129205/MODULE_13673338043232097095+e30acd3a/model.neff differ diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_14024125047097359821+e30acd3a/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_14024125047097359821+e30acd3a/model.hlo_module.pb index 88d4c357148f8723e10ac1cf8dc5426b680eef5a..d0ff601450111689cda2523ec9ae9fe9120354f2 100644 --- a/neuronxcc-2.21.33363.0+82129205/MODULE_14024125047097359821+e30acd3a/model.hlo_module.pb +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_14024125047097359821+e30acd3a/model.hlo_module.pb @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:7730eb5b8602fc6d2d25c92d8624de4ee95d56509ce0c2d8adbf41a9d7b99ceb +oid sha256:3868ec66d2c26d04dfcd0ee2d4fce0b8d67d132c9188ad2ad0bc1ccd2263f852 size 1584 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_14024125047097359821+e30acd3a/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_14024125047097359821+e30acd3a/model.neff index e42d054f5127fa958eccddff5ca10126152124c3..68ad99a8440682eabadba4cb9dddaccefac2fd94 100644 Binary files a/neuronxcc-2.21.33363.0+82129205/MODULE_14024125047097359821+e30acd3a/model.neff and b/neuronxcc-2.21.33363.0+82129205/MODULE_14024125047097359821+e30acd3a/model.neff differ diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_14488951057292576015+e30acd3a/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_14488951057292576015+e30acd3a/model.hlo_module.pb index d532e468ecceba150088a81cf4b534f83127347d..33bfe813a30b073602b205d8cfeb9f528cb8fd47 100644 --- a/neuronxcc-2.21.33363.0+82129205/MODULE_14488951057292576015+e30acd3a/model.hlo_module.pb +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_14488951057292576015+e30acd3a/model.hlo_module.pb @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:f794d9b46f347a2c9779006b54197d244ac42cd282903d46a9ac1effbff35900 +oid sha256:d5fca8287c8f360cc2db68816b1c0c6e53b3fa2645c2292b458e68440bfa6c50 size 1585 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_14488951057292576015+e30acd3a/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_14488951057292576015+e30acd3a/model.neff index 5436593e8c60ff93d9e29c9d733c009d19c2cd7d..ad5fdf74d8ba9c359eb4395b7b362fafd4b158ac 100644 Binary files a/neuronxcc-2.21.33363.0+82129205/MODULE_14488951057292576015+e30acd3a/model.neff and b/neuronxcc-2.21.33363.0+82129205/MODULE_14488951057292576015+e30acd3a/model.neff differ diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_14607415948795306857+e30acd3a/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_14607415948795306857+e30acd3a/model.hlo_module.pb index a040628b2dd49b30b03c553a530c0e2c76d57bb3..5712d4fcff68f6a51fefa0f5b6126807976fbf33 100644 --- a/neuronxcc-2.21.33363.0+82129205/MODULE_14607415948795306857+e30acd3a/model.hlo_module.pb +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_14607415948795306857+e30acd3a/model.hlo_module.pb @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:96a2ca6d1c617f569228e4c09d146226ca8d607049cc5b813b8b9d0e42ebbe63 +oid sha256:fa209a761824ec9d108f7daed265afa9cd0efbc16932dab674967e6a7c7e8369 size 1585 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_14607415948795306857+e30acd3a/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_14607415948795306857+e30acd3a/model.neff index 202c6b8521a788a3e20ee0e54c339aaa6dcf0ef6..8fb40cdf7854001396f9354289f1561cab9e1a59 100644 Binary files a/neuronxcc-2.21.33363.0+82129205/MODULE_14607415948795306857+e30acd3a/model.neff and b/neuronxcc-2.21.33363.0+82129205/MODULE_14607415948795306857+e30acd3a/model.neff differ diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_15195479995167874327+e30acd3a/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_15195479995167874327+e30acd3a/model.hlo_module.pb index a57f719e018130b080aaa379975c88b7fb4bc4f2..2ba8ddb6a6c66b8b32ed7e44013c3837e1d0a35d 100644 --- a/neuronxcc-2.21.33363.0+82129205/MODULE_15195479995167874327+e30acd3a/model.hlo_module.pb +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_15195479995167874327+e30acd3a/model.hlo_module.pb @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:cac76d2035fb9d2728d0052857f47b57fdfac0d0fb43734a4806a5a5a4deaed5 +oid sha256:4a4ac9b0a8b2ce4471ef5b6f7f1efddd21946ec6b3423abee4412f97ec57d5a5 size 1582 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_15195479995167874327+e30acd3a/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_15195479995167874327+e30acd3a/model.neff index eb727dbb5510b457d2390247c28550137146946f..0d97ebdea83a0c7843ae2fb65ac0e22b12dfa062 100644 Binary files a/neuronxcc-2.21.33363.0+82129205/MODULE_15195479995167874327+e30acd3a/model.neff and b/neuronxcc-2.21.33363.0+82129205/MODULE_15195479995167874327+e30acd3a/model.neff differ diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_15226158922329678840+e30acd3a/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_15226158922329678840+e30acd3a/model.hlo_module.pb index 06263c496303dad9352931d0f93b594ba1e4b5e6..f0f1b06236b7314cb945f3874ccf72c3bdf10957 100644 --- a/neuronxcc-2.21.33363.0+82129205/MODULE_15226158922329678840+e30acd3a/model.hlo_module.pb +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_15226158922329678840+e30acd3a/model.hlo_module.pb @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:6da43c48a28ebcc7b93e066fd156567bdd942450f41f926a0294a6275097cfa1 +oid sha256:db51f0ec93a734eaa52287c97a0ba33c1a89b534a4c9d9d74ff982afde0b4f38 size 1584 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_15226158922329678840+e30acd3a/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_15226158922329678840+e30acd3a/model.neff index 9ac254bb0a0cc701348fca4bd839ab597c6b2b7c..93e4b7bfc91ee8668946f6d542a10ce66f603b4e 100644 Binary files a/neuronxcc-2.21.33363.0+82129205/MODULE_15226158922329678840+e30acd3a/model.neff and b/neuronxcc-2.21.33363.0+82129205/MODULE_15226158922329678840+e30acd3a/model.neff differ diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_15549583432468528942+e30acd3a/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_15549583432468528942+e30acd3a/model.hlo_module.pb index d604ba392cf0e35823e332233d7b81e4b72c37be..62ff22654ec4dc62d44eafbf09ac25fc35ed294f 100644 --- a/neuronxcc-2.21.33363.0+82129205/MODULE_15549583432468528942+e30acd3a/model.hlo_module.pb +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_15549583432468528942+e30acd3a/model.hlo_module.pb @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:bf03da6cc8efe76396a94a9ec2ab1e947e3aae3b2004650f06be02c1cb664237 +oid sha256:39b9add75c493f66e27b194511c292de8035765ba18b4d8a2b24df70fa192d2f size 1584 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_15549583432468528942+e30acd3a/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_15549583432468528942+e30acd3a/model.neff index 6679d8da0f29a9f2fcfe7084549f4e8e1d6ef312..81d8d176914faa6599b4a0b83f96a1eac1dcf3b6 100644 Binary files a/neuronxcc-2.21.33363.0+82129205/MODULE_15549583432468528942+e30acd3a/model.neff and b/neuronxcc-2.21.33363.0+82129205/MODULE_15549583432468528942+e30acd3a/model.neff differ diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_15883166014121986340+e30acd3a/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_15883166014121986340+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_15883166014121986340+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_15883166014121986340+e30acd3a/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_15883166014121986340+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_15883166014121986340+e30acd3a/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_15883166014121986340+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..9671afab08a0471f9f5a5813704ee44e5e83535c --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_15883166014121986340+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:751ad0d352e51628e69a4053e21da34fa6a3fe1505bd5aa83ec9125b195f7a7f +size 1146 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_15883166014121986340+e30acd3a/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_15883166014121986340+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..ee967c8441ec6e0168cf22c85c24f989c943a169 Binary files /dev/null and b/neuronxcc-2.21.33363.0+82129205/MODULE_15883166014121986340+e30acd3a/model.neff differ diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_15974718484747567133+e30acd3a/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_15974718484747567133+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_15974718484747567133+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_15974718484747567133+e30acd3a/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_15974718484747567133+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_15974718484747567133+e30acd3a/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_15974718484747567133+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..27f758616dec356edcb84f35123f1064c40b8599 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_15974718484747567133+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3d1c22c14330d11384a0e107fd818c9fd613c57aeadbcf076ccac20973c3e4eb +size 1291 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_15974718484747567133+e30acd3a/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_15974718484747567133+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..b85143180d66c457594b125b4c6a7be99c89d666 Binary files /dev/null and b/neuronxcc-2.21.33363.0+82129205/MODULE_15974718484747567133+e30acd3a/model.neff differ diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_16063773584643651549+e30acd3a/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_16063773584643651549+e30acd3a/model.hlo_module.pb index 7fcef3c41c0d6edeb3832dd09ad315e34d1c3b05..29ebb18e871a0955609e3810c5661d2ef94f636e 100644 --- a/neuronxcc-2.21.33363.0+82129205/MODULE_16063773584643651549+e30acd3a/model.hlo_module.pb +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_16063773584643651549+e30acd3a/model.hlo_module.pb @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:3772c9b53cf2c833d0d1c07c90e6b645617324394ad76cd3936137a547c93adf +oid sha256:44dc0332f93f32c0338766e0766a66bef9979be73c78f1a56cc059b3e69a2c18 size 1144 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_16063773584643651549+e30acd3a/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_16063773584643651549+e30acd3a/model.neff index c21c7d2e5f5c638059050ec12657584a9419c400..42c0ca9f0cf16a8e05962a5738b9ea89ada0f6a0 100644 Binary files a/neuronxcc-2.21.33363.0+82129205/MODULE_16063773584643651549+e30acd3a/model.neff and b/neuronxcc-2.21.33363.0+82129205/MODULE_16063773584643651549+e30acd3a/model.neff differ diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_16540141349946602462+e30acd3a/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_16540141349946602462+e30acd3a/model.hlo_module.pb index c442d79bba92ba90bb790ec80c021d4af39c8a75..00ba1108f0d4daa2fc7841ea27a98a3b30b9b63e 100644 --- a/neuronxcc-2.21.33363.0+82129205/MODULE_16540141349946602462+e30acd3a/model.hlo_module.pb +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_16540141349946602462+e30acd3a/model.hlo_module.pb @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:2b8e1780595d270fdec28ffa5135fd9fc122d81455077a5333563bb01065f9eb +oid sha256:6e641a442ff6b13aab5d55f41b615160ec53ea1744f800537a9bc6b4ea5d2d91 size 1584 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_16540141349946602462+e30acd3a/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_16540141349946602462+e30acd3a/model.neff index bff4e87e51aeab73ff3e42712722e9cc4eae3fe6..0dca92d713ba3831e68b75b6d3457c0953758854 100644 Binary files a/neuronxcc-2.21.33363.0+82129205/MODULE_16540141349946602462+e30acd3a/model.neff and b/neuronxcc-2.21.33363.0+82129205/MODULE_16540141349946602462+e30acd3a/model.neff differ diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_1659424179484095552+e30acd3a/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_1659424179484095552+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_1659424179484095552+e30acd3a/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_1659424179484095552+e30acd3a/model.hlo_module.pb index a7e25eeb37121b478d999b750fbcd88e0bf27d24..6f491a28cb8f0836885e137c85358c351e5fb414 100644 --- a/neuronxcc-2.21.33363.0+82129205/MODULE_1659424179484095552+e30acd3a/model.hlo_module.pb +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_1659424179484095552+e30acd3a/model.hlo_module.pb @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:394ead2842be9fad710a8dd2987593d6340a0f6bf739f2bb6bf829d1a65712b6 +oid sha256:1a0eb013b9039ac2e1141e03ab07c452575f5f8da1b4c76b11772a72a35308c0 size 1146 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_1659424179484095552+e30acd3a/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_1659424179484095552+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..5be640dbc0a79f59ac3d2d5691d2a38dba11963a Binary files /dev/null and b/neuronxcc-2.21.33363.0+82129205/MODULE_1659424179484095552+e30acd3a/model.neff differ diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_17037369046574255528+e30acd3a/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_17037369046574255528+e30acd3a/model.hlo_module.pb index ebfeed2f0336a7c1b2cc132d29e93f0f47e0271c..263760b26897da1e3f89e75da326020460afa50d 100644 --- a/neuronxcc-2.21.33363.0+82129205/MODULE_17037369046574255528+e30acd3a/model.hlo_module.pb +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_17037369046574255528+e30acd3a/model.hlo_module.pb @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:ea6f95f6359e63ec8ab80994433ce28b0635e7041da26b6fcede717acc049264 +oid sha256:8a5f71e6a0795190aa972c48160b2bd3cc8cd9125f66e09f924b307a46646e34 size 1584 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_17037369046574255528+e30acd3a/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_17037369046574255528+e30acd3a/model.neff index 658b5eac55a8a4c6bdab7cf22e4798dc7c570b56..b577d0fc59badd803edf87c26765c9e5db736d37 100644 Binary files a/neuronxcc-2.21.33363.0+82129205/MODULE_17037369046574255528+e30acd3a/model.neff and b/neuronxcc-2.21.33363.0+82129205/MODULE_17037369046574255528+e30acd3a/model.neff differ diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_17162153672426857671+e30acd3a/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_17162153672426857671+e30acd3a/model.hlo_module.pb index ff8cfe6fb48f24862061ffd1e69bb93e259f494b..db6925dc5cf3a38cee2ea14c890a7f245cda9b27 100644 --- a/neuronxcc-2.21.33363.0+82129205/MODULE_17162153672426857671+e30acd3a/model.hlo_module.pb +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_17162153672426857671+e30acd3a/model.hlo_module.pb @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:a955ad497f25e8cfbd39bcb81ffd84a6762f8808cf9be1033d56672fdf6f8d9e +oid sha256:112b39a2281d37bb12a3d1f76dde6d1b15bf3ade7e146d2eb1f82679ae0b04d1 size 1584 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_17162153672426857671+e30acd3a/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_17162153672426857671+e30acd3a/model.neff index b289d48571ec771e4bebf5f8dfdbcf5c7938af25..f9c45e57eeea0eed3205cb1b915ea1ccd3808448 100644 Binary files a/neuronxcc-2.21.33363.0+82129205/MODULE_17162153672426857671+e30acd3a/model.neff and b/neuronxcc-2.21.33363.0+82129205/MODULE_17162153672426857671+e30acd3a/model.neff differ diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_17184761711863280677+e30acd3a/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_17184761711863280677+e30acd3a/model.hlo_module.pb index e8be5b68c75b45794bc5de7c2deca020c8a382cb..ffa69b6358c65f95c1866f4a55e68bc53c395dd2 100644 --- a/neuronxcc-2.21.33363.0+82129205/MODULE_17184761711863280677+e30acd3a/model.hlo_module.pb +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_17184761711863280677+e30acd3a/model.hlo_module.pb @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:f3a1cab3ecba7a6f07cc3ee1cd169a5cdacda09119c1f16840b98b4578735cc0 +oid sha256:d54f99a3641771607fe60a04580562b612f9cfcf58da242351adb5650cf86be6 size 1584 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_17184761711863280677+e30acd3a/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_17184761711863280677+e30acd3a/model.neff index a4aca912d0f68cf75f5af021bbe2e0e6326c1cf5..019fb7baa0eb479bd4ad5aa4cb2b05dcdd9848b6 100644 Binary files a/neuronxcc-2.21.33363.0+82129205/MODULE_17184761711863280677+e30acd3a/model.neff and b/neuronxcc-2.21.33363.0+82129205/MODULE_17184761711863280677+e30acd3a/model.neff differ diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_17685401492131160329+e30acd3a/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_17685401492131160329+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_17685401492131160329+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_17685401492131160329+e30acd3a/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_17685401492131160329+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_17685401492131160329+e30acd3a/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_17685401492131160329+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..eef51ae4b0f55ff7ca4784ee060dc802e160000b --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_17685401492131160329+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4f3c9067722287a88d585e5a8ee2251cbe208242934268d9cd5304dc3c14dbe2 +size 1291 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_17685401492131160329+e30acd3a/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_17685401492131160329+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..57d83894d08a02635bd6298ebe06a13e4b61c8cb Binary files /dev/null and b/neuronxcc-2.21.33363.0+82129205/MODULE_17685401492131160329+e30acd3a/model.neff differ diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_17713911408407405055+e30acd3a/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_17713911408407405055+e30acd3a/model.hlo_module.pb index 1b9649878f68ec37ea7456352663f5ec0da487cd..5dbbf792dfbab20c2e61ea77f19167e661c2c336 100644 --- a/neuronxcc-2.21.33363.0+82129205/MODULE_17713911408407405055+e30acd3a/model.hlo_module.pb +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_17713911408407405055+e30acd3a/model.hlo_module.pb @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:35d56233ecce04fbfae7d9f14fe4701e9080011d5ce4b5654ed54e146a5131e7 +oid sha256:9480cbce6414aef1a35a59823e5ddcadbd9334cf968704f9fbe16adb3717e5f2 size 1584 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_17713911408407405055+e30acd3a/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_17713911408407405055+e30acd3a/model.neff index 62c364c70b382ca4c02dc8d1a9c3c50ba2c04846..fa60b22d3e0ad87ee3aa5c32cb1f647b0b52b426 100644 Binary files a/neuronxcc-2.21.33363.0+82129205/MODULE_17713911408407405055+e30acd3a/model.neff and b/neuronxcc-2.21.33363.0+82129205/MODULE_17713911408407405055+e30acd3a/model.neff differ diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_1837940185986854500+e30acd3a/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_1837940185986854500+e30acd3a/model.hlo_module.pb index c13b24be1b411fb95f11aca98e792ec3ea448a84..5480e53419eec50055abdb1f7b74d9734a32e76f 100644 --- a/neuronxcc-2.21.33363.0+82129205/MODULE_1837940185986854500+e30acd3a/model.hlo_module.pb +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_1837940185986854500+e30acd3a/model.hlo_module.pb @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:e73bcffc136d2dc217b7e571cf1e8f5fa55276d132fce5e1fa93e287f5af7f11 +oid sha256:babc447ed6537b79e5de649d022948bf3ead1d92151f52916009fdd8cfc9a70b size 1584 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_1837940185986854500+e30acd3a/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_1837940185986854500+e30acd3a/model.neff index 9f7d2dfc38d640fef68e686f85554e160ea78c28..afc55c1971d067a58cc311e67d0e570e153312e8 100644 Binary files a/neuronxcc-2.21.33363.0+82129205/MODULE_1837940185986854500+e30acd3a/model.neff and b/neuronxcc-2.21.33363.0+82129205/MODULE_1837940185986854500+e30acd3a/model.neff differ diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_1870165519051566644+e30acd3a/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_1870165519051566644+e30acd3a/model.hlo_module.pb index 64c363347089b8883c973378fd169156b3d5d37f..db6ec8ae45917c795527ab84940df70bdbc05481 100644 --- a/neuronxcc-2.21.33363.0+82129205/MODULE_1870165519051566644+e30acd3a/model.hlo_module.pb +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_1870165519051566644+e30acd3a/model.hlo_module.pb @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:27439c189bb0cd81fadd20b58b5906d3ba31eb47fb16e84c9c4884fd47c96c86 +oid sha256:b8babac8da693fc6965aa30698c4e38f9de4fca47cdf6527947e0aa3fed52381 size 1584 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_1870165519051566644+e30acd3a/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_1870165519051566644+e30acd3a/model.neff index 0a59f8998776dad95a26ac1ef7078adbf6aae177..05352e78306cf3baf70817cca1aa9fbfe018157b 100644 Binary files a/neuronxcc-2.21.33363.0+82129205/MODULE_1870165519051566644+e30acd3a/model.neff and b/neuronxcc-2.21.33363.0+82129205/MODULE_1870165519051566644+e30acd3a/model.neff differ diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_2240472231266337587+e30acd3a/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_2240472231266337587+e30acd3a/model.hlo_module.pb index 5d0db9e7ecf490acae5d2a08a556d5a3cc486071..0fdeb64d97f1f9f0cb634478862cce72df69402e 100644 --- a/neuronxcc-2.21.33363.0+82129205/MODULE_2240472231266337587+e30acd3a/model.hlo_module.pb +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_2240472231266337587+e30acd3a/model.hlo_module.pb @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:50c3e59a5961d2e35404f090b0648874d10a8a12721fc9dd980ac5820c26f740 +oid sha256:86df59bb18ce74997c0039db7c246146f685971b9e201cf78b75d2e13e90fc59 size 1584 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_2240472231266337587+e30acd3a/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_2240472231266337587+e30acd3a/model.neff index a1c4aca4fd8e65bbb5442296997f14abb45d7c48..b28535733db8700fc8616c642711482a52ed7042 100644 Binary files a/neuronxcc-2.21.33363.0+82129205/MODULE_2240472231266337587+e30acd3a/model.neff and b/neuronxcc-2.21.33363.0+82129205/MODULE_2240472231266337587+e30acd3a/model.neff differ diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_2241641840113569106+e30acd3a/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_2241641840113569106+e30acd3a/model.hlo_module.pb index cc1ce00e7cb09d68985412c4119709cc94b76c5d..e330ad40e6a1ca8480622f315057e7a3144046fd 100644 --- a/neuronxcc-2.21.33363.0+82129205/MODULE_2241641840113569106+e30acd3a/model.hlo_module.pb +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_2241641840113569106+e30acd3a/model.hlo_module.pb @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:ccf86c59544ce69a4001c6270629b4619f4d42e402dedfa2d9963f7d82455d3e +oid sha256:f3fd5d3d3537914afbf25126d6a9fbf6201e8253671b1b0a06f7d4b163f804d6 size 1584 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_2241641840113569106+e30acd3a/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_2241641840113569106+e30acd3a/model.neff index 644dc6570565f8dd403f0028480c4e668d09e347..e53f9cdcb75f1780ed863e11b7d1ac642590d49c 100644 Binary files a/neuronxcc-2.21.33363.0+82129205/MODULE_2241641840113569106+e30acd3a/model.neff and b/neuronxcc-2.21.33363.0+82129205/MODULE_2241641840113569106+e30acd3a/model.neff differ diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_2447413629898598397+e30acd3a/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_2447413629898598397+e30acd3a/model.hlo_module.pb index d4ca017054b56947e59148088abb2ea6b4219f68..b6a2058d2f3e00fc230aadd524dfbdfc2382cc60 100644 --- a/neuronxcc-2.21.33363.0+82129205/MODULE_2447413629898598397+e30acd3a/model.hlo_module.pb +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_2447413629898598397+e30acd3a/model.hlo_module.pb @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:7ced77d6c5df1c8b63db687bdee8b798902c7c2c383f1d0ae937d1eb2857ae5f +oid sha256:f1910358302156bf24f8b3f454f40d94683a77fa5c96f15aebe10f2e36cd3f18 size 1584 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_2447413629898598397+e30acd3a/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_2447413629898598397+e30acd3a/model.neff index 6fba7d7caae4ace9cce45e1d55e1196d62bac497..cbfdebf43904e36c539a7d60bfc8d2cd3ef88629 100644 Binary files a/neuronxcc-2.21.33363.0+82129205/MODULE_2447413629898598397+e30acd3a/model.neff and b/neuronxcc-2.21.33363.0+82129205/MODULE_2447413629898598397+e30acd3a/model.neff differ diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_2477619772153140591+e30acd3a/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_2477619772153140591+e30acd3a/model.hlo_module.pb index 58b0ab2cf034398af2b01f8b3fa5220ae75a8817..bd25d3bd4519dfdf6857354ea3a28314daf9ebf0 100644 --- a/neuronxcc-2.21.33363.0+82129205/MODULE_2477619772153140591+e30acd3a/model.hlo_module.pb +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_2477619772153140591+e30acd3a/model.hlo_module.pb @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:912d560b87afecd94116a1c9905e4c2cc4d87bbbacef231ac77ccf50af3c6d57 +oid sha256:4fd456e855cdd48078aa665f2343a812cc96abc323ece2d4e795a22e6fb5de46 size 1584 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_2477619772153140591+e30acd3a/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_2477619772153140591+e30acd3a/model.neff index 016089fa8b101d8d371a41d6e3e4fe91a489ddba..275a2f345d10342909156be71cd8dc74a0735dbe 100644 Binary files a/neuronxcc-2.21.33363.0+82129205/MODULE_2477619772153140591+e30acd3a/model.neff and b/neuronxcc-2.21.33363.0+82129205/MODULE_2477619772153140591+e30acd3a/model.neff differ diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_2840230091891637644+e30acd3a/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_2840230091891637644+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_2840230091891637644+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_2840230091891637644+e30acd3a/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_2840230091891637644+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_2840230091891637644+e30acd3a/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_2840230091891637644+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..c4c87b055fc8db47ad27e1f0e3085518aacfde15 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_2840230091891637644+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:44b8b95c72a386bb3e43d8c3215c0de9630ab93508791e31274f396d83ebf9f9 +size 1291 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_2840230091891637644+e30acd3a/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_2840230091891637644+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..2818dccbcff7b38ba99dfae385830f8aef4dc98a Binary files /dev/null and b/neuronxcc-2.21.33363.0+82129205/MODULE_2840230091891637644+e30acd3a/model.neff differ diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_3006935121772265506+e30acd3a/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_3006935121772265506+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_3006935121772265506+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_3006935121772265506+e30acd3a/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_3006935121772265506+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_3006935121772265506+e30acd3a/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_3006935121772265506+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..04065d3577d9a8bdf71269560c7954c13dad9807 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_3006935121772265506+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b06e0c0b373b6d1df920a87171209526cf1aebf54675cf2c9948f1c6debbe6fc +size 2861 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_3006935121772265506+e30acd3a/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_3006935121772265506+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..d97f5cd40c4054b72d7f47d38ee2183abdec869d Binary files /dev/null and b/neuronxcc-2.21.33363.0+82129205/MODULE_3006935121772265506+e30acd3a/model.neff differ diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_31535d3f6678c545547b+0e774686/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_31535d3f6678c545547b+0e774686/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..1917dc36d0e27a328038a29b5c488797ca6bcfdf --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_31535d3f6678c545547b+0e774686/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--enable-saturate-infinity", "--auto-cast=none", "--model-type=transformer", "-O1", "--logfile=/tmp/nxdi_test_af4d6fed-a8ce-42f6-8c19-9cad62babd7a/compiler_workdir/SoftmaxWithMask/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_31535d3f6678c545547b+0e774686/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_31535d3f6678c545547b+0e774686/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_31535d3f6678c545547b+0e774686/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_31535d3f6678c545547b+0e774686/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..f2ee42eb9f1aa790cfddd8e066da7c8aeb1214d9 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_31535d3f6678c545547b+0e774686/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:70f96487dad4bb02b98bf2c955fe59650a5fdbcf1d763fdf56ec412b62b5774c +size 5596 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_31535d3f6678c545547b+0e774686/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_31535d3f6678c545547b+0e774686/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..d1af70b38124b8e75e03127d48d226cf702940ae Binary files /dev/null and b/neuronxcc-2.21.33363.0+82129205/MODULE_31535d3f6678c545547b+0e774686/model.neff differ diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_3742470769527135970+e30acd3a/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_3742470769527135970+e30acd3a/model.hlo_module.pb index 0144f7524b44832ee3b9b97df32c513be07b762a..a527f195e71af84bf559f2c6297355cd91fe9f74 100644 --- a/neuronxcc-2.21.33363.0+82129205/MODULE_3742470769527135970+e30acd3a/model.hlo_module.pb +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_3742470769527135970+e30acd3a/model.hlo_module.pb @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:d9f2d2d1e1238756da7acab6abca4cdd1f5ea3123f8be4870d733f60b2b16117 +oid sha256:b06d266597bfc4a71c823f51dd80846d148d49dcd9fda8d250c5db167e74ea66 size 1584 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_3742470769527135970+e30acd3a/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_3742470769527135970+e30acd3a/model.neff index e39f6e7f619aaf57312dbbf04574033786189700..2d3a7dceda21cd029c8faf430c78a1466e9db8ef 100644 Binary files a/neuronxcc-2.21.33363.0+82129205/MODULE_3742470769527135970+e30acd3a/model.neff and b/neuronxcc-2.21.33363.0+82129205/MODULE_3742470769527135970+e30acd3a/model.neff differ diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_3802233204730345176+e30acd3a/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_3802233204730345176+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_3802233204730345176+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_3802233204730345176+e30acd3a/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_3802233204730345176+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_3802233204730345176+e30acd3a/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_3802233204730345176+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..2c3ee7f331ebf0fc5ca09f98b78b79a1db6c2ff3 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_3802233204730345176+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:45d47abf3c330635b4c78a0f2a55199867d8536e9e0ecce4b3e59f5da320219a +size 1146 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_3802233204730345176+e30acd3a/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_3802233204730345176+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..6cfc92b02f7f77dcdf06cd7d2e4aed88e5c6fa70 Binary files /dev/null and b/neuronxcc-2.21.33363.0+82129205/MODULE_3802233204730345176+e30acd3a/model.neff differ diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_3918194918412354509+e30acd3a/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_3918194918412354509+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_3918194918412354509+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_3918194918412354509+e30acd3a/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_3918194918412354509+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_3918194918412354509+e30acd3a/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_3918194918412354509+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..401a28fc743e817fbcf6690eb84dfffe494d415d --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_3918194918412354509+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eda452c1f2e955560ffd996e3edb2737428a433cd7233e337f8cc1db72a2a1ed +size 1146 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_3918194918412354509+e30acd3a/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_3918194918412354509+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..17a42beba073b5e4b86c9b5989ea4a2307576634 Binary files /dev/null and b/neuronxcc-2.21.33363.0+82129205/MODULE_3918194918412354509+e30acd3a/model.neff differ diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_3e60b5a04d3967af005e+813e637b/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_3e60b5a04d3967af005e+813e637b/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..6ad21fa2f3c6e9dedf4b15e6dc09bb20e9f23c98 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_3e60b5a04d3967af005e+813e637b/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--enable-saturate-infinity", "--auto-cast=none", "--model-type=transformer", "-O1", "--logfile=/tmp/nxdi_test_c9de36f4-8076-4fd4-aeda-464c7b3dd45b/compiler_workdir/SoftmaxNoMask/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_3e60b5a04d3967af005e+813e637b/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_3e60b5a04d3967af005e+813e637b/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_3e60b5a04d3967af005e+813e637b/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_3e60b5a04d3967af005e+813e637b/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..36897c006be58fcc135059831fe41ce96ad676a1 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_3e60b5a04d3967af005e+813e637b/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e542c76cf27c3f807feac47dd3f58fd4c308e8d9e932f0732774bee19d640d8 +size 3881 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_3e60b5a04d3967af005e+813e637b/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_3e60b5a04d3967af005e+813e637b/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..4ba13944203e4fdffc1302ec2d5c6c2011efef3c Binary files /dev/null and b/neuronxcc-2.21.33363.0+82129205/MODULE_3e60b5a04d3967af005e+813e637b/model.neff differ diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_404621bbb97f199be5e0+f077467b/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_404621bbb97f199be5e0+f077467b/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..9069ce2d641d7fadfef7a2e2873e501705eed300 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_404621bbb97f199be5e0+f077467b/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--enable-saturate-infinity", "--auto-cast=none", "--model-type=transformer", "-O1", "--logfile=/tmp/nxdi_test_d9b0159b-b633-49f5-b266-20dd4d853192/compiler_workdir/AttentionModelWrapper/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_404621bbb97f199be5e0+f077467b/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_404621bbb97f199be5e0+f077467b/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_404621bbb97f199be5e0+f077467b/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_404621bbb97f199be5e0+f077467b/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..89eb2339905a3e3d5d05af1d33aeb632bbb1436e --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_404621bbb97f199be5e0+f077467b/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:14a5d6816ffd369be6c10cb45f27b95ad073d2be256d587642764fb87bce2d53 +size 8979 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_404621bbb97f199be5e0+f077467b/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_404621bbb97f199be5e0+f077467b/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..2a79062625612297add513265ac9fc9fdfc15a42 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_404621bbb97f199be5e0+f077467b/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:acb205bf62754cc797579daa6e1b2f6ceffbeefee347def969f6ed4fb28cf717 +size 246784 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_404621bbb97f199be5e0+f077467b/wrapped_neff.hlo b/neuronxcc-2.21.33363.0+82129205/MODULE_404621bbb97f199be5e0+f077467b/wrapped_neff.hlo new file mode 100644 index 0000000000000000000000000000000000000000..e176d07ff07b720767edd134f845255aff4542c1 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_404621bbb97f199be5e0+f077467b/wrapped_neff.hlo @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5b81121540b12a049a8a8294615bbdc14be3410b16be8631f0cf251253045c34 +size 249608 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_4609340858424122400+e30acd3a/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_4609340858424122400+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_4609340858424122400+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_4609340858424122400+e30acd3a/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_4609340858424122400+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_4609340858424122400+e30acd3a/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_4609340858424122400+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..4f00d1ee5a3d72ce0aa2e85b1a1462faa83391e6 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_4609340858424122400+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2fe81b6af6291d6553fb75265b08a1c1c3ed232e7dc9c209127565895a5c334a +size 1146 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_4609340858424122400+e30acd3a/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_4609340858424122400+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..c91761bd393ce27c4f0b942713c0d66c04bdb9a4 Binary files /dev/null and b/neuronxcc-2.21.33363.0+82129205/MODULE_4609340858424122400+e30acd3a/model.neff differ diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_4692571821501481255+e30acd3a/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_4692571821501481255+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_4692571821501481255+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_4692571821501481255+e30acd3a/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_4692571821501481255+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_4692571821501481255+e30acd3a/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_4692571821501481255+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..1ea91108b6fd8766b381071c23fb8613cd33fec8 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_4692571821501481255+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f102ed747978770493ce35a703b63b51368f818a5fd525765b97f841774e0c6f +size 1291 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_4692571821501481255+e30acd3a/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_4692571821501481255+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..48e6448373aa3d24be02c2a7224b30c726f1e840 Binary files /dev/null and b/neuronxcc-2.21.33363.0+82129205/MODULE_4692571821501481255+e30acd3a/model.neff differ diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_4729947242617427400+e30acd3a/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_4729947242617427400+e30acd3a/model.hlo_module.pb index ab5d2955c5aeb33c2b8423e7facddd2ddead1ea3..b34c142b597baea623a9f31df5bc00b1dbc05b8d 100644 --- a/neuronxcc-2.21.33363.0+82129205/MODULE_4729947242617427400+e30acd3a/model.hlo_module.pb +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_4729947242617427400+e30acd3a/model.hlo_module.pb @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:0dc16184a9197b242ab9bb070a2262cfc60a11b4b84c12d4ea59fad356f64771 +oid sha256:5ddd2b34a9153add60918b486cc982c36621219d75e68c4d4ffe7308aa34f0b1 size 1585 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_4729947242617427400+e30acd3a/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_4729947242617427400+e30acd3a/model.neff index 8263ea8b3de78893adf983571add9f78cf4a97f4..0ee75195c229d877b8ec24b0f3a1da9f33180e5f 100644 Binary files a/neuronxcc-2.21.33363.0+82129205/MODULE_4729947242617427400+e30acd3a/model.neff and b/neuronxcc-2.21.33363.0+82129205/MODULE_4729947242617427400+e30acd3a/model.neff differ diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_4748150422668476963+e30acd3a/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_4748150422668476963+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_4748150422668476963+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_4748150422668476963+e30acd3a/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_4748150422668476963+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_4748150422668476963+e30acd3a/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_4748150422668476963+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..4afd653aa72306252c0b83a036cc55756cf921c8 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_4748150422668476963+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eb57090a07022ca0fe061700dbe98acf47b871dbedbcb190ffbaa9782eae39a4 +size 1146 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_4748150422668476963+e30acd3a/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_4748150422668476963+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..a396aa212aa9a74e123ce8fb506e34776749b1c2 Binary files /dev/null and b/neuronxcc-2.21.33363.0+82129205/MODULE_4748150422668476963+e30acd3a/model.neff differ diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_4982309848892198153+e30acd3a/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_4982309848892198153+e30acd3a/model.hlo_module.pb index 409dc6a76c47febfd2e6764450b15c032e0d0419..419968ded4f2dd0690620cf7b1ff0c95bcc10edb 100644 --- a/neuronxcc-2.21.33363.0+82129205/MODULE_4982309848892198153+e30acd3a/model.hlo_module.pb +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_4982309848892198153+e30acd3a/model.hlo_module.pb @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:c0dcdccfc9cb1289cceea693cfb9f27f91556fcbe3060a7aeffcbef90ef8946d +oid sha256:ef983e0fbbc35dfee7e2b243b501d978fb75940f4bce747d55d3755a99794be9 size 1585 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_4982309848892198153+e30acd3a/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_4982309848892198153+e30acd3a/model.neff index 7feeecde5013bd311d129e9b73e614feeacff2fd..6271fade7ccaf9b060bd2bd0153eea33b644dcb8 100644 Binary files a/neuronxcc-2.21.33363.0+82129205/MODULE_4982309848892198153+e30acd3a/model.neff and b/neuronxcc-2.21.33363.0+82129205/MODULE_4982309848892198153+e30acd3a/model.neff differ diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_5056926643664195969+e30acd3a/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_5056926643664195969+e30acd3a/model.hlo_module.pb index 7da2d77d6f20dd2d43935bc46b7a42f00a1b53fd..403f66e7baa3f3b756ab751db521da376ca942e2 100644 --- a/neuronxcc-2.21.33363.0+82129205/MODULE_5056926643664195969+e30acd3a/model.hlo_module.pb +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_5056926643664195969+e30acd3a/model.hlo_module.pb @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:058681d48647e0c9b3dbe7688a61919a6582484d2f0b81ba3c0155e378d39840 +oid sha256:3dc8cf665df601199ae361822fc4f204b6fca26d47e2650a3445377fef620a7a size 1584 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_5056926643664195969+e30acd3a/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_5056926643664195969+e30acd3a/model.neff index ad763435ca14fea6e494cc68dbcdab7383f59eea..4f7ae33c005e1891a126a864868cb2d320215e0b 100644 Binary files a/neuronxcc-2.21.33363.0+82129205/MODULE_5056926643664195969+e30acd3a/model.neff and b/neuronxcc-2.21.33363.0+82129205/MODULE_5056926643664195969+e30acd3a/model.neff differ diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_5060945789978167091+e30acd3a/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_5060945789978167091+e30acd3a/model.hlo_module.pb index 9f7cfa734d8f530c72009eb32f5920d1b7011ac8..79aeaef2da595105480fe25b7c545d9748c7b2b3 100644 --- a/neuronxcc-2.21.33363.0+82129205/MODULE_5060945789978167091+e30acd3a/model.hlo_module.pb +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_5060945789978167091+e30acd3a/model.hlo_module.pb @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:f5cc8fae4180e9c37d3edf0a9c33cb9a77cc20d3a208ab308dd26971d505a3f2 +oid sha256:61ebecf5ddb703eee9f52d51e5dfafe50073fdf4ed9bbe9c38265fd5e4bf06bf size 1584 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_5060945789978167091+e30acd3a/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_5060945789978167091+e30acd3a/model.neff index c3e1d9df7d56d2f2630b9356f00b7248d6ca82c1..c9d275fd35d71bef2bed264b765d02951770523b 100644 Binary files a/neuronxcc-2.21.33363.0+82129205/MODULE_5060945789978167091+e30acd3a/model.neff and b/neuronxcc-2.21.33363.0+82129205/MODULE_5060945789978167091+e30acd3a/model.neff differ diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_5068307057019708073+e30acd3a/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_5068307057019708073+e30acd3a/model.hlo_module.pb index c134283ccd0f0cb78d3df709fd00745d387a3bf2..e29104dfed9a1b9ca18e1108596eba7d3bfcbb2f 100644 --- a/neuronxcc-2.21.33363.0+82129205/MODULE_5068307057019708073+e30acd3a/model.hlo_module.pb +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_5068307057019708073+e30acd3a/model.hlo_module.pb @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:d1bfa4233bec9ae7d38413a0183ed12d18519fc8a52d4be29ae06d39da17d8cd +oid sha256:71df08c7be422361b6bec9e9eceebb610b6cdf191b0f6f50992dd307056f3367 size 1584 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_5068307057019708073+e30acd3a/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_5068307057019708073+e30acd3a/model.neff index db6bb0a5b3d4fda083e6e3bd99c94af9c0781cd7..29ee0a2af8a427e1aece437803feb7c36f8be033 100644 Binary files a/neuronxcc-2.21.33363.0+82129205/MODULE_5068307057019708073+e30acd3a/model.neff and b/neuronxcc-2.21.33363.0+82129205/MODULE_5068307057019708073+e30acd3a/model.neff differ diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_5221425564004302780+e30acd3a/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_5221425564004302780+e30acd3a/model.hlo_module.pb index 72df21a2578f24d625843a1a3247988a3fbd65c4..e054c1381e5f95975c5a00440fb7626d86b9b663 100644 --- a/neuronxcc-2.21.33363.0+82129205/MODULE_5221425564004302780+e30acd3a/model.hlo_module.pb +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_5221425564004302780+e30acd3a/model.hlo_module.pb @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:41482b2311979515b0aeef0f82fffdc167ce3ed1cf6a003693418491cdb469fc +oid sha256:d5cc9fea64ae141cf6cec52aa4e82b3b59a58c188adcd60a01dedab867912119 size 1584 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_5221425564004302780+e30acd3a/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_5221425564004302780+e30acd3a/model.neff index 0c746225bc978d88dd2fc327c375cd121535189f..e60177a2c89fbb8a8d80d48ae82a34b0eab51972 100644 Binary files a/neuronxcc-2.21.33363.0+82129205/MODULE_5221425564004302780+e30acd3a/model.neff and b/neuronxcc-2.21.33363.0+82129205/MODULE_5221425564004302780+e30acd3a/model.neff differ diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_5301538834954885513+e30acd3a/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_5301538834954885513+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_5301538834954885513+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_5301538834954885513+e30acd3a/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_5301538834954885513+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_5301538834954885513+e30acd3a/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_5301538834954885513+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..b807a87939f8a0dfd4d068906d12792789099977 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_5301538834954885513+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8a9fcf7ef02db98b5c965953c1378d7da22b4612eabc05a029505c9f32623fe4 +size 1291 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_5301538834954885513+e30acd3a/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_5301538834954885513+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..5c8d94eea0e4724f335e0257648fe77018a2e042 Binary files /dev/null and b/neuronxcc-2.21.33363.0+82129205/MODULE_5301538834954885513+e30acd3a/model.neff differ diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_5346694134112720644+e30acd3a/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_5346694134112720644+e30acd3a/model.hlo_module.pb index 1a8b11f7ea3f8104bfc94568f6e6605b1044b61a..32deb3efdbb0397b82e08f374b8f96e442583ad9 100644 --- a/neuronxcc-2.21.33363.0+82129205/MODULE_5346694134112720644+e30acd3a/model.hlo_module.pb +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_5346694134112720644+e30acd3a/model.hlo_module.pb @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:5163c6cbea635d50d6bcef42a476e0c486c1fe477ce65bddb01ef5d613f3ada7 +oid sha256:a716b0a6aff138e9b18726f20aea5a8a8be08483d57ea5115d22e17f1311d348 size 1584 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_5346694134112720644+e30acd3a/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_5346694134112720644+e30acd3a/model.neff index 49ebd07bab2483eb641ed27190176b7a0bde2a3c..09c49f48abe63695c3f134455678474d5526ed43 100644 Binary files a/neuronxcc-2.21.33363.0+82129205/MODULE_5346694134112720644+e30acd3a/model.neff and b/neuronxcc-2.21.33363.0+82129205/MODULE_5346694134112720644+e30acd3a/model.neff differ diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_578110665359387607+e30acd3a/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_578110665359387607+e30acd3a/model.hlo_module.pb index 08f880bfd2f6bc4dbf4ba0e030ae57400b3644d9..fd5017c8b82cc95d576769b1e547b3981eef419f 100644 --- a/neuronxcc-2.21.33363.0+82129205/MODULE_578110665359387607+e30acd3a/model.hlo_module.pb +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_578110665359387607+e30acd3a/model.hlo_module.pb @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9416ee80e28588b7d58a56ed290c42e6942a1b3745ec238b91c7fafbc1f154e5 +oid sha256:3362e8815eac4eea5a1c2086bb6f3fe5428a81dd9b740ead591ffa0f862fb8cd size 1584 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_578110665359387607+e30acd3a/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_578110665359387607+e30acd3a/model.neff index 0a4b67437bca50e840e4750cd8418b65a6880796..6b8ba0ccc95d838a16c6abb42e3c73fd0a0dbe38 100644 Binary files a/neuronxcc-2.21.33363.0+82129205/MODULE_578110665359387607+e30acd3a/model.neff and b/neuronxcc-2.21.33363.0+82129205/MODULE_578110665359387607+e30acd3a/model.neff differ diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_6208374896869439318+e30acd3a/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_6208374896869439318+e30acd3a/model.hlo_module.pb index b2e45ac79e7cdd5ec4c177fbcf28a2783e9dfbea..6a8294758163c2493cda15c9e06290fd7ae3506d 100644 --- a/neuronxcc-2.21.33363.0+82129205/MODULE_6208374896869439318+e30acd3a/model.hlo_module.pb +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_6208374896869439318+e30acd3a/model.hlo_module.pb @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:286cd304747970894823fc06483ba76dfd74ce76d0989e5b2ba815f5c03c200e +oid sha256:969acdd9a8bd1b58487605bd99172caff83afe5f1b6ef1c272feb25a01fbe10a size 1585 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_6208374896869439318+e30acd3a/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_6208374896869439318+e30acd3a/model.neff index dd6932da06790795019b38ca937d8c747c2a4efc..5d950f677729a52275fa40d0e45b54998628a22c 100644 Binary files a/neuronxcc-2.21.33363.0+82129205/MODULE_6208374896869439318+e30acd3a/model.neff and b/neuronxcc-2.21.33363.0+82129205/MODULE_6208374896869439318+e30acd3a/model.neff differ diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_6305938804443382221+e30acd3a/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_6305938804443382221+e30acd3a/model.hlo_module.pb index d0f77914ffe027e73ead390ad61bd8c0fc019f22..0836ecda35ebde93846adfc4aeafbd5974116af6 100644 --- a/neuronxcc-2.21.33363.0+82129205/MODULE_6305938804443382221+e30acd3a/model.hlo_module.pb +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_6305938804443382221+e30acd3a/model.hlo_module.pb @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:69b9c9469d8eb89302c52a8b5ef28e5dcbefd0187702e88f5bfda4a4752be87d +oid sha256:bd3082d6299da8f09b654a5f2561f6ed683ede7cbf2c47a506960e4dfa0f731c size 1584 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_6305938804443382221+e30acd3a/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_6305938804443382221+e30acd3a/model.neff index a9c6762bbb9f7cd5a0dcd160bf65e83ad0e93885..bc273a3d2bcb8a4ebd375a70b6fd5cc969fa2024 100644 Binary files a/neuronxcc-2.21.33363.0+82129205/MODULE_6305938804443382221+e30acd3a/model.neff and b/neuronxcc-2.21.33363.0+82129205/MODULE_6305938804443382221+e30acd3a/model.neff differ diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_6462012722744130561+e30acd3a/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_6462012722744130561+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_6462012722744130561+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_6462012722744130561+e30acd3a/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_6462012722744130561+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_6462012722744130561+e30acd3a/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_6462012722744130561+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..26ec99769d25690b654937173d6d3c8f5096612b --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_6462012722744130561+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5dc3dbee591aa1a897f17043331c7acd2d931e0e3b85106811f7d8dc767a72b6 +size 1291 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_6462012722744130561+e30acd3a/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_6462012722744130561+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..64005a018a9506b362a332cb35b3bf6f0eb250e3 Binary files /dev/null and b/neuronxcc-2.21.33363.0+82129205/MODULE_6462012722744130561+e30acd3a/model.neff differ diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_6465053070255633885+e30acd3a/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_6465053070255633885+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_6465053070255633885+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_6465053070255633885+e30acd3a/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_6465053070255633885+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_6465053070255633885+e30acd3a/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_6465053070255633885+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..fc281971bbf0c5b3c61bcbbebf735d8ee19c19f8 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_6465053070255633885+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:637a792157c7a041784c4adb85b5957a8652b936fa3621e51c2818ec36ea4368 +size 1291 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_6465053070255633885+e30acd3a/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_6465053070255633885+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..1a48194babfde3111fe2fc609467cdb4db848141 Binary files /dev/null and b/neuronxcc-2.21.33363.0+82129205/MODULE_6465053070255633885+e30acd3a/model.neff differ diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_6601989946514187606+e30acd3a/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_6601989946514187606+e30acd3a/model.hlo_module.pb index ee1e423f2f3d8d36a62df3d8f7a6a4b196011bd1..dfd16295ccad9ad6795e5bf891cefe605d3407b3 100644 --- a/neuronxcc-2.21.33363.0+82129205/MODULE_6601989946514187606+e30acd3a/model.hlo_module.pb +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_6601989946514187606+e30acd3a/model.hlo_module.pb @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:b0b98325b529fcc4a4bee1adf72ca1e7d9f89c8de8b1dcdb957931e7816140f6 +oid sha256:bb11806ad9bc8ab74bf7a70a0537fcc5c83612c7e5866726b78b8a1ad8cc65d4 size 1584 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_6601989946514187606+e30acd3a/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_6601989946514187606+e30acd3a/model.neff index 6ed9fa6133ad18b6dddcec8ccbd2e6254f5f4cca..715db5269f449775bd4c31b78379af2dd6f1f154 100644 Binary files a/neuronxcc-2.21.33363.0+82129205/MODULE_6601989946514187606+e30acd3a/model.neff and b/neuronxcc-2.21.33363.0+82129205/MODULE_6601989946514187606+e30acd3a/model.neff differ diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_689110558945142051+e30acd3a/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_689110558945142051+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_689110558945142051+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_689110558945142051+e30acd3a/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_689110558945142051+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_689110558945142051+e30acd3a/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_689110558945142051+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..e8e7142a0bbd6bb961c5605c34c13019e4407ed1 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_689110558945142051+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6de9fb6b895067c8cdb6359762fc6e84f92e321e26c6218ea598903a2774e38f +size 2861 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_689110558945142051+e30acd3a/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_689110558945142051+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..4430aaf06a9f394cf8f61f03c5c5491cc3d3d419 Binary files /dev/null and b/neuronxcc-2.21.33363.0+82129205/MODULE_689110558945142051+e30acd3a/model.neff differ diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_6954418380069475056+e30acd3a/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_6954418380069475056+e30acd3a/model.hlo_module.pb index cc4867fcc446b41950eb76b3e23b948cabacfbcb..0adba9e814700a38d69a4c042d4c64a57d34bef6 100644 --- a/neuronxcc-2.21.33363.0+82129205/MODULE_6954418380069475056+e30acd3a/model.hlo_module.pb +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_6954418380069475056+e30acd3a/model.hlo_module.pb @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:de02a218d743956a2996aaa5bd62b9f1638ffba8fbbee1533b1cdea8c050ea29 +oid sha256:e594846bafe9533de55e918ea8c905a5cf6d650050ca7a6667fffc254d4e2856 size 1584 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_6954418380069475056+e30acd3a/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_6954418380069475056+e30acd3a/model.neff index 7210dd9abe1bcda21794bd4bf7033265879c1d0c..8270c287c937b89ddb0eef9927eb705c5b915438 100644 Binary files a/neuronxcc-2.21.33363.0+82129205/MODULE_6954418380069475056+e30acd3a/model.neff and b/neuronxcc-2.21.33363.0+82129205/MODULE_6954418380069475056+e30acd3a/model.neff differ diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_7071522469786365265+e30acd3a/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_7071522469786365265+e30acd3a/model.hlo_module.pb index 65cd73c86e8a07ff02487d4536d1f111a13f904e..18265fc32520afff0b71ad9fdd95624957353235 100644 --- a/neuronxcc-2.21.33363.0+82129205/MODULE_7071522469786365265+e30acd3a/model.hlo_module.pb +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_7071522469786365265+e30acd3a/model.hlo_module.pb @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:cb0a6b6b9c81d5c6c20c442718dccbf485f40c87a8217af91107a5ab3e0af055 +oid sha256:e6c75e4f4fbb7e64001e956a17320bf8e04e38c442cf7b2926cffdee4ac28151 size 1584 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_7071522469786365265+e30acd3a/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_7071522469786365265+e30acd3a/model.neff index f18a3a3f7cd6411fd170674e7c0a1428f8d2b954..b7160aaa4822c2986d85e50ae3e143123ae23c3a 100644 Binary files a/neuronxcc-2.21.33363.0+82129205/MODULE_7071522469786365265+e30acd3a/model.neff and b/neuronxcc-2.21.33363.0+82129205/MODULE_7071522469786365265+e30acd3a/model.neff differ diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_7430361747835832819+e30acd3a/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_7430361747835832819+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_7430361747835832819+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_7430361747835832819+e30acd3a/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_7430361747835832819+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_7430361747835832819+e30acd3a/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_7430361747835832819+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..194fb624fd767e52bddf8e4449084ab2706ccc13 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_7430361747835832819+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4138a7c3f0fd71b471f0e3aebdb6e44687d9d223022b017f398208560c37b8e2 +size 1291 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_7430361747835832819+e30acd3a/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_7430361747835832819+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..0e43a00f18a49765656fd396cbeeaddce20fffa7 Binary files /dev/null and b/neuronxcc-2.21.33363.0+82129205/MODULE_7430361747835832819+e30acd3a/model.neff differ diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_748714541699003438+e30acd3a/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_748714541699003438+e30acd3a/model.hlo_module.pb index 624a3c1b56463ca0ba1cbc694c1d9b90576442b7..b83ce58c8fe4463e38b7dbc18d871d3f07f5baa0 100644 --- a/neuronxcc-2.21.33363.0+82129205/MODULE_748714541699003438+e30acd3a/model.hlo_module.pb +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_748714541699003438+e30acd3a/model.hlo_module.pb @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:f5a94da50ba3ee7f04a09d0f188a7ad5540e359965b908e16572e1a5f6151498 +oid sha256:a809cc81115bdf753052a01e81b7dc159fb080eb7978b8aa629dee8a18578eb6 size 1584 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_748714541699003438+e30acd3a/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_748714541699003438+e30acd3a/model.neff index 4ba3cebab5f2a48b106da8f4a230731a97916fb8..67fb02b9b43aa91de6a373e0c19636652fcc4f5e 100644 Binary files a/neuronxcc-2.21.33363.0+82129205/MODULE_748714541699003438+e30acd3a/model.neff and b/neuronxcc-2.21.33363.0+82129205/MODULE_748714541699003438+e30acd3a/model.neff differ diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_7760252933458031364+e30acd3a/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_7760252933458031364+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_7760252933458031364+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_7760252933458031364+e30acd3a/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_7760252933458031364+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_7760252933458031364+e30acd3a/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_7760252933458031364+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..930763f611785216058259fdcc3ef4da892b70ca --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_7760252933458031364+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:78272e473bcea1b41467ca24293f499090407a72d5d6dc1e9b04988cb8958178 +size 1291 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_7760252933458031364+e30acd3a/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_7760252933458031364+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..39865ba2f9424e08064ddfd6789e3b425a7a750c Binary files /dev/null and b/neuronxcc-2.21.33363.0+82129205/MODULE_7760252933458031364+e30acd3a/model.neff differ diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_780259796876411187+e30acd3a/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_780259796876411187+e30acd3a/model.hlo_module.pb index 147c1586aac46ddfe7b367fb4f90a52b1589362e..52cd14423e731314228e47e41c76a7c6589078bf 100644 --- a/neuronxcc-2.21.33363.0+82129205/MODULE_780259796876411187+e30acd3a/model.hlo_module.pb +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_780259796876411187+e30acd3a/model.hlo_module.pb @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:4e3874129d23ad1c69d19cc9636edc6f6b0bec7684aaa4058429feb1e7acfc2c +oid sha256:6579b00592526fdafc15c6925475389090455f7ec42bd5e6c1ce1668f87fe02b size 1585 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_780259796876411187+e30acd3a/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_780259796876411187+e30acd3a/model.neff index 39542d53bb3961c021aec3d7944bf64223663336..6bceed19ac71b556aa2914349e5f354237fd3d2a 100644 Binary files a/neuronxcc-2.21.33363.0+82129205/MODULE_780259796876411187+e30acd3a/model.neff and b/neuronxcc-2.21.33363.0+82129205/MODULE_780259796876411187+e30acd3a/model.neff differ diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_788940165194100575+e30acd3a/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_788940165194100575+e30acd3a/model.hlo_module.pb index a3d9ab4f7c96a51129b485c987af0c3965fbd2e3..57fab77ef2631b5c5bad91d27bb78b26fcdbf8b2 100644 --- a/neuronxcc-2.21.33363.0+82129205/MODULE_788940165194100575+e30acd3a/model.hlo_module.pb +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_788940165194100575+e30acd3a/model.hlo_module.pb @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:12a4a82788fd9c10e258bc78cfac56903ed9e41e56c1b39918ac7a98aa50f857 +oid sha256:40505ede26f5eec04a38b8551d7d050115f239fdc3668526ecfe3853f9189947 size 1584 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_788940165194100575+e30acd3a/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_788940165194100575+e30acd3a/model.neff index 711b0e81fd87e197987f7da6b59e52c2f83a80c1..4ea197061c91c26e997dfbe99fe3858337cf0e6d 100644 Binary files a/neuronxcc-2.21.33363.0+82129205/MODULE_788940165194100575+e30acd3a/model.neff and b/neuronxcc-2.21.33363.0+82129205/MODULE_788940165194100575+e30acd3a/model.neff differ diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_8025f9b606fa6335fe08+a32116a7/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_8025f9b606fa6335fe08+a32116a7/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..3c18214665ab208ee16402ace66a8dd081416d1a --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_8025f9b606fa6335fe08+a32116a7/compile_flags.json @@ -0,0 +1 @@ +["--target=trn2", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=2", "--logfile=/tmp/nxd_model/context_encoding/_tp0_bk0/log-neuron-cc.txt"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_8025f9b606fa6335fe08+a32116a7/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_8025f9b606fa6335fe08+a32116a7/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_8025f9b606fa6335fe08+a32116a7/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_8025f9b606fa6335fe08+a32116a7/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..823a91a77f54d152e1dc2b1e1fba48a7ac1163a3 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_8025f9b606fa6335fe08+a32116a7/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a8885abad749a70e422301c2e0899870471231329bcede2907602d5ac771047 +size 1289344 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_8025f9b606fa6335fe08+a32116a7/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_8025f9b606fa6335fe08+a32116a7/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..32414a9f5945e6c7cf6017b9758d5928e54f1de4 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_8025f9b606fa6335fe08+a32116a7/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0d1c16fde6ef1a8f4b90b0747ca5676210a1df19cc62de7b94b1c0c13b20ae67 +size 728064 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_8093733071045345337+e30acd3a/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_8093733071045345337+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_8093733071045345337+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_8093733071045345337+e30acd3a/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_8093733071045345337+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_8093733071045345337+e30acd3a/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_8093733071045345337+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..a26710e6ec5bc9c45adabd2337dd918aebc4ad65 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_8093733071045345337+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9fa0a0dcad7912b6b0e8ef6a6a1ca26d271370391d98b674bc70c0d5c0c94545 +size 1291 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_8093733071045345337+e30acd3a/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_8093733071045345337+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..6a54095a89aefef24704223561f7624cbcad8909 Binary files /dev/null and b/neuronxcc-2.21.33363.0+82129205/MODULE_8093733071045345337+e30acd3a/model.neff differ diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_8432304590411733968+e30acd3a/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_8432304590411733968+e30acd3a/model.hlo_module.pb index ea75b72ceb1ffddf1735837bb050ce370fb813af..f41aa27a9b7d1c67708bda46b4f47c87e7f45b4c 100644 --- a/neuronxcc-2.21.33363.0+82129205/MODULE_8432304590411733968+e30acd3a/model.hlo_module.pb +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_8432304590411733968+e30acd3a/model.hlo_module.pb @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:81c88ba71326839d9c30573e697266a88ef7c7e6ca153aca44fcb611072884d8 +oid sha256:63aeb84c5055fa2c4ef11a302568a19a4fdae9df5917526ed3b0e367cb06f1b0 size 1584 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_8432304590411733968+e30acd3a/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_8432304590411733968+e30acd3a/model.neff index 78b3020a0f4b3514d2823af3281b88cb75c28775..9e0ad51be8223ac9858a13ddaa036c0e52ded8b3 100644 Binary files a/neuronxcc-2.21.33363.0+82129205/MODULE_8432304590411733968+e30acd3a/model.neff and b/neuronxcc-2.21.33363.0+82129205/MODULE_8432304590411733968+e30acd3a/model.neff differ diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_8468241434736974290+e30acd3a/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_8468241434736974290+e30acd3a/model.hlo_module.pb index 5ce4a24a3f4ad9ddae0cf6c4f101d0fb719b0485..d16cbd7f1997d9854faae1cf17fcc1aaab7c1b83 100644 --- a/neuronxcc-2.21.33363.0+82129205/MODULE_8468241434736974290+e30acd3a/model.hlo_module.pb +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_8468241434736974290+e30acd3a/model.hlo_module.pb @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:924f25eeb83b1f2c854719d98be6e51db203789ac31568689f5bd4aef63dfb9a +oid sha256:2c4eb5109d26aa8a070f987fc9b402b4bfa89dfb9d86a71209ea631ce0227e54 size 1584 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_8468241434736974290+e30acd3a/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_8468241434736974290+e30acd3a/model.neff index 8cf63b519dd0fc253a5de1381f2e58a41ce898cc..49c79255bb24d9d6d5c49ab22aff529b8f91bd2f 100644 Binary files a/neuronxcc-2.21.33363.0+82129205/MODULE_8468241434736974290+e30acd3a/model.neff and b/neuronxcc-2.21.33363.0+82129205/MODULE_8468241434736974290+e30acd3a/model.neff differ diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_8476840015321783067+e30acd3a/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_8476840015321783067+e30acd3a/model.hlo_module.pb index 1efd6b7dedc83c3704cd1b735e12395887f6da8a..832eb3ec7e15539a99ec76cd73a46ee89e9639a4 100644 --- a/neuronxcc-2.21.33363.0+82129205/MODULE_8476840015321783067+e30acd3a/model.hlo_module.pb +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_8476840015321783067+e30acd3a/model.hlo_module.pb @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:e9b5c4ccf12d542b037ab62137b8b394682b100f2c521675c7bf12890efda020 +oid sha256:e9e06bb9b05365bfe6a340f110e8910147209c825be5935ad4382edc00cdb7f9 size 1585 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_8476840015321783067+e30acd3a/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_8476840015321783067+e30acd3a/model.neff index f1c785df9c6ff3a021269f572b498971435f8c75..19badfe15d6c8065e93af411cf080adcb2da96bc 100644 Binary files a/neuronxcc-2.21.33363.0+82129205/MODULE_8476840015321783067+e30acd3a/model.neff and b/neuronxcc-2.21.33363.0+82129205/MODULE_8476840015321783067+e30acd3a/model.neff differ diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_8657275884604457834+e30acd3a/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_8657275884604457834+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_8657275884604457834+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_8657275884604457834+e30acd3a/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_8657275884604457834+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_8657275884604457834+e30acd3a/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_8657275884604457834+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..72b4b6cdc79eb2878d6545c2a1c1c59af7212b4b --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_8657275884604457834+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f18fa528a6945c9c4216e24f009ca2198865c4781c203e938b6c8f641553d4bb +size 2861 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_8657275884604457834+e30acd3a/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_8657275884604457834+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..772d9bbf822a72509ac1f2a88c2bb95a1979f3a1 Binary files /dev/null and b/neuronxcc-2.21.33363.0+82129205/MODULE_8657275884604457834+e30acd3a/model.neff differ diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_879201820668420060+e30acd3a/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_879201820668420060+e30acd3a/model.hlo_module.pb index a2b43988cc81aa73f757af772d542c413e653e2e..0eb95f18dfc5c9ddcfe9b08371bb982f49dee242 100644 --- a/neuronxcc-2.21.33363.0+82129205/MODULE_879201820668420060+e30acd3a/model.hlo_module.pb +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_879201820668420060+e30acd3a/model.hlo_module.pb @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:cef670d6b80a7e4253b327fd39e1d079ac588f85021dabc03613787fe9e15793 +oid sha256:ca65651a228c0d284ad9e9397ccbb88d286a0b8348df1bd94a1203c1d79cf0cd size 1584 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_879201820668420060+e30acd3a/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_879201820668420060+e30acd3a/model.neff index ba58a8ac545478c73d732c1d8901d02aa7bc55fa..52c5fad470bd024d846a166eb44db0bec052c419 100644 Binary files a/neuronxcc-2.21.33363.0+82129205/MODULE_879201820668420060+e30acd3a/model.neff and b/neuronxcc-2.21.33363.0+82129205/MODULE_879201820668420060+e30acd3a/model.neff differ diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_8874447663297084929+e30acd3a/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_8874447663297084929+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_8874447663297084929+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_8874447663297084929+e30acd3a/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_8874447663297084929+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_8874447663297084929+e30acd3a/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_8874447663297084929+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..f9ed7eed3fd03bc5f97721d28be29095865281f7 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_8874447663297084929+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e0d66898b506f270786d9c6bf4b29a31b0da5e43e4d64fd6ae60f8099c281c52 +size 1146 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_8874447663297084929+e30acd3a/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_8874447663297084929+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..545dc9114e665153840cde4b735df785cc9a9de0 Binary files /dev/null and b/neuronxcc-2.21.33363.0+82129205/MODULE_8874447663297084929+e30acd3a/model.neff differ diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_9359742670556022940+e30acd3a/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_9359742670556022940+e30acd3a/model.hlo_module.pb index d8aea4a29916e9ee6c3d3cb01dd7040f9449b6e7..92b0b1da6139ef6710b65e7a391ad79462d2bfae 100644 --- a/neuronxcc-2.21.33363.0+82129205/MODULE_9359742670556022940+e30acd3a/model.hlo_module.pb +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_9359742670556022940+e30acd3a/model.hlo_module.pb @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:e281a28fd4383e251e58b20244d279c47e2a97ff0e8d2ce7c4cdb5d6ebff3689 +oid sha256:d79f3f08811858666dbe36330c5514a97b0720ed5741fd83751c7c0790112e11 size 1584 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_9359742670556022940+e30acd3a/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_9359742670556022940+e30acd3a/model.neff index 87eb28e4596daed06413ac0b47e33673f0db962b..e950d9930201e7eba4c9737f0a563adca9912fcb 100644 Binary files a/neuronxcc-2.21.33363.0+82129205/MODULE_9359742670556022940+e30acd3a/model.neff and b/neuronxcc-2.21.33363.0+82129205/MODULE_9359742670556022940+e30acd3a/model.neff differ diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_9360214757141243910+e30acd3a/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_9360214757141243910+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_9360214757141243910+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_9360214757141243910+e30acd3a/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_9360214757141243910+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_9360214757141243910+e30acd3a/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_9360214757141243910+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..1284546c98ddb8d9020c191ceebbf2c8a89aa21d --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_9360214757141243910+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:50c1a6d78b01c6278521150f68bc50079751f4242f26de93361048d11f797e41 +size 1146 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_9360214757141243910+e30acd3a/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_9360214757141243910+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..ad18c567566ee18c4d72847f36000dff89df0f05 Binary files /dev/null and b/neuronxcc-2.21.33363.0+82129205/MODULE_9360214757141243910+e30acd3a/model.neff differ diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_9551663534243818596+e30acd3a/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_9551663534243818596+e30acd3a/model.hlo_module.pb index 9918fd3fa8009a6648d5eb93e90edc50804acd4c..7b501b50bc4fdc408b325781010ccb1a00d5bda2 100644 --- a/neuronxcc-2.21.33363.0+82129205/MODULE_9551663534243818596+e30acd3a/model.hlo_module.pb +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_9551663534243818596+e30acd3a/model.hlo_module.pb @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:c3bb8a07961986496e8562aaa6b8e2c95f1a16486d01671b496004968c006d1a +oid sha256:fdeb259c977147f4769a9268dd181b3b4bd7d86384aae41f1c0746dcc522774a size 1584 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_9551663534243818596+e30acd3a/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_9551663534243818596+e30acd3a/model.neff index 95d02cfd4094e2a2c5d23ca91d65ff927ab9151e..6b91a324a0bdce8ec5741021f6e2b7596d97140c 100644 Binary files a/neuronxcc-2.21.33363.0+82129205/MODULE_9551663534243818596+e30acd3a/model.neff and b/neuronxcc-2.21.33363.0+82129205/MODULE_9551663534243818596+e30acd3a/model.neff differ diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_9721314421976720364+e30acd3a/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_9721314421976720364+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_9721314421976720364+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_9721314421976720364+e30acd3a/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_9721314421976720364+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_9721314421976720364+e30acd3a/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_9721314421976720364+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..a1d74298b298220682d34cd6669cb432a3aaaa82 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_9721314421976720364+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d0a8bf136bc0f289b5b22a3f5ff3c5b30cd20a9e99cd24bc612701814abcea9 +size 1146 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_9721314421976720364+e30acd3a/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_9721314421976720364+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..9a4ca064dff93a34ebf7dcb7e2e916ca6e23f29f Binary files /dev/null and b/neuronxcc-2.21.33363.0+82129205/MODULE_9721314421976720364+e30acd3a/model.neff differ diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_9884039268981168463+e30acd3a/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_9884039268981168463+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_9884039268981168463+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_9884039268981168463+e30acd3a/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_9884039268981168463+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_9884039268981168463+e30acd3a/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_9884039268981168463+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..7dd5d7ac36ab5f04c9a38b0e2823abc8d2e51cf3 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_9884039268981168463+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:13babe9b8b4c9ddb62d9e46af56fe1e34b6e9a35d17e697b5b254f8f5b18680c +size 1146 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_9884039268981168463+e30acd3a/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_9884039268981168463+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..a20936c0b3ef97ffa2a86aaa5cc2084868271ce3 Binary files /dev/null and b/neuronxcc-2.21.33363.0+82129205/MODULE_9884039268981168463+e30acd3a/model.neff differ diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_a25a39b4c41e8b2cde6e+6170d8e1/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_a25a39b4c41e8b2cde6e+6170d8e1/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..9c277888420f00defd99fc3c102007a98b09199d --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_a25a39b4c41e8b2cde6e+6170d8e1/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/chunked_prefill/_tp0_bk0/log-neuron-cc.txt"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_a25a39b4c41e8b2cde6e+6170d8e1/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_a25a39b4c41e8b2cde6e+6170d8e1/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_a25a39b4c41e8b2cde6e+6170d8e1/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_a25a39b4c41e8b2cde6e+6170d8e1/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..bee35309a6cb1252c8c82b31707070a8684b809e --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_a25a39b4c41e8b2cde6e+6170d8e1/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5d99ef17361b13963a81e2e7ebdd2cb8142ebd33c31a1cedfb643ccb7cd1ddfe +size 551782 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_a25a39b4c41e8b2cde6e+6170d8e1/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_a25a39b4c41e8b2cde6e+6170d8e1/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..3a8f39263942ab957534c0a1c6e9c5feed4bcc72 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_a25a39b4c41e8b2cde6e+6170d8e1/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fe9f6f6fa8602c292d8bed20681f75a427b10171d68800caa699cb6cc7cf0a8d +size 27464704 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_a8db5771dcb730ef5627+3794e5d6/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_a8db5771dcb730ef5627+3794e5d6/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..a74904a6596f71ac43cf3b8a9d6981f785fd9b02 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_a8db5771dcb730ef5627+3794e5d6/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--enable-saturate-infinity", "--auto-cast=none", "--model-type=transformer", "-O1", "--logfile=/tmp/nxdi_test_4b161061-7f6e-4061-bc2a-a55b5eb3a0a0/compiler_workdir/NeuronRMSNorm/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_a8db5771dcb730ef5627+3794e5d6/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_a8db5771dcb730ef5627+3794e5d6/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_a8db5771dcb730ef5627+3794e5d6/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_a8db5771dcb730ef5627+3794e5d6/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..6a2752c25c9f7e1092e2b55c010694e168610ce3 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_a8db5771dcb730ef5627+3794e5d6/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1c774c6626fc91684e924b843c1fe807dadbbac6d8a8e19443663b43c13eac35 +size 1165 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_a8db5771dcb730ef5627+3794e5d6/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_a8db5771dcb730ef5627+3794e5d6/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..204d2be3ceae0da925266b4a981c4bd5e4526379 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_a8db5771dcb730ef5627+3794e5d6/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:54f79c1536082e2fe6152d9be7d83f91813cbfffebec4a1d27ccb43eaa5c333c +size 103424 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_a8db5771dcb730ef5627+3794e5d6/wrapped_neff.hlo b/neuronxcc-2.21.33363.0+82129205/MODULE_a8db5771dcb730ef5627+3794e5d6/wrapped_neff.hlo new file mode 100644 index 0000000000000000000000000000000000000000..87ff861c07175fc6e9a27fb2369fbd7e1c5150ef --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_a8db5771dcb730ef5627+3794e5d6/wrapped_neff.hlo @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:30bdc0c454dde2f3cfa630e975b39e14e117272950d115ad8cbd37001c4521d0 +size 104320 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_a91a06f2317ad34aad7f+ac10809c/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_a91a06f2317ad34aad7f+ac10809c/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..7d1678bf25666438bbebf65702a2233ae75c43c9 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_a91a06f2317ad34aad7f+ac10809c/compile_flags.json @@ -0,0 +1 @@ +["--target=trn2", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=2", "--logfile=/tmp/nxd_model/token_generation/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_a91a06f2317ad34aad7f+ac10809c/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_a91a06f2317ad34aad7f+ac10809c/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_a91a06f2317ad34aad7f+ac10809c/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_a91a06f2317ad34aad7f+ac10809c/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..821867f9b57e790440bf1c70dd0ec6d4c99e136c --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_a91a06f2317ad34aad7f+ac10809c/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3f410eb8efec7853dce1d94bb5ba1679004696d458e302bbd8f359e02b86d306 +size 1576973 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_a91a06f2317ad34aad7f+ac10809c/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_a91a06f2317ad34aad7f+ac10809c/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..a45d4ead9afe36c072f136564255873ddeb460f4 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_a91a06f2317ad34aad7f+ac10809c/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bd3f10d47e5ebdf00ca1b509d0aed43071b2dc5aa7b2fe3dcb0d2c0232982ac3 +size 769024 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_a91a06f2317ad34aad7f+ac10809c/wrapped_neff.hlo b/neuronxcc-2.21.33363.0+82129205/MODULE_a91a06f2317ad34aad7f+ac10809c/wrapped_neff.hlo new file mode 100644 index 0000000000000000000000000000000000000000..f637ea5ca3db363f57e37e3a84fdfa27332f31cc --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_a91a06f2317ad34aad7f+ac10809c/wrapped_neff.hlo @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:38f3d708cc001e84251b07820eeab5216ff1b14738d308e7147f1cfe293151da +size 776820 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_bfde8ebf354636b209da+24129607/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_bfde8ebf354636b209da+24129607/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..836724f44545ce0dedda1521fd4c623a6ea8ec72 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_bfde8ebf354636b209da+24129607/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/context_encoding/_tp0_bk0/log-neuron-cc.txt"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_bfde8ebf354636b209da+24129607/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_bfde8ebf354636b209da+24129607/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_bfde8ebf354636b209da+24129607/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_bfde8ebf354636b209da+24129607/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..7c5ced31ead1acb88758f209d98d6d6c718a90df --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_bfde8ebf354636b209da+24129607/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d7792147eb96b7e159bc72f89bfa69844127e4c3aceed9e23bcdbbe9342af30a +size 83504 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_bfde8ebf354636b209da+24129607/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_bfde8ebf354636b209da+24129607/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..59fc1023d6d1408b445a82b4d6ce56168e7eae30 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_bfde8ebf354636b209da+24129607/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:66628980cd693bdb1a1f4a3e93d46c48bb44dd7a0a43beb9ad7ccaa071283b8e +size 287744 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_c30315f06032f1c043d1+30e2d3d0/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_c30315f06032f1c043d1+30e2d3d0/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..a608847b5b7c7589901688944261f327d166d856 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_c30315f06032f1c043d1+30e2d3d0/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--enable-saturate-infinity", "--auto-cast=none", "--model-type=transformer", "-O1", "--logfile=/tmp/nxdi_test_7dca4664-63a1-4ce5-838c-d756e034b781/compiler_workdir/DecoderLayerWrapper/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_c30315f06032f1c043d1+30e2d3d0/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_c30315f06032f1c043d1+30e2d3d0/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_c30315f06032f1c043d1+30e2d3d0/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_c30315f06032f1c043d1+30e2d3d0/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..b050545e85d1adc68c37499eadab4b93c066a5c3 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_c30315f06032f1c043d1+30e2d3d0/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d6b705d66437ed91a243401b8b01711b8337e3147746669a22b30b46f47feefa +size 29532 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_c30315f06032f1c043d1+30e2d3d0/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_c30315f06032f1c043d1+30e2d3d0/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..be94c2e504a72601af3958019dfa33584967e55b --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_c30315f06032f1c043d1+30e2d3d0/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9327b0cf663169129312c56e28032d97b57ad07be158488c396c5768db33c8f0 +size 328704 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_c30315f06032f1c043d1+30e2d3d0/wrapped_neff.hlo b/neuronxcc-2.21.33363.0+82129205/MODULE_c30315f06032f1c043d1+30e2d3d0/wrapped_neff.hlo new file mode 100644 index 0000000000000000000000000000000000000000..48e4e1c3398897492324b776b63bcd8b61fcc300 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_c30315f06032f1c043d1+30e2d3d0/wrapped_neff.hlo @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d723a14cf28dd8650c580bba5fae254fdfc1bbaa4667c63693989bde05c37fe +size 334452 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_cb2d4884f03167cab578+08d8be6b/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_cb2d4884f03167cab578+08d8be6b/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..b7e90d7a747ea0f95e15b1eff101fcacc848fdb2 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_cb2d4884f03167cab578+08d8be6b/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--enable-saturate-infinity", "--auto-cast=none", "--model-type=transformer", "-O1", "--logfile=/tmp/nxdi_test_fd4491e6-6dda-4f11-8c11-fafbddfe8378/compiler_workdir/SoftmaxNoMask/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_cb2d4884f03167cab578+08d8be6b/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_cb2d4884f03167cab578+08d8be6b/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_cb2d4884f03167cab578+08d8be6b/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_cb2d4884f03167cab578+08d8be6b/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..c213570f630857303e7b0ec653018546c02dc983 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_cb2d4884f03167cab578+08d8be6b/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5efb0ea01dc0241314f91e19cbd9be551d1a66e7dbadd7cd4d6473d6b7d4b99a +size 3881 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_cb2d4884f03167cab578+08d8be6b/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_cb2d4884f03167cab578+08d8be6b/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..61deafb7809f40ba5047fb7c4ea5789d8b8045ae Binary files /dev/null and b/neuronxcc-2.21.33363.0+82129205/MODULE_cb2d4884f03167cab578+08d8be6b/model.neff differ diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_d8153f52c9c3889b4a06+652be344/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_d8153f52c9c3889b4a06+652be344/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..20264c77913a95273f6d6a80cee28cf77cbbf722 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_d8153f52c9c3889b4a06+652be344/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--enable-saturate-infinity", "--auto-cast=none", "--model-type=transformer", "-O1", "--logfile=/tmp/nxdi_test_13cb7918-0109-4210-ba6d-b589588ec400/compiler_workdir/Llama3RotaryEmbedding/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_d8153f52c9c3889b4a06+652be344/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_d8153f52c9c3889b4a06+652be344/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_d8153f52c9c3889b4a06+652be344/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_d8153f52c9c3889b4a06+652be344/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..f1e2473c54cffac949ecf31d3b6ec636c290545b --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_d8153f52c9c3889b4a06+652be344/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f4a29d4cf27aec9af90e53324eff9ee69e033679482f4016a9dd3e5416c7c68a +size 1584 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_d8153f52c9c3889b4a06+652be344/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_d8153f52c9c3889b4a06+652be344/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..9e4a527aa58d75f956cc51947678771939a8aa41 Binary files /dev/null and b/neuronxcc-2.21.33363.0+82129205/MODULE_d8153f52c9c3889b4a06+652be344/model.neff differ diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_df184b2f6028b6fccfdc+db16d357/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_df184b2f6028b6fccfdc+db16d357/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..c08d745741b85526c5ceecf2c1ba3415aca4c487 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_df184b2f6028b6fccfdc+db16d357/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--enable-saturate-infinity", "--auto-cast=none", "--model-type=transformer", "-O1", "--logfile=/tmp/nxdi_test_4eb027fd-2a4a-476e-ae2b-a826fd7885b9/compiler_workdir/DecoderLayerWrapper/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_df184b2f6028b6fccfdc+db16d357/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_df184b2f6028b6fccfdc+db16d357/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_df184b2f6028b6fccfdc+db16d357/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_df184b2f6028b6fccfdc+db16d357/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..307f90c8e8aa2efa59b5a7f04944e13f8a7e1b5f --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_df184b2f6028b6fccfdc+db16d357/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bc96f7fb7fbf64514a818a779dd383411b8c502b328094192490c454e498a825 +size 14480 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_df184b2f6028b6fccfdc+db16d357/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_df184b2f6028b6fccfdc+db16d357/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..9e9c211b157c6d9ed67635bb3c66949456d5a4ed --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_df184b2f6028b6fccfdc+db16d357/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:32f0120d4c1c0c8a37cfe82160688c2c81242ff27f87ac763983f8aca5bde845 +size 267264 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_df184b2f6028b6fccfdc+db16d357/wrapped_neff.hlo b/neuronxcc-2.21.33363.0+82129205/MODULE_df184b2f6028b6fccfdc+db16d357/wrapped_neff.hlo new file mode 100644 index 0000000000000000000000000000000000000000..93bebe6a1be22e000a93e3c7550effccc21b650b --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_df184b2f6028b6fccfdc+db16d357/wrapped_neff.hlo @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7cd02511c3689298813481d436d72ed4e32d62425cdb11606d1a82eb53ec3174 +size 272962 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_e737e0fdb56bf5bd26fc+a02c3a36/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_e737e0fdb56bf5bd26fc+a02c3a36/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..5726abc7d1d8c52fa95bc7919439a23a23fe3b9a --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_e737e0fdb56bf5bd26fc+a02c3a36/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/token_generation/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_e737e0fdb56bf5bd26fc+a02c3a36/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_e737e0fdb56bf5bd26fc+a02c3a36/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_e737e0fdb56bf5bd26fc+a02c3a36/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_e737e0fdb56bf5bd26fc+a02c3a36/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..7b4eefbd2651e1756e05dd96945b7e9399439438 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_e737e0fdb56bf5bd26fc+a02c3a36/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9ca0e174781faf7dc336281f381d288b7d27dd3c52243716f097166fd70848a3 +size 86102 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_e737e0fdb56bf5bd26fc+a02c3a36/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_e737e0fdb56bf5bd26fc+a02c3a36/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..a358438e3102c677b6ec594594156e3399277773 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_e737e0fdb56bf5bd26fc+a02c3a36/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:663ebced910d4bdb605134a998b97ea4ddc5a73f5d07363842e83bc2651377f7 +size 277504 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_e737e0fdb56bf5bd26fc+a02c3a36/wrapped_neff.hlo b/neuronxcc-2.21.33363.0+82129205/MODULE_e737e0fdb56bf5bd26fc+a02c3a36/wrapped_neff.hlo new file mode 100644 index 0000000000000000000000000000000000000000..14dc157b88ba946b3acf09ea60e91f9a6cc7afb2 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_e737e0fdb56bf5bd26fc+a02c3a36/wrapped_neff.hlo @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e36580620d6308d2d7cdeadf8bd1f4c76d1e7afd6569a0c7ea922c8de742c81d +size 285717 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_ef4584e237468f2869e3+dd1b78ca/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_ef4584e237468f2869e3+dd1b78ca/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..2fcf50214e0db220836dde2f642031d7f481da3c --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_ef4584e237468f2869e3+dd1b78ca/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--enable-saturate-infinity", "--auto-cast=none", "--model-type=transformer", "-O1", "--logfile=/tmp/nxdi_test_8d411022-31d7-4f30-8410-c0801d071c7e/compiler_workdir/NeuronLlamaMLP/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_ef4584e237468f2869e3+dd1b78ca/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_ef4584e237468f2869e3+dd1b78ca/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_ef4584e237468f2869e3+dd1b78ca/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_ef4584e237468f2869e3+dd1b78ca/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..6da2cba66863fc471486cc2a5da22b16c00d6480 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_ef4584e237468f2869e3+dd1b78ca/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:993f99d2d09d34bd152af4c7f96a1e6e1d8788e1cd4aefb845c601d2f4d5fcfb +size 1931 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_ef4584e237468f2869e3+dd1b78ca/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_ef4584e237468f2869e3+dd1b78ca/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..88fb3731d26d3491414fbe6bd32d588fc6fb14b9 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_ef4584e237468f2869e3+dd1b78ca/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dfe6768677cc5a016e88709e1d02c93fa46894cb3392440c29779a2a5c538a40 +size 134144 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_ef4584e237468f2869e3+dd1b78ca/wrapped_neff.hlo b/neuronxcc-2.21.33363.0+82129205/MODULE_ef4584e237468f2869e3+dd1b78ca/wrapped_neff.hlo new file mode 100644 index 0000000000000000000000000000000000000000..1b710cff895a0daf1539d3f83394991455e94a01 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_ef4584e237468f2869e3+dd1b78ca/wrapped_neff.hlo @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b11b25be44d197cffcd3a6bff0704df01754fcde47abf616594476eba8e7a918 +size 136222 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_fb23d3cbf7cf9571e3f2+0338459e/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_fb23d3cbf7cf9571e3f2+0338459e/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..93af01c40742a3dacacebd2f305104176392fc3a --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_fb23d3cbf7cf9571e3f2+0338459e/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--enable-saturate-infinity", "--auto-cast=none", "--model-type=transformer", "-O1", "--logfile=/tmp/nxdi_test_cca1606a-ed8d-4999-abee-e5cd5f1c6759/compiler_workdir/AttentionModelWrapper/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_fb23d3cbf7cf9571e3f2+0338459e/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_fb23d3cbf7cf9571e3f2+0338459e/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_fb23d3cbf7cf9571e3f2+0338459e/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_fb23d3cbf7cf9571e3f2+0338459e/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..8203a5aa5acd37ae7e6d6839b35c7438ee9e48fd --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_fb23d3cbf7cf9571e3f2+0338459e/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0eb674f0ac78f8d22ded7c755c983de3edb92563308d60b734d19e694f489568 +size 11280 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_fb23d3cbf7cf9571e3f2+0338459e/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_fb23d3cbf7cf9571e3f2+0338459e/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..99daf3f93e16042790a104e1d9e40d5b5c7f5682 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_fb23d3cbf7cf9571e3f2+0338459e/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e5347af44f340fcb45523c3366cd2ee525692f86a9f18cb0c1110442e6cefff1 +size 1444864 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_fb23d3cbf7cf9571e3f2+0338459e/wrapped_neff.hlo b/neuronxcc-2.21.33363.0+82129205/MODULE_fb23d3cbf7cf9571e3f2+0338459e/wrapped_neff.hlo new file mode 100644 index 0000000000000000000000000000000000000000..32fd48ca87fa7d0f5f8594894df978573f9a6e66 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_fb23d3cbf7cf9571e3f2+0338459e/wrapped_neff.hlo @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:472ef4af8a7fea050dbdfaefc64347c9d906532ff058203559b8f86a680a8b03 +size 1447845