diff --git a/.gitattributes b/.gitattributes index 321c203fa5210ce89b49c8fffc1cfbcc1c6c0da2..fd4f36d8f30386ce5a3f523de3d36bb11dd779db 100644 --- a/.gitattributes +++ b/.gitattributes @@ -5402,3 +5402,28 @@ neuronxcc-2.21.18209.0+043b1bf7/MODULE_e7235732a32fbac73c61+24129607/model.neff neuronxcc-2.21.18209.0+043b1bf7/MODULE_0efef6046521fed2cd76+24129607/model.neff filter=lfs diff=lfs merge=lfs -text neuronxcc-2.21.18209.0+043b1bf7/MODULE_7eab73a0314d91031486+a02c3a36/model.neff filter=lfs diff=lfs merge=lfs -text neuronxcc-2.21.18209.0+043b1bf7/MODULE_7eab73a0314d91031486+a02c3a36/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.18209.0+043b1bf7/MODULE_3e60ddce17a65ac4ee68+24129607/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.18209.0+043b1bf7/MODULE_410ef55a3aca5cd80fc8+24129607/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.18209.0+043b1bf7/MODULE_457b87eb09461f794651+24129607/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.18209.0+043b1bf7/MODULE_62abb2454c6da8d57ad5+a02c3a36/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.18209.0+043b1bf7/MODULE_62abb2454c6da8d57ad5+a02c3a36/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.18209.0+043b1bf7/MODULE_73587bc7122ba5a81758+80d05c3f/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.18209.0+043b1bf7/MODULE_73587bc7122ba5a81758+80d05c3f/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.18209.0+043b1bf7/MODULE_75329916c4da1120954c+6e4949b4/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.18209.0+043b1bf7/MODULE_7c590ab98f45f8a8dd15+283df001/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.18209.0+043b1bf7/MODULE_8eedc4b0995b3a9b6f52+677eeb9d/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.18209.0+043b1bf7/MODULE_944763b36d810f4af582+24129607/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.18209.0+043b1bf7/MODULE_b23271513f9095bde4db+2dde74c7/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.18209.0+043b1bf7/MODULE_b23271513f9095bde4db+2dde74c7/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.18209.0+043b1bf7/MODULE_bdf25cde1a48d420319c+a02c3a36/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.18209.0+043b1bf7/MODULE_bdf25cde1a48d420319c+a02c3a36/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.18209.0+043b1bf7/MODULE_c6ce9281df2387ad44c8+a02c3a36/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.18209.0+043b1bf7/MODULE_c6ce9281df2387ad44c8+a02c3a36/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.18209.0+043b1bf7/MODULE_ccb75cdf21908f3399fe+a02c3a36/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.18209.0+043b1bf7/MODULE_ccb75cdf21908f3399fe+a02c3a36/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.18209.0+043b1bf7/MODULE_ccd99eedd56f698b9cb3+24129607/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.18209.0+043b1bf7/MODULE_cde3417e6918fabff4a7+a02c3a36/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.18209.0+043b1bf7/MODULE_cde3417e6918fabff4a7+a02c3a36/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.18209.0+043b1bf7/MODULE_f52fe8e88daf6dc9619a+24129607/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.18209.0+043b1bf7/MODULE_fef9240b8fbfaca895ba+a02c3a36/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.18209.0+043b1bf7/MODULE_fef9240b8fbfaca895ba+a02c3a36/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_3e60ddce17a65ac4ee68+24129607/compile_flags.json b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_3e60ddce17a65ac4ee68+24129607/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..836724f44545ce0dedda1521fd4c623a6ea8ec72 --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_3e60ddce17a65ac4ee68+24129607/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/context_encoding/_tp0_bk0/log-neuron-cc.txt"] \ No newline at end of file diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_3e60ddce17a65ac4ee68+24129607/model.done b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_3e60ddce17a65ac4ee68+24129607/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_3e60ddce17a65ac4ee68+24129607/model.hlo_module.pb b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_3e60ddce17a65ac4ee68+24129607/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..4db3f296bd83d447bf1608e9a2abc1112c1684ca --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_3e60ddce17a65ac4ee68+24129607/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:daa56f4ac44a9f5ef0c2bea00b070484c64f869b2f270f64ad0216a1b10a8a45 +size 82772 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_3e60ddce17a65ac4ee68+24129607/model.neff b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_3e60ddce17a65ac4ee68+24129607/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..bad8e0ebaca175db701ae6fa6d664aff01e4e670 --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_3e60ddce17a65ac4ee68+24129607/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a84198eb5174b5d745494fc9e45169601f49709a6a5320ffdd138cc9bccc5bb9 +size 267264 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_410ef55a3aca5cd80fc8+24129607/compile_flags.json b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_410ef55a3aca5cd80fc8+24129607/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..836724f44545ce0dedda1521fd4c623a6ea8ec72 --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_410ef55a3aca5cd80fc8+24129607/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/context_encoding/_tp0_bk0/log-neuron-cc.txt"] \ No newline at end of file diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_410ef55a3aca5cd80fc8+24129607/model.done b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_410ef55a3aca5cd80fc8+24129607/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_410ef55a3aca5cd80fc8+24129607/model.hlo_module.pb b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_410ef55a3aca5cd80fc8+24129607/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..5dfbfb6e23f85722a9218c297816fc53499e67b6 --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_410ef55a3aca5cd80fc8+24129607/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0c3a49dd72fdb5d2a07cca8e30e0036959275a194da4ffc5cad20247ce22ac7d +size 81516 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_410ef55a3aca5cd80fc8+24129607/model.neff b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_410ef55a3aca5cd80fc8+24129607/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..329f0e8066f3fbce454ce202a958987b8b5af818 --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_410ef55a3aca5cd80fc8+24129607/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a89e463f13e66b5411c6caf9fecb046931fdef9f43e787a5949136f485effee5 +size 267264 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_457b87eb09461f794651+24129607/compile_flags.json b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_457b87eb09461f794651+24129607/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..836724f44545ce0dedda1521fd4c623a6ea8ec72 --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_457b87eb09461f794651+24129607/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/context_encoding/_tp0_bk0/log-neuron-cc.txt"] \ No newline at end of file diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_457b87eb09461f794651+24129607/model.done b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_457b87eb09461f794651+24129607/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_457b87eb09461f794651+24129607/model.hlo_module.pb b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_457b87eb09461f794651+24129607/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..ee4854bfbf3c9fa7b307290410c69cb59e5924dc --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_457b87eb09461f794651+24129607/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:032cb1b65501aaae18875d59644fa8d7dc0ef0e7ccdb6a34cf00604c98766f80 +size 90382 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_457b87eb09461f794651+24129607/model.neff b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_457b87eb09461f794651+24129607/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..1567294c167558f3a78c96d8856155b45142dbaf --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_457b87eb09461f794651+24129607/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e0f7f9a4b0511f5fff458088bc15eedbac4e70b22e05674c404dd8372df9f40d +size 359424 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_62abb2454c6da8d57ad5+a02c3a36/compile_flags.json b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_62abb2454c6da8d57ad5+a02c3a36/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..5726abc7d1d8c52fa95bc7919439a23a23fe3b9a --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_62abb2454c6da8d57ad5+a02c3a36/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/token_generation/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"] \ No newline at end of file diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_62abb2454c6da8d57ad5+a02c3a36/model.done b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_62abb2454c6da8d57ad5+a02c3a36/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_62abb2454c6da8d57ad5+a02c3a36/model.hlo_module.pb b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_62abb2454c6da8d57ad5+a02c3a36/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..f9aac85f572373187ed5932ede47f59a7a91323f --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_62abb2454c6da8d57ad5+a02c3a36/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0902b9467e36affd529236be99c466bb326eb59e56e6b6414b2bde17d7913ac8 +size 676474 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_62abb2454c6da8d57ad5+a02c3a36/model.neff b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_62abb2454c6da8d57ad5+a02c3a36/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..790da0ab1f5977b55b6a260e9a4ce50408e21e30 --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_62abb2454c6da8d57ad5+a02c3a36/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8f875cdc83e9e466901d31a5a2cab15b29d58c59f5dd8325e69bb6dccbbda3f0 +size 543744 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_62abb2454c6da8d57ad5+a02c3a36/wrapped_neff.hlo b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_62abb2454c6da8d57ad5+a02c3a36/wrapped_neff.hlo new file mode 100644 index 0000000000000000000000000000000000000000..e82cc85e3749341e817fe8bd66016c138bf3b7a6 --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_62abb2454c6da8d57ad5+a02c3a36/wrapped_neff.hlo @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6c3d561ca45029346d1af7ef232c45d4624a60a4a45ed8fcf578276f5413e3b4 +size 563380 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_73587bc7122ba5a81758+80d05c3f/compile_flags.json b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_73587bc7122ba5a81758+80d05c3f/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..3d7d85cd3d975162683053faa369dcc6259604af --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_73587bc7122ba5a81758+80d05c3f/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--enable-saturate-infinity", "--enable-mixed-precision-accumulation", "--model-type", "transformer", "-O1", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2", "--auto-cast=none", "--internal-enable-dge-levels", "vector_dynamic_offsets", "--logfile=/tmp/nxd_model/token_generation/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"] \ No newline at end of file diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_73587bc7122ba5a81758+80d05c3f/model.done b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_73587bc7122ba5a81758+80d05c3f/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_73587bc7122ba5a81758+80d05c3f/model.hlo_module.pb b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_73587bc7122ba5a81758+80d05c3f/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..2117dab3e3ed8caad749b8256ab430c591d3b72a --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_73587bc7122ba5a81758+80d05c3f/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ec57d9d2f9d9be197ad88a58ece6b14b0ccab97c121b8d20cc9512558ddf6562 +size 70276 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_73587bc7122ba5a81758+80d05c3f/model.neff b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_73587bc7122ba5a81758+80d05c3f/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..00050102b50b61178e5b107dfa0845eef9d2e62d --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_73587bc7122ba5a81758+80d05c3f/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0d03bfcd38bb928f707074efc6d8334f29bad554a85f578ef492fffd998cc449 +size 277504 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_73587bc7122ba5a81758+80d05c3f/wrapped_neff.hlo b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_73587bc7122ba5a81758+80d05c3f/wrapped_neff.hlo new file mode 100644 index 0000000000000000000000000000000000000000..5acbe77c7a1af3080007fd9f470f85f98f5532f4 --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_73587bc7122ba5a81758+80d05c3f/wrapped_neff.hlo @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6c73570dafd81045c71e660922cf27117ae4a9abe994ccbf168245c732561931 +size 289571 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_75329916c4da1120954c+6e4949b4/compile_flags.json b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_75329916c4da1120954c+6e4949b4/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..2ad69cd01383a682715fed6c7faaf92a72533ca6 --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_75329916c4da1120954c+6e4949b4/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--enable-saturate-infinity", "--enable-mixed-precision-accumulation", "--model-type", "transformer", "-O1", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2", "--auto-cast=none", "--internal-enable-dge-levels", "vector_dynamic_offsets", "--logfile=/tmp/nxd_model/context_encoding/_tp0_bk0/log-neuron-cc.txt"] \ No newline at end of file diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_75329916c4da1120954c+6e4949b4/model.done b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_75329916c4da1120954c+6e4949b4/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_75329916c4da1120954c+6e4949b4/model.hlo_module.pb b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_75329916c4da1120954c+6e4949b4/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..46e89a7399c6f3036064b053dd6e6165f99886ab --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_75329916c4da1120954c+6e4949b4/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6126e0b2e546e6ea64244384b3f3fc8553a6e38d382d288bc90c252603b8574a +size 84807 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_75329916c4da1120954c+6e4949b4/model.neff b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_75329916c4da1120954c+6e4949b4/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..0a0852c37c0b10d02bb110ae486b811c3ee0704e --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_75329916c4da1120954c+6e4949b4/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd0b72deee8d8cecef0d0a0d4f0a0d75be605dd01327107f58cb3b8505601818 +size 646144 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_7c590ab98f45f8a8dd15+283df001/compile_flags.json b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_7c590ab98f45f8a8dd15+283df001/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..58fbf6b9366d9e28d7f19321e85acd4cd96c0614 --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_7c590ab98f45f8a8dd15+283df001/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--enable-saturate-infinity", "--enable-mixed-precision-accumulation", "--model-type", "transformer", "-O1", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2", "--auto-cast=none", "--internal-enable-dge-levels", "vector_dynamic_offsets", "--internal-hlo2tensorizer-options=--verify-hlo=true", "--logfile=/tmp/nxd_model/context_encoding/_tp0_bk0/log-neuron-cc.txt"] \ No newline at end of file diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_7c590ab98f45f8a8dd15+283df001/model.done b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_7c590ab98f45f8a8dd15+283df001/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_7c590ab98f45f8a8dd15+283df001/model.hlo_module.pb b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_7c590ab98f45f8a8dd15+283df001/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..db0761a06cea881029c7bd23354b6750900aa774 --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_7c590ab98f45f8a8dd15+283df001/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:054c5055b65405714e51c64f753a419433ec87fb494bf2753f8927c2cda60cdc +size 97794 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_7c590ab98f45f8a8dd15+283df001/model.neff b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_7c590ab98f45f8a8dd15+283df001/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..3ed25c2b05de4c550e7e41c037bcb98240c46060 --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_7c590ab98f45f8a8dd15+283df001/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c8c9717599d7021b2458d728e241605922aa39c7b088ead7d9f8ab786a689d35 +size 410624 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_8eedc4b0995b3a9b6f52+677eeb9d/compile_flags.json b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_8eedc4b0995b3a9b6f52+677eeb9d/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..ae7e0c6790082c43cd145aae8cc7e3cc89e15ca8 --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_8eedc4b0995b3a9b6f52+677eeb9d/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/speculation_model/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"] \ No newline at end of file diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_8eedc4b0995b3a9b6f52+677eeb9d/model.done b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_8eedc4b0995b3a9b6f52+677eeb9d/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_8eedc4b0995b3a9b6f52+677eeb9d/model.hlo_module.pb b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_8eedc4b0995b3a9b6f52+677eeb9d/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..e1d47503a6147d6660f78d4a89f05f4657bfe8b7 --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_8eedc4b0995b3a9b6f52+677eeb9d/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d7707ed593b1cd987d6610a983e0d581ebae6f51eba46aec434d58c14dd2eec6 +size 415213 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_8eedc4b0995b3a9b6f52+677eeb9d/model.neff b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_8eedc4b0995b3a9b6f52+677eeb9d/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..5e22af70765864c9cb532fa4e556020cad48d3b5 --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_8eedc4b0995b3a9b6f52+677eeb9d/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0afbee815fd022f48138e1c33b6adcd4e9a12da17c3b370770df12fff20f333d +size 3666944 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_944763b36d810f4af582+24129607/compile_flags.json b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_944763b36d810f4af582+24129607/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..836724f44545ce0dedda1521fd4c623a6ea8ec72 --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_944763b36d810f4af582+24129607/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/context_encoding/_tp0_bk0/log-neuron-cc.txt"] \ No newline at end of file diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_944763b36d810f4af582+24129607/model.done b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_944763b36d810f4af582+24129607/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_944763b36d810f4af582+24129607/model.hlo_module.pb b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_944763b36d810f4af582+24129607/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..2490c1fe7fef9d747c24ae4daa81eb948a183fc1 --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_944763b36d810f4af582+24129607/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba30bac1303e4d846c40c65f8e4d8a644794b6964038372ff73e155714762bdc +size 83504 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_944763b36d810f4af582+24129607/model.neff b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_944763b36d810f4af582+24129607/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..aa7787229422a521ee88ffab91063a4ff9051db6 --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_944763b36d810f4af582+24129607/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d34c0e1077854da0117de707ddcc47a359ca54642890a60a9dc23e35000db3d9 +size 328704 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_b23271513f9095bde4db+2dde74c7/compile_flags.json b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_b23271513f9095bde4db+2dde74c7/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..a7a40c022faf4beb0fb20246d9c1f9c8f32c6900 --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_b23271513f9095bde4db+2dde74c7/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--enable-saturate-infinity", "--enable-mixed-precision-accumulation", "--model-type", "transformer", "-O1", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2", "--auto-cast=none", "--internal-enable-dge-levels", "vector_dynamic_offsets", "--internal-hlo2tensorizer-options=--verify-hlo=true", "--logfile=/tmp/nxd_model/token_generation/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"] \ No newline at end of file diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_b23271513f9095bde4db+2dde74c7/model.done b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_b23271513f9095bde4db+2dde74c7/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_b23271513f9095bde4db+2dde74c7/model.hlo_module.pb b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_b23271513f9095bde4db+2dde74c7/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..727fe2caac58854e2f659732c11b6b5473ac4505 --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_b23271513f9095bde4db+2dde74c7/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6596d3769509c9146ae4a3975d1c70c2eb236f1527bf8cab5cf9306c4300289f +size 89555 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_b23271513f9095bde4db+2dde74c7/model.neff b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_b23271513f9095bde4db+2dde74c7/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..4f426ff78d24933fd8e7418496876bfd7f0131a6 --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_b23271513f9095bde4db+2dde74c7/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3f683c6d672910c5813fea24b4cdef7463c8dcc13c839e420ccd3fb53def6438 +size 369664 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_b23271513f9095bde4db+2dde74c7/wrapped_neff.hlo b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_b23271513f9095bde4db+2dde74c7/wrapped_neff.hlo new file mode 100644 index 0000000000000000000000000000000000000000..31907e70305f4abb3642216cbfe6bbb05b6126d0 --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_b23271513f9095bde4db+2dde74c7/wrapped_neff.hlo @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c5eae6e28efdf471c154f8e069ca68f73d8182aaad545f342d9d4f7521e6959a +size 379362 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_bdf25cde1a48d420319c+a02c3a36/compile_flags.json b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_bdf25cde1a48d420319c+a02c3a36/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..5726abc7d1d8c52fa95bc7919439a23a23fe3b9a --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_bdf25cde1a48d420319c+a02c3a36/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/token_generation/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"] \ No newline at end of file diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_bdf25cde1a48d420319c+a02c3a36/model.done b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_bdf25cde1a48d420319c+a02c3a36/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_bdf25cde1a48d420319c+a02c3a36/model.hlo_module.pb b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_bdf25cde1a48d420319c+a02c3a36/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..be8215e4db02a98e7c7d9a9b026367f5b42a91ea --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_bdf25cde1a48d420319c+a02c3a36/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:20ed0858162f8fc2c58bc4c23d0925dbeda5897dae0889f87758206676394f4e +size 81843 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_bdf25cde1a48d420319c+a02c3a36/model.neff b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_bdf25cde1a48d420319c+a02c3a36/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..bd1954dfb9915f0dc20bce50396e451d7f2af36c --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_bdf25cde1a48d420319c+a02c3a36/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cc30bd13387891165e0c53839527b8fa393cb3a2e107b87e63b4710591baac38 +size 246784 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_bdf25cde1a48d420319c+a02c3a36/wrapped_neff.hlo b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_bdf25cde1a48d420319c+a02c3a36/wrapped_neff.hlo new file mode 100644 index 0000000000000000000000000000000000000000..f9684684f27c1ec2395f7b7923ef9d5e9797439e --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_bdf25cde1a48d420319c+a02c3a36/wrapped_neff.hlo @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a20c64f7bc1c18e70785750a133eb0d75a560c11a0201aa2a8bce49830e0bdf4 +size 255104 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_c6ce9281df2387ad44c8+a02c3a36/compile_flags.json b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_c6ce9281df2387ad44c8+a02c3a36/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..5726abc7d1d8c52fa95bc7919439a23a23fe3b9a --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_c6ce9281df2387ad44c8+a02c3a36/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/token_generation/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"] \ No newline at end of file diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_c6ce9281df2387ad44c8+a02c3a36/model.done b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_c6ce9281df2387ad44c8+a02c3a36/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_c6ce9281df2387ad44c8+a02c3a36/model.hlo_module.pb b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_c6ce9281df2387ad44c8+a02c3a36/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..71a45b2e71496cd9a4651b67356cd1c41ba41ef9 --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_c6ce9281df2387ad44c8+a02c3a36/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:db7ebbb9e2aa4d3c3d4667f098e18faa9ed0a231c9831e73c8118bfad21264ad +size 91147 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_c6ce9281df2387ad44c8+a02c3a36/model.neff b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_c6ce9281df2387ad44c8+a02c3a36/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..8b619127554153c20689a665fae4e2bc7363fecd --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_c6ce9281df2387ad44c8+a02c3a36/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bda38ac5105c744179690ac05af1193054d38008d20286ed4555985a8267b298 +size 277504 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_c6ce9281df2387ad44c8+a02c3a36/wrapped_neff.hlo b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_c6ce9281df2387ad44c8+a02c3a36/wrapped_neff.hlo new file mode 100644 index 0000000000000000000000000000000000000000..39c6f0ed0ac58b309432e0e4c9017f2f57cb1139 --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_c6ce9281df2387ad44c8+a02c3a36/wrapped_neff.hlo @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d8be8db5635b2c87ad1a9aff1f217c6147916f9d7818d491af7d13512c5755fc +size 289031 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_ccb75cdf21908f3399fe+a02c3a36/compile_flags.json b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_ccb75cdf21908f3399fe+a02c3a36/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..5726abc7d1d8c52fa95bc7919439a23a23fe3b9a --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_ccb75cdf21908f3399fe+a02c3a36/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/token_generation/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"] \ No newline at end of file diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_ccb75cdf21908f3399fe+a02c3a36/model.done b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_ccb75cdf21908f3399fe+a02c3a36/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_ccb75cdf21908f3399fe+a02c3a36/model.hlo_module.pb b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_ccb75cdf21908f3399fe+a02c3a36/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..61972ab77477b19dee312608af414e380c48b7e9 --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_ccb75cdf21908f3399fe+a02c3a36/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:613e342a683da59642c46d2dc2e949301ad5e16ba24ad1cf98df935a5a3b8b2a +size 380010 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_ccb75cdf21908f3399fe+a02c3a36/model.neff b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_ccb75cdf21908f3399fe+a02c3a36/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..f9872a41729e0042fcd9ca5f56b6272be39245d8 --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_ccb75cdf21908f3399fe+a02c3a36/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b1dc13537a29845ae9653e2df3bbdbe13b2c14916c3c4b6dca06898a3f4ed160 +size 1926144 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_ccb75cdf21908f3399fe+a02c3a36/wrapped_neff.hlo b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_ccb75cdf21908f3399fe+a02c3a36/wrapped_neff.hlo new file mode 100644 index 0000000000000000000000000000000000000000..e806f4183519f695f48c5dfa442a135f5a693f9a --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_ccb75cdf21908f3399fe+a02c3a36/wrapped_neff.hlo @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7e1e789174212b2012815c7365bc0507ac612891375291574eb975850d855f8d +size 2019200 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_ccd99eedd56f698b9cb3+24129607/compile_flags.json b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_ccd99eedd56f698b9cb3+24129607/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..836724f44545ce0dedda1521fd4c623a6ea8ec72 --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_ccd99eedd56f698b9cb3+24129607/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/context_encoding/_tp0_bk0/log-neuron-cc.txt"] \ No newline at end of file diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_ccd99eedd56f698b9cb3+24129607/model.done b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_ccd99eedd56f698b9cb3+24129607/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_ccd99eedd56f698b9cb3+24129607/model.hlo_module.pb b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_ccd99eedd56f698b9cb3+24129607/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..c954f65885fbf67996673a116e3777ee791b82dc --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_ccd99eedd56f698b9cb3+24129607/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d167b7fc9794adb3af4bedd335c8d928c11cd023681a9cc51494d42f7eba8fbe +size 392910 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_ccd99eedd56f698b9cb3+24129607/model.neff b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_ccd99eedd56f698b9cb3+24129607/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..814e9ffc3443b0934ba2a20d001979a970febc0a --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_ccd99eedd56f698b9cb3+24129607/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:609536f634c0448a35378ba532255f25cfa7457c37b6e6fad0eaa61603143937 +size 41626624 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_cde3417e6918fabff4a7+a02c3a36/compile_flags.json b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_cde3417e6918fabff4a7+a02c3a36/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..5726abc7d1d8c52fa95bc7919439a23a23fe3b9a --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_cde3417e6918fabff4a7+a02c3a36/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/token_generation/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"] \ No newline at end of file diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_cde3417e6918fabff4a7+a02c3a36/model.done b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_cde3417e6918fabff4a7+a02c3a36/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_cde3417e6918fabff4a7+a02c3a36/model.hlo_module.pb b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_cde3417e6918fabff4a7+a02c3a36/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..3b28dfdd4b213537b2dea5c6bcc967e9c9762156 --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_cde3417e6918fabff4a7+a02c3a36/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5d61ac2165fde7772e8d3035b0f89b50beec5e0d305548cbacc624eefa9452d3 +size 82753 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_cde3417e6918fabff4a7+a02c3a36/model.neff b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_cde3417e6918fabff4a7+a02c3a36/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..7ef75b0074fa4ec73095a81a2758a1f5a2e7c0bf --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_cde3417e6918fabff4a7+a02c3a36/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cea17f8986a267e3fa86b63e8c8a3b106afafd0e5478426eb521569c64665576 +size 277504 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_cde3417e6918fabff4a7+a02c3a36/wrapped_neff.hlo b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_cde3417e6918fabff4a7+a02c3a36/wrapped_neff.hlo new file mode 100644 index 0000000000000000000000000000000000000000..16cadf15bed8b8d64673c72339abc3c4194888e0 --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_cde3417e6918fabff4a7+a02c3a36/wrapped_neff.hlo @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:17c67194a4d9db74cf7f5199cb56c0e38b74ec8d65e8dfdd5ebd0aea8b3e739e +size 285854 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_f52fe8e88daf6dc9619a+24129607/compile_flags.json b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_f52fe8e88daf6dc9619a+24129607/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..836724f44545ce0dedda1521fd4c623a6ea8ec72 --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_f52fe8e88daf6dc9619a+24129607/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/context_encoding/_tp0_bk0/log-neuron-cc.txt"] \ No newline at end of file diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_f52fe8e88daf6dc9619a+24129607/model.done b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_f52fe8e88daf6dc9619a+24129607/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_f52fe8e88daf6dc9619a+24129607/model.hlo_module.pb b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_f52fe8e88daf6dc9619a+24129607/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..2a4957642a3a55f6c5ddc59adb81100baeaf9d1a --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_f52fe8e88daf6dc9619a+24129607/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6fe1533083be685e04908eaafd5dd3e002ff344b3624f4b42176f7d99ff3d634 +size 694128 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_f52fe8e88daf6dc9619a+24129607/model.neff b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_f52fe8e88daf6dc9619a+24129607/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..809f033697d5a18c3701ca99bfe27ec5ed1bad6f --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_f52fe8e88daf6dc9619a+24129607/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:18e13cd939c298758f20aaf4407e494542df6666b7f2e2818bcd2ea3b787b3cf +size 625664 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_fef9240b8fbfaca895ba+a02c3a36/compile_flags.json b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_fef9240b8fbfaca895ba+a02c3a36/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..5726abc7d1d8c52fa95bc7919439a23a23fe3b9a --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_fef9240b8fbfaca895ba+a02c3a36/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/token_generation/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"] \ No newline at end of file diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_fef9240b8fbfaca895ba+a02c3a36/model.done b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_fef9240b8fbfaca895ba+a02c3a36/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_fef9240b8fbfaca895ba+a02c3a36/model.hlo_module.pb b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_fef9240b8fbfaca895ba+a02c3a36/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..64028cc78541c1833466a343e251d2e19d025203 --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_fef9240b8fbfaca895ba+a02c3a36/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e70386c0d4c7acaf312dfe4908f119fe46d817ab3d82394d549c5ed84707d551 +size 80382 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_fef9240b8fbfaca895ba+a02c3a36/model.neff b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_fef9240b8fbfaca895ba+a02c3a36/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..577ea088f274c56a1b2394ab7d36e27fcf8d79ca --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_fef9240b8fbfaca895ba+a02c3a36/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d3d927af378381473500e96b89325a170bb270599aced0a24b611864951f8ece +size 216064 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_fef9240b8fbfaca895ba+a02c3a36/wrapped_neff.hlo b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_fef9240b8fbfaca895ba+a02c3a36/wrapped_neff.hlo new file mode 100644 index 0000000000000000000000000000000000000000..ab538e3d9aea6f0151927e1e511d70b44ceb1e3b --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_fef9240b8fbfaca895ba+a02c3a36/wrapped_neff.hlo @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f09b0dee89c9253473b3aa6925920c0db08b1a94e9ba7c9d75329c5d81491d0c +size 224412