diff --git a/.gitattributes b/.gitattributes index d290e81c2e493ba288aa5d05b0ee509e6725837b..6671aeee1a4eecb2ab0b9eeff8acfb71b76b2b7f 100644 --- a/.gitattributes +++ b/.gitattributes @@ -15707,3 +15707,171 @@ neuronxcc-2.21.33363.0+82129205/MODULE_abb8078c9a8dfd146600+cc7a6cdd/model.neff neuronxcc-2.21.33363.0+82129205/MODULE_abb8078c9a8dfd146600+cc7a6cdd/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text neuronxcc-2.21.33363.0+82129205/MODULE_fc182b60fb9656608ef0+6695fbd9/model.neff filter=lfs diff=lfs merge=lfs -text neuronxcc-2.21.33363.0+82129205/MODULE_fc182b60fb9656608ef0+6695fbd9/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.18209.0+043b1bf7/MODULE_0654da519a1110a6aad4+ad9e832d/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.18209.0+043b1bf7/MODULE_06e58c7a469128c652b5+ad9e832d/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.18209.0+043b1bf7/MODULE_3cb9043f67e6b5a9acbf+ad9e832d/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.18209.0+043b1bf7/MODULE_4262eabf33a3b2c61448+617f6939/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.18209.0+043b1bf7/MODULE_4262eabf33a3b2c61448+617f6939/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.18209.0+043b1bf7/MODULE_454cbfa5310f70cadd4c+617f6939/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.18209.0+043b1bf7/MODULE_454cbfa5310f70cadd4c+617f6939/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.18209.0+043b1bf7/MODULE_4b55e4f26a3acec8be46+617f6939/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.18209.0+043b1bf7/MODULE_4b55e4f26a3acec8be46+617f6939/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.18209.0+043b1bf7/MODULE_5122ddbc31f7f615af79+617f6939/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.18209.0+043b1bf7/MODULE_5122ddbc31f7f615af79+617f6939/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.18209.0+043b1bf7/MODULE_57d02543ed097317eb38+ad9e832d/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.18209.0+043b1bf7/MODULE_6df16d281c8d34e7b8c8+ad9e832d/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.18209.0+043b1bf7/MODULE_7776165b0d0d23f46d32+ad9e832d/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.18209.0+043b1bf7/MODULE_8926597e9069871b192d+ad9e832d/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.18209.0+043b1bf7/MODULE_8d519e024abae9bbf305+617f6939/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.18209.0+043b1bf7/MODULE_8d519e024abae9bbf305+617f6939/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.18209.0+043b1bf7/MODULE_9a73716a575cb3cb95df+ad9e832d/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.18209.0+043b1bf7/MODULE_b3fcf757bda6afe1679e+ad9e832d/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.18209.0+043b1bf7/MODULE_da7e97c0c4b45f3b3821+ad9e832d/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.18209.0+043b1bf7/MODULE_de35c230ea0abd3360a7+617f6939/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.18209.0+043b1bf7/MODULE_de35c230ea0abd3360a7+617f6939/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.18209.0+043b1bf7/MODULE_eacd5f9beef23723ae4a+617f6939/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.18209.0+043b1bf7/MODULE_eacd5f9beef23723ae4a+617f6939/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.18209.0+043b1bf7/MODULE_f8b4f545fd646928f740+ad9e832d/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.18209.0+043b1bf7/MODULE_fede9e304a150a635925+617f6939/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.18209.0+043b1bf7/MODULE_fede9e304a150a635925+617f6939/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_03563a07b466ff1a7583+24129607/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_0a11d2377319957aa7b1+87e73322/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_0a11d2377319957aa7b1+87e73322/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_0cc2b44bb9cd283b1eeb+5c07cd07/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_0cc2b44bb9cd283b1eeb+5c07cd07/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_0e63a0b6e1742e1fdb32+24129607/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_1351bde3344f209ba8a1+24129607/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_137f98143cdeb07dab7d+a02c3a36/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_137f98143cdeb07dab7d+a02c3a36/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_15024025e6662a62c755+3da4118c/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_15024025e6662a62c755+3da4118c/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_1b7d34902916e968eb1d+af8e51ae/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_1b7d34902916e968eb1d+af8e51ae/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_1d4bedf0c37a53b47737+a02c3a36/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_1d4bedf0c37a53b47737+a02c3a36/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_1de326760d7a62df783b+a02c3a36/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_1de326760d7a62df783b+a02c3a36/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_20ded251b25e18aad5b0+24129607/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_21ce3b68a9e0797a477c+24129607/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_2505e14f043060847cbf+a02c3a36/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_2505e14f043060847cbf+a02c3a36/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_26fe13069f0a9e99f32e+24129607/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_2a2a4bab1649c00a577f+a02c3a36/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_2a2a4bab1649c00a577f+a02c3a36/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_2a8eca8e0378831dfed0+f9f8d9f2/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_2a8eca8e0378831dfed0+f9f8d9f2/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_2be35f469d98437fb988+a02c3a36/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_2be35f469d98437fb988+a02c3a36/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_2facf9e355669579de43+24129607/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_31e31b6f47afb89b553b+bafdbdde/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_31e31b6f47afb89b553b+bafdbdde/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_32a1f486b38c93d2cf79+aefc65cb/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_32a1f486b38c93d2cf79+aefc65cb/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_35a63695aeefa2d44798+24129607/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_415b25e4e1c1a1ab8cc6+a02c3a36/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_415b25e4e1c1a1ab8cc6+a02c3a36/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_4247663625e2eaeb4fab+a02c3a36/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_4247663625e2eaeb4fab+a02c3a36/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_437a9e154e0cc794398f+0da03933/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_437a9e154e0cc794398f+0da03933/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_49b427a31f505e15551a+ec51c92c/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_49b427a31f505e15551a+ec51c92c/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_5321c1b69979af5581ee+a02c3a36/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_5321c1b69979af5581ee+a02c3a36/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_54dce09f6a5327de2511+fe16c4be/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_54dce09f6a5327de2511+fe16c4be/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_628b6d34444473fad038+a02c3a36/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_628b6d34444473fad038+a02c3a36/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_68b856b391a016dcfb36+94f624bf/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_68b856b391a016dcfb36+94f624bf/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_69ce67073ba646143ed4+24129607/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_6b045be69220451cd35c+a02c3a36/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_6b045be69220451cd35c+a02c3a36/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_6cc68373d81858239a08+24129607/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_6dd858f775c0a9002ded+8f459db2/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_6dd858f775c0a9002ded+8f459db2/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_73021bd2bcd85d0ae281+bafdbdde/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_73021bd2bcd85d0ae281+bafdbdde/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_77f1b8fbe51833738f1c+24129607/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_7ac33c003364730bb8e0+e4ea82eb/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_7ac33c003364730bb8e0+e4ea82eb/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_7b28cd1e3dc6bc844fa3+24129607/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_7c2638502a7538102290+a02c3a36/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_7c2638502a7538102290+a02c3a36/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_7d7829b80b30c6a8366e+82a94d75/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_7d7829b80b30c6a8366e+82a94d75/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_7f4b070326c197aa68db+a02c3a36/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_7f4b070326c197aa68db+a02c3a36/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_8040971574bb1f40a771+eb6614ba/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_8040971574bb1f40a771+eb6614ba/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_818bc30ba0942fe4c3d6+24129607/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_82cabaf7b1369e971e5c+5e080832/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_82cabaf7b1369e971e5c+5e080832/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_862f4269950d182a7b0b+bceffd01/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_862f4269950d182a7b0b+bceffd01/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_8976186fc1a14a570398+24129607/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_8e3aecb3518895a4ebd0+a02c3a36/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_8e3aecb3518895a4ebd0+a02c3a36/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_8f63e2da128b2efd447e+a02c3a36/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_8f63e2da128b2efd447e+a02c3a36/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_9312fb1868a91c85e16a+24129607/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_96198b429c7161961ae8+a02c3a36/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_96198b429c7161961ae8+a02c3a36/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_97d05358399518e4efee+a02c3a36/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_97d05358399518e4efee+a02c3a36/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_9a0754abf83f7bc78b7d+098c44e3/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_9a0754abf83f7bc78b7d+098c44e3/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_9b81a779cf3ae3a12644+149cbfff/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_9b81a779cf3ae3a12644+149cbfff/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_9f3d72fade252307a3fc+a02c3a36/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_9f3d72fade252307a3fc+a02c3a36/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_a0467b8b82934a24d142+a02c3a36/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_a0467b8b82934a24d142+a02c3a36/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_aa3ef3e7a5cba473337f+1dee5e5e/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_aa3ef3e7a5cba473337f+1dee5e5e/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_ab1b160b3d8fa09ed76e+a02c3a36/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_ab1b160b3d8fa09ed76e+a02c3a36/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_ad7c8ac474ec4bdeae52+24129607/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_adf2c812522e586cea39+24129607/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_b0d91b1607c7df83fc7f+a02c3a36/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_b0d91b1607c7df83fc7f+a02c3a36/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_b1cd3aa0106a6921386d+a02c3a36/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_b1cd3aa0106a6921386d+a02c3a36/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_bb3cafc9659e6ad373c7+24129607/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_bc57576bbc26e14097b8+24129607/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_bdefd4948bd161bfec05+24129607/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_c47d987826f446f9955b+a02c3a36/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_c47d987826f446f9955b+a02c3a36/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_c9952f69ef9cfc495903+a02c3a36/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_c9952f69ef9cfc495903+a02c3a36/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_cbda8a59038c9c5ffc17+a02c3a36/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_cbda8a59038c9c5ffc17+a02c3a36/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_ccc2d4abbb67d5b7286f+a02c3a36/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_ccc2d4abbb67d5b7286f+a02c3a36/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_ce1ed82235621875fbad+eef3363a/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_ce1ed82235621875fbad+eef3363a/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_ce8e893faf0f99f6c70b+f0422fe3/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_ce8e893faf0f99f6c70b+f0422fe3/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_d053e5a2bdf45f8b64ef+a02c3a36/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_d053e5a2bdf45f8b64ef+a02c3a36/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_d1b92df9d7d3f05023d5+6df9a02b/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_d1b92df9d7d3f05023d5+6df9a02b/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_d557da6777202c62f6c1+a02c3a36/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_d557da6777202c62f6c1+a02c3a36/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_d5ee7d5ab32cdaaa0ee0+677eeb9d/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_d97f2a797158f5574518+24129607/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_dc7fcef2e19ad392688a+24129607/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_de64a5eb66d5e73e20ff+ee6b6593/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_de64a5eb66d5e73e20ff+ee6b6593/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_e5486eb6f3f1a553b5f8+ecd1b333/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_e5486eb6f3f1a553b5f8+ecd1b333/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_e54f2eec2036cfaa2527+a02c3a36/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_e54f2eec2036cfaa2527+a02c3a36/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_eadbca4e425481d07426+24129607/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_ebda959e0a7e1b1b3d41+24129607/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_ed0ddf13430a2a717168+24129607/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_f03f06a24a40a8dbe7e1+24129607/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_fcaa5220788f46dccc4f+a02c3a36/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_fcaa5220788f46dccc4f+a02c3a36/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_fd44e24d672157f0bc14+a02c3a36/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_fd44e24d672157f0bc14+a02c3a36/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_0654da519a1110a6aad4+ad9e832d/compile_flags.json b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_0654da519a1110a6aad4+ad9e832d/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..0a2078b3647f01aa3165babe7ccfb751b4575e61 --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_0654da519a1110a6aad4+ad9e832d/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "--lnc=1", "-O1", "--internal-hlo2tensorizer-options= --modular-flow-mac-threshold=10 --verify-hlo=true", "--logfile=/tmp/nxd_model/context_encoding_model/_tp0_bk0/log-neuron-cc.txt"] \ No newline at end of file diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_0654da519a1110a6aad4+ad9e832d/model.done b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_0654da519a1110a6aad4+ad9e832d/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_0654da519a1110a6aad4+ad9e832d/model.hlo_module.pb b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_0654da519a1110a6aad4+ad9e832d/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..033a3c160aea38ed1ce2c6ecd425e82dabc56f35 --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_0654da519a1110a6aad4+ad9e832d/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:17c096a64f827fc570914bd877c33bb2b6d4b1afd2313a82e249d70da338f146 +size 936785 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_0654da519a1110a6aad4+ad9e832d/model.neff b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_0654da519a1110a6aad4+ad9e832d/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..93cea20c893eac7f1037814357d28e3ec70664e9 --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_0654da519a1110a6aad4+ad9e832d/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2c15732a812350a3a27aeace7738a30c6027911be1dc5e6a5d896ff890d7c00e +size 11561984 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_06e58c7a469128c652b5+ad9e832d/compile_flags.json b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_06e58c7a469128c652b5+ad9e832d/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..0a2078b3647f01aa3165babe7ccfb751b4575e61 --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_06e58c7a469128c652b5+ad9e832d/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "--lnc=1", "-O1", "--internal-hlo2tensorizer-options= --modular-flow-mac-threshold=10 --verify-hlo=true", "--logfile=/tmp/nxd_model/context_encoding_model/_tp0_bk0/log-neuron-cc.txt"] \ No newline at end of file diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_06e58c7a469128c652b5+ad9e832d/model.done b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_06e58c7a469128c652b5+ad9e832d/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_06e58c7a469128c652b5+ad9e832d/model.hlo_module.pb b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_06e58c7a469128c652b5+ad9e832d/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..e0943ef035bd1d2e138715ba528f22ca245971aa --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_06e58c7a469128c652b5+ad9e832d/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:05c5f09f68c1912103423eeb9d56a58404f0c6fdddbe1816e7c33073e659a2cb +size 726384 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_06e58c7a469128c652b5+ad9e832d/model.neff b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_06e58c7a469128c652b5+ad9e832d/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..a183e9e0ca626c678a9fac19b2d5d39716d679c0 --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_06e58c7a469128c652b5+ad9e832d/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d68ad0966b1e9e7ea97f6212f6275741342159f8b013adca888b4ed2564a7a4c +size 492544 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_3cb9043f67e6b5a9acbf+ad9e832d/compile_flags.json b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_3cb9043f67e6b5a9acbf+ad9e832d/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..0a2078b3647f01aa3165babe7ccfb751b4575e61 --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_3cb9043f67e6b5a9acbf+ad9e832d/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "--lnc=1", "-O1", "--internal-hlo2tensorizer-options= --modular-flow-mac-threshold=10 --verify-hlo=true", "--logfile=/tmp/nxd_model/context_encoding_model/_tp0_bk0/log-neuron-cc.txt"] \ No newline at end of file diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_3cb9043f67e6b5a9acbf+ad9e832d/model.done b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_3cb9043f67e6b5a9acbf+ad9e832d/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_3cb9043f67e6b5a9acbf+ad9e832d/model.hlo_module.pb b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_3cb9043f67e6b5a9acbf+ad9e832d/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..32b013409a941cf46d07cce124a70f5da656ea3e --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_3cb9043f67e6b5a9acbf+ad9e832d/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eb5bd8e78159ccce3eae8b4e36beb1bc30d66f673c8c4d01b80e818f0e5483cf +size 678558 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_3cb9043f67e6b5a9acbf+ad9e832d/model.neff b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_3cb9043f67e6b5a9acbf+ad9e832d/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..773bc27d5766de4c0d694a9bd50bc0b890d634c4 --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_3cb9043f67e6b5a9acbf+ad9e832d/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:93a4c486f03a6855de565b9571babfa47a4f214c4242a94445cc972c72dfedf5 +size 1659904 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_4262eabf33a3b2c61448+617f6939/compile_flags.json b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_4262eabf33a3b2c61448+617f6939/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..107cebd2dc9223d7d557c2256bdd494131263beb --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_4262eabf33a3b2c61448+617f6939/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=1 --vectorize-strided-dma ", "--lnc=1", "-O2", "--internal-hlo2tensorizer-options=--verify-hlo=true", "--logfile=/tmp/nxd_model/token_generation_model/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"] \ No newline at end of file diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_4262eabf33a3b2c61448+617f6939/model.done b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_4262eabf33a3b2c61448+617f6939/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_4262eabf33a3b2c61448+617f6939/model.hlo_module.pb b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_4262eabf33a3b2c61448+617f6939/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..49baea80168635c616246ed36cd39939c16fd63f --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_4262eabf33a3b2c61448+617f6939/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76aa5bdd9171b91554e3461102196b55b4a8f7453a965cdc9e9c89b9746deda7 +size 747576 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_4262eabf33a3b2c61448+617f6939/model.neff b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_4262eabf33a3b2c61448+617f6939/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..096af15f33e0b0ef8ed4ff4b14ed7590f5967289 --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_4262eabf33a3b2c61448+617f6939/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:405817d784b623c7bc20cb7ce54f7d65ed8a737226de9755f081bf73b10c95e0 +size 3113984 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_4262eabf33a3b2c61448+617f6939/wrapped_neff.hlo b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_4262eabf33a3b2c61448+617f6939/wrapped_neff.hlo new file mode 100644 index 0000000000000000000000000000000000000000..2b912a0167fbe7142343127b8299dfa951c8d350 --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_4262eabf33a3b2c61448+617f6939/wrapped_neff.hlo @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:95fb219447af7158351ee48861dbcfbffd673c4fb243778edef7c658333a80f0 +size 3299472 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_454cbfa5310f70cadd4c+617f6939/compile_flags.json b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_454cbfa5310f70cadd4c+617f6939/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..107cebd2dc9223d7d557c2256bdd494131263beb --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_454cbfa5310f70cadd4c+617f6939/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=1 --vectorize-strided-dma ", "--lnc=1", "-O2", "--internal-hlo2tensorizer-options=--verify-hlo=true", "--logfile=/tmp/nxd_model/token_generation_model/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"] \ No newline at end of file diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_454cbfa5310f70cadd4c+617f6939/model.done b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_454cbfa5310f70cadd4c+617f6939/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_454cbfa5310f70cadd4c+617f6939/model.hlo_module.pb b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_454cbfa5310f70cadd4c+617f6939/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..85de4563a8a26b1586e5f1bc560873a827ce0d5e --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_454cbfa5310f70cadd4c+617f6939/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eaac8a0d1057bbcaaf5fc3dc85fa7699af59ddc07c1c26435640d6112acceff2 +size 378947 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_454cbfa5310f70cadd4c+617f6939/model.neff b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_454cbfa5310f70cadd4c+617f6939/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..eadb87407b46ba1a83fd4d4f6ac8d1b7bc8aa8a7 --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_454cbfa5310f70cadd4c+617f6939/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f24564b3a426253a6c9a58a73a9dedf7df1bb3c4ae4f9c3029d426f107c9c7b4 +size 1926144 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_454cbfa5310f70cadd4c+617f6939/wrapped_neff.hlo b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_454cbfa5310f70cadd4c+617f6939/wrapped_neff.hlo new file mode 100644 index 0000000000000000000000000000000000000000..c9dfbc44d8ca8feac4fbca9301a4228500fce41f --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_454cbfa5310f70cadd4c+617f6939/wrapped_neff.hlo @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b7485e701ed5c6302ee1967ad86e7d57db68d08f66dca5344c6ee9783377ef51 +size 2000256 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_4b55e4f26a3acec8be46+617f6939/compile_flags.json b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_4b55e4f26a3acec8be46+617f6939/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..107cebd2dc9223d7d557c2256bdd494131263beb --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_4b55e4f26a3acec8be46+617f6939/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=1 --vectorize-strided-dma ", "--lnc=1", "-O2", "--internal-hlo2tensorizer-options=--verify-hlo=true", "--logfile=/tmp/nxd_model/token_generation_model/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"] \ No newline at end of file diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_4b55e4f26a3acec8be46+617f6939/model.done b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_4b55e4f26a3acec8be46+617f6939/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_4b55e4f26a3acec8be46+617f6939/model.hlo_module.pb b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_4b55e4f26a3acec8be46+617f6939/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..6ffd5c27ec279bad5c57820a34203f50291ca6af --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_4b55e4f26a3acec8be46+617f6939/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c69e83428c93f3412168937e1df467dd69d10ef46e9576f1fcb96de906e1a86 +size 382812 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_4b55e4f26a3acec8be46+617f6939/model.neff b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_4b55e4f26a3acec8be46+617f6939/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..76346e1992e6c459e78824649d4ed94ff63e13de --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_4b55e4f26a3acec8be46+617f6939/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76209c24a04f98926f0cfe3fb63de3d27ef082dcdb30d4fec9ee2de7c5f18d37 +size 3032064 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_4b55e4f26a3acec8be46+617f6939/wrapped_neff.hlo b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_4b55e4f26a3acec8be46+617f6939/wrapped_neff.hlo new file mode 100644 index 0000000000000000000000000000000000000000..69a404e3399cec1a7f6a2b2e0f9c53b58a4a07d0 --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_4b55e4f26a3acec8be46+617f6939/wrapped_neff.hlo @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca1eb5edafa963dab3105d66b6044e615664da9c73f0a1a998f7ea8ae9ba07b7 +size 3106169 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_5122ddbc31f7f615af79+617f6939/compile_flags.json b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_5122ddbc31f7f615af79+617f6939/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..107cebd2dc9223d7d557c2256bdd494131263beb --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_5122ddbc31f7f615af79+617f6939/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=1 --vectorize-strided-dma ", "--lnc=1", "-O2", "--internal-hlo2tensorizer-options=--verify-hlo=true", "--logfile=/tmp/nxd_model/token_generation_model/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"] \ No newline at end of file diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_5122ddbc31f7f615af79+617f6939/model.done b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_5122ddbc31f7f615af79+617f6939/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_5122ddbc31f7f615af79+617f6939/model.hlo_module.pb b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_5122ddbc31f7f615af79+617f6939/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..2be4392d71eb255773052f55d30aca80803ae9da --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_5122ddbc31f7f615af79+617f6939/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d430b5a352b7fbee3742c299062adfd10f1232b12cd924c52e979764a23e3f8 +size 382348 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_5122ddbc31f7f615af79+617f6939/model.neff b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_5122ddbc31f7f615af79+617f6939/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..50a21cbd45dec18d38125d1b40efd8cd10bfbe4a --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_5122ddbc31f7f615af79+617f6939/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e24de20088f1002f739a76dff410698f254aab56f4dbdd8cdd5e85d2770eaa7c +size 2049024 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_5122ddbc31f7f615af79+617f6939/wrapped_neff.hlo b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_5122ddbc31f7f615af79+617f6939/wrapped_neff.hlo new file mode 100644 index 0000000000000000000000000000000000000000..a2cf63bca4e60ff783a6ff491ffe6c8204584691 --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_5122ddbc31f7f615af79+617f6939/wrapped_neff.hlo @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f5ca74126a5794dacf54743b1bbfd785f5eb4f45e34cb5f0280e864eeb78a0a +size 2123112 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_57d02543ed097317eb38+ad9e832d/compile_flags.json b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_57d02543ed097317eb38+ad9e832d/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..0a2078b3647f01aa3165babe7ccfb751b4575e61 --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_57d02543ed097317eb38+ad9e832d/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "--lnc=1", "-O1", "--internal-hlo2tensorizer-options= --modular-flow-mac-threshold=10 --verify-hlo=true", "--logfile=/tmp/nxd_model/context_encoding_model/_tp0_bk0/log-neuron-cc.txt"] \ No newline at end of file diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_57d02543ed097317eb38+ad9e832d/model.done b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_57d02543ed097317eb38+ad9e832d/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_57d02543ed097317eb38+ad9e832d/model.hlo_module.pb b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_57d02543ed097317eb38+ad9e832d/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..98a0eb078e834bbea63f34d77c4177812f2646e7 --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_57d02543ed097317eb38+ad9e832d/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f7889bc62e8dcef2a8de07ab0712acd532c2d6f207defd057f42dc19a58a0dc7 +size 983272 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_57d02543ed097317eb38+ad9e832d/model.neff b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_57d02543ed097317eb38+ad9e832d/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..992b8d984d843e77980e78f52221080d1ca4d2db --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_57d02543ed097317eb38+ad9e832d/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fee37fa3f3fd8eb8db0f8f866970dfdccc1d45a71c42a03a5da62f6ff16ea6a2 +size 11981824 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_6df16d281c8d34e7b8c8+ad9e832d/compile_flags.json b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_6df16d281c8d34e7b8c8+ad9e832d/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..0a2078b3647f01aa3165babe7ccfb751b4575e61 --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_6df16d281c8d34e7b8c8+ad9e832d/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "--lnc=1", "-O1", "--internal-hlo2tensorizer-options= --modular-flow-mac-threshold=10 --verify-hlo=true", "--logfile=/tmp/nxd_model/context_encoding_model/_tp0_bk0/log-neuron-cc.txt"] \ No newline at end of file diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_6df16d281c8d34e7b8c8+ad9e832d/model.done b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_6df16d281c8d34e7b8c8+ad9e832d/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_6df16d281c8d34e7b8c8+ad9e832d/model.hlo_module.pb b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_6df16d281c8d34e7b8c8+ad9e832d/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..3dcca1bf5f9cbc646524144e057427d5291670e3 --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_6df16d281c8d34e7b8c8+ad9e832d/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:97fb1218b3b85f5e1750c92b0b95e18b2f0fff0dbe607f1c8307ff625175c782 +size 598800 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_6df16d281c8d34e7b8c8+ad9e832d/model.neff b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_6df16d281c8d34e7b8c8+ad9e832d/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..44f3f4a748c62a36e424976ed93569601e89bf39 --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_6df16d281c8d34e7b8c8+ad9e832d/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:789d0cd4da08ab7421274e55250c231edd04c5dab1294fedc165ce26e13ef622 +size 297984 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_7081ad26fb8bc6748c94+ad9e832d/compile_flags.json b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_7081ad26fb8bc6748c94+ad9e832d/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..0a2078b3647f01aa3165babe7ccfb751b4575e61 --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_7081ad26fb8bc6748c94+ad9e832d/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "--lnc=1", "-O1", "--internal-hlo2tensorizer-options= --modular-flow-mac-threshold=10 --verify-hlo=true", "--logfile=/tmp/nxd_model/context_encoding_model/_tp0_bk0/log-neuron-cc.txt"] \ No newline at end of file diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_7081ad26fb8bc6748c94+ad9e832d/model.hlo_module.pb b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_7081ad26fb8bc6748c94+ad9e832d/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..a9b8170860dbfac96824d84279b7aab38beb982c --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_7081ad26fb8bc6748c94+ad9e832d/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e488a3bbddf55f2468ac5482fad6f32a0393da0f909dd6cc75613aafcc5268d6 +size 933493 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_7081ad26fb8bc6748c94+ad9e832d/model.log b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_7081ad26fb8bc6748c94+ad9e832d/model.log new file mode 100644 index 0000000000000000000000000000000000000000..f3562fc98970c1d54e6df8d4490bb5b19a8792a7 --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_7081ad26fb8bc6748c94+ad9e832d/model.log @@ -0,0 +1 @@ +Failed compilation with ['neuronx-cc', 'compile', '--framework=XLA', '/tmp/nxd_model/context_encoding_model/_tp0_bk0/model.MODULE_7081ad26fb8bc6748c94+ad9e832d.hlo_module.pb', '--output', '/tmp/nxd_model/context_encoding_model/_tp0_bk0/model.MODULE_7081ad26fb8bc6748c94+ad9e832d.neff', '--target=trn1', '--auto-cast=none', '--model-type=transformer', '--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ', '--lnc=1', '-O1', '--internal-hlo2tensorizer-options= --modular-flow-mac-threshold=10 --verify-hlo=true', '--logfile=/tmp/nxd_model/context_encoding_model/_tp0_bk0/log-neuron-cc.txt', '--verbose=35']: \ No newline at end of file diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_7776165b0d0d23f46d32+ad9e832d/compile_flags.json b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_7776165b0d0d23f46d32+ad9e832d/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..0a2078b3647f01aa3165babe7ccfb751b4575e61 --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_7776165b0d0d23f46d32+ad9e832d/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "--lnc=1", "-O1", "--internal-hlo2tensorizer-options= --modular-flow-mac-threshold=10 --verify-hlo=true", "--logfile=/tmp/nxd_model/context_encoding_model/_tp0_bk0/log-neuron-cc.txt"] \ No newline at end of file diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_7776165b0d0d23f46d32+ad9e832d/model.done b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_7776165b0d0d23f46d32+ad9e832d/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_7776165b0d0d23f46d32+ad9e832d/model.hlo_module.pb b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_7776165b0d0d23f46d32+ad9e832d/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..a0a394984ab83eaab4946ea0f58d3875c167f7e3 --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_7776165b0d0d23f46d32+ad9e832d/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5e7683c211dc0af38826ebf6230b77d074a161cee9ec7cb1479cbed80886141d +size 879322 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_7776165b0d0d23f46d32+ad9e832d/model.neff b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_7776165b0d0d23f46d32+ad9e832d/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..c73f711019ed832f56b83317f517d5d887ff85d7 --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_7776165b0d0d23f46d32+ad9e832d/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:359e60c0c6954b4b1e41353841731e1af857fcdfae77175beede8434fa5b0b4f +size 11664384 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_8926597e9069871b192d+ad9e832d/compile_flags.json b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_8926597e9069871b192d+ad9e832d/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..0a2078b3647f01aa3165babe7ccfb751b4575e61 --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_8926597e9069871b192d+ad9e832d/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "--lnc=1", "-O1", "--internal-hlo2tensorizer-options= --modular-flow-mac-threshold=10 --verify-hlo=true", "--logfile=/tmp/nxd_model/context_encoding_model/_tp0_bk0/log-neuron-cc.txt"] \ No newline at end of file diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_8926597e9069871b192d+ad9e832d/model.done b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_8926597e9069871b192d+ad9e832d/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_8926597e9069871b192d+ad9e832d/model.hlo_module.pb b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_8926597e9069871b192d+ad9e832d/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..563dbd41e22b2d8421294f7d016cf1ae0dcdf7ae --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_8926597e9069871b192d+ad9e832d/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e997c4e79e96cbcb32a125f0d039e049ef9db52977baa2ba2ff1c61cc44f8728 +size 472299 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_8926597e9069871b192d+ad9e832d/model.neff b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_8926597e9069871b192d+ad9e832d/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..b2095c9af54431f7d4f654d7ddfc9c86cfbf034d --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_8926597e9069871b192d+ad9e832d/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1f6f412e048ddcb9a23fa9f92216ff3eeeb3eeeb78a0c4c5aada3c1962097b44 +size 8203264 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_8d519e024abae9bbf305+617f6939/compile_flags.json b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_8d519e024abae9bbf305+617f6939/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..107cebd2dc9223d7d557c2256bdd494131263beb --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_8d519e024abae9bbf305+617f6939/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=1 --vectorize-strided-dma ", "--lnc=1", "-O2", "--internal-hlo2tensorizer-options=--verify-hlo=true", "--logfile=/tmp/nxd_model/token_generation_model/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"] \ No newline at end of file diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_8d519e024abae9bbf305+617f6939/model.done b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_8d519e024abae9bbf305+617f6939/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_8d519e024abae9bbf305+617f6939/model.hlo_module.pb b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_8d519e024abae9bbf305+617f6939/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..0b8c33e2e7c1d1b9330847cb73628d679127be33 --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_8d519e024abae9bbf305+617f6939/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5071a7599bf37c6e189b6187158a0179ccca7462c9dffd2a1c7bd8018789229d +size 764473 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_8d519e024abae9bbf305+617f6939/model.neff b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_8d519e024abae9bbf305+617f6939/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..7990b30da2e371c4d37b0c5be7928172d6d53c8b --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_8d519e024abae9bbf305+617f6939/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:314b069eebb2613c82e93cdce1a0e1e98cc3f8b83d87c475b1be547e9b715902 +size 8397824 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_8d519e024abae9bbf305+617f6939/wrapped_neff.hlo b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_8d519e024abae9bbf305+617f6939/wrapped_neff.hlo new file mode 100644 index 0000000000000000000000000000000000000000..d4485069ba89101c40bf15ec54f58ae495bf7bde --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_8d519e024abae9bbf305+617f6939/wrapped_neff.hlo @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dc685dbef59db678dce409552323ab8686c2f8181be35c3a56d908b079d65c6b +size 8583322 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_9a73716a575cb3cb95df+ad9e832d/compile_flags.json b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_9a73716a575cb3cb95df+ad9e832d/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..0a2078b3647f01aa3165babe7ccfb751b4575e61 --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_9a73716a575cb3cb95df+ad9e832d/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "--lnc=1", "-O1", "--internal-hlo2tensorizer-options= --modular-flow-mac-threshold=10 --verify-hlo=true", "--logfile=/tmp/nxd_model/context_encoding_model/_tp0_bk0/log-neuron-cc.txt"] \ No newline at end of file diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_9a73716a575cb3cb95df+ad9e832d/model.done b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_9a73716a575cb3cb95df+ad9e832d/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_9a73716a575cb3cb95df+ad9e832d/model.hlo_module.pb b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_9a73716a575cb3cb95df+ad9e832d/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..1e0f3a0c35f1f9afe8e66526c13abe2371e65fdb --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_9a73716a575cb3cb95df+ad9e832d/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a62f6d9bc9df3e2de19505d67e63c54515ab460fea5371f2c82e9e8d3c67322b +size 467299 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_9a73716a575cb3cb95df+ad9e832d/model.neff b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_9a73716a575cb3cb95df+ad9e832d/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..3087ede30df6c7904780408e81c352cddd41179d --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_9a73716a575cb3cb95df+ad9e832d/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7b4934ab602c98cf48c3c0047ec8bdd1706da17f5f5e7e9542e04045911cfeb3 +size 4363264 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_b3fcf757bda6afe1679e+ad9e832d/compile_flags.json b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_b3fcf757bda6afe1679e+ad9e832d/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..0a2078b3647f01aa3165babe7ccfb751b4575e61 --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_b3fcf757bda6afe1679e+ad9e832d/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "--lnc=1", "-O1", "--internal-hlo2tensorizer-options= --modular-flow-mac-threshold=10 --verify-hlo=true", "--logfile=/tmp/nxd_model/context_encoding_model/_tp0_bk0/log-neuron-cc.txt"] \ No newline at end of file diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_b3fcf757bda6afe1679e+ad9e832d/model.done b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_b3fcf757bda6afe1679e+ad9e832d/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_b3fcf757bda6afe1679e+ad9e832d/model.hlo_module.pb b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_b3fcf757bda6afe1679e+ad9e832d/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..3d35a5b7f9d6c9e9d2b2166ccd7c67a322118cc8 --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_b3fcf757bda6afe1679e+ad9e832d/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fb0b4a58bc33a450116485bdc97c80db38b76b6cf227f1a396467a16f8a24120 +size 463666 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_b3fcf757bda6afe1679e+ad9e832d/model.neff b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_b3fcf757bda6afe1679e+ad9e832d/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..021bc3b27b57510caa6aeaa257373abe8ebe838b --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_b3fcf757bda6afe1679e+ad9e832d/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ed1635305f59594bb96729057bfbd84fefd31db1795f3e1248314ef8e7b6e273 +size 3953664 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_da7e97c0c4b45f3b3821+ad9e832d/compile_flags.json b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_da7e97c0c4b45f3b3821+ad9e832d/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..0a2078b3647f01aa3165babe7ccfb751b4575e61 --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_da7e97c0c4b45f3b3821+ad9e832d/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "--lnc=1", "-O1", "--internal-hlo2tensorizer-options= --modular-flow-mac-threshold=10 --verify-hlo=true", "--logfile=/tmp/nxd_model/context_encoding_model/_tp0_bk0/log-neuron-cc.txt"] \ No newline at end of file diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_da7e97c0c4b45f3b3821+ad9e832d/model.done b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_da7e97c0c4b45f3b3821+ad9e832d/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_da7e97c0c4b45f3b3821+ad9e832d/model.hlo_module.pb b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_da7e97c0c4b45f3b3821+ad9e832d/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..a50971fc5aca4d68e0e14f3369929a6bc58ea002 --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_da7e97c0c4b45f3b3821+ad9e832d/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:67a1aedb62ddf41c80dc68cc5012e85a308184096cc91161a0b8c3722ed7e519 +size 667112 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_da7e97c0c4b45f3b3821+ad9e832d/model.neff b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_da7e97c0c4b45f3b3821+ad9e832d/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..013c20fb441e4bffe04047c54deac8280cac2356 --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_da7e97c0c4b45f3b3821+ad9e832d/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1c8b0200b2ad3b8eab8b71726ba5c3f59f83e8e5fb23c82e56699848db128fce +size 451584 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_de35c230ea0abd3360a7+617f6939/compile_flags.json b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_de35c230ea0abd3360a7+617f6939/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..107cebd2dc9223d7d557c2256bdd494131263beb --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_de35c230ea0abd3360a7+617f6939/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=1 --vectorize-strided-dma ", "--lnc=1", "-O2", "--internal-hlo2tensorizer-options=--verify-hlo=true", "--logfile=/tmp/nxd_model/token_generation_model/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"] \ No newline at end of file diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_de35c230ea0abd3360a7+617f6939/model.done b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_de35c230ea0abd3360a7+617f6939/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_de35c230ea0abd3360a7+617f6939/model.hlo_module.pb b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_de35c230ea0abd3360a7+617f6939/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..791cfcd0632b9c313c830562f527ebd73e00604f --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_de35c230ea0abd3360a7+617f6939/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:005f593253160ac83985c31e41ad06d4e8ef8abb217eabd8f83f8616b96d0fcc +size 623022 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_de35c230ea0abd3360a7+617f6939/model.neff b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_de35c230ea0abd3360a7+617f6939/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..630d9f9446e62f3ccef908478dce73153464bfc2 --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_de35c230ea0abd3360a7+617f6939/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1c9ddd19d822c930094daf4f23fe71ba2ef0752147d8d2f02c968f84b64b932a +size 1537024 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_de35c230ea0abd3360a7+617f6939/wrapped_neff.hlo b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_de35c230ea0abd3360a7+617f6939/wrapped_neff.hlo new file mode 100644 index 0000000000000000000000000000000000000000..003284dff45a8c830fab2e5a925545d4d69e417e --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_de35c230ea0abd3360a7+617f6939/wrapped_neff.hlo @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:777da8f3b00fbf3c274133ae4405c17c52d5d2942b92d8423bc02639d1b597f5 +size 1720482 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_eacd5f9beef23723ae4a+617f6939/compile_flags.json b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_eacd5f9beef23723ae4a+617f6939/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..107cebd2dc9223d7d557c2256bdd494131263beb --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_eacd5f9beef23723ae4a+617f6939/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=1 --vectorize-strided-dma ", "--lnc=1", "-O2", "--internal-hlo2tensorizer-options=--verify-hlo=true", "--logfile=/tmp/nxd_model/token_generation_model/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"] \ No newline at end of file diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_eacd5f9beef23723ae4a+617f6939/model.done b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_eacd5f9beef23723ae4a+617f6939/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_eacd5f9beef23723ae4a+617f6939/model.hlo_module.pb b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_eacd5f9beef23723ae4a+617f6939/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..92935257f68c4868ee22289df0b02b9bc9184bf8 --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_eacd5f9beef23723ae4a+617f6939/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0b6e644ce4a647575cac6ee8a2b724e7eeddce2a15d81873dcb06658ee9b43c2 +size 374121 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_eacd5f9beef23723ae4a+617f6939/model.neff b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_eacd5f9beef23723ae4a+617f6939/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..1a4b0d304f46d736f7b099bd7182b9663b23389e --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_eacd5f9beef23723ae4a+617f6939/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:27888041c8321fa7821e9e2462fa24906b92a55403e477ad4270efcf29f80abf +size 1117184 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_eacd5f9beef23723ae4a+617f6939/wrapped_neff.hlo b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_eacd5f9beef23723ae4a+617f6939/wrapped_neff.hlo new file mode 100644 index 0000000000000000000000000000000000000000..f1be8b54518143719e0c3eb60828b4ac84901da1 --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_eacd5f9beef23723ae4a+617f6939/wrapped_neff.hlo @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:79f4497b6c14d756912c64bdf11a914fbeeea99ea086717893013947ddb15959 +size 1209802 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_f8b4f545fd646928f740+ad9e832d/compile_flags.json b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_f8b4f545fd646928f740+ad9e832d/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..0a2078b3647f01aa3165babe7ccfb751b4575e61 --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_f8b4f545fd646928f740+ad9e832d/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "--lnc=1", "-O1", "--internal-hlo2tensorizer-options= --modular-flow-mac-threshold=10 --verify-hlo=true", "--logfile=/tmp/nxd_model/context_encoding_model/_tp0_bk0/log-neuron-cc.txt"] \ No newline at end of file diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_f8b4f545fd646928f740+ad9e832d/model.done b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_f8b4f545fd646928f740+ad9e832d/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_f8b4f545fd646928f740+ad9e832d/model.hlo_module.pb b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_f8b4f545fd646928f740+ad9e832d/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..d043f2b3418e69ff03a62fd1d19a89b9ab1b52e6 --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_f8b4f545fd646928f740+ad9e832d/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2a4ab156514485dbf5d74db2535e84136a07f17752c578320af5984844defbff +size 468446 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_f8b4f545fd646928f740+ad9e832d/model.neff b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_f8b4f545fd646928f740+ad9e832d/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..3a5516c40c36be97003df94e78b1c693d72651a1 --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_f8b4f545fd646928f740+ad9e832d/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aa6791c3341dd45d1cdf2724e98350fb7b1b08c8198db84fcd650b33c04117b0 +size 22252544 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_fede9e304a150a635925+617f6939/compile_flags.json b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_fede9e304a150a635925+617f6939/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..107cebd2dc9223d7d557c2256bdd494131263beb --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_fede9e304a150a635925+617f6939/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=1 --vectorize-strided-dma ", "--lnc=1", "-O2", "--internal-hlo2tensorizer-options=--verify-hlo=true", "--logfile=/tmp/nxd_model/token_generation_model/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"] \ No newline at end of file diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_fede9e304a150a635925+617f6939/model.done b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_fede9e304a150a635925+617f6939/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_fede9e304a150a635925+617f6939/model.hlo_module.pb b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_fede9e304a150a635925+617f6939/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..f6d50735d68bf785de4fd88218365ab2d919aaed --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_fede9e304a150a635925+617f6939/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e7707b4ae5ae2b0aafdac9c76d4726c1969cbe176743da0ce7d7ad494ae57b7f +size 743609 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_fede9e304a150a635925+617f6939/model.neff b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_fede9e304a150a635925+617f6939/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..8e21a64fecfb0790a14e390e0d88988684ddd8c2 --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_fede9e304a150a635925+617f6939/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b1816edc19a32a1152161f05f69ee58a6289d6a4bef3c10b547245abd13e8333 +size 2970624 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_fede9e304a150a635925+617f6939/wrapped_neff.hlo b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_fede9e304a150a635925+617f6939/wrapped_neff.hlo new file mode 100644 index 0000000000000000000000000000000000000000..e6b4f2b453b4ec4002802ae7ed464099ba3ac948 --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_fede9e304a150a635925+617f6939/wrapped_neff.hlo @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:41cca0b61d997d19bcb4eb7bf9d5d2b64b1e0ed7c572644b2097d98b1b2c918b +size 3155208 diff --git a/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.3.dev2/llama/meta-llama/Llama-3.1-8B-Instruct/3f2788536ce52a84f6c0.json b/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.3.dev2/llama/meta-llama/Llama-3.1-8B-Instruct/3f2788536ce52a84f6c0.json new file mode 100644 index 0000000000000000000000000000000000000000..9ee756b0da4477bf7e484e42424a21ce6d33e981 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.3.dev2/llama/meta-llama/Llama-3.1-8B-Instruct/3f2788536ce52a84f6c0.json @@ -0,0 +1,62 @@ +{ + "_entry_class": "SingleModelCacheEntry", + "_model_id": "meta-llama/Llama-3.1-8B-Instruct", + "_task": "text-generation", + "architectures": [ + "LlamaForCausalLM" + ], + "attention_bias": false, + "attention_dropout": 0.0, + "dtype": "bfloat16", + "head_dim": 128, + "hidden_act": "silu", + "hidden_size": 4096, + "initializer_range": 0.02, + "intermediate_size": 14336, + "max_position_embeddings": 131072, + "mlp_bias": false, + "model_type": "llama", + "neuron": { + "_serialized_key": "NxDNeuronConfig", + "batch_size": 1, + "capacity_factor": null, + "checkpoint_id": "meta-llama/Llama-3.1-8B-Instruct", + "checkpoint_revision": "0e9e39f249a16976918f6564b8830bc894c89659", + "continuous_batching": false, + "ep_degree": 1, + "fused_qkv": true, + "glu_mlp": true, + "local_ranks_size": 8, + "max_batch_size": 1, + "max_context_length": 16384, + "max_topk": 256, + "n_active_tokens": 16384, + "neuronxcc_version": "2.21.33363.0+82129205", + "on_device_sampling": true, + "optimum_neuron_version": "0.4.3.dev2", + "output_logits": false, + "pp_degree": 1, + "sequence_length": 16384, + "speculation_length": 0, + "start_rank_id": 0, + "target": "trn1", + "torch_dtype": "bfloat16", + "tp_degree": 8 + }, + "num_attention_heads": 32, + "num_hidden_layers": 32, + "num_key_value_heads": 8, + "pretraining_tp": 1, + "rms_norm_eps": 1e-05, + "rope_scaling": { + "factor": 8.0, + "high_freq_factor": 4.0, + "low_freq_factor": 1.0, + "original_max_position_embeddings": 8192, + "rope_type": "llama3" + }, + "rope_theta": 500000.0, + "tie_word_embeddings": false, + "use_cache": true, + "vocab_size": 128256 +} \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.3.dev3/granite/hf-internal-testing/tiny-random-GraniteForCausalLM/822b61c3a021502bf290.json b/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.3.dev3/granite/hf-internal-testing/tiny-random-GraniteForCausalLM/822b61c3a021502bf290.json new file mode 100644 index 0000000000000000000000000000000000000000..953b4852a148dbf9c10eca4aeb1d5038a06e96a3 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.3.dev3/granite/hf-internal-testing/tiny-random-GraniteForCausalLM/822b61c3a021502bf290.json @@ -0,0 +1,59 @@ +{ + "_entry_class": "SingleModelCacheEntry", + "_model_id": "hf-internal-testing/tiny-random-GraniteForCausalLM", + "_task": "text-generation", + "architectures": [ + "GraniteForCausalLM" + ], + "attention_bias": false, + "attention_dropout": 0.0, + "attention_multiplier": 1.0, + "dtype": "float32", + "embedding_multiplier": 1.0, + "hidden_act": "silu", + "hidden_size": 32, + "initializer_range": 0.02, + "intermediate_size": 64, + "logits_scaling": 1.0, + "max_position_embeddings": 2048, + "mlp_bias": false, + "model_type": "granite", + "neuron": { + "_serialized_key": "NxDNeuronConfig", + "batch_size": 1, + "capacity_factor": null, + "checkpoint_id": "hf-internal-testing/tiny-random-GraniteForCausalLM", + "checkpoint_revision": "c3074ebc0ac2fe545305f5e5f6cce2cc9b2aa0c5", + "continuous_batching": false, + "ep_degree": 1, + "fused_qkv": true, + "glu_mlp": true, + "local_ranks_size": 2, + "max_batch_size": 1, + "max_context_length": 1024, + "max_topk": 256, + "n_active_tokens": 1024, + "neuronxcc_version": "2.21.33363.0+82129205", + "on_device_sampling": true, + "optimum_neuron_version": "0.4.3.dev3", + "output_logits": false, + "pp_degree": 1, + "sequence_length": 1024, + "sequence_parallel_enabled": false, + "speculation_length": 0, + "start_rank_id": 0, + "target": "trn1", + "torch_dtype": "float32", + "tp_degree": 2 + }, + "num_attention_heads": 4, + "num_hidden_layers": 2, + "num_key_value_heads": 4, + "residual_multiplier": 1.0, + "rms_norm_eps": 1e-06, + "rope_scaling": null, + "rope_theta": 10000.0, + "tie_word_embeddings": false, + "use_cache": true, + "vocab_size": 49152 +} \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.3.dev3/granite/ibm-granite/granite-3.1-2b-instruct/063d011f2046f1d6b411.json b/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.3.dev3/granite/ibm-granite/granite-3.1-2b-instruct/063d011f2046f1d6b411.json new file mode 100644 index 0000000000000000000000000000000000000000..c91f637b45bdc3cd8b8a58af1ee5456613ec82b0 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.3.dev3/granite/ibm-granite/granite-3.1-2b-instruct/063d011f2046f1d6b411.json @@ -0,0 +1,58 @@ +{ + "_entry_class": "SingleModelCacheEntry", + "_model_id": "ibm-granite/granite-3.1-2b-instruct", + "_task": "text-generation", + "architectures": [ + "GraniteForCausalLM" + ], + "attention_bias": false, + "attention_dropout": 0.1, + "attention_multiplier": 0.015625, + "dtype": "bfloat16", + "embedding_multiplier": 12.0, + "hidden_act": "silu", + "hidden_size": 2048, + "initializer_range": 0.02, + "intermediate_size": 8192, + "logits_scaling": 8.0, + "max_position_embeddings": 131072, + "mlp_bias": false, + "model_type": "granite", + "neuron": { + "_serialized_key": "NxDNeuronConfig", + "batch_size": 4, + "capacity_factor": null, + "checkpoint_id": "ibm-granite/granite-3.1-2b-instruct", + "checkpoint_revision": "bbc2aed595bd38bd770263dc3ab831db9794441d", + "continuous_batching": true, + "ep_degree": 1, + "fused_qkv": true, + "glu_mlp": true, + "local_ranks_size": 2, + "max_batch_size": 4, + "max_context_length": 4096, + "max_topk": 256, + "n_active_tokens": 4096, + "neuronxcc_version": "2.21.33363.0+82129205", + "on_device_sampling": true, + "optimum_neuron_version": "0.4.3.dev3", + "output_logits": false, + "pp_degree": 1, + "sequence_length": 4096, + "speculation_length": 0, + "start_rank_id": 0, + "target": "trn1", + "torch_dtype": "bfloat16", + "tp_degree": 2 + }, + "num_attention_heads": 32, + "num_hidden_layers": 40, + "num_key_value_heads": 8, + "residual_multiplier": 0.22, + "rms_norm_eps": 1e-05, + "rope_scaling": null, + "rope_theta": 5000000.0, + "tie_word_embeddings": true, + "use_cache": true, + "vocab_size": 49155 +} \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.3.dev3/granite/ibm-granite/granite-3.1-2b-instruct/dd07030f54079f7dc586.json b/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.3.dev3/granite/ibm-granite/granite-3.1-2b-instruct/dd07030f54079f7dc586.json new file mode 100644 index 0000000000000000000000000000000000000000..d0b4453a3a705b7c62c3dfdcff64413a3229921c --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.3.dev3/granite/ibm-granite/granite-3.1-2b-instruct/dd07030f54079f7dc586.json @@ -0,0 +1,59 @@ +{ + "_entry_class": "SingleModelCacheEntry", + "_model_id": "ibm-granite/granite-3.1-2b-instruct", + "_task": "text-generation", + "architectures": [ + "GraniteForCausalLM" + ], + "attention_bias": false, + "attention_dropout": 0.1, + "attention_multiplier": 0.015625, + "dtype": "bfloat16", + "embedding_multiplier": 12.0, + "hidden_act": "silu", + "hidden_size": 2048, + "initializer_range": 0.02, + "intermediate_size": 8192, + "logits_scaling": 8.0, + "max_position_embeddings": 131072, + "mlp_bias": false, + "model_type": "granite", + "neuron": { + "_serialized_key": "NxDNeuronConfig", + "batch_size": 4, + "capacity_factor": null, + "checkpoint_id": "ibm-granite/granite-3.1-2b-instruct", + "checkpoint_revision": "bbc2aed595bd38bd770263dc3ab831db9794441d", + "continuous_batching": true, + "ep_degree": 1, + "fused_qkv": true, + "glu_mlp": true, + "local_ranks_size": 2, + "max_batch_size": 4, + "max_context_length": 4096, + "max_topk": 256, + "n_active_tokens": 4096, + "neuronxcc_version": "2.21.33363.0+82129205", + "on_device_sampling": true, + "optimum_neuron_version": "0.4.3.dev3", + "output_logits": false, + "pp_degree": 1, + "sequence_length": 4096, + "sequence_parallel_enabled": false, + "speculation_length": 0, + "start_rank_id": 0, + "target": "trn1", + "torch_dtype": "bfloat16", + "tp_degree": 2 + }, + "num_attention_heads": 32, + "num_hidden_layers": 40, + "num_key_value_heads": 8, + "residual_multiplier": 0.22, + "rms_norm_eps": 1e-05, + "rope_scaling": null, + "rope_theta": 5000000.0, + "tie_word_embeddings": true, + "use_cache": true, + "vocab_size": 49155 +} \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.3.dev3/llama/llamafactory/tiny-random-Llama-3/9587f75fe03d32199424.json b/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.3.dev3/llama/llamafactory/tiny-random-Llama-3/9587f75fe03d32199424.json new file mode 100644 index 0000000000000000000000000000000000000000..5c414e0515e4652370454d3942e3ee7b2bc1a2d8 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.3.dev3/llama/llamafactory/tiny-random-Llama-3/9587f75fe03d32199424.json @@ -0,0 +1,63 @@ +{ + "_entry_class": "SingleModelCacheEntry", + "_model_id": "llamafactory/tiny-random-Llama-3", + "_task": "text-generation", + "architectures": [ + "LlamaForCausalLM" + ], + "attention_bias": false, + "attention_dropout": 0.0, + "dtype": "float16", + "head_dim": 4, + "hidden_act": "silu", + "hidden_size": 16, + "initializer_range": 0.02, + "intermediate_size": 64, + "max_position_embeddings": 131072, + "mlp_bias": false, + "model_type": "llama", + "neuron": { + "_serialized_key": "NxDNeuronConfig", + "batch_size": 1, + "capacity_factor": null, + "checkpoint_id": "llamafactory/tiny-random-Llama-3", + "checkpoint_revision": "bf2a2e3bf199ad2ee96f02a3c00246c608db22a8", + "continuous_batching": false, + "ep_degree": 1, + "fused_qkv": true, + "glu_mlp": true, + "local_ranks_size": 2, + "max_batch_size": 1, + "max_context_length": 1024, + "max_topk": 256, + "n_active_tokens": 1024, + "neuronxcc_version": "2.21.33363.0+82129205", + "on_device_sampling": true, + "optimum_neuron_version": "0.4.3.dev3", + "output_logits": false, + "pp_degree": 1, + "sequence_length": 1024, + "sequence_parallel_enabled": false, + "speculation_length": 0, + "start_rank_id": 0, + "target": "trn1", + "torch_dtype": "float16", + "tp_degree": 2 + }, + "num_attention_heads": 4, + "num_hidden_layers": 2, + "num_key_value_heads": 4, + "pretraining_tp": 1, + "rms_norm_eps": 1e-05, + "rope_scaling": { + "factor": 8.0, + "high_freq_factor": 4.0, + "low_freq_factor": 1.0, + "original_max_position_embeddings": 8192, + "rope_type": "llama3" + }, + "rope_theta": 500000.0, + "tie_word_embeddings": false, + "use_cache": true, + "vocab_size": 128256 +} \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.3.dev3/llama/meta-llama/Llama-3.1-8B-Instruct/0451dd4ad8e23b64aa0c.json b/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.3.dev3/llama/meta-llama/Llama-3.1-8B-Instruct/0451dd4ad8e23b64aa0c.json new file mode 100644 index 0000000000000000000000000000000000000000..57b0c8ef0e89dfcf24119b497faf000c71083e49 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.3.dev3/llama/meta-llama/Llama-3.1-8B-Instruct/0451dd4ad8e23b64aa0c.json @@ -0,0 +1,63 @@ +{ + "_entry_class": "SingleModelCacheEntry", + "_model_id": "meta-llama/Llama-3.1-8B-Instruct", + "_task": "text-generation", + "architectures": [ + "LlamaForCausalLM" + ], + "attention_bias": false, + "attention_dropout": 0.0, + "dtype": "bfloat16", + "head_dim": 128, + "hidden_act": "silu", + "hidden_size": 4096, + "initializer_range": 0.02, + "intermediate_size": 14336, + "max_position_embeddings": 131072, + "mlp_bias": false, + "model_type": "llama", + "neuron": { + "_serialized_key": "NxDNeuronConfig", + "batch_size": 1, + "capacity_factor": null, + "checkpoint_id": "meta-llama/Llama-3.1-8B-Instruct", + "checkpoint_revision": "0e9e39f249a16976918f6564b8830bc894c89659", + "continuous_batching": false, + "ep_degree": 1, + "fused_qkv": true, + "glu_mlp": true, + "local_ranks_size": 2, + "max_batch_size": 1, + "max_context_length": 4096, + "max_topk": 256, + "n_active_tokens": 4096, + "neuronxcc_version": "2.21.33363.0+82129205", + "on_device_sampling": true, + "optimum_neuron_version": "0.4.3.dev3", + "output_logits": false, + "pp_degree": 1, + "sequence_length": 4096, + "sequence_parallel_enabled": true, + "speculation_length": 0, + "start_rank_id": 0, + "target": "trn1", + "torch_dtype": "bfloat16", + "tp_degree": 2 + }, + "num_attention_heads": 32, + "num_hidden_layers": 32, + "num_key_value_heads": 8, + "pretraining_tp": 1, + "rms_norm_eps": 1e-05, + "rope_scaling": { + "factor": 8.0, + "high_freq_factor": 4.0, + "low_freq_factor": 1.0, + "original_max_position_embeddings": 8192, + "rope_type": "llama3" + }, + "rope_theta": 500000.0, + "tie_word_embeddings": false, + "use_cache": true, + "vocab_size": 128256 +} \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.3.dev3/llama/meta-llama/Llama-3.1-8B-Instruct/837dd017e8ae4530668c.json b/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.3.dev3/llama/meta-llama/Llama-3.1-8B-Instruct/837dd017e8ae4530668c.json new file mode 100644 index 0000000000000000000000000000000000000000..eacd6923727a653d98d2647649dea9eca38f4d13 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.3.dev3/llama/meta-llama/Llama-3.1-8B-Instruct/837dd017e8ae4530668c.json @@ -0,0 +1,63 @@ +{ + "_entry_class": "SingleModelCacheEntry", + "_model_id": "meta-llama/Llama-3.1-8B-Instruct", + "_task": "text-generation", + "architectures": [ + "LlamaForCausalLM" + ], + "attention_bias": false, + "attention_dropout": 0.0, + "dtype": "bfloat16", + "head_dim": 128, + "hidden_act": "silu", + "hidden_size": 4096, + "initializer_range": 0.02, + "intermediate_size": 14336, + "max_position_embeddings": 131072, + "mlp_bias": false, + "model_type": "llama", + "neuron": { + "_serialized_key": "NxDNeuronConfig", + "batch_size": 1, + "capacity_factor": null, + "checkpoint_id": "meta-llama/Llama-3.1-8B-Instruct", + "checkpoint_revision": "0e9e39f249a16976918f6564b8830bc894c89659", + "continuous_batching": false, + "ep_degree": 1, + "fused_qkv": true, + "glu_mlp": true, + "local_ranks_size": 8, + "max_batch_size": 1, + "max_context_length": 16384, + "max_topk": 256, + "n_active_tokens": 16384, + "neuronxcc_version": "2.21.33363.0+82129205", + "on_device_sampling": false, + "optimum_neuron_version": "0.4.3.dev3", + "output_logits": false, + "pp_degree": 1, + "sequence_length": 16384, + "sequence_parallel_enabled": false, + "speculation_length": 0, + "start_rank_id": 0, + "target": "trn1", + "torch_dtype": "bfloat16", + "tp_degree": 8 + }, + "num_attention_heads": 32, + "num_hidden_layers": 32, + "num_key_value_heads": 8, + "pretraining_tp": 1, + "rms_norm_eps": 1e-05, + "rope_scaling": { + "factor": 8.0, + "high_freq_factor": 4.0, + "low_freq_factor": 1.0, + "original_max_position_embeddings": 8192, + "rope_type": "llama3" + }, + "rope_theta": 500000.0, + "tie_word_embeddings": false, + "use_cache": true, + "vocab_size": 128256 +} \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.3.dev3/llama/meta-llama/Llama-3.1-8B-Instruct/a36d353642d325c5397f.json b/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.3.dev3/llama/meta-llama/Llama-3.1-8B-Instruct/a36d353642d325c5397f.json new file mode 100644 index 0000000000000000000000000000000000000000..b6cb5c9878246185d850718290292e714c23ff33 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.3.dev3/llama/meta-llama/Llama-3.1-8B-Instruct/a36d353642d325c5397f.json @@ -0,0 +1,63 @@ +{ + "_entry_class": "SingleModelCacheEntry", + "_model_id": "meta-llama/Llama-3.1-8B-Instruct", + "_task": "text-generation", + "architectures": [ + "LlamaForCausalLM" + ], + "attention_bias": false, + "attention_dropout": 0.0, + "dtype": "bfloat16", + "head_dim": 128, + "hidden_act": "silu", + "hidden_size": 4096, + "initializer_range": 0.02, + "intermediate_size": 14336, + "max_position_embeddings": 131072, + "mlp_bias": false, + "model_type": "llama", + "neuron": { + "_serialized_key": "NxDNeuronConfig", + "batch_size": 1, + "capacity_factor": null, + "checkpoint_id": "meta-llama/Llama-3.1-8B-Instruct", + "checkpoint_revision": "0e9e39f249a16976918f6564b8830bc894c89659", + "continuous_batching": false, + "ep_degree": 1, + "fused_qkv": true, + "glu_mlp": true, + "local_ranks_size": 8, + "max_batch_size": 1, + "max_context_length": 16384, + "max_topk": 256, + "n_active_tokens": 16384, + "neuronxcc_version": "2.21.33363.0+82129205", + "on_device_sampling": false, + "optimum_neuron_version": "0.4.3.dev3", + "output_logits": false, + "pp_degree": 1, + "sequence_length": 16384, + "sequence_parallel_enabled": true, + "speculation_length": 0, + "start_rank_id": 0, + "target": "trn1", + "torch_dtype": "bfloat16", + "tp_degree": 8 + }, + "num_attention_heads": 32, + "num_hidden_layers": 32, + "num_key_value_heads": 8, + "pretraining_tp": 1, + "rms_norm_eps": 1e-05, + "rope_scaling": { + "factor": 8.0, + "high_freq_factor": 4.0, + "low_freq_factor": 1.0, + "original_max_position_embeddings": 8192, + "rope_type": "llama3" + }, + "rope_theta": 500000.0, + "tie_word_embeddings": false, + "use_cache": true, + "vocab_size": 128256 +} \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.3.dev3/llama/meta-llama/Llama-3.1-8B-Instruct/cfdcd4c75495aba1f95d.json b/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.3.dev3/llama/meta-llama/Llama-3.1-8B-Instruct/cfdcd4c75495aba1f95d.json new file mode 100644 index 0000000000000000000000000000000000000000..0be835ccb4574668bdcbad446e495e4ff967e8d9 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.3.dev3/llama/meta-llama/Llama-3.1-8B-Instruct/cfdcd4c75495aba1f95d.json @@ -0,0 +1,63 @@ +{ + "_entry_class": "SingleModelCacheEntry", + "_model_id": "meta-llama/Llama-3.1-8B-Instruct", + "_task": "text-generation", + "architectures": [ + "LlamaForCausalLM" + ], + "attention_bias": false, + "attention_dropout": 0.0, + "dtype": "bfloat16", + "head_dim": 128, + "hidden_act": "silu", + "hidden_size": 4096, + "initializer_range": 0.02, + "intermediate_size": 14336, + "max_position_embeddings": 131072, + "mlp_bias": false, + "model_type": "llama", + "neuron": { + "_serialized_key": "NxDNeuronConfig", + "batch_size": 1, + "capacity_factor": null, + "checkpoint_id": "meta-llama/Llama-3.1-8B-Instruct", + "checkpoint_revision": "0e9e39f249a16976918f6564b8830bc894c89659", + "continuous_batching": false, + "ep_degree": 1, + "fused_qkv": true, + "glu_mlp": true, + "local_ranks_size": 2, + "max_batch_size": 1, + "max_context_length": 4096, + "max_topk": 256, + "n_active_tokens": 4096, + "neuronxcc_version": "2.21.33363.0+82129205", + "on_device_sampling": false, + "optimum_neuron_version": "0.4.3.dev3", + "output_logits": false, + "pp_degree": 1, + "sequence_length": 4096, + "sequence_parallel_enabled": true, + "speculation_length": 0, + "start_rank_id": 0, + "target": "trn1", + "torch_dtype": "bfloat16", + "tp_degree": 2 + }, + "num_attention_heads": 32, + "num_hidden_layers": 32, + "num_key_value_heads": 8, + "pretraining_tp": 1, + "rms_norm_eps": 1e-05, + "rope_scaling": { + "factor": 8.0, + "high_freq_factor": 4.0, + "low_freq_factor": 1.0, + "original_max_position_embeddings": 8192, + "rope_type": "llama3" + }, + "rope_theta": 500000.0, + "tie_word_embeddings": false, + "use_cache": true, + "vocab_size": 128256 +} \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.3.dev3/llama/unsloth/Llama-3.2-1B-Instruct/0fef0800e360b8e2aa85.json b/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.3.dev3/llama/unsloth/Llama-3.2-1B-Instruct/0fef0800e360b8e2aa85.json new file mode 100644 index 0000000000000000000000000000000000000000..1176d2993637727e30b887f0d66cad7e9c14d8d6 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.3.dev3/llama/unsloth/Llama-3.2-1B-Instruct/0fef0800e360b8e2aa85.json @@ -0,0 +1,64 @@ +{ + "_entry_class": "SingleModelCacheEntry", + "_model_id": "unsloth/Llama-3.2-1B-Instruct", + "_task": "text-generation", + "architectures": [ + "LlamaForCausalLM" + ], + "attention_bias": false, + "attention_dropout": 0.0, + "dtype": "bfloat16", + "head_dim": 64, + "hidden_act": "silu", + "hidden_size": 2048, + "initializer_range": 0.02, + "intermediate_size": 8192, + "max_position_embeddings": 131072, + "mlp_bias": false, + "model_type": "llama", + "neuron": { + "_serialized_key": "NxDNeuronConfig", + "batch_size": 1, + "capacity_factor": null, + "checkpoint_id": "unsloth/Llama-3.2-1B-Instruct", + "checkpoint_revision": "5a8abab4a5d6f164389b1079fb721cfab8d7126c", + "continuous_batching": false, + "ep_degree": 1, + "fused_qkv": true, + "glu_mlp": true, + "local_ranks_size": 2, + "max_batch_size": 1, + "max_context_length": 16384, + "max_topk": 256, + "n_active_tokens": 16384, + "neuronxcc_version": "2.21.33363.0+82129205", + "on_device_sampling": false, + "optimum_neuron_version": "0.4.3.dev3", + "output_logits": false, + "pp_degree": 1, + "sequence_length": 16384, + "sequence_parallel_enabled": true, + "speculation_length": 0, + "start_rank_id": 0, + "target": "trn1", + "torch_dtype": "bfloat16", + "tp_degree": 2 + }, + "num_attention_heads": 32, + "num_hidden_layers": 16, + "num_key_value_heads": 8, + "pretraining_tp": 1, + "rms_norm_eps": 1e-05, + "rope_scaling": { + "factor": 32.0, + "high_freq_factor": 4.0, + "low_freq_factor": 1.0, + "original_max_position_embeddings": 8192, + "rope_type": "llama3" + }, + "rope_theta": 500000.0, + "tie_word_embeddings": true, + "unsloth_fixed": true, + "use_cache": true, + "vocab_size": 128256 +} \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.3.dev3/llama/unsloth/Llama-3.2-1B-Instruct/2b6b32ab110a36e51b85.json b/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.3.dev3/llama/unsloth/Llama-3.2-1B-Instruct/2b6b32ab110a36e51b85.json new file mode 100644 index 0000000000000000000000000000000000000000..adb047ad6ab16f2b640eb5437e4a239f15131d55 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.3.dev3/llama/unsloth/Llama-3.2-1B-Instruct/2b6b32ab110a36e51b85.json @@ -0,0 +1,64 @@ +{ + "_entry_class": "SingleModelCacheEntry", + "_model_id": "unsloth/Llama-3.2-1B-Instruct", + "_task": "text-generation", + "architectures": [ + "LlamaForCausalLM" + ], + "attention_bias": false, + "attention_dropout": 0.0, + "dtype": "bfloat16", + "head_dim": 64, + "hidden_act": "silu", + "hidden_size": 2048, + "initializer_range": 0.02, + "intermediate_size": 8192, + "max_position_embeddings": 131072, + "mlp_bias": false, + "model_type": "llama", + "neuron": { + "_serialized_key": "NxDNeuronConfig", + "batch_size": 4, + "capacity_factor": null, + "checkpoint_id": "unsloth/Llama-3.2-1B-Instruct", + "checkpoint_revision": "5a8abab4a5d6f164389b1079fb721cfab8d7126c", + "continuous_batching": true, + "ep_degree": 1, + "fused_qkv": true, + "glu_mlp": true, + "local_ranks_size": 2, + "max_batch_size": 4, + "max_context_length": 4096, + "max_topk": 256, + "n_active_tokens": 4096, + "neuronxcc_version": "2.21.33363.0+82129205", + "on_device_sampling": true, + "optimum_neuron_version": "0.4.3.dev3", + "output_logits": false, + "pp_degree": 1, + "sequence_length": 4096, + "sequence_parallel_enabled": true, + "speculation_length": 0, + "start_rank_id": 0, + "target": "trn1", + "torch_dtype": "bfloat16", + "tp_degree": 2 + }, + "num_attention_heads": 32, + "num_hidden_layers": 16, + "num_key_value_heads": 8, + "pretraining_tp": 1, + "rms_norm_eps": 1e-05, + "rope_scaling": { + "factor": 32.0, + "high_freq_factor": 4.0, + "low_freq_factor": 1.0, + "original_max_position_embeddings": 8192, + "rope_type": "llama3" + }, + "rope_theta": 500000.0, + "tie_word_embeddings": true, + "unsloth_fixed": true, + "use_cache": true, + "vocab_size": 128256 +} \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.3.dev3/llama/unsloth/Llama-3.2-1B-Instruct/80315139ffb2eb77db25.json b/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.3.dev3/llama/unsloth/Llama-3.2-1B-Instruct/80315139ffb2eb77db25.json new file mode 100644 index 0000000000000000000000000000000000000000..54731d14ef8f780b8a6b77e5036cc8937bb0de8d --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.3.dev3/llama/unsloth/Llama-3.2-1B-Instruct/80315139ffb2eb77db25.json @@ -0,0 +1,64 @@ +{ + "_entry_class": "SingleModelCacheEntry", + "_model_id": "unsloth/Llama-3.2-1B-Instruct", + "_task": "text-generation", + "architectures": [ + "LlamaForCausalLM" + ], + "attention_bias": false, + "attention_dropout": 0.0, + "dtype": "bfloat16", + "head_dim": 64, + "hidden_act": "silu", + "hidden_size": 2048, + "initializer_range": 0.02, + "intermediate_size": 8192, + "max_position_embeddings": 131072, + "mlp_bias": false, + "model_type": "llama", + "neuron": { + "_serialized_key": "NxDNeuronConfig", + "batch_size": 1, + "capacity_factor": null, + "checkpoint_id": "unsloth/Llama-3.2-1B-Instruct", + "checkpoint_revision": null, + "continuous_batching": false, + "ep_degree": 1, + "fused_qkv": false, + "glu_mlp": true, + "local_ranks_size": 2, + "max_batch_size": 1, + "max_context_length": 4096, + "max_topk": 256, + "n_active_tokens": 4096, + "neuronxcc_version": "2.21.33363.0+82129205", + "on_device_sampling": false, + "optimum_neuron_version": "0.4.3.dev3", + "output_logits": false, + "pp_degree": 1, + "sequence_length": 4096, + "sequence_parallel_enabled": false, + "speculation_length": 5, + "start_rank_id": 0, + "target": "trn1", + "torch_dtype": "bfloat16", + "tp_degree": 2 + }, + "num_attention_heads": 32, + "num_hidden_layers": 16, + "num_key_value_heads": 8, + "pretraining_tp": 1, + "rms_norm_eps": 1e-05, + "rope_scaling": { + "factor": 32.0, + "high_freq_factor": 4.0, + "low_freq_factor": 1.0, + "original_max_position_embeddings": 8192, + "rope_type": "llama3" + }, + "rope_theta": 500000.0, + "tie_word_embeddings": true, + "unsloth_fixed": true, + "use_cache": true, + "vocab_size": 128256 +} \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.3.dev3/llama/unsloth/Llama-3.2-1B-Instruct/94df3810f4ff25f21be1.json b/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.3.dev3/llama/unsloth/Llama-3.2-1B-Instruct/94df3810f4ff25f21be1.json new file mode 100644 index 0000000000000000000000000000000000000000..2cae3a27f52268a52e85dc611f3cd7de9eb6a3cf --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.3.dev3/llama/unsloth/Llama-3.2-1B-Instruct/94df3810f4ff25f21be1.json @@ -0,0 +1,64 @@ +{ + "_entry_class": "SingleModelCacheEntry", + "_model_id": "unsloth/Llama-3.2-1B-Instruct", + "_task": "text-generation", + "architectures": [ + "LlamaForCausalLM" + ], + "attention_bias": false, + "attention_dropout": 0.0, + "dtype": "bfloat16", + "head_dim": 64, + "hidden_act": "silu", + "hidden_size": 2048, + "initializer_range": 0.02, + "intermediate_size": 8192, + "max_position_embeddings": 131072, + "mlp_bias": false, + "model_type": "llama", + "neuron": { + "_serialized_key": "NxDNeuronConfig", + "batch_size": 4, + "capacity_factor": null, + "checkpoint_id": "unsloth/Llama-3.2-1B-Instruct", + "checkpoint_revision": "5a8abab4a5d6f164389b1079fb721cfab8d7126c", + "continuous_batching": true, + "ep_degree": 1, + "fused_qkv": true, + "glu_mlp": true, + "local_ranks_size": 2, + "max_batch_size": 4, + "max_context_length": 4096, + "max_topk": 256, + "n_active_tokens": 4096, + "neuronxcc_version": "2.21.33363.0+82129205", + "on_device_sampling": true, + "optimum_neuron_version": "0.4.3.dev3", + "output_logits": false, + "pp_degree": 1, + "sequence_length": 4096, + "sequence_parallel_enabled": false, + "speculation_length": 0, + "start_rank_id": 0, + "target": "trn1", + "torch_dtype": "bfloat16", + "tp_degree": 2 + }, + "num_attention_heads": 32, + "num_hidden_layers": 16, + "num_key_value_heads": 8, + "pretraining_tp": 1, + "rms_norm_eps": 1e-05, + "rope_scaling": { + "factor": 32.0, + "high_freq_factor": 4.0, + "low_freq_factor": 1.0, + "original_max_position_embeddings": 8192, + "rope_type": "llama3" + }, + "rope_theta": 500000.0, + "tie_word_embeddings": true, + "unsloth_fixed": true, + "use_cache": true, + "vocab_size": 128256 +} \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.3.dev3/llama/unsloth/Llama-3.2-1B-Instruct/98b3fa9a890ef0e1f391.json b/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.3.dev3/llama/unsloth/Llama-3.2-1B-Instruct/98b3fa9a890ef0e1f391.json new file mode 100644 index 0000000000000000000000000000000000000000..7e96121ea85f2a51c8013ab3a71f96a7eb38d9d2 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.3.dev3/llama/unsloth/Llama-3.2-1B-Instruct/98b3fa9a890ef0e1f391.json @@ -0,0 +1,64 @@ +{ + "_entry_class": "SingleModelCacheEntry", + "_model_id": "unsloth/Llama-3.2-1B-Instruct", + "_task": "text-generation", + "architectures": [ + "LlamaForCausalLM" + ], + "attention_bias": false, + "attention_dropout": 0.0, + "dtype": "bfloat16", + "head_dim": 64, + "hidden_act": "silu", + "hidden_size": 2048, + "initializer_range": 0.02, + "intermediate_size": 8192, + "max_position_embeddings": 131072, + "mlp_bias": false, + "model_type": "llama", + "neuron": { + "_serialized_key": "NxDNeuronConfig", + "batch_size": 1, + "capacity_factor": null, + "checkpoint_id": "unsloth/Llama-3.2-1B-Instruct", + "checkpoint_revision": "5a8abab4a5d6f164389b1079fb721cfab8d7126c", + "continuous_batching": false, + "ep_degree": 1, + "fused_qkv": true, + "glu_mlp": true, + "local_ranks_size": 2, + "max_batch_size": 1, + "max_context_length": 4096, + "max_topk": 256, + "n_active_tokens": 4096, + "neuronxcc_version": "2.21.33363.0+82129205", + "on_device_sampling": true, + "optimum_neuron_version": "0.4.3.dev3", + "output_logits": false, + "pp_degree": 1, + "sequence_length": 4096, + "sequence_parallel_enabled": false, + "speculation_length": 0, + "start_rank_id": 0, + "target": "trn1", + "torch_dtype": "bfloat16", + "tp_degree": 2 + }, + "num_attention_heads": 32, + "num_hidden_layers": 16, + "num_key_value_heads": 8, + "pretraining_tp": 1, + "rms_norm_eps": 1e-05, + "rope_scaling": { + "factor": 32.0, + "high_freq_factor": 4.0, + "low_freq_factor": 1.0, + "original_max_position_embeddings": 8192, + "rope_type": "llama3" + }, + "rope_theta": 500000.0, + "tie_word_embeddings": true, + "unsloth_fixed": true, + "use_cache": true, + "vocab_size": 128256 +} \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.3.dev3/llama/unsloth/Llama-3.2-1B-Instruct/a6f67c366d986ef4b636.json b/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.3.dev3/llama/unsloth/Llama-3.2-1B-Instruct/a6f67c366d986ef4b636.json new file mode 100644 index 0000000000000000000000000000000000000000..b0c6f88746d3fa626bf974d2ae730cd1a72c8e0b --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.3.dev3/llama/unsloth/Llama-3.2-1B-Instruct/a6f67c366d986ef4b636.json @@ -0,0 +1,64 @@ +{ + "_entry_class": "SingleModelCacheEntry", + "_model_id": "unsloth/Llama-3.2-1B-Instruct", + "_task": "text-generation", + "architectures": [ + "LlamaForCausalLM" + ], + "attention_bias": false, + "attention_dropout": 0.0, + "dtype": "bfloat16", + "head_dim": 64, + "hidden_act": "silu", + "hidden_size": 2048, + "initializer_range": 0.02, + "intermediate_size": 8192, + "max_position_embeddings": 131072, + "mlp_bias": false, + "model_type": "llama", + "neuron": { + "_serialized_key": "NxDNeuronConfig", + "batch_size": 1, + "capacity_factor": null, + "checkpoint_id": "unsloth/Llama-3.2-1B-Instruct", + "checkpoint_revision": "5a8abab4a5d6f164389b1079fb721cfab8d7126c", + "continuous_batching": false, + "ep_degree": 1, + "fused_qkv": true, + "glu_mlp": true, + "local_ranks_size": 2, + "max_batch_size": 1, + "max_context_length": 16384, + "max_topk": 256, + "n_active_tokens": 16384, + "neuronxcc_version": "2.21.33363.0+82129205", + "on_device_sampling": false, + "optimum_neuron_version": "0.4.3.dev3", + "output_logits": false, + "pp_degree": 1, + "sequence_length": 16384, + "sequence_parallel_enabled": false, + "speculation_length": 0, + "start_rank_id": 0, + "target": "trn1", + "torch_dtype": "bfloat16", + "tp_degree": 2 + }, + "num_attention_heads": 32, + "num_hidden_layers": 16, + "num_key_value_heads": 8, + "pretraining_tp": 1, + "rms_norm_eps": 1e-05, + "rope_scaling": { + "factor": 32.0, + "high_freq_factor": 4.0, + "low_freq_factor": 1.0, + "original_max_position_embeddings": 8192, + "rope_type": "llama3" + }, + "rope_theta": 500000.0, + "tie_word_embeddings": true, + "unsloth_fixed": true, + "use_cache": true, + "vocab_size": 128256 +} \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.3.dev3/llama/unsloth/Llama-3.2-1B-Instruct/c87e429d1d13a13279bd.json b/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.3.dev3/llama/unsloth/Llama-3.2-1B-Instruct/c87e429d1d13a13279bd.json new file mode 100644 index 0000000000000000000000000000000000000000..2aa821b22dab835c81f1b78ebb8532c9f9e7ea86 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.3.dev3/llama/unsloth/Llama-3.2-1B-Instruct/c87e429d1d13a13279bd.json @@ -0,0 +1,64 @@ +{ + "_entry_class": "SingleModelCacheEntry", + "_model_id": "unsloth/Llama-3.2-1B-Instruct", + "_task": "text-generation", + "architectures": [ + "LlamaForCausalLM" + ], + "attention_bias": false, + "attention_dropout": 0.0, + "dtype": "bfloat16", + "head_dim": 64, + "hidden_act": "silu", + "hidden_size": 2048, + "initializer_range": 0.02, + "intermediate_size": 8192, + "max_position_embeddings": 131072, + "mlp_bias": false, + "model_type": "llama", + "neuron": { + "_serialized_key": "NxDNeuronConfig", + "batch_size": 1, + "capacity_factor": null, + "checkpoint_id": "unsloth/Llama-3.2-1B-Instruct", + "checkpoint_revision": "5a8abab4a5d6f164389b1079fb721cfab8d7126c", + "continuous_batching": false, + "ep_degree": 1, + "fused_qkv": true, + "glu_mlp": true, + "local_ranks_size": 2, + "max_batch_size": 1, + "max_context_length": 4096, + "max_topk": 256, + "n_active_tokens": 4096, + "neuronxcc_version": "2.21.33363.0+82129205", + "on_device_sampling": false, + "optimum_neuron_version": "0.4.3.dev3", + "output_logits": false, + "pp_degree": 1, + "sequence_length": 4096, + "sequence_parallel_enabled": true, + "speculation_length": 0, + "start_rank_id": 0, + "target": "trn1", + "torch_dtype": "bfloat16", + "tp_degree": 2 + }, + "num_attention_heads": 32, + "num_hidden_layers": 16, + "num_key_value_heads": 8, + "pretraining_tp": 1, + "rms_norm_eps": 1e-05, + "rope_scaling": { + "factor": 32.0, + "high_freq_factor": 4.0, + "low_freq_factor": 1.0, + "original_max_position_embeddings": 8192, + "rope_type": "llama3" + }, + "rope_theta": 500000.0, + "tie_word_embeddings": true, + "unsloth_fixed": true, + "use_cache": true, + "vocab_size": 128256 +} \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.3.dev3/llama/unsloth/Llama-3.2-1B-Instruct/cfe0f6333cc973602102.json b/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.3.dev3/llama/unsloth/Llama-3.2-1B-Instruct/cfe0f6333cc973602102.json new file mode 100644 index 0000000000000000000000000000000000000000..0f3c9e78e9674d89f6387f5aec6ecfbc8a933449 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.3.dev3/llama/unsloth/Llama-3.2-1B-Instruct/cfe0f6333cc973602102.json @@ -0,0 +1,64 @@ +{ + "_entry_class": "SingleModelCacheEntry", + "_model_id": "unsloth/Llama-3.2-1B-Instruct", + "_task": "text-generation", + "architectures": [ + "LlamaForCausalLM" + ], + "attention_bias": false, + "attention_dropout": 0.0, + "dtype": "bfloat16", + "head_dim": 64, + "hidden_act": "silu", + "hidden_size": 2048, + "initializer_range": 0.02, + "intermediate_size": 8192, + "max_position_embeddings": 131072, + "mlp_bias": false, + "model_type": "llama", + "neuron": { + "_serialized_key": "NxDNeuronConfig", + "batch_size": 1, + "capacity_factor": null, + "checkpoint_id": "unsloth/Llama-3.2-1B-Instruct", + "checkpoint_revision": "5a8abab4a5d6f164389b1079fb721cfab8d7126c", + "continuous_batching": false, + "ep_degree": 1, + "fused_qkv": true, + "glu_mlp": true, + "local_ranks_size": 2, + "max_batch_size": 1, + "max_context_length": 4096, + "max_topk": 256, + "n_active_tokens": 4096, + "neuronxcc_version": "2.21.33363.0+82129205", + "on_device_sampling": false, + "optimum_neuron_version": "0.4.3.dev3", + "output_logits": false, + "pp_degree": 1, + "sequence_length": 4096, + "sequence_parallel_enabled": false, + "speculation_length": 0, + "start_rank_id": 0, + "target": "trn1", + "torch_dtype": "bfloat16", + "tp_degree": 2 + }, + "num_attention_heads": 32, + "num_hidden_layers": 16, + "num_key_value_heads": 8, + "pretraining_tp": 1, + "rms_norm_eps": 1e-05, + "rope_scaling": { + "factor": 32.0, + "high_freq_factor": 4.0, + "low_freq_factor": 1.0, + "original_max_position_embeddings": 8192, + "rope_type": "llama3" + }, + "rope_theta": 500000.0, + "tie_word_embeddings": true, + "unsloth_fixed": true, + "use_cache": true, + "vocab_size": 128256 +} \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.3.dev3/llama/unsloth/Llama-3.2-1B-Instruct/e75d2005d39261b7d1d8.json b/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.3.dev3/llama/unsloth/Llama-3.2-1B-Instruct/e75d2005d39261b7d1d8.json new file mode 100644 index 0000000000000000000000000000000000000000..414e12ffe0e80f2374f0def3ca2478102205f4f7 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.3.dev3/llama/unsloth/Llama-3.2-1B-Instruct/e75d2005d39261b7d1d8.json @@ -0,0 +1,64 @@ +{ + "_entry_class": "SingleModelCacheEntry", + "_model_id": "unsloth/Llama-3.2-1B-Instruct", + "_task": "text-generation", + "architectures": [ + "LlamaForCausalLM" + ], + "attention_bias": false, + "attention_dropout": 0.0, + "dtype": "bfloat16", + "head_dim": 64, + "hidden_act": "silu", + "hidden_size": 2048, + "initializer_range": 0.02, + "intermediate_size": 8192, + "max_position_embeddings": 131072, + "mlp_bias": false, + "model_type": "llama", + "neuron": { + "_serialized_key": "NxDNeuronConfig", + "batch_size": 1, + "capacity_factor": null, + "checkpoint_id": "unsloth/Llama-3.2-1B-Instruct", + "checkpoint_revision": "5a8abab4a5d6f164389b1079fb721cfab8d7126c", + "continuous_batching": false, + "ep_degree": 1, + "fused_qkv": true, + "glu_mlp": true, + "local_ranks_size": 2, + "max_batch_size": 1, + "max_context_length": 4096, + "max_topk": 256, + "n_active_tokens": 4096, + "neuronxcc_version": "2.21.33363.0+82129205", + "on_device_sampling": true, + "optimum_neuron_version": "0.4.3.dev3", + "output_logits": false, + "pp_degree": 1, + "sequence_length": 4096, + "sequence_parallel_enabled": true, + "speculation_length": 0, + "start_rank_id": 0, + "target": "trn1", + "torch_dtype": "bfloat16", + "tp_degree": 2 + }, + "num_attention_heads": 32, + "num_hidden_layers": 16, + "num_key_value_heads": 8, + "pretraining_tp": 1, + "rms_norm_eps": 1e-05, + "rope_scaling": { + "factor": 32.0, + "high_freq_factor": 4.0, + "low_freq_factor": 1.0, + "original_max_position_embeddings": 8192, + "rope_type": "llama3" + }, + "rope_theta": 500000.0, + "tie_word_embeddings": true, + "unsloth_fixed": true, + "use_cache": true, + "vocab_size": 128256 +} \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.3.dev3/llama/unsloth/Llama-3.2-1B-Instruct/ea31be52d67b5f045068.json b/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.3.dev3/llama/unsloth/Llama-3.2-1B-Instruct/ea31be52d67b5f045068.json new file mode 100644 index 0000000000000000000000000000000000000000..9df8e0febae6828621c923ae3cce1267a1a83351 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.3.dev3/llama/unsloth/Llama-3.2-1B-Instruct/ea31be52d67b5f045068.json @@ -0,0 +1,64 @@ +{ + "_entry_class": "SingleModelCacheEntry", + "_model_id": "unsloth/Llama-3.2-1B-Instruct", + "_task": "text-generation", + "architectures": [ + "LlamaForCausalLM" + ], + "attention_bias": false, + "attention_dropout": 0.0, + "dtype": "bfloat16", + "head_dim": 64, + "hidden_act": "silu", + "hidden_size": 2048, + "initializer_range": 0.02, + "intermediate_size": 8192, + "max_position_embeddings": 131072, + "mlp_bias": false, + "model_type": "llama", + "neuron": { + "_serialized_key": "NxDNeuronConfig", + "batch_size": 1, + "capacity_factor": null, + "checkpoint_id": "unsloth/Llama-3.2-1B-Instruct", + "checkpoint_revision": null, + "continuous_batching": false, + "ep_degree": 1, + "fused_qkv": false, + "glu_mlp": true, + "local_ranks_size": 2, + "max_batch_size": 1, + "max_context_length": 4096, + "max_topk": 256, + "n_active_tokens": 4096, + "neuronxcc_version": "2.21.33363.0+82129205", + "on_device_sampling": false, + "optimum_neuron_version": "0.4.3.dev3", + "output_logits": false, + "pp_degree": 1, + "sequence_length": 4096, + "sequence_parallel_enabled": false, + "speculation_length": 0, + "start_rank_id": 0, + "target": "trn1", + "torch_dtype": "bfloat16", + "tp_degree": 2 + }, + "num_attention_heads": 32, + "num_hidden_layers": 16, + "num_key_value_heads": 8, + "pretraining_tp": 1, + "rms_norm_eps": 1e-05, + "rope_scaling": { + "factor": 32.0, + "high_freq_factor": 4.0, + "low_freq_factor": 1.0, + "original_max_position_embeddings": 8192, + "rope_type": "llama3" + }, + "rope_theta": 500000.0, + "tie_word_embeddings": true, + "unsloth_fixed": true, + "use_cache": true, + "vocab_size": 128256 +} \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.3.dev3/llama4_text/tiny-random/llama-4/663adc121ad6f0bf6c41.json b/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.3.dev3/llama4_text/tiny-random/llama-4/663adc121ad6f0bf6c41.json new file mode 100644 index 0000000000000000000000000000000000000000..4c08759982b036f55f8dde88b082e3ea0236d4ac --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.3.dev3/llama4_text/tiny-random/llama-4/663adc121ad6f0bf6c41.json @@ -0,0 +1,82 @@ +{ + "_entry_class": "SingleModelCacheEntry", + "_model_id": "tiny-random/llama-4", + "_task": "text-generation", + "attention_bias": false, + "attention_chunk_size": 128, + "attention_dropout": 0.0, + "attn_scale": 0.1, + "attn_temperature_tuning": 4, + "cache_implementation": "hybrid", + "dtype": "bfloat16", + "floor_scale": 8192, + "for_llm_compressor": false, + "head_dim": 32, + "hidden_act": "silu", + "hidden_size": 32, + "initializer_range": 0.02, + "interleave_moe_layer_step": 2, + "intermediate_size": 64, + "intermediate_size_mlp": 128, + "layer_types": [ + "chunked_attention", + "chunked_attention", + "chunked_attention", + "full_attention" + ], + "max_position_embeddings": 1048576, + "model_type": "llama4_text", + "moe_layers": [ + 1, + 3 + ], + "neuron": { + "_serialized_key": "NxDNeuronConfig", + "batch_size": 1, + "capacity_factor": null, + "checkpoint_id": "tiny-random/llama-4", + "checkpoint_revision": "9e716f5d4d1ffe0a44a15f46f4a12b840439aba4", + "continuous_batching": false, + "ep_degree": 1, + "fused_qkv": false, + "glu_mlp": true, + "local_ranks_size": 2, + "max_batch_size": 1, + "max_context_length": 1024, + "max_topk": 256, + "n_active_tokens": 1024, + "neuronxcc_version": "2.21.33363.0+82129205", + "on_device_sampling": true, + "optimum_neuron_version": "0.4.3.dev3", + "output_logits": false, + "pp_degree": 1, + "sequence_length": 1024, + "sequence_parallel_enabled": false, + "speculation_length": 0, + "start_rank_id": 0, + "target": "trn1", + "torch_dtype": "bfloat16", + "tp_degree": 2 + }, + "no_rope_layers": [ + 1, + 1, + 1, + 0 + ], + "num_attention_heads": 1, + "num_experts_per_tok": 1, + "num_hidden_layers": 4, + "num_key_value_heads": 1, + "num_local_experts": 8, + "output_router_logits": false, + "rms_norm_eps": 1e-05, + "rope_scaling": null, + "rope_theta": 500000.0, + "router_aux_loss_coef": 0.001, + "router_jitter_noise": 0.0, + "tie_word_embeddings": true, + "use_cache": true, + "use_qk_norm": true, + "vocab_size": 202048 +} \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.3.dev3/mixtral/dacorvo/Mixtral-tiny/2115b9307dea032bae46.json b/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.3.dev3/mixtral/dacorvo/Mixtral-tiny/2115b9307dea032bae46.json new file mode 100644 index 0000000000000000000000000000000000000000..2618688721dbf26e95a54b4080c355d4a2d418a2 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.3.dev3/mixtral/dacorvo/Mixtral-tiny/2115b9307dea032bae46.json @@ -0,0 +1,58 @@ +{ + "_entry_class": "SingleModelCacheEntry", + "_model_id": "dacorvo/Mixtral-tiny", + "_task": "text-generation", + "architectures": [ + "MixtralForCausalLM" + ], + "attention_dropout": 0.0, + "dtype": "float16", + "head_dim": 32, + "hidden_act": "silu", + "hidden_size": 1024, + "initializer_range": 0.02, + "intermediate_size": 3584, + "max_position_embeddings": 1024, + "model_type": "mixtral", + "neuron": { + "_serialized_key": "NxDNeuronConfig", + "batch_size": 1, + "capacity_factor": null, + "checkpoint_id": "dacorvo/Mixtral-tiny", + "checkpoint_revision": "c557ba205ddff6ea911f4719e0d543d6c08356b6", + "continuous_batching": false, + "ep_degree": 1, + "fused_qkv": false, + "glu_mlp": true, + "local_ranks_size": 2, + "max_batch_size": 1, + "max_context_length": 1024, + "max_topk": 256, + "n_active_tokens": 1024, + "neuronxcc_version": "2.21.33363.0+82129205", + "on_device_sampling": false, + "optimum_neuron_version": "0.4.3.dev3", + "output_logits": false, + "pp_degree": 1, + "sequence_length": 1024, + "speculation_length": 0, + "start_rank_id": 0, + "target": "trn1", + "torch_dtype": "float16", + "tp_degree": 2 + }, + "num_attention_heads": 32, + "num_experts_per_tok": 2, + "num_hidden_layers": 2, + "num_key_value_heads": 8, + "num_local_experts": 8, + "output_router_logits": false, + "rms_norm_eps": 1e-05, + "rope_theta": 10000.0, + "router_aux_loss_coef": 0.001, + "router_jitter_noise": 0.0, + "sliding_window": 4096, + "tie_word_embeddings": false, + "use_cache": true, + "vocab_size": 32000 +} \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.3.dev3/mixtral/dacorvo/Mixtral-tiny/6c78d4e7067fedb8c6d8.json b/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.3.dev3/mixtral/dacorvo/Mixtral-tiny/6c78d4e7067fedb8c6d8.json new file mode 100644 index 0000000000000000000000000000000000000000..6531218cdfc5fcfd5f3ea2c92614d4d5a0e1ccb5 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.3.dev3/mixtral/dacorvo/Mixtral-tiny/6c78d4e7067fedb8c6d8.json @@ -0,0 +1,59 @@ +{ + "_entry_class": "SingleModelCacheEntry", + "_model_id": "dacorvo/Mixtral-tiny", + "_task": "text-generation", + "architectures": [ + "MixtralForCausalLM" + ], + "attention_dropout": 0.0, + "dtype": "float16", + "head_dim": 32, + "hidden_act": "silu", + "hidden_size": 1024, + "initializer_range": 0.02, + "intermediate_size": 3584, + "max_position_embeddings": 1024, + "model_type": "mixtral", + "neuron": { + "_serialized_key": "NxDNeuronConfig", + "batch_size": 1, + "capacity_factor": null, + "checkpoint_id": "dacorvo/Mixtral-tiny", + "checkpoint_revision": "c557ba205ddff6ea911f4719e0d543d6c08356b6", + "continuous_batching": false, + "ep_degree": 1, + "fused_qkv": false, + "glu_mlp": true, + "local_ranks_size": 2, + "max_batch_size": 1, + "max_context_length": 1024, + "max_topk": 256, + "n_active_tokens": 1024, + "neuronxcc_version": "2.21.33363.0+82129205", + "on_device_sampling": false, + "optimum_neuron_version": "0.4.3.dev3", + "output_logits": false, + "pp_degree": 1, + "sequence_length": 1024, + "sequence_parallel_enabled": false, + "speculation_length": 0, + "start_rank_id": 0, + "target": "trn1", + "torch_dtype": "float16", + "tp_degree": 2 + }, + "num_attention_heads": 32, + "num_experts_per_tok": 2, + "num_hidden_layers": 2, + "num_key_value_heads": 8, + "num_local_experts": 8, + "output_router_logits": false, + "rms_norm_eps": 1e-05, + "rope_theta": 10000.0, + "router_aux_loss_coef": 0.001, + "router_jitter_noise": 0.0, + "sliding_window": 4096, + "tie_word_embeddings": false, + "use_cache": true, + "vocab_size": 32000 +} \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.3.dev3/phi3/microsoft/Phi-3-mini-4k-instruct/606cd550f76180b896b7.json b/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.3.dev3/phi3/microsoft/Phi-3-mini-4k-instruct/606cd550f76180b896b7.json new file mode 100644 index 0000000000000000000000000000000000000000..0551d94eb085b9c070ac05c943bc3a7d8746d896 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.3.dev3/phi3/microsoft/Phi-3-mini-4k-instruct/606cd550f76180b896b7.json @@ -0,0 +1,63 @@ +{ + "_entry_class": "SingleModelCacheEntry", + "_model_id": "microsoft/Phi-3-mini-4k-instruct", + "_task": "text-generation", + "architectures": [ + "Phi3ForCausalLM" + ], + "attention_bias": false, + "attention_dropout": 0.0, + "auto_map": { + "AutoConfig": "configuration_phi3.Phi3Config", + "AutoModelForCausalLM": "modeling_phi3.Phi3ForCausalLM" + }, + "dtype": "bfloat16", + "embd_pdrop": 0.0, + "hidden_act": "silu", + "hidden_size": 3072, + "initializer_range": 0.02, + "intermediate_size": 8192, + "max_position_embeddings": 4096, + "model_type": "phi3", + "neuron": { + "_serialized_key": "NxDNeuronConfig", + "batch_size": 4, + "capacity_factor": null, + "checkpoint_id": "microsoft/Phi-3-mini-4k-instruct", + "checkpoint_revision": "f39ac1d28e925b323eae81227eaba4464caced4e", + "continuous_batching": true, + "ep_degree": 1, + "fused_qkv": true, + "glu_mlp": true, + "local_ranks_size": 2, + "max_batch_size": 4, + "max_context_length": 4096, + "max_topk": 256, + "n_active_tokens": 4096, + "neuronxcc_version": "2.21.33363.0+82129205", + "on_device_sampling": true, + "optimum_neuron_version": "0.4.3.dev3", + "output_logits": false, + "pp_degree": 1, + "sequence_length": 4096, + "sequence_parallel_enabled": false, + "speculation_length": 0, + "start_rank_id": 0, + "target": "trn1", + "torch_dtype": "bfloat16", + "tp_degree": 2 + }, + "num_attention_heads": 32, + "num_hidden_layers": 32, + "num_key_value_heads": 32, + "original_max_position_embeddings": 4096, + "partial_rotary_factor": 1.0, + "resid_pdrop": 0.0, + "rms_norm_eps": 1e-05, + "rope_scaling": null, + "rope_theta": 10000.0, + "sliding_window": 2047, + "tie_word_embeddings": false, + "use_cache": true, + "vocab_size": 32064 +} \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.3.dev3/phi3/microsoft/Phi-3-mini-4k-instruct/7a02cab53063011b4bcd.json b/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.3.dev3/phi3/microsoft/Phi-3-mini-4k-instruct/7a02cab53063011b4bcd.json new file mode 100644 index 0000000000000000000000000000000000000000..bb6303771722427d2e2534559b4d6352dc101fe9 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.3.dev3/phi3/microsoft/Phi-3-mini-4k-instruct/7a02cab53063011b4bcd.json @@ -0,0 +1,62 @@ +{ + "_entry_class": "SingleModelCacheEntry", + "_model_id": "microsoft/Phi-3-mini-4k-instruct", + "_task": "text-generation", + "architectures": [ + "Phi3ForCausalLM" + ], + "attention_bias": false, + "attention_dropout": 0.0, + "auto_map": { + "AutoConfig": "configuration_phi3.Phi3Config", + "AutoModelForCausalLM": "modeling_phi3.Phi3ForCausalLM" + }, + "dtype": "bfloat16", + "embd_pdrop": 0.0, + "hidden_act": "silu", + "hidden_size": 3072, + "initializer_range": 0.02, + "intermediate_size": 8192, + "max_position_embeddings": 4096, + "model_type": "phi3", + "neuron": { + "_serialized_key": "NxDNeuronConfig", + "batch_size": 4, + "capacity_factor": null, + "checkpoint_id": "microsoft/Phi-3-mini-4k-instruct", + "checkpoint_revision": "f39ac1d28e925b323eae81227eaba4464caced4e", + "continuous_batching": true, + "ep_degree": 1, + "fused_qkv": true, + "glu_mlp": true, + "local_ranks_size": 2, + "max_batch_size": 4, + "max_context_length": 4096, + "max_topk": 256, + "n_active_tokens": 4096, + "neuronxcc_version": "2.21.33363.0+82129205", + "on_device_sampling": true, + "optimum_neuron_version": "0.4.3.dev3", + "output_logits": false, + "pp_degree": 1, + "sequence_length": 4096, + "speculation_length": 0, + "start_rank_id": 0, + "target": "trn1", + "torch_dtype": "bfloat16", + "tp_degree": 2 + }, + "num_attention_heads": 32, + "num_hidden_layers": 32, + "num_key_value_heads": 32, + "original_max_position_embeddings": 4096, + "partial_rotary_factor": 1.0, + "resid_pdrop": 0.0, + "rms_norm_eps": 1e-05, + "rope_scaling": null, + "rope_theta": 10000.0, + "sliding_window": 2047, + "tie_word_embeddings": false, + "use_cache": true, + "vocab_size": 32064 +} \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.3.dev3/phi3/yujiepan/phi-4-tiny-random/9830c1de6c2e8faed0c8.json b/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.3.dev3/phi3/yujiepan/phi-4-tiny-random/9830c1de6c2e8faed0c8.json new file mode 100644 index 0000000000000000000000000000000000000000..6eb10d1cf9056c8c5895ea3b4365ba6c8d7a40ab --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.3.dev3/phi3/yujiepan/phi-4-tiny-random/9830c1de6c2e8faed0c8.json @@ -0,0 +1,60 @@ +{ + "_entry_class": "SingleModelCacheEntry", + "_model_id": "yujiepan/phi-4-tiny-random", + "_task": "text-generation", + "architectures": [ + "Phi3ForCausalLM" + ], + "attention_bias": false, + "attention_dropout": 0.0, + "auto_map": {}, + "dtype": "bfloat16", + "embd_pdrop": 0.0, + "hidden_act": "silu", + "hidden_size": 16, + "initializer_range": 0.02, + "intermediate_size": 32, + "max_position_embeddings": 16384, + "model_type": "phi3", + "neuron": { + "_serialized_key": "NxDNeuronConfig", + "batch_size": 1, + "capacity_factor": null, + "checkpoint_id": "yujiepan/phi-4-tiny-random", + "checkpoint_revision": "18a9a1168dc97ac6d128f811925670c275610f5a", + "continuous_batching": false, + "ep_degree": 1, + "fused_qkv": true, + "glu_mlp": true, + "local_ranks_size": 2, + "max_batch_size": 1, + "max_context_length": 1024, + "max_topk": 256, + "n_active_tokens": 1024, + "neuronxcc_version": "2.21.33363.0+82129205", + "on_device_sampling": true, + "optimum_neuron_version": "0.4.3.dev3", + "output_logits": false, + "pp_degree": 1, + "sequence_length": 1024, + "sequence_parallel_enabled": false, + "speculation_length": 0, + "start_rank_id": 0, + "target": "trn1", + "torch_dtype": "bfloat16", + "tp_degree": 2 + }, + "num_attention_heads": 2, + "num_hidden_layers": 2, + "num_key_value_heads": 1, + "original_max_position_embeddings": 16384, + "partial_rotary_factor": 1.0, + "resid_pdrop": 0.0, + "rms_norm_eps": 1e-05, + "rope_scaling": null, + "rope_theta": 250000, + "sliding_window": null, + "tie_word_embeddings": false, + "use_cache": true, + "vocab_size": 100352 +} \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.3.dev3/qwen2/Qwen/Qwen2.5-0.5B/49a52397959b42823ec6.json b/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.3.dev3/qwen2/Qwen/Qwen2.5-0.5B/49a52397959b42823ec6.json new file mode 100644 index 0000000000000000000000000000000000000000..e1d2745b21a07ca824f61059821dabd06dcaeec3 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.3.dev3/qwen2/Qwen/Qwen2.5-0.5B/49a52397959b42823ec6.json @@ -0,0 +1,82 @@ +{ + "_entry_class": "SingleModelCacheEntry", + "_model_id": "Qwen/Qwen2.5-0.5B", + "_task": "text-generation", + "architectures": [ + "Qwen2ForCausalLM" + ], + "attention_dropout": 0.0, + "dtype": "bfloat16", + "hidden_act": "silu", + "hidden_size": 896, + "initializer_range": 0.02, + "intermediate_size": 4864, + "layer_types": [ + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention" + ], + "max_position_embeddings": 32768, + "max_window_layers": 24, + "model_type": "qwen2", + "neuron": { + "_serialized_key": "NxDNeuronConfig", + "batch_size": 4, + "capacity_factor": null, + "checkpoint_id": "Qwen/Qwen2.5-0.5B", + "checkpoint_revision": "060db6499f32faf8b98477b0a26969ef7d8b9987", + "continuous_batching": true, + "ep_degree": 1, + "fused_qkv": false, + "glu_mlp": true, + "local_ranks_size": 2, + "max_batch_size": 4, + "max_context_length": 4096, + "max_topk": 256, + "n_active_tokens": 4096, + "neuronxcc_version": "2.21.33363.0+82129205", + "on_device_sampling": false, + "optimum_neuron_version": "0.4.3.dev3", + "output_logits": false, + "pp_degree": 1, + "sequence_length": 4096, + "speculation_length": 0, + "start_rank_id": 0, + "target": "trn1", + "torch_dtype": "bfloat16", + "tp_degree": 2 + }, + "num_attention_heads": 14, + "num_hidden_layers": 24, + "num_key_value_heads": 2, + "rms_norm_eps": 1e-06, + "rope_scaling": null, + "rope_theta": 1000000.0, + "sliding_window": null, + "tie_word_embeddings": true, + "use_cache": true, + "use_mrope": false, + "use_sliding_window": false, + "vocab_size": 151936 +} \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.3.dev3/qwen2/Qwen/Qwen2.5-0.5B/cf30894023926ebec49a.json b/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.3.dev3/qwen2/Qwen/Qwen2.5-0.5B/cf30894023926ebec49a.json new file mode 100644 index 0000000000000000000000000000000000000000..16a5f6696925c17cdd881834106f8f659e1db2bb --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.3.dev3/qwen2/Qwen/Qwen2.5-0.5B/cf30894023926ebec49a.json @@ -0,0 +1,83 @@ +{ + "_entry_class": "SingleModelCacheEntry", + "_model_id": "Qwen/Qwen2.5-0.5B", + "_task": "text-generation", + "architectures": [ + "Qwen2ForCausalLM" + ], + "attention_dropout": 0.0, + "dtype": "bfloat16", + "hidden_act": "silu", + "hidden_size": 896, + "initializer_range": 0.02, + "intermediate_size": 4864, + "layer_types": [ + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention" + ], + "max_position_embeddings": 32768, + "max_window_layers": 24, + "model_type": "qwen2", + "neuron": { + "_serialized_key": "NxDNeuronConfig", + "batch_size": 4, + "capacity_factor": null, + "checkpoint_id": "Qwen/Qwen2.5-0.5B", + "checkpoint_revision": "060db6499f32faf8b98477b0a26969ef7d8b9987", + "continuous_batching": true, + "ep_degree": 1, + "fused_qkv": false, + "glu_mlp": true, + "local_ranks_size": 2, + "max_batch_size": 4, + "max_context_length": 4096, + "max_topk": 256, + "n_active_tokens": 4096, + "neuronxcc_version": "2.21.33363.0+82129205", + "on_device_sampling": false, + "optimum_neuron_version": "0.4.3.dev3", + "output_logits": false, + "pp_degree": 1, + "sequence_length": 4096, + "sequence_parallel_enabled": false, + "speculation_length": 0, + "start_rank_id": 0, + "target": "trn1", + "torch_dtype": "bfloat16", + "tp_degree": 2 + }, + "num_attention_heads": 14, + "num_hidden_layers": 24, + "num_key_value_heads": 2, + "rms_norm_eps": 1e-06, + "rope_scaling": null, + "rope_theta": 1000000.0, + "sliding_window": null, + "tie_word_embeddings": true, + "use_cache": true, + "use_mrope": false, + "use_sliding_window": false, + "vocab_size": 151936 +} \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.3.dev3/qwen2/yujiepan/qwen2.5-128k-tiny-random/d2ffa119e8a8f246f65e.json b/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.3.dev3/qwen2/yujiepan/qwen2.5-128k-tiny-random/d2ffa119e8a8f246f65e.json new file mode 100644 index 0000000000000000000000000000000000000000..5ffa20032c4158f27561ddc4b2d5ceed0ad2a415 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.3.dev3/qwen2/yujiepan/qwen2.5-128k-tiny-random/d2ffa119e8a8f246f65e.json @@ -0,0 +1,65 @@ +{ + "_entry_class": "SingleModelCacheEntry", + "_model_id": "yujiepan/qwen2.5-128k-tiny-random", + "_task": "text-generation", + "architectures": [ + "Qwen2ForCausalLM" + ], + "attention_dropout": 0.0, + "dtype": "bfloat16", + "hidden_act": "silu", + "hidden_size": 8, + "initializer_range": 0.02, + "intermediate_size": 16, + "layer_types": [ + "full_attention", + "full_attention" + ], + "max_position_embeddings": 32768, + "max_window_layers": 1, + "model_type": "qwen2", + "neuron": { + "_serialized_key": "NxDNeuronConfig", + "batch_size": 1, + "capacity_factor": null, + "checkpoint_id": "yujiepan/qwen2.5-128k-tiny-random", + "checkpoint_revision": "c8296d4ca3f87782876d2382fbb6481d1beb8ef0", + "continuous_batching": false, + "ep_degree": 1, + "fused_qkv": false, + "glu_mlp": true, + "local_ranks_size": 2, + "max_batch_size": 1, + "max_context_length": 1024, + "max_topk": 256, + "n_active_tokens": 1024, + "neuronxcc_version": "2.21.33363.0+82129205", + "on_device_sampling": true, + "optimum_neuron_version": "0.4.3.dev3", + "output_logits": false, + "pp_degree": 1, + "sequence_length": 1024, + "sequence_parallel_enabled": false, + "speculation_length": 0, + "start_rank_id": 0, + "target": "trn1", + "torch_dtype": "bfloat16", + "tp_degree": 2 + }, + "num_attention_heads": 4, + "num_hidden_layers": 2, + "num_key_value_heads": 2, + "rms_norm_eps": 1e-06, + "rope_scaling": { + "factor": 4.0, + "original_max_position_embeddings": 32768, + "rope_type": "yarn", + "type": "yarn" + }, + "rope_theta": 1000000.0, + "sliding_window": null, + "tie_word_embeddings": false, + "use_cache": true, + "use_sliding_window": false, + "vocab_size": 152064 +} \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.3.dev3/qwen3/Qwen/Qwen3-0.6B/19b1a0628bd4d98a32cd.json b/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.3.dev3/qwen3/Qwen/Qwen3-0.6B/19b1a0628bd4d98a32cd.json new file mode 100644 index 0000000000000000000000000000000000000000..0c204b14b0f41f261aaa07a9d5fa1020098ae0b8 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.3.dev3/qwen3/Qwen/Qwen3-0.6B/19b1a0628bd4d98a32cd.json @@ -0,0 +1,87 @@ +{ + "_entry_class": "SingleModelCacheEntry", + "_model_id": "Qwen/Qwen3-0.6B", + "_task": "text-generation", + "architectures": [ + "Qwen3ForCausalLM" + ], + "attention_bias": false, + "attention_dropout": 0.0, + "dtype": "bfloat16", + "head_dim": 128, + "hidden_act": "silu", + "hidden_size": 1024, + "initializer_range": 0.02, + "intermediate_size": 3072, + "layer_types": [ + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention" + ], + "max_position_embeddings": 40960, + "max_window_layers": 28, + "model_type": "qwen3", + "neuron": { + "_serialized_key": "NxDNeuronConfig", + "batch_size": 4, + "capacity_factor": null, + "checkpoint_id": "Qwen/Qwen3-0.6B", + "checkpoint_revision": "c1899de289a04d12100db370d81485cdf75e47ca", + "continuous_batching": true, + "ep_degree": 1, + "fused_qkv": true, + "glu_mlp": true, + "local_ranks_size": 2, + "max_batch_size": 4, + "max_context_length": 4096, + "max_topk": 256, + "n_active_tokens": 4096, + "neuronxcc_version": "2.21.33363.0+82129205", + "on_device_sampling": false, + "optimum_neuron_version": "0.4.3.dev3", + "output_logits": false, + "pp_degree": 1, + "sequence_length": 4096, + "speculation_length": 0, + "start_rank_id": 0, + "target": "trn1", + "torch_dtype": "bfloat16", + "tp_degree": 2 + }, + "num_attention_heads": 16, + "num_hidden_layers": 28, + "num_key_value_heads": 8, + "rms_norm_eps": 1e-06, + "rope_scaling": null, + "rope_theta": 1000000, + "sliding_window": null, + "tie_word_embeddings": true, + "use_cache": true, + "use_sliding_window": false, + "vocab_size": 151936 +} \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.3.dev3/qwen3/Qwen/Qwen3-0.6B/b07ee07074b519837e2e.json b/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.3.dev3/qwen3/Qwen/Qwen3-0.6B/b07ee07074b519837e2e.json new file mode 100644 index 0000000000000000000000000000000000000000..aacadb32d28bd56305f643c2218c34ea8534bece --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.3.dev3/qwen3/Qwen/Qwen3-0.6B/b07ee07074b519837e2e.json @@ -0,0 +1,88 @@ +{ + "_entry_class": "SingleModelCacheEntry", + "_model_id": "Qwen/Qwen3-0.6B", + "_task": "text-generation", + "architectures": [ + "Qwen3ForCausalLM" + ], + "attention_bias": false, + "attention_dropout": 0.0, + "dtype": "bfloat16", + "head_dim": 128, + "hidden_act": "silu", + "hidden_size": 1024, + "initializer_range": 0.02, + "intermediate_size": 3072, + "layer_types": [ + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention" + ], + "max_position_embeddings": 40960, + "max_window_layers": 28, + "model_type": "qwen3", + "neuron": { + "_serialized_key": "NxDNeuronConfig", + "batch_size": 4, + "capacity_factor": null, + "checkpoint_id": "Qwen/Qwen3-0.6B", + "checkpoint_revision": "c1899de289a04d12100db370d81485cdf75e47ca", + "continuous_batching": true, + "ep_degree": 1, + "fused_qkv": true, + "glu_mlp": true, + "local_ranks_size": 2, + "max_batch_size": 4, + "max_context_length": 4096, + "max_topk": 256, + "n_active_tokens": 4096, + "neuronxcc_version": "2.21.33363.0+82129205", + "on_device_sampling": false, + "optimum_neuron_version": "0.4.3.dev3", + "output_logits": false, + "pp_degree": 1, + "sequence_length": 4096, + "sequence_parallel_enabled": false, + "speculation_length": 0, + "start_rank_id": 0, + "target": "trn1", + "torch_dtype": "bfloat16", + "tp_degree": 2 + }, + "num_attention_heads": 16, + "num_hidden_layers": 28, + "num_key_value_heads": 8, + "rms_norm_eps": 1e-06, + "rope_scaling": null, + "rope_theta": 1000000, + "sliding_window": null, + "tie_word_embeddings": true, + "use_cache": true, + "use_sliding_window": false, + "vocab_size": 151936 +} \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.3.dev3/qwen3_moe/optimum-internal-testing/tiny-random-qwen3_moe/35684b74302809c36482.json b/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.3.dev3/qwen3_moe/optimum-internal-testing/tiny-random-qwen3_moe/35684b74302809c36482.json new file mode 100644 index 0000000000000000000000000000000000000000..f9c23f3f9471ee957c95e9178095bf9a849cc358 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.3.dev3/qwen3_moe/optimum-internal-testing/tiny-random-qwen3_moe/35684b74302809c36482.json @@ -0,0 +1,66 @@ +{ + "_entry_class": "SingleModelCacheEntry", + "_model_id": "optimum-internal-testing/tiny-random-qwen3_moe", + "_task": "text-generation", + "architectures": [ + "Qwen3MoeForCausalLM" + ], + "attention_bias": false, + "attention_dropout": 0.0, + "decoder_sparse_step": 2, + "dtype": "float32", + "head_dim": 32, + "hidden_act": "silu", + "hidden_size": 64, + "initializer_range": 0.02, + "intermediate_size": 128, + "max_position_embeddings": 40960, + "max_window_layers": 1, + "mlp_only_layers": [], + "model_type": "qwen3_moe", + "moe_intermediate_size": 128, + "neuron": { + "_serialized_key": "NxDNeuronConfig", + "batch_size": 1, + "capacity_factor": null, + "checkpoint_id": "optimum-internal-testing/tiny-random-qwen3_moe", + "checkpoint_revision": "e0230be2839556b44b7400a233c73c74b4abb7af", + "continuous_batching": false, + "ep_degree": 1, + "fused_qkv": false, + "glu_mlp": true, + "local_ranks_size": 2, + "max_batch_size": 1, + "max_context_length": 1024, + "max_topk": 256, + "n_active_tokens": 1024, + "neuronxcc_version": "2.21.33363.0+82129205", + "on_device_sampling": true, + "optimum_neuron_version": "0.4.3.dev3", + "output_logits": false, + "pp_degree": 1, + "sequence_length": 1024, + "sequence_parallel_enabled": false, + "speculation_length": 0, + "start_rank_id": 0, + "target": "trn1", + "torch_dtype": "float32", + "tp_degree": 2 + }, + "norm_topk_prob": true, + "num_attention_heads": 2, + "num_experts": 8, + "num_experts_per_tok": 2, + "num_hidden_layers": 2, + "num_key_value_heads": 1, + "output_router_logits": false, + "rms_norm_eps": 1e-06, + "rope_scaling": null, + "rope_theta": 1000000.0, + "router_aux_loss_coef": 0.001, + "sliding_window": null, + "tie_word_embeddings": true, + "use_cache": true, + "use_sliding_window": false, + "vocab_size": 151936 +} \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.3.dev3/smollm3/HuggingFaceTB/SmolLM3-3B/0d500de1edebf543a09c.json b/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.3.dev3/smollm3/HuggingFaceTB/SmolLM3-3B/0d500de1edebf543a09c.json new file mode 100644 index 0000000000000000000000000000000000000000..31996dd74634e70765c7a97f116b806cbaeeafc4 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.3.dev3/smollm3/HuggingFaceTB/SmolLM3-3B/0d500de1edebf543a09c.json @@ -0,0 +1,135 @@ +{ + "_entry_class": "SingleModelCacheEntry", + "_model_id": "HuggingFaceTB/SmolLM3-3B", + "_task": "text-generation", + "architectures": [ + "SmolLM3ForCausalLM" + ], + "attention_bias": false, + "attention_dropout": 0.0, + "dtype": "bfloat16", + "hidden_act": "silu", + "hidden_size": 2048, + "initializer_range": 0.02, + "intermediate_size": 11008, + "layer_types": [ + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention" + ], + "max_position_embeddings": 65536, + "max_window_layers": 28, + "mlp_bias": false, + "model_type": "smollm3", + "neuron": { + "_serialized_key": "NxDNeuronConfig", + "batch_size": 4, + "capacity_factor": null, + "checkpoint_id": "HuggingFaceTB/SmolLM3-3B", + "checkpoint_revision": "a07cc9a04f16550a088caea529712d1d335b0ac1", + "continuous_batching": true, + "ep_degree": 1, + "fused_qkv": true, + "glu_mlp": true, + "local_ranks_size": 2, + "max_batch_size": 4, + "max_context_length": 4096, + "max_topk": 256, + "n_active_tokens": 4096, + "neuronxcc_version": "2.21.33363.0+82129205", + "on_device_sampling": true, + "optimum_neuron_version": "0.4.3.dev3", + "output_logits": false, + "pp_degree": 1, + "sequence_length": 4096, + "sequence_parallel_enabled": false, + "speculation_length": 0, + "start_rank_id": 0, + "target": "trn1", + "torch_dtype": "bfloat16", + "tp_degree": 2 + }, + "no_rope_layer_interval": 4, + "no_rope_layers": [ + 1, + 1, + 1, + 0, + 1, + 1, + 1, + 0, + 1, + 1, + 1, + 0, + 1, + 1, + 1, + 0, + 1, + 1, + 1, + 0, + 1, + 1, + 1, + 0, + 1, + 1, + 1, + 0, + 1, + 1, + 1, + 0, + 1, + 1, + 1, + 0 + ], + "num_attention_heads": 16, + "num_hidden_layers": 36, + "num_key_value_heads": 4, + "pretraining_tp": 2, + "rms_norm_eps": 1e-06, + "rope_scaling": null, + "rope_theta": 5000000.0, + "sliding_window": null, + "use_cache": false, + "use_sliding_window": false, + "vocab_size": 128256 +} \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.3.dev3/smollm3/HuggingFaceTB/SmolLM3-3B/9a47a3a9f135594c847d.json b/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.3.dev3/smollm3/HuggingFaceTB/SmolLM3-3B/9a47a3a9f135594c847d.json new file mode 100644 index 0000000000000000000000000000000000000000..7f62300262e7600b998c6e2f2367f65a901d70ff --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.3.dev3/smollm3/HuggingFaceTB/SmolLM3-3B/9a47a3a9f135594c847d.json @@ -0,0 +1,135 @@ +{ + "_entry_class": "SingleModelCacheEntry", + "_model_id": "HuggingFaceTB/SmolLM3-3B", + "_task": "text-generation", + "architectures": [ + "SmolLM3ForCausalLM" + ], + "attention_bias": false, + "attention_dropout": 0.0, + "dtype": "bfloat16", + "hidden_act": "silu", + "hidden_size": 2048, + "initializer_range": 0.02, + "intermediate_size": 11008, + "layer_types": [ + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention" + ], + "max_position_embeddings": 65536, + "max_window_layers": 28, + "mlp_bias": false, + "model_type": "smollm3", + "neuron": { + "_serialized_key": "NxDNeuronConfig", + "batch_size": 1, + "capacity_factor": null, + "checkpoint_id": "HuggingFaceTB/SmolLM3-3B", + "checkpoint_revision": "a07cc9a04f16550a088caea529712d1d335b0ac1", + "continuous_batching": false, + "ep_degree": 1, + "fused_qkv": true, + "glu_mlp": true, + "local_ranks_size": 2, + "max_batch_size": 1, + "max_context_length": 1024, + "max_topk": 256, + "n_active_tokens": 1024, + "neuronxcc_version": "2.21.33363.0+82129205", + "on_device_sampling": true, + "optimum_neuron_version": "0.4.3.dev3", + "output_logits": false, + "pp_degree": 1, + "sequence_length": 1024, + "sequence_parallel_enabled": false, + "speculation_length": 0, + "start_rank_id": 0, + "target": "trn1", + "torch_dtype": "bfloat16", + "tp_degree": 2 + }, + "no_rope_layer_interval": 4, + "no_rope_layers": [ + 1, + 1, + 1, + 0, + 1, + 1, + 1, + 0, + 1, + 1, + 1, + 0, + 1, + 1, + 1, + 0, + 1, + 1, + 1, + 0, + 1, + 1, + 1, + 0, + 1, + 1, + 1, + 0, + 1, + 1, + 1, + 0, + 1, + 1, + 1, + 0 + ], + "num_attention_heads": 16, + "num_hidden_layers": 36, + "num_key_value_heads": 4, + "pretraining_tp": 2, + "rms_norm_eps": 1e-06, + "rope_scaling": null, + "rope_theta": 5000000.0, + "sliding_window": null, + "use_cache": false, + "use_sliding_window": false, + "vocab_size": 128256 +} \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.3.dev3/smollm3/HuggingFaceTB/SmolLM3-3B/f30f56d7ee477331eddd.json b/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.3.dev3/smollm3/HuggingFaceTB/SmolLM3-3B/f30f56d7ee477331eddd.json new file mode 100644 index 0000000000000000000000000000000000000000..ffa8ddf9b17d01bb5ef4686891e5c9c710e6d3be --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.3.dev3/smollm3/HuggingFaceTB/SmolLM3-3B/f30f56d7ee477331eddd.json @@ -0,0 +1,134 @@ +{ + "_entry_class": "SingleModelCacheEntry", + "_model_id": "HuggingFaceTB/SmolLM3-3B", + "_task": "text-generation", + "architectures": [ + "SmolLM3ForCausalLM" + ], + "attention_bias": false, + "attention_dropout": 0.0, + "dtype": "bfloat16", + "hidden_act": "silu", + "hidden_size": 2048, + "initializer_range": 0.02, + "intermediate_size": 11008, + "layer_types": [ + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention" + ], + "max_position_embeddings": 65536, + "max_window_layers": 28, + "mlp_bias": false, + "model_type": "smollm3", + "neuron": { + "_serialized_key": "NxDNeuronConfig", + "batch_size": 4, + "capacity_factor": null, + "checkpoint_id": "HuggingFaceTB/SmolLM3-3B", + "checkpoint_revision": "a07cc9a04f16550a088caea529712d1d335b0ac1", + "continuous_batching": true, + "ep_degree": 1, + "fused_qkv": true, + "glu_mlp": true, + "local_ranks_size": 2, + "max_batch_size": 4, + "max_context_length": 4096, + "max_topk": 256, + "n_active_tokens": 4096, + "neuronxcc_version": "2.21.33363.0+82129205", + "on_device_sampling": true, + "optimum_neuron_version": "0.4.3.dev3", + "output_logits": false, + "pp_degree": 1, + "sequence_length": 4096, + "speculation_length": 0, + "start_rank_id": 0, + "target": "trn1", + "torch_dtype": "bfloat16", + "tp_degree": 2 + }, + "no_rope_layer_interval": 4, + "no_rope_layers": [ + 1, + 1, + 1, + 0, + 1, + 1, + 1, + 0, + 1, + 1, + 1, + 0, + 1, + 1, + 1, + 0, + 1, + 1, + 1, + 0, + 1, + 1, + 1, + 0, + 1, + 1, + 1, + 0, + 1, + 1, + 1, + 0, + 1, + 1, + 1, + 0 + ], + "num_attention_heads": 16, + "num_hidden_layers": 36, + "num_key_value_heads": 4, + "pretraining_tp": 2, + "rms_norm_eps": 1e-06, + "rope_scaling": null, + "rope_theta": 5000000.0, + "sliding_window": null, + "use_cache": false, + "use_sliding_window": false, + "vocab_size": 128256 +} \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.5.dev1/3338d63843deff76593f3d84514682d027ea1b76f25961369968d0a698b30250/8672676a3375e884cc27.json b/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.5.dev1/3338d63843deff76593f3d84514682d027ea1b76f25961369968d0a698b30250/8672676a3375e884cc27.json new file mode 100644 index 0000000000000000000000000000000000000000..27b1121dc39f76aa34e745ddd19be099dd6f3676 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.5.dev1/3338d63843deff76593f3d84514682d027ea1b76f25961369968d0a698b30250/8672676a3375e884cc27.json @@ -0,0 +1,62 @@ +{ + "_entry_class": "SingleModelCacheEntry", + "_model_id": "meta-llama/Llama-3.3-70B-Instruct", + "_task": "text-generation", + "architectures": [ + "LlamaForCausalLM" + ], + "attention_bias": false, + "attention_dropout": 0.0, + "dtype": "bfloat16", + "head_dim": 128, + "hidden_act": "silu", + "hidden_size": 8192, + "initializer_range": 0.02, + "intermediate_size": 28672, + "max_position_embeddings": 131072, + "mlp_bias": false, + "model_type": "llama", + "neuron": { + "_serialized_key": "NxDNeuronConfig", + "batch_size": 1, + "capacity_factor": null, + "checkpoint_id": "meta-llama/Llama-3.3-70B-Instruct", + "checkpoint_revision": "6f6073b423013f6a7d4d9f39144961bfbfbc386b", + "continuous_batching": false, + "ep_degree": 1, + "fused_qkv": true, + "glu_mlp": true, + "local_ranks_size": 24, + "max_batch_size": 1, + "max_context_length": 16384, + "max_topk": 256, + "n_active_tokens": 16384, + "neuronxcc_version": "2.21.33363.0+82129205", + "on_device_sampling": true, + "optimum_neuron_version": "0.4.5.dev1", + "output_logits": false, + "pp_degree": 1, + "sequence_length": 16384, + "speculation_length": 0, + "start_rank_id": 0, + "target": "trn1", + "torch_dtype": "bfloat16", + "tp_degree": 24 + }, + "num_attention_heads": 64, + "num_hidden_layers": 80, + "num_key_value_heads": 8, + "pretraining_tp": 1, + "rms_norm_eps": 1e-05, + "rope_scaling": { + "factor": 8.0, + "high_freq_factor": 4.0, + "low_freq_factor": 1.0, + "original_max_position_embeddings": 8192, + "rope_type": "llama3" + }, + "rope_theta": 500000.0, + "tie_word_embeddings": false, + "use_cache": true, + "vocab_size": 128256 +} \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.5.dev1/llama/meta-llama/Llama-3.3-70B-Instruct/8672676a3375e884cc27.json b/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.5.dev1/llama/meta-llama/Llama-3.3-70B-Instruct/8672676a3375e884cc27.json new file mode 100644 index 0000000000000000000000000000000000000000..27b1121dc39f76aa34e745ddd19be099dd6f3676 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.5.dev1/llama/meta-llama/Llama-3.3-70B-Instruct/8672676a3375e884cc27.json @@ -0,0 +1,62 @@ +{ + "_entry_class": "SingleModelCacheEntry", + "_model_id": "meta-llama/Llama-3.3-70B-Instruct", + "_task": "text-generation", + "architectures": [ + "LlamaForCausalLM" + ], + "attention_bias": false, + "attention_dropout": 0.0, + "dtype": "bfloat16", + "head_dim": 128, + "hidden_act": "silu", + "hidden_size": 8192, + "initializer_range": 0.02, + "intermediate_size": 28672, + "max_position_embeddings": 131072, + "mlp_bias": false, + "model_type": "llama", + "neuron": { + "_serialized_key": "NxDNeuronConfig", + "batch_size": 1, + "capacity_factor": null, + "checkpoint_id": "meta-llama/Llama-3.3-70B-Instruct", + "checkpoint_revision": "6f6073b423013f6a7d4d9f39144961bfbfbc386b", + "continuous_batching": false, + "ep_degree": 1, + "fused_qkv": true, + "glu_mlp": true, + "local_ranks_size": 24, + "max_batch_size": 1, + "max_context_length": 16384, + "max_topk": 256, + "n_active_tokens": 16384, + "neuronxcc_version": "2.21.33363.0+82129205", + "on_device_sampling": true, + "optimum_neuron_version": "0.4.5.dev1", + "output_logits": false, + "pp_degree": 1, + "sequence_length": 16384, + "speculation_length": 0, + "start_rank_id": 0, + "target": "trn1", + "torch_dtype": "bfloat16", + "tp_degree": 24 + }, + "num_attention_heads": 64, + "num_hidden_layers": 80, + "num_key_value_heads": 8, + "pretraining_tp": 1, + "rms_norm_eps": 1e-05, + "rope_scaling": { + "factor": 8.0, + "high_freq_factor": 4.0, + "low_freq_factor": 1.0, + "original_max_position_embeddings": 8192, + "rope_type": "llama3" + }, + "rope_theta": 500000.0, + "tie_word_embeddings": false, + "use_cache": true, + "vocab_size": 128256 +} \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_01328268a19023ed0f24+f8e6d902/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_01328268a19023ed0f24+f8e6d902/model.hlo_module.pb index e1c7a90ca8e1b18d6f623143b55987c66f3a0976..910fb21ca78c9b5103637fe5ba28e6ecd2162ea9 100644 --- a/neuronxcc-2.21.33363.0+82129205/MODULE_01328268a19023ed0f24+f8e6d902/model.hlo_module.pb +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_01328268a19023ed0f24+f8e6d902/model.hlo_module.pb @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:8ef50e479badb0312e208336533316393fc797857eb5a2cde744753c266d7f3f +oid sha256:5a7be97d2012aa41b5f56bf5bf86357a0dae77fd27821fa3e0737aba2fe5521e size 97794 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_01328268a19023ed0f24+f8e6d902/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_01328268a19023ed0f24+f8e6d902/model.neff index e4bfe59d6155f39fb2dc7b02432b14d2efc62266..887c66d40f263958cddbd9115ba918fa59003dbf 100644 --- a/neuronxcc-2.21.33363.0+82129205/MODULE_01328268a19023ed0f24+f8e6d902/model.neff +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_01328268a19023ed0f24+f8e6d902/model.neff @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:671f2968ee09229cb96bb22be152df8bd197829d6ce7ad77ef854a3963b716b9 +oid sha256:7ff6c1f2a8f76328f3ffd5cd9cbb7ad62552ac54af96be0b68b754f3e79f2c6e size 410624 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_03563a07b466ff1a7583+24129607/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_03563a07b466ff1a7583+24129607/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..836724f44545ce0dedda1521fd4c623a6ea8ec72 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_03563a07b466ff1a7583+24129607/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/context_encoding/_tp0_bk0/log-neuron-cc.txt"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_03563a07b466ff1a7583+24129607/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_03563a07b466ff1a7583+24129607/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_03563a07b466ff1a7583+24129607/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_03563a07b466ff1a7583+24129607/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..1c0c5bd4738b8c097795c218feb6443ef6ed63bc --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_03563a07b466ff1a7583+24129607/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e445156b47032a190d83fc2c046434ceebaf6955ca33f5225b018b68f9d2c21 +size 464761 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_03563a07b466ff1a7583+24129607/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_03563a07b466ff1a7583+24129607/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..ec378fa6ca64ccf10e111d566464005796bcb14c --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_03563a07b466ff1a7583+24129607/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2c2123c893919ee13fb7762a2640a6ec76d00052c62ea198a63100094cf2a075 +size 42363904 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_0a11d2377319957aa7b1+87e73322/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_0a11d2377319957aa7b1+87e73322/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..d08b4685aaf65dbeb01a27f6d42a6d395cfd43ad --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_0a11d2377319957aa7b1+87e73322/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--enable-saturate-infinity", "--auto-cast=none", "--model-type=transformer", "-O1", "--logfile=/tmp/nxdi_test_dc3e1bee-6524-447d-9446-272b95c584c4/compiler_workdir/DecoderLayerWrapper/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_0a11d2377319957aa7b1+87e73322/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_0a11d2377319957aa7b1+87e73322/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_0a11d2377319957aa7b1+87e73322/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_0a11d2377319957aa7b1+87e73322/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..f1741924eff22d4ff01845ba4c4fcdf856e561ee --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_0a11d2377319957aa7b1+87e73322/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5aada783fa65d42822de46cbe32345d5a69308162fb8bac9b5878183bb6f0812 +size 16322 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_0a11d2377319957aa7b1+87e73322/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_0a11d2377319957aa7b1+87e73322/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..7aca30d1619a9d5eb6488c54a918d6a50d774054 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_0a11d2377319957aa7b1+87e73322/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dea5db1d9f224ae63a2ac65d3c8a0fa794429d3bb9efeef01f2e344e6aee3af6 +size 154624 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_0a11d2377319957aa7b1+87e73322/wrapped_neff.hlo b/neuronxcc-2.21.33363.0+82129205/MODULE_0a11d2377319957aa7b1+87e73322/wrapped_neff.hlo new file mode 100644 index 0000000000000000000000000000000000000000..58d7d395210b1d0b6fb193557e09e6bf886ee25e --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_0a11d2377319957aa7b1+87e73322/wrapped_neff.hlo @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b8ff8c72815d5f3128a219b592ebd8f67a72024d843966722abf90c530120a91 +size 159439 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_0cc2b44bb9cd283b1eeb+5c07cd07/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_0cc2b44bb9cd283b1eeb+5c07cd07/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..941164a3d3430701ce849f46463f3f70d42ce160 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_0cc2b44bb9cd283b1eeb+5c07cd07/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--enable-saturate-infinity", "--auto-cast=none", "--model-type=transformer", "-O1", "--logfile=/tmp/nxdi_test_c73e95e0-6203-4ae1-93e0-d723062123b7/compiler_workdir/DecoderLayerWrapper/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_0cc2b44bb9cd283b1eeb+5c07cd07/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_0cc2b44bb9cd283b1eeb+5c07cd07/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_0cc2b44bb9cd283b1eeb+5c07cd07/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_0cc2b44bb9cd283b1eeb+5c07cd07/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..d681207f945990d4e21e50b0e6b8e90d019cd7f0 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_0cc2b44bb9cd283b1eeb+5c07cd07/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:acc559309a214b16f3917edf6efe2b0ab578f048a6524f41ac73e1d625078b3e +size 14480 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_0cc2b44bb9cd283b1eeb+5c07cd07/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_0cc2b44bb9cd283b1eeb+5c07cd07/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..6d393187a6291dbaa27184ce990ff9acbfde7d48 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_0cc2b44bb9cd283b1eeb+5c07cd07/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d15f9bd70809a747570ff3bf0e24da12be5cd3c44f60c127defa9bd7bb555bb5 +size 267264 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_0cc2b44bb9cd283b1eeb+5c07cd07/wrapped_neff.hlo b/neuronxcc-2.21.33363.0+82129205/MODULE_0cc2b44bb9cd283b1eeb+5c07cd07/wrapped_neff.hlo new file mode 100644 index 0000000000000000000000000000000000000000..59c8f42b5d04428211a2b7b494c1e8ae343a4562 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_0cc2b44bb9cd283b1eeb+5c07cd07/wrapped_neff.hlo @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ad55d35419702983604416a0663c8fe217a59867078d09197bab95def35e5b8a +size 272962 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_0e63a0b6e1742e1fdb32+24129607/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_0e63a0b6e1742e1fdb32+24129607/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..836724f44545ce0dedda1521fd4c623a6ea8ec72 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_0e63a0b6e1742e1fdb32+24129607/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/context_encoding/_tp0_bk0/log-neuron-cc.txt"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_0e63a0b6e1742e1fdb32+24129607/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_0e63a0b6e1742e1fdb32+24129607/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_0e63a0b6e1742e1fdb32+24129607/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_0e63a0b6e1742e1fdb32+24129607/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..a175e30a8c2bcf6522f7c9f99b623ae52e6bc450 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_0e63a0b6e1742e1fdb32+24129607/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4c59a9beb3152a126b4174162d5fa06e986ecc9ee9ce9634883d872b5a2157d2 +size 90122 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_0e63a0b6e1742e1fdb32+24129607/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_0e63a0b6e1742e1fdb32+24129607/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..78912220e60c83267b0bd66dc6394477054a264d --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_0e63a0b6e1742e1fdb32+24129607/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f5e4bf77d4ab016388cc0f6f9729aad864a641f76101eb3cb74a17b6b25b9a5c +size 30977024 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_10907752543637211265+e30acd3a/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_10907752543637211265+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_10907752543637211265+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_10907752543637211265+e30acd3a/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_10907752543637211265+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_10907752543637211265+e30acd3a/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_10907752543637211265+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..b90a86dc9847aa4694b1ae072a3a2d5a6c06a295 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_10907752543637211265+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b36a2c38093715f8f1064e95c504963c4eefb108483ea5177b7a9b67c594c14c +size 1584 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_10907752543637211265+e30acd3a/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_10907752543637211265+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..05857a281a16252edfc671336951cf3143cea874 Binary files /dev/null and b/neuronxcc-2.21.33363.0+82129205/MODULE_10907752543637211265+e30acd3a/model.neff differ diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_11400907432531398953+e30acd3a/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_11400907432531398953+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_11400907432531398953+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_11400907432531398953+e30acd3a/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_11400907432531398953+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_11400907432531398953+e30acd3a/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_11400907432531398953+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..ad2498cb3ccc8151ea047c432b2b66e2e625d32e --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_11400907432531398953+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1dcdc83733e2a421bdc65e593bd84b693b25114c7d871cc5383cf3ac18dbfdfb +size 1584 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_11400907432531398953+e30acd3a/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_11400907432531398953+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..91d66f16cab01417f03cb68141cb534e3c471d76 Binary files /dev/null and b/neuronxcc-2.21.33363.0+82129205/MODULE_11400907432531398953+e30acd3a/model.neff differ diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_12324009378304635855+e30acd3a/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_12324009378304635855+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_12324009378304635855+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_12324009378304635855+e30acd3a/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_12324009378304635855+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_12324009378304635855+e30acd3a/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_12324009378304635855+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..ef9826bc0f3be4cee030dba2d27589e70ab9646c --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_12324009378304635855+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c03b599abe1f3c2c4641cf7e8ff997574d293007a2321ba5af97b65b188e6b99 +size 1584 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_12324009378304635855+e30acd3a/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_12324009378304635855+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..d98c76d93a56a5e20c58fcd99590b22d18f47a81 Binary files /dev/null and b/neuronxcc-2.21.33363.0+82129205/MODULE_12324009378304635855+e30acd3a/model.neff differ diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_12666804432653521811+e30acd3a/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_12666804432653521811+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_12666804432653521811+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_12666804432653521811+e30acd3a/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_12666804432653521811+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_12666804432653521811+e30acd3a/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_12666804432653521811+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..600468f9199a6c583c50512a0beb464459827ee0 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_12666804432653521811+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b7aec6718d215967d85935fe984b05d9b16246efecfec2137a2e30759d81c555 +size 1585 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_12666804432653521811+e30acd3a/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_12666804432653521811+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..3d3cb71282f1878c8bc1cf58c47d706d8177b831 Binary files /dev/null and b/neuronxcc-2.21.33363.0+82129205/MODULE_12666804432653521811+e30acd3a/model.neff differ diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_13092192882592555392+e30acd3a/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_13092192882592555392+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_13092192882592555392+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_13092192882592555392+e30acd3a/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_13092192882592555392+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_13092192882592555392+e30acd3a/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_13092192882592555392+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..f215ff53bd093fc485dd3a3e0493ecd1677d0e3d --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_13092192882592555392+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c7e5e8627e554f6106efe00a9e5443edd528624611d8c29ec34ebbb98fc7d8d2 +size 1584 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_13092192882592555392+e30acd3a/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_13092192882592555392+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..9ffe14c8c9aa9e52320b13760eb1c3f438fd0cfc Binary files /dev/null and b/neuronxcc-2.21.33363.0+82129205/MODULE_13092192882592555392+e30acd3a/model.neff differ diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_13129006844218143067+e30acd3a/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_13129006844218143067+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_13129006844218143067+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_13129006844218143067+e30acd3a/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_13129006844218143067+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_13129006844218143067+e30acd3a/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_13129006844218143067+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..16a43cc54293e607a6255ad9da104a22d7521d04 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_13129006844218143067+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5ac835add8ef9104a34341aa0f2a6c485e5ea7fb5e04bb187959e310c6ec0e14 +size 1584 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_13129006844218143067+e30acd3a/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_13129006844218143067+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..48284eb792c98aa67cbc26bd9644d5b75a0ee03f Binary files /dev/null and b/neuronxcc-2.21.33363.0+82129205/MODULE_13129006844218143067+e30acd3a/model.neff differ diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_13163168066471565112+e30acd3a/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_13163168066471565112+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_13163168066471565112+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_13163168066471565112+e30acd3a/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_13163168066471565112+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_13163168066471565112+e30acd3a/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_13163168066471565112+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..30a44c112a1e85be62e94865d7e39ea36faa66eb --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_13163168066471565112+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:79ca38629b9bb8e54332a80e8e36748d843d502acfc7244cc95a320ec55b90c5 +size 1584 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_13163168066471565112+e30acd3a/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_13163168066471565112+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..fc101a0aaec86df6f780f6d7ea7ce0e226d9e526 Binary files /dev/null and b/neuronxcc-2.21.33363.0+82129205/MODULE_13163168066471565112+e30acd3a/model.neff differ diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_13385766575326555678+e30acd3a/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_13385766575326555678+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_13385766575326555678+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_13385766575326555678+e30acd3a/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_13385766575326555678+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_13385766575326555678+e30acd3a/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_13385766575326555678+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..d5170eb98150404cddea97e8dc3b154e7948f12c --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_13385766575326555678+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:175d7534042da2b21e67c22c6527992c0c5734601d3f8def1dccf42da367ec68 +size 1584 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_13385766575326555678+e30acd3a/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_13385766575326555678+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..70df91ddb00894d7386c28d0bea946e1edfcf4a6 Binary files /dev/null and b/neuronxcc-2.21.33363.0+82129205/MODULE_13385766575326555678+e30acd3a/model.neff differ diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_1351bde3344f209ba8a1+24129607/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_1351bde3344f209ba8a1+24129607/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..836724f44545ce0dedda1521fd4c623a6ea8ec72 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_1351bde3344f209ba8a1+24129607/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/context_encoding/_tp0_bk0/log-neuron-cc.txt"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_1351bde3344f209ba8a1+24129607/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_1351bde3344f209ba8a1+24129607/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_1351bde3344f209ba8a1+24129607/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_1351bde3344f209ba8a1+24129607/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..71d8f28725a6fd36067e26814a4ebfe648ca205e --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_1351bde3344f209ba8a1+24129607/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9f7e20ba12250d08b854a76456fa2e4e0d6ddf13691e025257a2e3778525e023 +size 867147 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_1351bde3344f209ba8a1+24129607/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_1351bde3344f209ba8a1+24129607/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..3e106e70fad71397498cdf003f227ab6a0a0176e --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_1351bde3344f209ba8a1+24129607/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:57b2ee4243bd8fe7035f1301940240484b1b2a18187aa6368723739798ce86d1 +size 11684864 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_13521002922414225272+e30acd3a/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_13521002922414225272+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_13521002922414225272+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_13521002922414225272+e30acd3a/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_13521002922414225272+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_13521002922414225272+e30acd3a/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_13521002922414225272+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..332a53812f106f5bdc39c5328bc3416d9da5009f --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_13521002922414225272+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:733d0fb0b8a00ad2f86ce0d3202e2731f51e7a752e198b9b302678f8317ea9c2 +size 1584 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_13521002922414225272+e30acd3a/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_13521002922414225272+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..08334f268e5efc243a714ea6ca9812d5c2a571b9 Binary files /dev/null and b/neuronxcc-2.21.33363.0+82129205/MODULE_13521002922414225272+e30acd3a/model.neff differ diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_137f98143cdeb07dab7d+a02c3a36/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_137f98143cdeb07dab7d+a02c3a36/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..5726abc7d1d8c52fa95bc7919439a23a23fe3b9a --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_137f98143cdeb07dab7d+a02c3a36/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/token_generation/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_137f98143cdeb07dab7d+a02c3a36/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_137f98143cdeb07dab7d+a02c3a36/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_137f98143cdeb07dab7d+a02c3a36/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_137f98143cdeb07dab7d+a02c3a36/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..a1b84944bd41f36506ece4afd68096d3271335d8 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_137f98143cdeb07dab7d+a02c3a36/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6c3af8ccf676bfc9035f2832be64f2c64d4fb71e544ed4a55e45823227860db7 +size 863008 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_137f98143cdeb07dab7d+a02c3a36/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_137f98143cdeb07dab7d+a02c3a36/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..97145496307759fbce4f0e9df7fb9b2fc8e29687 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_137f98143cdeb07dab7d+a02c3a36/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:db55af8b240e22fd8c6947d7fcf77d9db9951d7a854022ea5e1bcdc69b2e9e8c +size 5039104 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_137f98143cdeb07dab7d+a02c3a36/wrapped_neff.hlo b/neuronxcc-2.21.33363.0+82129205/MODULE_137f98143cdeb07dab7d+a02c3a36/wrapped_neff.hlo new file mode 100644 index 0000000000000000000000000000000000000000..1fd2fea9c23be1fc4e3259abc8b7f7fc32c29fbc --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_137f98143cdeb07dab7d+a02c3a36/wrapped_neff.hlo @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d12b0bd6935e99c2317788a98c688f30bccd28bc264c3e8886100cb709dfc68 +size 5205771 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_14024125047097359821+e30acd3a/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_14024125047097359821+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_14024125047097359821+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_14024125047097359821+e30acd3a/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_14024125047097359821+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_14024125047097359821+e30acd3a/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_14024125047097359821+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..88d4c357148f8723e10ac1cf8dc5426b680eef5a --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_14024125047097359821+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7730eb5b8602fc6d2d25c92d8624de4ee95d56509ce0c2d8adbf41a9d7b99ceb +size 1584 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_14024125047097359821+e30acd3a/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_14024125047097359821+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..e42d054f5127fa958eccddff5ca10126152124c3 Binary files /dev/null and b/neuronxcc-2.21.33363.0+82129205/MODULE_14024125047097359821+e30acd3a/model.neff differ diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_14488951057292576015+e30acd3a/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_14488951057292576015+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_14488951057292576015+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_14488951057292576015+e30acd3a/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_14488951057292576015+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_14488951057292576015+e30acd3a/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_14488951057292576015+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..d532e468ecceba150088a81cf4b534f83127347d --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_14488951057292576015+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f794d9b46f347a2c9779006b54197d244ac42cd282903d46a9ac1effbff35900 +size 1585 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_14488951057292576015+e30acd3a/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_14488951057292576015+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..5436593e8c60ff93d9e29c9d733c009d19c2cd7d Binary files /dev/null and b/neuronxcc-2.21.33363.0+82129205/MODULE_14488951057292576015+e30acd3a/model.neff differ diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_14607415948795306857+e30acd3a/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_14607415948795306857+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_14607415948795306857+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_14607415948795306857+e30acd3a/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_14607415948795306857+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_14607415948795306857+e30acd3a/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_14607415948795306857+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..a040628b2dd49b30b03c553a530c0e2c76d57bb3 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_14607415948795306857+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:96a2ca6d1c617f569228e4c09d146226ca8d607049cc5b813b8b9d0e42ebbe63 +size 1585 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_14607415948795306857+e30acd3a/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_14607415948795306857+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..202c6b8521a788a3e20ee0e54c339aaa6dcf0ef6 Binary files /dev/null and b/neuronxcc-2.21.33363.0+82129205/MODULE_14607415948795306857+e30acd3a/model.neff differ diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_15024025e6662a62c755+3da4118c/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_15024025e6662a62c755+3da4118c/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..a6b6e86fcf3a9dcc66da77a1686996cf6c5f2485 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_15024025e6662a62c755+3da4118c/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--enable-saturate-infinity", "--auto-cast=none", "--model-type=transformer", "-O1", "--logfile=/tmp/nxdi_test_fcce9440-6cfe-44be-b29b-556e9b41f4b5/compiler_workdir/DecoderLayerWrapper/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_15024025e6662a62c755+3da4118c/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_15024025e6662a62c755+3da4118c/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_15024025e6662a62c755+3da4118c/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_15024025e6662a62c755+3da4118c/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..8ce8199bda2f1ed5aa931fb578dc70e03ecb0fd0 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_15024025e6662a62c755+3da4118c/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c5aac07a6d8f77b95a7886b293abbce6620a0056f9f0d69a3cb31d022f82483e +size 15848 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_15024025e6662a62c755+3da4118c/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_15024025e6662a62c755+3da4118c/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..c94ccb37812cb9697aabd7e7b477ac802cb01c96 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_15024025e6662a62c755+3da4118c/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:23929ea58e25dd0fa8083385e36ea77a1c22ead42823f5065fda46f09096cd34 +size 267264 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_15024025e6662a62c755+3da4118c/wrapped_neff.hlo b/neuronxcc-2.21.33363.0+82129205/MODULE_15024025e6662a62c755+3da4118c/wrapped_neff.hlo new file mode 100644 index 0000000000000000000000000000000000000000..58bc119da9673db22943722bbf122eaa8d2cbba2 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_15024025e6662a62c755+3da4118c/wrapped_neff.hlo @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6a1297c7781e71bc4908185a65b3c0d9ab5724ef370c5dbd4fa042a7972fa920 +size 272962 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_15104978417860996248+e30acd3a/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_15104978417860996248+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_15104978417860996248+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_15104978417860996248+e30acd3a/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_15104978417860996248+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_15104978417860996248+e30acd3a/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_15104978417860996248+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..cedcae31cd2e003e183f6c87d0d439039ef8b01e --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_15104978417860996248+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d8d761528ce6886a8b55d0c5ea938e8bedc2b6e7a1632afaae7f26549f37e571 +size 1369 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_15104978417860996248+e30acd3a/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_15104978417860996248+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..cb2da8c4eace83c30ce7aab0077751bab7a157c3 Binary files /dev/null and b/neuronxcc-2.21.33363.0+82129205/MODULE_15104978417860996248+e30acd3a/model.neff differ diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_15195479995167874327+e30acd3a/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_15195479995167874327+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_15195479995167874327+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_15195479995167874327+e30acd3a/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_15195479995167874327+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_15195479995167874327+e30acd3a/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_15195479995167874327+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..a57f719e018130b080aaa379975c88b7fb4bc4f2 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_15195479995167874327+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cac76d2035fb9d2728d0052857f47b57fdfac0d0fb43734a4806a5a5a4deaed5 +size 1582 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_15195479995167874327+e30acd3a/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_15195479995167874327+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..eb727dbb5510b457d2390247c28550137146946f Binary files /dev/null and b/neuronxcc-2.21.33363.0+82129205/MODULE_15195479995167874327+e30acd3a/model.neff differ diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_15226158922329678840+e30acd3a/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_15226158922329678840+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_15226158922329678840+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_15226158922329678840+e30acd3a/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_15226158922329678840+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_15226158922329678840+e30acd3a/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_15226158922329678840+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..06263c496303dad9352931d0f93b594ba1e4b5e6 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_15226158922329678840+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6da43c48a28ebcc7b93e066fd156567bdd942450f41f926a0294a6275097cfa1 +size 1584 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_15226158922329678840+e30acd3a/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_15226158922329678840+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..9ac254bb0a0cc701348fca4bd839ab597c6b2b7c Binary files /dev/null and b/neuronxcc-2.21.33363.0+82129205/MODULE_15226158922329678840+e30acd3a/model.neff differ diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_15549583432468528942+e30acd3a/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_15549583432468528942+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_15549583432468528942+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_15549583432468528942+e30acd3a/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_15549583432468528942+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_15549583432468528942+e30acd3a/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_15549583432468528942+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..d604ba392cf0e35823e332233d7b81e4b72c37be --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_15549583432468528942+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bf03da6cc8efe76396a94a9ec2ab1e947e3aae3b2004650f06be02c1cb664237 +size 1584 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_15549583432468528942+e30acd3a/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_15549583432468528942+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..6679d8da0f29a9f2fcfe7084549f4e8e1d6ef312 Binary files /dev/null and b/neuronxcc-2.21.33363.0+82129205/MODULE_15549583432468528942+e30acd3a/model.neff differ diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_16063773584643651549+e30acd3a/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_16063773584643651549+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_16063773584643651549+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_16063773584643651549+e30acd3a/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_16063773584643651549+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_16063773584643651549+e30acd3a/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_16063773584643651549+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..7fcef3c41c0d6edeb3832dd09ad315e34d1c3b05 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_16063773584643651549+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3772c9b53cf2c833d0d1c07c90e6b645617324394ad76cd3936137a547c93adf +size 1144 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_16063773584643651549+e30acd3a/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_16063773584643651549+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..c21c7d2e5f5c638059050ec12657584a9419c400 Binary files /dev/null and b/neuronxcc-2.21.33363.0+82129205/MODULE_16063773584643651549+e30acd3a/model.neff differ diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_16540141349946602462+e30acd3a/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_16540141349946602462+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_16540141349946602462+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_16540141349946602462+e30acd3a/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_16540141349946602462+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_16540141349946602462+e30acd3a/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_16540141349946602462+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..c442d79bba92ba90bb790ec80c021d4af39c8a75 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_16540141349946602462+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2b8e1780595d270fdec28ffa5135fd9fc122d81455077a5333563bb01065f9eb +size 1584 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_16540141349946602462+e30acd3a/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_16540141349946602462+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..bff4e87e51aeab73ff3e42712722e9cc4eae3fe6 Binary files /dev/null and b/neuronxcc-2.21.33363.0+82129205/MODULE_16540141349946602462+e30acd3a/model.neff differ diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_1659424179484095552+e30acd3a/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_1659424179484095552+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_1659424179484095552+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_1659424179484095552+e30acd3a/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_1659424179484095552+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..a7e25eeb37121b478d999b750fbcd88e0bf27d24 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_1659424179484095552+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:394ead2842be9fad710a8dd2987593d6340a0f6bf739f2bb6bf829d1a65712b6 +size 1146 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_17037369046574255528+e30acd3a/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_17037369046574255528+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_17037369046574255528+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_17037369046574255528+e30acd3a/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_17037369046574255528+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_17037369046574255528+e30acd3a/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_17037369046574255528+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..ebfeed2f0336a7c1b2cc132d29e93f0f47e0271c --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_17037369046574255528+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea6f95f6359e63ec8ab80994433ce28b0635e7041da26b6fcede717acc049264 +size 1584 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_17037369046574255528+e30acd3a/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_17037369046574255528+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..658b5eac55a8a4c6bdab7cf22e4798dc7c570b56 Binary files /dev/null and b/neuronxcc-2.21.33363.0+82129205/MODULE_17037369046574255528+e30acd3a/model.neff differ diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_17162153672426857671+e30acd3a/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_17162153672426857671+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_17162153672426857671+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_17162153672426857671+e30acd3a/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_17162153672426857671+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_17162153672426857671+e30acd3a/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_17162153672426857671+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..ff8cfe6fb48f24862061ffd1e69bb93e259f494b --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_17162153672426857671+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a955ad497f25e8cfbd39bcb81ffd84a6762f8808cf9be1033d56672fdf6f8d9e +size 1584 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_17162153672426857671+e30acd3a/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_17162153672426857671+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..b289d48571ec771e4bebf5f8dfdbcf5c7938af25 Binary files /dev/null and b/neuronxcc-2.21.33363.0+82129205/MODULE_17162153672426857671+e30acd3a/model.neff differ diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_17184761711863280677+e30acd3a/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_17184761711863280677+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_17184761711863280677+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_17184761711863280677+e30acd3a/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_17184761711863280677+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_17184761711863280677+e30acd3a/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_17184761711863280677+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..e8be5b68c75b45794bc5de7c2deca020c8a382cb --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_17184761711863280677+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f3a1cab3ecba7a6f07cc3ee1cd169a5cdacda09119c1f16840b98b4578735cc0 +size 1584 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_17184761711863280677+e30acd3a/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_17184761711863280677+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..a4aca912d0f68cf75f5af021bbe2e0e6326c1cf5 Binary files /dev/null and b/neuronxcc-2.21.33363.0+82129205/MODULE_17184761711863280677+e30acd3a/model.neff differ diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_17713911408407405055+e30acd3a/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_17713911408407405055+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_17713911408407405055+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_17713911408407405055+e30acd3a/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_17713911408407405055+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_17713911408407405055+e30acd3a/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_17713911408407405055+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..1b9649878f68ec37ea7456352663f5ec0da487cd --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_17713911408407405055+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:35d56233ecce04fbfae7d9f14fe4701e9080011d5ce4b5654ed54e146a5131e7 +size 1584 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_17713911408407405055+e30acd3a/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_17713911408407405055+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..62c364c70b382ca4c02dc8d1a9c3c50ba2c04846 Binary files /dev/null and b/neuronxcc-2.21.33363.0+82129205/MODULE_17713911408407405055+e30acd3a/model.neff differ diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_17890aeca56402771161+24129607/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_17890aeca56402771161+24129607/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..836724f44545ce0dedda1521fd4c623a6ea8ec72 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_17890aeca56402771161+24129607/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/context_encoding/_tp0_bk0/log-neuron-cc.txt"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_17890aeca56402771161+24129607/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_17890aeca56402771161+24129607/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..5aca66687848cb4b7ef807b5310d0619e74e90d6 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_17890aeca56402771161+24129607/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f7dd81a812c89896646ccef219f594888f40effdb4037f39880ea712f66c7e11 +size 539300 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_17890aeca56402771161+24129607/model.log b/neuronxcc-2.21.33363.0+82129205/MODULE_17890aeca56402771161+24129607/model.log new file mode 100644 index 0000000000000000000000000000000000000000..2a9d62afd561c693f6e3da367780057686d856b1 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_17890aeca56402771161+24129607/model.log @@ -0,0 +1 @@ +Failed compilation with ['neuronx-cc', 'compile', '--framework=XLA', '/tmp/nxd_model/context_encoding/_tp0_bk0/model.MODULE_17890aeca56402771161+24129607.hlo_module.pb', '--output', '/tmp/nxd_model/context_encoding/_tp0_bk0/model.MODULE_17890aeca56402771161+24129607.neff', '--target=trn1', '--auto-cast=none', '--model-type=transformer', '--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ', '-O2', '--lnc=1', '--logfile=/tmp/nxd_model/context_encoding/_tp0_bk0/log-neuron-cc.txt', '--verbose=35']: \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_1837940185986854500+e30acd3a/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_1837940185986854500+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_1837940185986854500+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_1837940185986854500+e30acd3a/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_1837940185986854500+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_1837940185986854500+e30acd3a/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_1837940185986854500+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..c13b24be1b411fb95f11aca98e792ec3ea448a84 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_1837940185986854500+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e73bcffc136d2dc217b7e571cf1e8f5fa55276d132fce5e1fa93e287f5af7f11 +size 1584 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_1837940185986854500+e30acd3a/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_1837940185986854500+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..9f7d2dfc38d640fef68e686f85554e160ea78c28 Binary files /dev/null and b/neuronxcc-2.21.33363.0+82129205/MODULE_1837940185986854500+e30acd3a/model.neff differ diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_1870165519051566644+e30acd3a/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_1870165519051566644+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_1870165519051566644+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_1870165519051566644+e30acd3a/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_1870165519051566644+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_1870165519051566644+e30acd3a/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_1870165519051566644+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..64c363347089b8883c973378fd169156b3d5d37f --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_1870165519051566644+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:27439c189bb0cd81fadd20b58b5906d3ba31eb47fb16e84c9c4884fd47c96c86 +size 1584 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_1870165519051566644+e30acd3a/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_1870165519051566644+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..0a59f8998776dad95a26ac1ef7078adbf6aae177 Binary files /dev/null and b/neuronxcc-2.21.33363.0+82129205/MODULE_1870165519051566644+e30acd3a/model.neff differ diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_1934c2fc93e7793f0aef+a02c3a36/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_1934c2fc93e7793f0aef+a02c3a36/model.hlo_module.pb index 7bce5095c949934184123fb96719ea53a2057667..2b843c21a9eca44a50823d9d159c8f60a770c4e3 100644 --- a/neuronxcc-2.21.33363.0+82129205/MODULE_1934c2fc93e7793f0aef+a02c3a36/model.hlo_module.pb +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_1934c2fc93e7793f0aef+a02c3a36/model.hlo_module.pb @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:c6361b23631f22b3534873d4bc3fde1c4197b34dc2d5d84b8097108cc7faed45 +oid sha256:3ca0a9c8719d71e823180edfc6eba4a8842e74134383b6713cb51cd6134d5fb7 size 596952 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_1934c2fc93e7793f0aef+a02c3a36/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_1934c2fc93e7793f0aef+a02c3a36/model.neff index d9d3bb858681b0723bda25f49abcb33571303d5d..0552ae495415e2fcb5a2d07605f66ac6f209b512 100644 --- a/neuronxcc-2.21.33363.0+82129205/MODULE_1934c2fc93e7793f0aef+a02c3a36/model.neff +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_1934c2fc93e7793f0aef+a02c3a36/model.neff @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:0be47707e53a60759826fc077df760c768f27f3699574a1ca42a2c1721ac66bc +oid sha256:81f3a436a6014e92728a2af8e77d0d85eabeb5f40ccf61c11b4f0dcac0806751 size 1936384 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_1934c2fc93e7793f0aef+a02c3a36/wrapped_neff.hlo b/neuronxcc-2.21.33363.0+82129205/MODULE_1934c2fc93e7793f0aef+a02c3a36/wrapped_neff.hlo index b83454042532437969142d6d7309a8a4feca0510..38ac5374b75e241384b3ba0683ac74cddf771e5f 100644 --- a/neuronxcc-2.21.33363.0+82129205/MODULE_1934c2fc93e7793f0aef+a02c3a36/wrapped_neff.hlo +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_1934c2fc93e7793f0aef+a02c3a36/wrapped_neff.hlo @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9e23e21a3d39349b0a3b066fd29eb841c6bb9dba1fde90c7a0792c5717638a18 +oid sha256:c3ec97e51a42515c9ce13acbfba6965d41f7e0554d97ca9f9ab94caebd61aaa5 size 2092575 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_1944f672afeaa6480c61+24129607/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_1944f672afeaa6480c61+24129607/model.hlo_module.pb index 57b324cfac621f09e5b76754f3064d2bd3d88a50..2f9624c1eefa19fab1b31fc6f0b11744b23cfe6a 100644 --- a/neuronxcc-2.21.33363.0+82129205/MODULE_1944f672afeaa6480c61+24129607/model.hlo_module.pb +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_1944f672afeaa6480c61+24129607/model.hlo_module.pb @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:b77f0fd54de2b3f0e4d80ee388867e6ab1f396c5fd6c14be411f63d198649118 +oid sha256:21b1204a4001c8a692290e9265478a1dbf162d41df0bba52b580fd22ab3a8735 size 865460 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_1944f672afeaa6480c61+24129607/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_1944f672afeaa6480c61+24129607/model.neff index 5bc62ccff49928f839b0e38f0104812d45543b92..0a56f967b5ef928fce83c9cedd5f39e67b48abf7 100644 --- a/neuronxcc-2.21.33363.0+82129205/MODULE_1944f672afeaa6480c61+24129607/model.neff +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_1944f672afeaa6480c61+24129607/model.neff @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:bc4ee4b8b64d4dc6330fdd8fae2947adf4f88ba10b2505b8b51907e13863538d +oid sha256:8e245ced68ece76c2e986e8d3bd5daf8aa2cb73ddc6d8aa87dfdf32196593303 size 36148224 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_1b7d34902916e968eb1d+af8e51ae/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_1b7d34902916e968eb1d+af8e51ae/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..cc4abea2a1b942a97dfae129550d14e42dc122f9 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_1b7d34902916e968eb1d+af8e51ae/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--enable-saturate-infinity", "--auto-cast=none", "--model-type=transformer", "-O1", "--logfile=/tmp/nxdi_test_77bcc32d-0acb-45e8-a7cc-8c888e51b310/compiler_workdir/DecoderLayerWrapper/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_1b7d34902916e968eb1d+af8e51ae/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_1b7d34902916e968eb1d+af8e51ae/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_1b7d34902916e968eb1d+af8e51ae/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_1b7d34902916e968eb1d+af8e51ae/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..eb128384081972f3d54bbeb0879607f8625c73d5 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_1b7d34902916e968eb1d+af8e51ae/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5a088876f20bbab318478dbed556fcbd544ccdfe018b0dd561cf82bbb59f4bd9 +size 15848 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_1b7d34902916e968eb1d+af8e51ae/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_1b7d34902916e968eb1d+af8e51ae/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..7a286864152493173ab7ffdbf309fdb78538805a --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_1b7d34902916e968eb1d+af8e51ae/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3667ee3f5c2862bb3281975c4e6a9a9027810f1cc9b224d1e75d81464ff9acbe +size 830464 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_1b7d34902916e968eb1d+af8e51ae/wrapped_neff.hlo b/neuronxcc-2.21.33363.0+82129205/MODULE_1b7d34902916e968eb1d+af8e51ae/wrapped_neff.hlo new file mode 100644 index 0000000000000000000000000000000000000000..e3815bb113aa39acf5294c256bc6aa98a8c87f0d --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_1b7d34902916e968eb1d+af8e51ae/wrapped_neff.hlo @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ad8116384c4689bc55341707a67991727a7e6a5ddc7242bae4b0d2f44b1cd515 +size 836176 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_1d4bedf0c37a53b47737+a02c3a36/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_1d4bedf0c37a53b47737+a02c3a36/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..5726abc7d1d8c52fa95bc7919439a23a23fe3b9a --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_1d4bedf0c37a53b47737+a02c3a36/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/token_generation/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_1d4bedf0c37a53b47737+a02c3a36/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_1d4bedf0c37a53b47737+a02c3a36/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_1d4bedf0c37a53b47737+a02c3a36/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_1d4bedf0c37a53b47737+a02c3a36/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..3b28dfdd4b213537b2dea5c6bcc967e9c9762156 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_1d4bedf0c37a53b47737+a02c3a36/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5d61ac2165fde7772e8d3035b0f89b50beec5e0d305548cbacc624eefa9452d3 +size 82753 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_1d4bedf0c37a53b47737+a02c3a36/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_1d4bedf0c37a53b47737+a02c3a36/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..775f26b82b7b93dbbc4a2485d6d80f45279f1955 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_1d4bedf0c37a53b47737+a02c3a36/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:46ba68c0aadd4763eb642e9c19a4cc1d146805bf9f246e0e641bb2e390e292dc +size 277504 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_1d4bedf0c37a53b47737+a02c3a36/wrapped_neff.hlo b/neuronxcc-2.21.33363.0+82129205/MODULE_1d4bedf0c37a53b47737+a02c3a36/wrapped_neff.hlo new file mode 100644 index 0000000000000000000000000000000000000000..89b50330d84cc96c864680444f956454d55a1fd9 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_1d4bedf0c37a53b47737+a02c3a36/wrapped_neff.hlo @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5bc467900543a33abd00bdb0231e3abf9d59ce0ee85e2dc7dda90fe7684a866d +size 285854 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_1de326760d7a62df783b+a02c3a36/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_1de326760d7a62df783b+a02c3a36/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..5726abc7d1d8c52fa95bc7919439a23a23fe3b9a --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_1de326760d7a62df783b+a02c3a36/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/token_generation/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_1de326760d7a62df783b+a02c3a36/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_1de326760d7a62df783b+a02c3a36/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_1de326760d7a62df783b+a02c3a36/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_1de326760d7a62df783b+a02c3a36/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..b06919896ca29f3debbf14d63bc79f82062b224e --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_1de326760d7a62df783b+a02c3a36/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea9bfb02971151b32a96661dd179e4988ddc1c5e8abc764f2b2b6de65dc6c558 +size 65413 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_1de326760d7a62df783b+a02c3a36/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_1de326760d7a62df783b+a02c3a36/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..1da6077106cbb71cc48c5803329620ee0d098c58 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_1de326760d7a62df783b+a02c3a36/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d91fbc0d530dddf34e6b4111be7a31d724944f20be2657f28e145ecc24ed0db3 +size 707584 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_1de326760d7a62df783b+a02c3a36/wrapped_neff.hlo b/neuronxcc-2.21.33363.0+82129205/MODULE_1de326760d7a62df783b+a02c3a36/wrapped_neff.hlo new file mode 100644 index 0000000000000000000000000000000000000000..49f31e60a591ff07326baddbbd9458661798ecd4 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_1de326760d7a62df783b+a02c3a36/wrapped_neff.hlo @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dc038fa331f25b43feca0259115f57fb745f2095bc66b161821869781b15d76c +size 713927 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_20ded251b25e18aad5b0+24129607/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_20ded251b25e18aad5b0+24129607/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..836724f44545ce0dedda1521fd4c623a6ea8ec72 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_20ded251b25e18aad5b0+24129607/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/context_encoding/_tp0_bk0/log-neuron-cc.txt"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_20ded251b25e18aad5b0+24129607/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_20ded251b25e18aad5b0+24129607/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_20ded251b25e18aad5b0+24129607/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_20ded251b25e18aad5b0+24129607/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..0976a343019ccf01ea1d9c1c819850344b771e59 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_20ded251b25e18aad5b0+24129607/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c58abb644d9362c99fa166606676a8dc86a64eb8676a59269c70083ad0e2ebad +size 504323 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_20ded251b25e18aad5b0+24129607/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_20ded251b25e18aad5b0+24129607/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..dd1a644afcb2c296d9d634ad5d1edf8aa25f5642 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_20ded251b25e18aad5b0+24129607/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7a3ba0eb6e1df08cbffca30403208d7bc01a9dbf90456333ab4e02f7ff41d3a7 +size 42148864 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_21ce3b68a9e0797a477c+24129607/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_21ce3b68a9e0797a477c+24129607/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..836724f44545ce0dedda1521fd4c623a6ea8ec72 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_21ce3b68a9e0797a477c+24129607/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/context_encoding/_tp0_bk0/log-neuron-cc.txt"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_21ce3b68a9e0797a477c+24129607/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_21ce3b68a9e0797a477c+24129607/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_21ce3b68a9e0797a477c+24129607/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_21ce3b68a9e0797a477c+24129607/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..c1ae2358157aaab2b04c830234bf17254555a320 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_21ce3b68a9e0797a477c+24129607/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:19ef9c0e229d0180ad66410bc6ac1f944992aeea7ca7b4c53b152b5673be3ca4 +size 66855 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_21ce3b68a9e0797a477c+24129607/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_21ce3b68a9e0797a477c+24129607/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..c98fc01cb9e9f1c08038109b4c7ed1ec683a3a2c --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_21ce3b68a9e0797a477c+24129607/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:93a992e2d9933efc2937e7635a1d54b89f50b5ed6249429c0bc4d6f904ad1f28 +size 52132864 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_2240472231266337587+e30acd3a/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_2240472231266337587+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_2240472231266337587+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_2240472231266337587+e30acd3a/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_2240472231266337587+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_2240472231266337587+e30acd3a/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_2240472231266337587+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..5d0db9e7ecf490acae5d2a08a556d5a3cc486071 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_2240472231266337587+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:50c3e59a5961d2e35404f090b0648874d10a8a12721fc9dd980ac5820c26f740 +size 1584 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_2240472231266337587+e30acd3a/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_2240472231266337587+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..a1c4aca4fd8e65bbb5442296997f14abb45d7c48 Binary files /dev/null and b/neuronxcc-2.21.33363.0+82129205/MODULE_2240472231266337587+e30acd3a/model.neff differ diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_2241641840113569106+e30acd3a/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_2241641840113569106+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_2241641840113569106+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_2241641840113569106+e30acd3a/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_2241641840113569106+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_2241641840113569106+e30acd3a/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_2241641840113569106+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..cc1ce00e7cb09d68985412c4119709cc94b76c5d --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_2241641840113569106+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ccf86c59544ce69a4001c6270629b4619f4d42e402dedfa2d9963f7d82455d3e +size 1584 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_2241641840113569106+e30acd3a/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_2241641840113569106+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..644dc6570565f8dd403f0028480c4e668d09e347 Binary files /dev/null and b/neuronxcc-2.21.33363.0+82129205/MODULE_2241641840113569106+e30acd3a/model.neff differ diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_2447413629898598397+e30acd3a/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_2447413629898598397+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_2447413629898598397+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_2447413629898598397+e30acd3a/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_2447413629898598397+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_2447413629898598397+e30acd3a/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_2447413629898598397+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..d4ca017054b56947e59148088abb2ea6b4219f68 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_2447413629898598397+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7ced77d6c5df1c8b63db687bdee8b798902c7c2c383f1d0ae937d1eb2857ae5f +size 1584 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_2447413629898598397+e30acd3a/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_2447413629898598397+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..6fba7d7caae4ace9cce45e1d55e1196d62bac497 Binary files /dev/null and b/neuronxcc-2.21.33363.0+82129205/MODULE_2447413629898598397+e30acd3a/model.neff differ diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_2477619772153140591+e30acd3a/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_2477619772153140591+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_2477619772153140591+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_2477619772153140591+e30acd3a/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_2477619772153140591+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_2477619772153140591+e30acd3a/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_2477619772153140591+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..58b0ab2cf034398af2b01f8b3fa5220ae75a8817 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_2477619772153140591+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:912d560b87afecd94116a1c9905e4c2cc4d87bbbacef231ac77ccf50af3c6d57 +size 1584 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_2477619772153140591+e30acd3a/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_2477619772153140591+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..016089fa8b101d8d371a41d6e3e4fe91a489ddba Binary files /dev/null and b/neuronxcc-2.21.33363.0+82129205/MODULE_2477619772153140591+e30acd3a/model.neff differ diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_2505e14f043060847cbf+a02c3a36/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_2505e14f043060847cbf+a02c3a36/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..5726abc7d1d8c52fa95bc7919439a23a23fe3b9a --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_2505e14f043060847cbf+a02c3a36/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/token_generation/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_2505e14f043060847cbf+a02c3a36/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_2505e14f043060847cbf+a02c3a36/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_2505e14f043060847cbf+a02c3a36/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_2505e14f043060847cbf+a02c3a36/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..a5732d6426d493a5db46a424d6bcb66da68236bd --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_2505e14f043060847cbf+a02c3a36/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:403bd670698dd551b1f54d7e1a1c2143d031a7be9909884fa14376fd54706394 +size 64866 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_2505e14f043060847cbf+a02c3a36/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_2505e14f043060847cbf+a02c3a36/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..a6c86070f60ca7a17b7a614ac833ced24c58e5fb --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_2505e14f043060847cbf+a02c3a36/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f49d86b8f770493b29d42b4847f9ec724aeef7f0bd49605f01ef3de641e850f1 +size 697344 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_2505e14f043060847cbf+a02c3a36/wrapped_neff.hlo b/neuronxcc-2.21.33363.0+82129205/MODULE_2505e14f043060847cbf+a02c3a36/wrapped_neff.hlo new file mode 100644 index 0000000000000000000000000000000000000000..054f95bea2df0d473590181938b3173a1612d3cd --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_2505e14f043060847cbf+a02c3a36/wrapped_neff.hlo @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b434ea3a7bbd686e206ea179e2de7a35b33a7f180c0d9472ae6bfd8c0209542a +size 703687 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_250ecf58b3a2e7ac5757+24129607/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_250ecf58b3a2e7ac5757+24129607/model.hlo_module.pb index 2454aac239b8ec369102b0184785d212d54d5a33..ca9bae0de2f377eb55116ac5ffac7016164602ea 100644 --- a/neuronxcc-2.21.33363.0+82129205/MODULE_250ecf58b3a2e7ac5757+24129607/model.hlo_module.pb +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_250ecf58b3a2e7ac5757+24129607/model.hlo_module.pb @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:c1c161937d0eeeb2eca0dfcca2535ee497d38d1e83b3dbc45f21ccf5a0100888 +oid sha256:329e621507127750dc610f95907a7e901219e2f34aaef4c17d140feef4a6c579 size 1061093 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_250ecf58b3a2e7ac5757+24129607/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_250ecf58b3a2e7ac5757+24129607/model.neff index 20ddb57879805fbb4d393d858b69286efb35950a..3e1feb5f78b53c3696f5f0308c66aa2185433a9e 100644 --- a/neuronxcc-2.21.33363.0+82129205/MODULE_250ecf58b3a2e7ac5757+24129607/model.neff +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_250ecf58b3a2e7ac5757+24129607/model.neff @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:af2c4a236a1f97d56e0840ca8099bf268c1fad8b15295cae8f906ae0c5534a0b +oid sha256:91ba54a6131873512c8412ed7a9972adca35b2f18f36e528de0b048bc3c788de size 9473024 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_2672b897bf6327bea9e4+24129607/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_2672b897bf6327bea9e4+24129607/model.hlo_module.pb index d396e291c54b3b1e1c83a9761d827ea5c2b5a5a3..a151e0db66c9936e4eb4c88ec4b2d7c748e10e2d 100644 --- a/neuronxcc-2.21.33363.0+82129205/MODULE_2672b897bf6327bea9e4+24129607/model.hlo_module.pb +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_2672b897bf6327bea9e4+24129607/model.hlo_module.pb @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:6b56b0d331077542e72e5da19741dfcd8d5d6bdd01d35c1cdbe74227327956a6 +oid sha256:b4b6486a12378501e2484cf81b9f6885eabca76a7d817e3e2041c1736bac16d7 size 82772 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_2672b897bf6327bea9e4+24129607/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_2672b897bf6327bea9e4+24129607/model.neff index 24f815ffa5bd57a7edac132c9d55d934ee370402..cb31650fc005c2de4ee977a846b33ff3a5fb7cb3 100644 --- a/neuronxcc-2.21.33363.0+82129205/MODULE_2672b897bf6327bea9e4+24129607/model.neff +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_2672b897bf6327bea9e4+24129607/model.neff @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:d1cd6ca36926fad065cd480b6e705f247170aeb533426465d808212c1b7a5123 +oid sha256:1c65b6b3a5f7c34ae231694981cf76347fb89393c25990695cd4f921f3d243e3 size 267264 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_26fe13069f0a9e99f32e+24129607/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_26fe13069f0a9e99f32e+24129607/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..836724f44545ce0dedda1521fd4c623a6ea8ec72 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_26fe13069f0a9e99f32e+24129607/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/context_encoding/_tp0_bk0/log-neuron-cc.txt"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_26fe13069f0a9e99f32e+24129607/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_26fe13069f0a9e99f32e+24129607/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_26fe13069f0a9e99f32e+24129607/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_26fe13069f0a9e99f32e+24129607/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..6d7c001aea0ee8f01fe55ed670a32916914bf996 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_26fe13069f0a9e99f32e+24129607/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3d4eaa3b3636adb612756e70dfef8afbc4ae0afbe8e04560c301a49ea2f074e9 +size 522818 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_26fe13069f0a9e99f32e+24129607/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_26fe13069f0a9e99f32e+24129607/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..6ef2037d9899a85e96698720f5fa547e3cfb1eef --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_26fe13069f0a9e99f32e+24129607/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d91e651714d7de678fd08630a5ce061d23e0e844226052a2d59c02b76945b06d +size 50187264 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_2a2a4bab1649c00a577f+a02c3a36/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_2a2a4bab1649c00a577f+a02c3a36/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..5726abc7d1d8c52fa95bc7919439a23a23fe3b9a --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_2a2a4bab1649c00a577f+a02c3a36/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/token_generation/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_2a2a4bab1649c00a577f+a02c3a36/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_2a2a4bab1649c00a577f+a02c3a36/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_2a2a4bab1649c00a577f+a02c3a36/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_2a2a4bab1649c00a577f+a02c3a36/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..d85a11d96a32147eadc611ac8bedd51c08839f42 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_2a2a4bab1649c00a577f+a02c3a36/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5150397c2f48112ac596401fd4cafae86f937eb96f16e06a9c38fec3bba7cc87 +size 450713 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_2a2a4bab1649c00a577f+a02c3a36/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_2a2a4bab1649c00a577f+a02c3a36/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..a4b09f8aab9af7df9e5aec257b62fef422e5f707 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_2a2a4bab1649c00a577f+a02c3a36/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:49fa72e7d69d8698538f163e35389b37a659f7910121f9b7c075a1d9696edde0 +size 3083264 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_2a2a4bab1649c00a577f+a02c3a36/wrapped_neff.hlo b/neuronxcc-2.21.33363.0+82129205/MODULE_2a2a4bab1649c00a577f+a02c3a36/wrapped_neff.hlo new file mode 100644 index 0000000000000000000000000000000000000000..0801f8fd466a8c50579777fd65a77d5540b7e1c8 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_2a2a4bab1649c00a577f+a02c3a36/wrapped_neff.hlo @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a9c542fe43d7702def7f7bc1111d3ad41d74aa2d4f37adf0582ed1f88dfd9622 +size 3157365 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_2a8eca8e0378831dfed0+f9f8d9f2/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_2a8eca8e0378831dfed0+f9f8d9f2/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..bec002fcd624dd50c22a4e2add187dd45708d5f9 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_2a8eca8e0378831dfed0+f9f8d9f2/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--enable-saturate-infinity", "--auto-cast=none", "--model-type=transformer", "-O1", "--logfile=/tmp/nxdi_test_812078a8-d4d8-4318-89fc-4adea56cef02/compiler_workdir/DecoderLayerWrapper/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_2a8eca8e0378831dfed0+f9f8d9f2/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_2a8eca8e0378831dfed0+f9f8d9f2/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_2a8eca8e0378831dfed0+f9f8d9f2/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_2a8eca8e0378831dfed0+f9f8d9f2/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..ff879eded7ec91ff4fc07b77e19994b215d22744 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_2a8eca8e0378831dfed0+f9f8d9f2/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e42bcbe7948f4d8cc240e37d6cb16249ae4adb96e4b00d85102f32851af7535f +size 21842 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_2a8eca8e0378831dfed0+f9f8d9f2/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_2a8eca8e0378831dfed0+f9f8d9f2/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..2a1ba8b7d7cb78d07b5c907ad54ae7a9ffbbce37 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_2a8eca8e0378831dfed0+f9f8d9f2/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f6f498ac8eb126d70c7bec3622859ac4c0ca5188f2d5e1d006c6f4e45c1ad45 +size 13507584 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_2a8eca8e0378831dfed0+f9f8d9f2/wrapped_neff.hlo b/neuronxcc-2.21.33363.0+82129205/MODULE_2a8eca8e0378831dfed0+f9f8d9f2/wrapped_neff.hlo new file mode 100644 index 0000000000000000000000000000000000000000..42662ad1579d78cc9fc945b5aa351be523f71a0e --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_2a8eca8e0378831dfed0+f9f8d9f2/wrapped_neff.hlo @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:af615d24a3366b0c55e609f2507b0b880e8bd5b8d50070cbabd170867c318255 +size 13513141 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_2be35f469d98437fb988+a02c3a36/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_2be35f469d98437fb988+a02c3a36/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..5726abc7d1d8c52fa95bc7919439a23a23fe3b9a --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_2be35f469d98437fb988+a02c3a36/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/token_generation/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_2be35f469d98437fb988+a02c3a36/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_2be35f469d98437fb988+a02c3a36/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_2be35f469d98437fb988+a02c3a36/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_2be35f469d98437fb988+a02c3a36/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..3787ab6f1dbf7ef691456dd915553c0dcfeea6ec --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_2be35f469d98437fb988+a02c3a36/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:33c0d924980adacf53be00ecc8defacb9d9e79a2cdfdeab4ae1e821ce9807fa3 +size 431007 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_2be35f469d98437fb988+a02c3a36/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_2be35f469d98437fb988+a02c3a36/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..19a6aec47a0cb28a3adefdbf20d7631fc4a499cd --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_2be35f469d98437fb988+a02c3a36/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c6733b1c6e5d7436be5e6d2e1dfc0989b1f168c5e8d584e3ea940a8f42a25b7e +size 3134464 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_2be35f469d98437fb988+a02c3a36/wrapped_neff.hlo b/neuronxcc-2.21.33363.0+82129205/MODULE_2be35f469d98437fb988+a02c3a36/wrapped_neff.hlo new file mode 100644 index 0000000000000000000000000000000000000000..2a73a358bcba83766fd64762c7004c14b88ac649 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_2be35f469d98437fb988+a02c3a36/wrapped_neff.hlo @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c4e27ca52b81b4bf465a499ec0bfc28d44a4c2156661892476b4454342c6a4bf +size 3208708 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_2facf9e355669579de43+24129607/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_2facf9e355669579de43+24129607/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..836724f44545ce0dedda1521fd4c623a6ea8ec72 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_2facf9e355669579de43+24129607/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/context_encoding/_tp0_bk0/log-neuron-cc.txt"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_2facf9e355669579de43+24129607/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_2facf9e355669579de43+24129607/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_2facf9e355669579de43+24129607/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_2facf9e355669579de43+24129607/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..d46d455b93a77bf5263860c04d178d2e526d263e --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_2facf9e355669579de43+24129607/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:74c34d10a1c301c387d1a81f13e046ec5c328450b36a1433688985ba53cdafa9 +size 61748 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_2facf9e355669579de43+24129607/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_2facf9e355669579de43+24129607/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..6ce79e3a6442014bf19ef906758baa37d7077a42 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_2facf9e355669579de43+24129607/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fab16ac6ff7661d9ce5297889945988be8d1cf5b8350af8eafc3a1202c1adf00 +size 1383424 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_313c4e4e44b74c64a01a+a02c3a36/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_313c4e4e44b74c64a01a+a02c3a36/model.neff index 4f809cd67362761109ea5e7b0fd40f064284f87d..f180a3ac59042bcbaf0a9707591c35c3c9adc5cd 100644 --- a/neuronxcc-2.21.33363.0+82129205/MODULE_313c4e4e44b74c64a01a+a02c3a36/model.neff +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_313c4e4e44b74c64a01a+a02c3a36/model.neff @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:e5477d813971bbd860779e46013216672c82d9307c9018cdd6df9a2cbdc45dbf +oid sha256:1c9ce6e5dbe86ee5e3ee3af585888bf707419b3429fbbe6715735f2e750e7186 size 3503104 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_313c4e4e44b74c64a01a+a02c3a36/wrapped_neff.hlo b/neuronxcc-2.21.33363.0+82129205/MODULE_313c4e4e44b74c64a01a+a02c3a36/wrapped_neff.hlo index 0703f5fb9fc7eedd8cb588bd5d8f693b8777e87c..4c48fe14bbfd7f045878e6b908c13c843acbdeb3 100644 --- a/neuronxcc-2.21.33363.0+82129205/MODULE_313c4e4e44b74c64a01a+a02c3a36/wrapped_neff.hlo +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_313c4e4e44b74c64a01a+a02c3a36/wrapped_neff.hlo @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:f4231b25c02fede81b37a9b22d913b0989eaf5281d447b2a9f30304db4c3527d +oid sha256:18bbd8164abb30f44a7b3893042bab4ff76c686ef675f41461bcc30dd730315b size 3640161 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_31e31b6f47afb89b553b+bafdbdde/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_31e31b6f47afb89b553b+bafdbdde/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..5a228a7a4cc7c7df9e8b4887d22dcd862c2f60f3 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_31e31b6f47afb89b553b+bafdbdde/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2", "-O1", "--lnc=1", "--enable-saturate-infinity", "--enable-mixed-precision-accumulation", "--internal-enable-dge-levels=vector_dynamic_offsets", "--internal-hlo2tensorizer-options=--verify-hlo=true", "--logfile=/tmp/nxd_model/token_generation/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_31e31b6f47afb89b553b+bafdbdde/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_31e31b6f47afb89b553b+bafdbdde/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_31e31b6f47afb89b553b+bafdbdde/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_31e31b6f47afb89b553b+bafdbdde/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..034b3692dbedbb2c3dc57e51f7235a13ff251cc9 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_31e31b6f47afb89b553b+bafdbdde/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:061213de218a73c7d090fd093562e9c08718438de6287e6a332372c8f7906930 +size 70276 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_31e31b6f47afb89b553b+bafdbdde/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_31e31b6f47afb89b553b+bafdbdde/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..0f74f5d3bf8893db7c6f48efe0d992d770b23b52 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_31e31b6f47afb89b553b+bafdbdde/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e64780612d32c890d4c7d297248e064089d8ef4f8a9f9d5a9a1c169c6421ec29 +size 277504 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_31e31b6f47afb89b553b+bafdbdde/wrapped_neff.hlo b/neuronxcc-2.21.33363.0+82129205/MODULE_31e31b6f47afb89b553b+bafdbdde/wrapped_neff.hlo new file mode 100644 index 0000000000000000000000000000000000000000..0d9c94e8f0f71749a41037666f977c6ef332a510 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_31e31b6f47afb89b553b+bafdbdde/wrapped_neff.hlo @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:54d1ec39550a8bb2e6e192265b3fed7b4a12065b0c8d82456a918f7a5be1e4ae +size 289571 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_31e31b6f47afb89b553b+da15b874/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_31e31b6f47afb89b553b+da15b874/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..c3fb8c073852fb04e7ae88fd2592978716b60eeb --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_31e31b6f47afb89b553b+da15b874/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2", "-O1--lnc=1", "--enable-saturate-infinity", "--enable-mixed-precision-accumulation", "--internal-enable-dge-levels=vector_dynamic_offsets", "--internal-hlo2tensorizer-options=--verify-hlo=true", "--logfile=/tmp/nxd_model/token_generation/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_31e31b6f47afb89b553b+da15b874/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_31e31b6f47afb89b553b+da15b874/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..2117dab3e3ed8caad749b8256ab430c591d3b72a --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_31e31b6f47afb89b553b+da15b874/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ec57d9d2f9d9be197ad88a58ece6b14b0ccab97c121b8d20cc9512558ddf6562 +size 70276 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_31e31b6f47afb89b553b+da15b874/model.log b/neuronxcc-2.21.33363.0+82129205/MODULE_31e31b6f47afb89b553b+da15b874/model.log new file mode 100644 index 0000000000000000000000000000000000000000..f25bdb6bbd823e002119a606100d83dd796b7d08 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_31e31b6f47afb89b553b+da15b874/model.log @@ -0,0 +1,5 @@ +Failed compilation with ['neuronx-cc', 'compile', '--framework=XLA', '/tmp/nxd_model/token_generation/_tp0_bk0/model.MODULE_31e31b6f47afb89b553b+da15b874.hlo_module.pb', '--output', '/tmp/nxd_model/token_generation/_tp0_bk0/model.MODULE_31e31b6f47afb89b553b+da15b874.neff', '--target=trn1', '--auto-cast=none', '--model-type=transformer', '--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2', '-O1--lnc=1', '--enable-saturate-infinity', '--enable-mixed-precision-accumulation', '--internal-enable-dge-levels=vector_dynamic_offsets', '--internal-hlo2tensorizer-options=--verify-hlo=true', '--logfile=/tmp/nxd_model/token_generation/_tp0_bk0/log-neuron-cc.txt', '--enable-internal-neff-wrapper', '--verbose=35']: neuronx-cc compile: argument --optlevel/-O: invalid choice: 1--lnc=1 (choose from 1, 2, 3) +usage: neuronx-cc compile --framework {XLA} --target {trn1,inf2,trn1n,trn2,trn2n} [--logical-nc-config {1,2}] [--enable-fast-loading-neuron-binaries] [--enable-fast-context-switch] + [--auto-cast ] [--auto-cast-type {fp16,bf16,tf32,fp8_e4m3}] [--output ] [--optlevel {1,2,3}] [--help] + [--model-type {transformer,unet-inference,generic}] [--distribution-strategy {fsdp,nemo,llm-training,generic}] [--enable-dge] + [--verbose {debug|info|warning|user|off}] [--logfile ] [--logfile-verbose {debug|info|warning|user}] diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_32a1f486b38c93d2cf79+aefc65cb/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_32a1f486b38c93d2cf79+aefc65cb/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..c5952e088416a39a69306c916805c51af6791f67 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_32a1f486b38c93d2cf79+aefc65cb/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--enable-saturate-infinity", "--auto-cast=none", "--model-type=transformer", "-O1", "--logfile=/tmp/nxdi_test_5710ae5f-9607-4686-8ff0-ea79d5a044f9/compiler_workdir/DecoderLayerWrapper/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_32a1f486b38c93d2cf79+aefc65cb/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_32a1f486b38c93d2cf79+aefc65cb/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_32a1f486b38c93d2cf79+aefc65cb/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_32a1f486b38c93d2cf79+aefc65cb/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..a852e97890f4515eb815fe58fdd223424595647c --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_32a1f486b38c93d2cf79+aefc65cb/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d81d4f270c9fdb31b731b1d9ccd66a9862aaeb87b9a21cd08c180306f8ad8baa +size 22067 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_32a1f486b38c93d2cf79+aefc65cb/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_32a1f486b38c93d2cf79+aefc65cb/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..228f8711af4c6f5159955c26a2d36c0e42b638f0 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_32a1f486b38c93d2cf79+aefc65cb/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e0356039895590074cabcb72fc03b812aba1dcab8ab36df8c9a1ae048108bc1a +size 45251584 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_32a1f486b38c93d2cf79+aefc65cb/wrapped_neff.hlo b/neuronxcc-2.21.33363.0+82129205/MODULE_32a1f486b38c93d2cf79+aefc65cb/wrapped_neff.hlo new file mode 100644 index 0000000000000000000000000000000000000000..e25f1a62bc1eff158d78288ae24357114a244a4f --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_32a1f486b38c93d2cf79+aefc65cb/wrapped_neff.hlo @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9384dd4822184baaa34c79a9975c246aeef6c8ad6e78e6e08e930cf7020b5f86 +size 45257152 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_35a63695aeefa2d44798+24129607/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_35a63695aeefa2d44798+24129607/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..836724f44545ce0dedda1521fd4c623a6ea8ec72 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_35a63695aeefa2d44798+24129607/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/context_encoding/_tp0_bk0/log-neuron-cc.txt"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_35a63695aeefa2d44798+24129607/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_35a63695aeefa2d44798+24129607/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_35a63695aeefa2d44798+24129607/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_35a63695aeefa2d44798+24129607/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..e4b079abea0f82423ab2605e3d2e8fdcaeec1d47 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_35a63695aeefa2d44798+24129607/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:996734e9b61410c29a1dec6e20faca089cdc9e6f6d1ed6361c1cdc1ebf79de20 +size 439084 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_35a63695aeefa2d44798+24129607/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_35a63695aeefa2d44798+24129607/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..4e7baaa4c5b1e285fb139a71985cf649d607a491 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_35a63695aeefa2d44798+24129607/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fdcb29853ebd5b5be6ccc9f14b429ed3911423c1b9ee98ee9e5e1491e989c8df +size 31325184 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_3742470769527135970+e30acd3a/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_3742470769527135970+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_3742470769527135970+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_3742470769527135970+e30acd3a/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_3742470769527135970+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_3742470769527135970+e30acd3a/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_3742470769527135970+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..0144f7524b44832ee3b9b97df32c513be07b762a --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_3742470769527135970+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d9f2d2d1e1238756da7acab6abca4cdd1f5ea3123f8be4870d733f60b2b16117 +size 1584 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_3742470769527135970+e30acd3a/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_3742470769527135970+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..e39f6e7f619aaf57312dbbf04574033786189700 Binary files /dev/null and b/neuronxcc-2.21.33363.0+82129205/MODULE_3742470769527135970+e30acd3a/model.neff differ diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_3c75648f1b6d85bd72d5+a02c3a36/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_3c75648f1b6d85bd72d5+a02c3a36/model.hlo_module.pb index 781ef29d24dabc23eb054215bc19b2abc3f419bb..eaa293b4f71a668dfd800b85378e442f16ff772e 100644 --- a/neuronxcc-2.21.33363.0+82129205/MODULE_3c75648f1b6d85bd72d5+a02c3a36/model.hlo_module.pb +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_3c75648f1b6d85bd72d5+a02c3a36/model.hlo_module.pb @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:6f113c10c77741cc08a19adc7d5e09e035a03a03d751dbefede3d51d70aa3a37 +oid sha256:43084b28c1eb1e4e35a8ce5107944cf673a708ff6fdcca63d8eb5db3610ddc9e size 426769 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_3c75648f1b6d85bd72d5+a02c3a36/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_3c75648f1b6d85bd72d5+a02c3a36/model.neff index 8b5e9b5929c041f51bc1955afc24d21acd9eecbb..3c1d4bb93e5fca421abf6d91fc90f3e8d828bef3 100644 --- a/neuronxcc-2.21.33363.0+82129205/MODULE_3c75648f1b6d85bd72d5+a02c3a36/model.neff +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_3c75648f1b6d85bd72d5+a02c3a36/model.neff @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:6f6b941c15ed66c686b8acff2b452ead98bcf0a038a2569fb7a79463ea49703a +oid sha256:b8b2b09210453b06bb5291f939a26f54542cf10e5825b38365c7048649a22586 size 3073024 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_3c75648f1b6d85bd72d5+a02c3a36/wrapped_neff.hlo b/neuronxcc-2.21.33363.0+82129205/MODULE_3c75648f1b6d85bd72d5+a02c3a36/wrapped_neff.hlo index ddaba73d698a3c624e122b4d2fcbf3d56b483c5f..69a4ec3d18d5f7201c52266637ff1b0c20707812 100644 --- a/neuronxcc-2.21.33363.0+82129205/MODULE_3c75648f1b6d85bd72d5+a02c3a36/wrapped_neff.hlo +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_3c75648f1b6d85bd72d5+a02c3a36/wrapped_neff.hlo @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:3251669900d2348ad53608811a4ffc8d5adb276028f5b97a24b9dcb52014473d +oid sha256:0bf07a3c100d60a4846c9553cebcf878350a91cdc83b9e21f41497b5e29a9353 size 3147125 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_3d18caa8c6545b3526ee+24129607/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_3d18caa8c6545b3526ee+24129607/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..836724f44545ce0dedda1521fd4c623a6ea8ec72 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_3d18caa8c6545b3526ee+24129607/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/context_encoding/_tp0_bk0/log-neuron-cc.txt"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_3d18caa8c6545b3526ee+24129607/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_3d18caa8c6545b3526ee+24129607/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..6f429d4f3167523c7e5b7dbe8a9ceb0bdb5ef393 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_3d18caa8c6545b3526ee+24129607/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1c4696443fc792c790e4db6ef23dc6ce83740ba279e4a38fe67b7e9df14c7afc +size 61748 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_3d18caa8c6545b3526ee+24129607/model.log b/neuronxcc-2.21.33363.0+82129205/MODULE_3d18caa8c6545b3526ee+24129607/model.log new file mode 100644 index 0000000000000000000000000000000000000000..6e60c201aab0ec957bfd4919dc98fd2f81d7f0d4 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_3d18caa8c6545b3526ee+24129607/model.log @@ -0,0 +1 @@ +Failed compilation with ['neuronx-cc', 'compile', '--framework=XLA', '/tmp/nxd_model/context_encoding/_tp0_bk0/model.MODULE_3d18caa8c6545b3526ee+24129607.hlo_module.pb', '--output', '/tmp/nxd_model/context_encoding/_tp0_bk0/model.MODULE_3d18caa8c6545b3526ee+24129607.neff', '--target=trn1', '--auto-cast=none', '--model-type=transformer', '--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ', '-O2', '--lnc=1', '--logfile=/tmp/nxd_model/context_encoding/_tp0_bk0/log-neuron-cc.txt', '--verbose=35']: \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_415b25e4e1c1a1ab8cc6+a02c3a36/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_415b25e4e1c1a1ab8cc6+a02c3a36/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..5726abc7d1d8c52fa95bc7919439a23a23fe3b9a --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_415b25e4e1c1a1ab8cc6+a02c3a36/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/token_generation/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_415b25e4e1c1a1ab8cc6+a02c3a36/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_415b25e4e1c1a1ab8cc6+a02c3a36/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_415b25e4e1c1a1ab8cc6+a02c3a36/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_415b25e4e1c1a1ab8cc6+a02c3a36/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..d56c4afb41862f33e433c98cb072d925ee0e847a --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_415b25e4e1c1a1ab8cc6+a02c3a36/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7071240a51ed314e5995b9f1702a28f7d6403edabea3f83ac63117b2b8575c94 +size 418008 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_415b25e4e1c1a1ab8cc6+a02c3a36/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_415b25e4e1c1a1ab8cc6+a02c3a36/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..5d5ce6101d8d69b980d3a0ef46b3f06df7034d6f --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_415b25e4e1c1a1ab8cc6+a02c3a36/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:712b59b369059677cc76a50ca3b5058cafe588d641a93fdf1cf06cd2a9161a7f +size 2315264 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_415b25e4e1c1a1ab8cc6+a02c3a36/wrapped_neff.hlo b/neuronxcc-2.21.33363.0+82129205/MODULE_415b25e4e1c1a1ab8cc6+a02c3a36/wrapped_neff.hlo new file mode 100644 index 0000000000000000000000000000000000000000..fdc2a7bf0de7a12e92fb2dd050e08fdcb378664a --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_415b25e4e1c1a1ab8cc6+a02c3a36/wrapped_neff.hlo @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:08461d638c78e562d0365be917d002ca16cdd440bade82cce4724ab1ef1690ea +size 2389365 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_4247663625e2eaeb4fab+a02c3a36/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_4247663625e2eaeb4fab+a02c3a36/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..5726abc7d1d8c52fa95bc7919439a23a23fe3b9a --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_4247663625e2eaeb4fab+a02c3a36/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/token_generation/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_4247663625e2eaeb4fab+a02c3a36/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_4247663625e2eaeb4fab+a02c3a36/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_4247663625e2eaeb4fab+a02c3a36/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_4247663625e2eaeb4fab+a02c3a36/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..fde266f24753492d595dbb2d9fbc88c2a3fa7f78 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_4247663625e2eaeb4fab+a02c3a36/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f0c908a5ddbf03970315b73168cfd6d3b14f39328f2b700c5d1e9c4144323034 +size 91147 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_4247663625e2eaeb4fab+a02c3a36/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_4247663625e2eaeb4fab+a02c3a36/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..971ceabb2f757196d864f73d5bfed5da56e21f81 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_4247663625e2eaeb4fab+a02c3a36/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ad22d482746dc393d9343d9b7855e8da2352e083b60b8627da2f1291a7ba960f +size 277504 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_4247663625e2eaeb4fab+a02c3a36/wrapped_neff.hlo b/neuronxcc-2.21.33363.0+82129205/MODULE_4247663625e2eaeb4fab+a02c3a36/wrapped_neff.hlo new file mode 100644 index 0000000000000000000000000000000000000000..a7c5e47b3cb90370430f202ccedb2dc411e99f54 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_4247663625e2eaeb4fab+a02c3a36/wrapped_neff.hlo @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0d64528a98e0b9f958208d4b0fa5e55a5cd5026e6c04a9d2d5ee1e01bfcec393 +size 289031 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_42601fbe748660a77be0+24129607/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_42601fbe748660a77be0+24129607/model.hlo_module.pb index 8e197c567018eaadae5985e26111641ed208c2fb..d6ec8f50958e8d2e4ce15f18cddcde3d6e39eaba 100644 --- a/neuronxcc-2.21.33363.0+82129205/MODULE_42601fbe748660a77be0+24129607/model.hlo_module.pb +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_42601fbe748660a77be0+24129607/model.hlo_module.pb @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:d007bb7f19dc61262140698229d888d0b068426fac10d9b9b91caf164ce03f62 +oid sha256:64694dab15395d5f9cbbf32f45ee8924868bc1c2e8052c947c86c68c533b0420 size 923430 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_42601fbe748660a77be0+24129607/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_42601fbe748660a77be0+24129607/model.neff index 02757a845d768b8e2a635157bcfbb1e8fcbbe156..f4a243064cdf6402784f67094405d26f78708214 100644 --- a/neuronxcc-2.21.33363.0+82129205/MODULE_42601fbe748660a77be0+24129607/model.neff +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_42601fbe748660a77be0+24129607/model.neff @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:4afe796b0d005955e0e3c76c735b50c83ce7b5c0ca9c0cd5b76b031131b4f6e4 +oid sha256:1605afbb7b8dfa13b0d1ab9a10c86b98ac20a19d12cd861502b0974964a9627f size 5213184 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_437a9e154e0cc794398f+0da03933/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_437a9e154e0cc794398f+0da03933/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..9bc100211f66b009fd4618d869085e5eefcacdf9 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_437a9e154e0cc794398f+0da03933/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--enable-saturate-infinity", "--auto-cast=none", "--model-type=transformer", "-O1", "--logfile=/tmp/nxdi_test_f8046dd1-17f4-48f1-9db5-e72f948df6d4/compiler_workdir/DecoderLayerWrapper/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_437a9e154e0cc794398f+0da03933/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_437a9e154e0cc794398f+0da03933/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_437a9e154e0cc794398f+0da03933/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_437a9e154e0cc794398f+0da03933/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..93830a9e3c3ba8980fb309b3be9cf1a8cc9f0f8d --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_437a9e154e0cc794398f+0da03933/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7cb82e68653c0d69b83d4e680812efb7015c733fc863789b753dadd380599dcd +size 15848 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_437a9e154e0cc794398f+0da03933/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_437a9e154e0cc794398f+0da03933/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..45f13a3d37b03cc8d4b6bf504738f157c221b41a --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_437a9e154e0cc794398f+0da03933/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:34a8af1af3ec00a5602296f41b1a6c0be7e5e169b6b0ae3eb24759a29c761e36 +size 400384 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_437a9e154e0cc794398f+0da03933/wrapped_neff.hlo b/neuronxcc-2.21.33363.0+82129205/MODULE_437a9e154e0cc794398f+0da03933/wrapped_neff.hlo new file mode 100644 index 0000000000000000000000000000000000000000..cb543f4a6f1655c6b9a8ad5ac4847448e6ddd5bf --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_437a9e154e0cc794398f+0da03933/wrapped_neff.hlo @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dbfc55682e4cde6e69da161b545755925c78e56ce4dc16b55700795d1c3a5648 +size 406082 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_4413977037670895934+e30acd3a/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_4413977037670895934+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_4413977037670895934+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_4413977037670895934+e30acd3a/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_4413977037670895934+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..49f6bceffacbac6067fb57db5ca99fe4cde58a1f --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_4413977037670895934+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:142cf311bb36155e3b609e6f1aa843a87974422fab37ba4fd5166d092a028f5e +size 1338 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_4729947242617427400+e30acd3a/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_4729947242617427400+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_4729947242617427400+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_4729947242617427400+e30acd3a/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_4729947242617427400+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_4729947242617427400+e30acd3a/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_4729947242617427400+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..ab5d2955c5aeb33c2b8423e7facddd2ddead1ea3 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_4729947242617427400+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0dc16184a9197b242ab9bb070a2262cfc60a11b4b84c12d4ea59fad356f64771 +size 1585 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_4729947242617427400+e30acd3a/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_4729947242617427400+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..8263ea8b3de78893adf983571add9f78cf4a97f4 Binary files /dev/null and b/neuronxcc-2.21.33363.0+82129205/MODULE_4729947242617427400+e30acd3a/model.neff differ diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_4982309848892198153+e30acd3a/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_4982309848892198153+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_4982309848892198153+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_4982309848892198153+e30acd3a/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_4982309848892198153+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_4982309848892198153+e30acd3a/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_4982309848892198153+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..409dc6a76c47febfd2e6764450b15c032e0d0419 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_4982309848892198153+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c0dcdccfc9cb1289cceea693cfb9f27f91556fcbe3060a7aeffcbef90ef8946d +size 1585 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_4982309848892198153+e30acd3a/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_4982309848892198153+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..7feeecde5013bd311d129e9b73e614feeacff2fd Binary files /dev/null and b/neuronxcc-2.21.33363.0+82129205/MODULE_4982309848892198153+e30acd3a/model.neff differ diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_49b427a31f505e15551a+ec51c92c/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_49b427a31f505e15551a+ec51c92c/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..4497c8e4272323ebdda5e2b1043ebdf59117430b --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_49b427a31f505e15551a+ec51c92c/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--enable-saturate-infinity", "--auto-cast=none", "--model-type=transformer", "-O1", "--logfile=/tmp/nxdi_test_559ff7cb-7a76-44b8-a16e-2de44cab2a60/compiler_workdir/DecoderLayerWrapper/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_49b427a31f505e15551a+ec51c92c/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_49b427a31f505e15551a+ec51c92c/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_49b427a31f505e15551a+ec51c92c/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_49b427a31f505e15551a+ec51c92c/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..24059d82bbcd149441306f8c07104e0d1a528b8d --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_49b427a31f505e15551a+ec51c92c/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ffcb69581a275910194c1f9da6e6f165815ff451ce0b8fc2a627210726a1426a +size 14480 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_49b427a31f505e15551a+ec51c92c/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_49b427a31f505e15551a+ec51c92c/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..c24efa6f547487c85acc26acf0bfeeb3bbd588c6 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_49b427a31f505e15551a+ec51c92c/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5c7ce05af28e3de8c57215d18f13b1d163b60f87e1ca2c9fe21ae0d996be2d51 +size 267264 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_49b427a31f505e15551a+ec51c92c/wrapped_neff.hlo b/neuronxcc-2.21.33363.0+82129205/MODULE_49b427a31f505e15551a+ec51c92c/wrapped_neff.hlo new file mode 100644 index 0000000000000000000000000000000000000000..153da81bf8b396c3543fe6fe860fb1a54701f464 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_49b427a31f505e15551a+ec51c92c/wrapped_neff.hlo @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e00b5183ccdd988fa7f78fb681dca16e8c85117ab6822fedb153ddb5f8161e4 +size 272962 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_4ac5ed244908e0b23eb7+677eeb9d/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_4ac5ed244908e0b23eb7+677eeb9d/model.hlo_module.pb index b4c40605da7851ffe567c9778de9d2083d306e1a..58b844b6061c1f9a1ab0b3c6c889c594ba91dd4b 100644 --- a/neuronxcc-2.21.33363.0+82129205/MODULE_4ac5ed244908e0b23eb7+677eeb9d/model.hlo_module.pb +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_4ac5ed244908e0b23eb7+677eeb9d/model.hlo_module.pb @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:185054b8ba80e7f52847989d5a58e3fb4aade61a671dfa510960053999998743 +oid sha256:ca80d55257caff0cc88a182611da0df7d95d1903c9dfe7bf87cf178ffb39718d size 423848 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_4ac5ed244908e0b23eb7+677eeb9d/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_4ac5ed244908e0b23eb7+677eeb9d/model.neff index 6c6159f8d47db8fd8279f29a598f88cf5f4cba96..623cc7349e31b11ca390261219fa1e4057305709 100644 --- a/neuronxcc-2.21.33363.0+82129205/MODULE_4ac5ed244908e0b23eb7+677eeb9d/model.neff +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_4ac5ed244908e0b23eb7+677eeb9d/model.neff @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:c9edfbb33bf7c99e688e8c548d7dd44eb866e3c89386ccf98942ae4694ebfeba +oid sha256:d70ad414aa3573103cbfde1ce85a53ec1a0481420517552d1a3c956e83bb630b size 3687424 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_4ec35bb57fbe1fdb6c78+24129607/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_4ec35bb57fbe1fdb6c78+24129607/model.hlo_module.pb index 895edb3462afd732c644c9f7bdcba520ae1d2f4f..9704ecf1639b344805be684c2ded122cea54d55c 100644 --- a/neuronxcc-2.21.33363.0+82129205/MODULE_4ec35bb57fbe1fdb6c78+24129607/model.hlo_module.pb +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_4ec35bb57fbe1fdb6c78+24129607/model.hlo_module.pb @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9e6541330eaced8ef5bd62804c6e06991d2bcb38f68c71b2cabb4ce571665de2 +oid sha256:dffab56f351fd6047a44f5ebd5da77b5b9ff225cbccc10f1838035d418f90930 size 1050679 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_4ec35bb57fbe1fdb6c78+24129607/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_4ec35bb57fbe1fdb6c78+24129607/model.neff index 4706e6ef2fc9d02aea23b7d7dd1b7f62c0776276..99bdbdb85c437f2560d064e1104bb4c119c3726a 100644 --- a/neuronxcc-2.21.33363.0+82129205/MODULE_4ec35bb57fbe1fdb6c78+24129607/model.neff +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_4ec35bb57fbe1fdb6c78+24129607/model.neff @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:d387ff6d3dd9954294cec3810fadabd0718735a038aaebd74ab358c209fd2b88 +oid sha256:50bc7c0ea9062790faf1ff7831453d65c8d1d51cde620c8e380820e4486a5f9d size 5827584 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_5056926643664195969+e30acd3a/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_5056926643664195969+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_5056926643664195969+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_5056926643664195969+e30acd3a/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_5056926643664195969+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_5056926643664195969+e30acd3a/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_5056926643664195969+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..7da2d77d6f20dd2d43935bc46b7a42f00a1b53fd --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_5056926643664195969+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:058681d48647e0c9b3dbe7688a61919a6582484d2f0b81ba3c0155e378d39840 +size 1584 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_5056926643664195969+e30acd3a/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_5056926643664195969+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..ad763435ca14fea6e494cc68dbcdab7383f59eea Binary files /dev/null and b/neuronxcc-2.21.33363.0+82129205/MODULE_5056926643664195969+e30acd3a/model.neff differ diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_5060945789978167091+e30acd3a/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_5060945789978167091+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_5060945789978167091+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_5060945789978167091+e30acd3a/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_5060945789978167091+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_5060945789978167091+e30acd3a/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_5060945789978167091+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..9f7cfa734d8f530c72009eb32f5920d1b7011ac8 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_5060945789978167091+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f5cc8fae4180e9c37d3edf0a9c33cb9a77cc20d3a208ab308dd26971d505a3f2 +size 1584 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_5060945789978167091+e30acd3a/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_5060945789978167091+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..c3e1d9df7d56d2f2630b9356f00b7248d6ca82c1 Binary files /dev/null and b/neuronxcc-2.21.33363.0+82129205/MODULE_5060945789978167091+e30acd3a/model.neff differ diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_5068307057019708073+e30acd3a/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_5068307057019708073+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_5068307057019708073+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_5068307057019708073+e30acd3a/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_5068307057019708073+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_5068307057019708073+e30acd3a/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_5068307057019708073+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..c134283ccd0f0cb78d3df709fd00745d387a3bf2 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_5068307057019708073+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d1bfa4233bec9ae7d38413a0183ed12d18519fc8a52d4be29ae06d39da17d8cd +size 1584 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_5068307057019708073+e30acd3a/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_5068307057019708073+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..db6bb0a5b3d4fda083e6e3bd99c94af9c0781cd7 Binary files /dev/null and b/neuronxcc-2.21.33363.0+82129205/MODULE_5068307057019708073+e30acd3a/model.neff differ diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_5221425564004302780+e30acd3a/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_5221425564004302780+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_5221425564004302780+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_5221425564004302780+e30acd3a/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_5221425564004302780+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_5221425564004302780+e30acd3a/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_5221425564004302780+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..72df21a2578f24d625843a1a3247988a3fbd65c4 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_5221425564004302780+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:41482b2311979515b0aeef0f82fffdc167ce3ed1cf6a003693418491cdb469fc +size 1584 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_5221425564004302780+e30acd3a/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_5221425564004302780+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..0c746225bc978d88dd2fc327c375cd121535189f Binary files /dev/null and b/neuronxcc-2.21.33363.0+82129205/MODULE_5221425564004302780+e30acd3a/model.neff differ diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_5321c1b69979af5581ee+a02c3a36/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_5321c1b69979af5581ee+a02c3a36/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..5726abc7d1d8c52fa95bc7919439a23a23fe3b9a --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_5321c1b69979af5581ee+a02c3a36/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/token_generation/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_5321c1b69979af5581ee+a02c3a36/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_5321c1b69979af5581ee+a02c3a36/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_5321c1b69979af5581ee+a02c3a36/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_5321c1b69979af5581ee+a02c3a36/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..a24605669bdc13546da99ca5a437f66e68bd7b1a --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_5321c1b69979af5581ee+a02c3a36/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f820ab2f729bdfd55a7ba9bf0003cafd9de67e76cd3a97884b33094e6344f53b +size 59654 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_5321c1b69979af5581ee+a02c3a36/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_5321c1b69979af5581ee+a02c3a36/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..15fd3c16b848d0eab5773fc0b8412a3b450bd2ad --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_5321c1b69979af5581ee+a02c3a36/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d7860b98a64042069d6fc93f55e4fdd957cd63f1dc2833e60f8f0c2be421f943 +size 1065984 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_5321c1b69979af5581ee+a02c3a36/wrapped_neff.hlo b/neuronxcc-2.21.33363.0+82129205/MODULE_5321c1b69979af5581ee+a02c3a36/wrapped_neff.hlo new file mode 100644 index 0000000000000000000000000000000000000000..90d74fc16d8a727c38f67cbddb21600ec5343c8e --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_5321c1b69979af5581ee+a02c3a36/wrapped_neff.hlo @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a41e80db3ee12b789d64769d2aeef981cbc1b2fa8ff1f244202a57cd02b903bc +size 1072769 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_5346694134112720644+e30acd3a/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_5346694134112720644+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_5346694134112720644+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_5346694134112720644+e30acd3a/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_5346694134112720644+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_5346694134112720644+e30acd3a/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_5346694134112720644+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..1a8b11f7ea3f8104bfc94568f6e6605b1044b61a --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_5346694134112720644+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5163c6cbea635d50d6bcef42a476e0c486c1fe477ce65bddb01ef5d613f3ada7 +size 1584 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_5346694134112720644+e30acd3a/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_5346694134112720644+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..49ebd07bab2483eb641ed27190176b7a0bde2a3c Binary files /dev/null and b/neuronxcc-2.21.33363.0+82129205/MODULE_5346694134112720644+e30acd3a/model.neff differ diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_54dce09f6a5327de2511+fe16c4be/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_54dce09f6a5327de2511+fe16c4be/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..7be89b3e590fbf1fefd1d22b3fa5955dd1257559 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_54dce09f6a5327de2511+fe16c4be/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--enable-saturate-infinity", "--auto-cast=none", "--model-type=transformer", "-O1", "--logfile=/tmp/nxdi_test_fcc54286-d5b7-4e55-9ea0-9d22abafcc6d/compiler_workdir/DecoderLayerWrapper/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_54dce09f6a5327de2511+fe16c4be/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_54dce09f6a5327de2511+fe16c4be/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_54dce09f6a5327de2511+fe16c4be/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_54dce09f6a5327de2511+fe16c4be/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..24059d82bbcd149441306f8c07104e0d1a528b8d --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_54dce09f6a5327de2511+fe16c4be/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ffcb69581a275910194c1f9da6e6f165815ff451ce0b8fc2a627210726a1426a +size 14480 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_54dce09f6a5327de2511+fe16c4be/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_54dce09f6a5327de2511+fe16c4be/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..70b156ca450d4a72d7ff99fd4290bf3866804e63 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_54dce09f6a5327de2511+fe16c4be/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bb035ebc5ee4edb0eadf00aaa3c9ad4a7aa8598c63ea253488b28c1014e8b6ac +size 267264 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_54dce09f6a5327de2511+fe16c4be/wrapped_neff.hlo b/neuronxcc-2.21.33363.0+82129205/MODULE_54dce09f6a5327de2511+fe16c4be/wrapped_neff.hlo new file mode 100644 index 0000000000000000000000000000000000000000..a39f153b6829edf1fb318f42cd53710e15a56cd4 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_54dce09f6a5327de2511+fe16c4be/wrapped_neff.hlo @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b24ff417c4c79be9479a91455335c7d277f1145fe6d3725fa91ac58deb3d035 +size 272962 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_578110665359387607+e30acd3a/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_578110665359387607+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_578110665359387607+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_578110665359387607+e30acd3a/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_578110665359387607+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_578110665359387607+e30acd3a/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_578110665359387607+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..08f880bfd2f6bc4dbf4ba0e030ae57400b3644d9 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_578110665359387607+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9416ee80e28588b7d58a56ed290c42e6942a1b3745ec238b91c7fafbc1f154e5 +size 1584 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_578110665359387607+e30acd3a/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_578110665359387607+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..0a4b67437bca50e840e4750cd8418b65a6880796 Binary files /dev/null and b/neuronxcc-2.21.33363.0+82129205/MODULE_578110665359387607+e30acd3a/model.neff differ diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_5960bdedd7549bfacf7a+24129607/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_5960bdedd7549bfacf7a+24129607/model.hlo_module.pb index dbe1f9441e2a7b2c4185bbafced0748b740f4d63..96b0b9d0aac667bdfb4b89f452b77fd0695d787e 100644 --- a/neuronxcc-2.21.33363.0+82129205/MODULE_5960bdedd7549bfacf7a+24129607/model.hlo_module.pb +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_5960bdedd7549bfacf7a+24129607/model.hlo_module.pb @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:5231390fb7b7b3c9416cee6d063cf72f57c3e66de2333a27302fd7480aad917a +oid sha256:76c10df9f9fadac3ce5fee74c4470b2cdade440cf97718b4545a4e3de7fc54aa size 694128 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_5960bdedd7549bfacf7a+24129607/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_5960bdedd7549bfacf7a+24129607/model.neff index b4b9c29f0411998756002266e85b7d95ef151b1d..ea50519fb23dc2dea11f1fddc04774675adc6431 100644 --- a/neuronxcc-2.21.33363.0+82129205/MODULE_5960bdedd7549bfacf7a+24129607/model.neff +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_5960bdedd7549bfacf7a+24129607/model.neff @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:1d609c20314399dc90d7d3efc2f573991a8799ceb9c8c13a0528387d15454663 +oid sha256:5f816d25661f62f7f838c0800cb426bb2a2a552c974bc9c93181f83780ef36d8 size 625664 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_5a1775d2dd85719fa52a+a02c3a36/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_5a1775d2dd85719fa52a+a02c3a36/model.hlo_module.pb index ca2139b0a1c89d82bfa0225cb7b5731633c2c9f3..3b4e1caf8515f00e3ac37c3a1dfdba8ecbc8165c 100644 --- a/neuronxcc-2.21.33363.0+82129205/MODULE_5a1775d2dd85719fa52a+a02c3a36/model.hlo_module.pb +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_5a1775d2dd85719fa52a+a02c3a36/model.hlo_module.pb @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:e684a3c433b3d1931b42c868bc1f8e187d8d344041c428cfd571ae78019cda22 +oid sha256:19511d8804f5867708960e2d2fe363464f9fab523e00714e2bb658fd0dcf7d66 size 872065 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_5a1775d2dd85719fa52a+a02c3a36/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_5a1775d2dd85719fa52a+a02c3a36/model.neff index 85e79360d6e09dcd11d7ee7195d717c34e7e6256..32d9b98722be808e147b384df7ffd9d0acfed0ef 100644 --- a/neuronxcc-2.21.33363.0+82129205/MODULE_5a1775d2dd85719fa52a+a02c3a36/model.neff +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_5a1775d2dd85719fa52a+a02c3a36/model.neff @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:558d00184fa1bac07430de16a73ee90da6291d87bdca5c37a0861521f936e86f +oid sha256:a1f800118fbab2a3f0e76ea675155dee4ac7c7c81344422aaf3a1d9410fa8c8c size 6759424 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_5a1775d2dd85719fa52a+a02c3a36/wrapped_neff.hlo b/neuronxcc-2.21.33363.0+82129205/MODULE_5a1775d2dd85719fa52a+a02c3a36/wrapped_neff.hlo index ac67cf1b1f6b08f88b88277daf86dc0d968f2f51..ae0aac5addc49da5e5dc1eff828aca17a6d3900b 100644 --- a/neuronxcc-2.21.33363.0+82129205/MODULE_5a1775d2dd85719fa52a+a02c3a36/wrapped_neff.hlo +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_5a1775d2dd85719fa52a+a02c3a36/wrapped_neff.hlo @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:f3f72238ea26ef23b1555bbfebd0581b0e7192da33c47dabc912a8987fe7a106 +oid sha256:e19063f7564465530256f4c433085a999fd5c7f620fd46742c22e971a9c2a098 size 6925948 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_6208374896869439318+e30acd3a/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_6208374896869439318+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_6208374896869439318+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_6208374896869439318+e30acd3a/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_6208374896869439318+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_6208374896869439318+e30acd3a/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_6208374896869439318+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..b2e45ac79e7cdd5ec4c177fbcf28a2783e9dfbea --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_6208374896869439318+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:286cd304747970894823fc06483ba76dfd74ce76d0989e5b2ba815f5c03c200e +size 1585 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_6208374896869439318+e30acd3a/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_6208374896869439318+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..dd6932da06790795019b38ca937d8c747c2a4efc Binary files /dev/null and b/neuronxcc-2.21.33363.0+82129205/MODULE_6208374896869439318+e30acd3a/model.neff differ diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_628b6d34444473fad038+a02c3a36/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_628b6d34444473fad038+a02c3a36/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..5726abc7d1d8c52fa95bc7919439a23a23fe3b9a --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_628b6d34444473fad038+a02c3a36/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/token_generation/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_628b6d34444473fad038+a02c3a36/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_628b6d34444473fad038+a02c3a36/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_628b6d34444473fad038+a02c3a36/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_628b6d34444473fad038+a02c3a36/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..7e156f6710d8d03836be1f27c589dfa8b047798b --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_628b6d34444473fad038+a02c3a36/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3408a558a72716e37aa265b674934a28ade7f77e0ca28de65c0d414b4bfac775 +size 59309 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_628b6d34444473fad038+a02c3a36/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_628b6d34444473fad038+a02c3a36/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..587c858640fadee7ed17fd8c9b52a6c352746c96 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_628b6d34444473fad038+a02c3a36/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3a53e8264739e457be503d9a06659bfa2cb60386fe7d8c7a3d01ba03f0bbeab +size 1055744 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_628b6d34444473fad038+a02c3a36/wrapped_neff.hlo b/neuronxcc-2.21.33363.0+82129205/MODULE_628b6d34444473fad038+a02c3a36/wrapped_neff.hlo new file mode 100644 index 0000000000000000000000000000000000000000..5d0bf58459bfae4f359ffce1381394319952fcef --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_628b6d34444473fad038+a02c3a36/wrapped_neff.hlo @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b40e2821470ce2f32e9b58ce8c66bb2c8053e5cff8002eb664bb7a8726e1c3c8 +size 1062511 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_6305938804443382221+e30acd3a/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_6305938804443382221+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_6305938804443382221+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_6305938804443382221+e30acd3a/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_6305938804443382221+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_6305938804443382221+e30acd3a/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_6305938804443382221+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..d0f77914ffe027e73ead390ad61bd8c0fc019f22 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_6305938804443382221+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:69b9c9469d8eb89302c52a8b5ef28e5dcbefd0187702e88f5bfda4a4752be87d +size 1584 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_6305938804443382221+e30acd3a/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_6305938804443382221+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..a9c6762bbb9f7cd5a0dcd160bf65e83ad0e93885 Binary files /dev/null and b/neuronxcc-2.21.33363.0+82129205/MODULE_6305938804443382221+e30acd3a/model.neff differ diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_6601989946514187606+e30acd3a/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_6601989946514187606+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_6601989946514187606+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_6601989946514187606+e30acd3a/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_6601989946514187606+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_6601989946514187606+e30acd3a/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_6601989946514187606+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..ee1e423f2f3d8d36a62df3d8f7a6a4b196011bd1 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_6601989946514187606+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b0b98325b529fcc4a4bee1adf72ca1e7d9f89c8de8b1dcdb957931e7816140f6 +size 1584 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_6601989946514187606+e30acd3a/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_6601989946514187606+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..6ed9fa6133ad18b6dddcec8ccbd2e6254f5f4cca Binary files /dev/null and b/neuronxcc-2.21.33363.0+82129205/MODULE_6601989946514187606+e30acd3a/model.neff differ diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_68b856b391a016dcfb36+94f624bf/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_68b856b391a016dcfb36+94f624bf/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..83ee45b9ce41df0692cb91a162763cbd5d22842e --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_68b856b391a016dcfb36+94f624bf/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--enable-saturate-infinity", "--auto-cast=none", "--model-type=transformer", "-O1", "--logfile=/tmp/nxdi_test_06bfbb88-4dfc-437e-aa33-6cfeb3e22fa3/compiler_workdir/DecoderLayerWrapper/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_68b856b391a016dcfb36+94f624bf/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_68b856b391a016dcfb36+94f624bf/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_68b856b391a016dcfb36+94f624bf/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_68b856b391a016dcfb36+94f624bf/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..d681207f945990d4e21e50b0e6b8e90d019cd7f0 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_68b856b391a016dcfb36+94f624bf/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:acc559309a214b16f3917edf6efe2b0ab578f048a6524f41ac73e1d625078b3e +size 14480 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_68b856b391a016dcfb36+94f624bf/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_68b856b391a016dcfb36+94f624bf/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..a1c8fffb047b653f52989b7594becdb05ef2f029 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_68b856b391a016dcfb36+94f624bf/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5ecf16f3fc1ecbaf91c19332adec13f58b9eab5526f5f8ebc930b3d03612d918 +size 267264 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_68b856b391a016dcfb36+94f624bf/wrapped_neff.hlo b/neuronxcc-2.21.33363.0+82129205/MODULE_68b856b391a016dcfb36+94f624bf/wrapped_neff.hlo new file mode 100644 index 0000000000000000000000000000000000000000..0fce3d09952f3e46e3306afcfe93214ed46d5f91 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_68b856b391a016dcfb36+94f624bf/wrapped_neff.hlo @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2c0cebff355853de964162bcf5aaa797e3b9c3d4669128992120207a32240729 +size 272962 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_6954418380069475056+e30acd3a/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_6954418380069475056+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_6954418380069475056+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_6954418380069475056+e30acd3a/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_6954418380069475056+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_6954418380069475056+e30acd3a/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_6954418380069475056+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..cc4867fcc446b41950eb76b3e23b948cabacfbcb --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_6954418380069475056+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:de02a218d743956a2996aaa5bd62b9f1638ffba8fbbee1533b1cdea8c050ea29 +size 1584 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_6954418380069475056+e30acd3a/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_6954418380069475056+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..7210dd9abe1bcda21794bd4bf7033265879c1d0c Binary files /dev/null and b/neuronxcc-2.21.33363.0+82129205/MODULE_6954418380069475056+e30acd3a/model.neff differ diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_69ce67073ba646143ed4+24129607/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_69ce67073ba646143ed4+24129607/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..836724f44545ce0dedda1521fd4c623a6ea8ec72 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_69ce67073ba646143ed4+24129607/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/context_encoding/_tp0_bk0/log-neuron-cc.txt"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_69ce67073ba646143ed4+24129607/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_69ce67073ba646143ed4+24129607/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_69ce67073ba646143ed4+24129607/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_69ce67073ba646143ed4+24129607/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..14fdbbb33d6e5dc636e9b23afebc653c24205dcd --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_69ce67073ba646143ed4+24129607/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:56098bbc4e1115bb073697e1c5a349c4e8bb83656efcf80c80ecc9d9cb4d5767 +size 965833 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_69ce67073ba646143ed4+24129607/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_69ce67073ba646143ed4+24129607/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..5ab7f115f126ee090e328a9b38fd742814a9cad7 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_69ce67073ba646143ed4+24129607/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:70cc500c4a4184db6b0b40edc013e749fbf1c78edfc6f513aae54d3dd9349282 +size 6687744 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_6b045be69220451cd35c+a02c3a36/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_6b045be69220451cd35c+a02c3a36/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..5726abc7d1d8c52fa95bc7919439a23a23fe3b9a --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_6b045be69220451cd35c+a02c3a36/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/token_generation/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_6b045be69220451cd35c+a02c3a36/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_6b045be69220451cd35c+a02c3a36/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_6b045be69220451cd35c+a02c3a36/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_6b045be69220451cd35c+a02c3a36/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..8f5b7a6670302805eb63187fed4ac60442b90e52 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_6b045be69220451cd35c+a02c3a36/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:134c0917a81e0e14135b250cdc4a1b63a67d652bd5f5ef6aded7b27637e2cf32 +size 863510 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_6b045be69220451cd35c+a02c3a36/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_6b045be69220451cd35c+a02c3a36/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..312c1828c56fc48afcab6fc8149d9c5a22d618bd --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_6b045be69220451cd35c+a02c3a36/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:68e743a72b13678866827e5b546eaabb5e88bcd1792ba84ca2fea8fa338e08e7 +size 6769664 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_6b045be69220451cd35c+a02c3a36/wrapped_neff.hlo b/neuronxcc-2.21.33363.0+82129205/MODULE_6b045be69220451cd35c+a02c3a36/wrapped_neff.hlo new file mode 100644 index 0000000000000000000000000000000000000000..42f1a400e028ae3673bf8f99b179d25c0713da5e --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_6b045be69220451cd35c+a02c3a36/wrapped_neff.hlo @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5b56a1b3f1cb55d9c1de5d4c6ba6e63563387d8f90a0c6f90858b65408e5cfb8 +size 6936331 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_6cc68373d81858239a08+24129607/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_6cc68373d81858239a08+24129607/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..836724f44545ce0dedda1521fd4c623a6ea8ec72 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_6cc68373d81858239a08+24129607/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/context_encoding/_tp0_bk0/log-neuron-cc.txt"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_6cc68373d81858239a08+24129607/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_6cc68373d81858239a08+24129607/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_6cc68373d81858239a08+24129607/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_6cc68373d81858239a08+24129607/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..e4cc839e7273e66ba15ee208dd7c79a38527c6d0 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_6cc68373d81858239a08+24129607/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:30a510cf4846173f2371acf3fd47814e09b78380db54628e90e1b93b87357080 +size 442335 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_6cc68373d81858239a08+24129607/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_6cc68373d81858239a08+24129607/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..18ea2f617f7a697deece61a5cf56aa1358dcdea6 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_6cc68373d81858239a08+24129607/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea36def340f997d46e74cad79b468db35534763807a30cae8d49da53516b2bca +size 41114624 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_6dd858f775c0a9002ded+8f459db2/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_6dd858f775c0a9002ded+8f459db2/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..e6d68cacdbb58b2fed9cd72b40d5cc941579deb9 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_6dd858f775c0a9002ded+8f459db2/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--enable-saturate-infinity", "--auto-cast=none", "--model-type=transformer", "-O1", "--logfile=/tmp/nxdi_test_5d34103a-85dc-4015-9fa3-ab51760b4433/compiler_workdir/DecoderLayerWrapper/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_6dd858f775c0a9002ded+8f459db2/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_6dd858f775c0a9002ded+8f459db2/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_6dd858f775c0a9002ded+8f459db2/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_6dd858f775c0a9002ded+8f459db2/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..ed757b286534c7f122a88f2e017000b828da9643 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_6dd858f775c0a9002ded+8f459db2/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:643b366d2e368b3b3b6d9c836ded077dc6564cf85685f50a5492dadb9cd8c5da +size 21842 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_6dd858f775c0a9002ded+8f459db2/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_6dd858f775c0a9002ded+8f459db2/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..5a56934a10800da4c79ac1e7515cda02eb541e59 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_6dd858f775c0a9002ded+8f459db2/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d08223e8a2dc1b30437ecdda7f471a8bafee9522372349713bd5e5e69a54fe2 +size 5356544 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_6dd858f775c0a9002ded+8f459db2/wrapped_neff.hlo b/neuronxcc-2.21.33363.0+82129205/MODULE_6dd858f775c0a9002ded+8f459db2/wrapped_neff.hlo new file mode 100644 index 0000000000000000000000000000000000000000..ba754df170712b9f5b564ea89e78536e880cb0f7 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_6dd858f775c0a9002ded+8f459db2/wrapped_neff.hlo @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3d7df662538e217a23fb97997288319d4249b46f1cbe5147339bd5ca1a88390d +size 5362101 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_7071522469786365265+e30acd3a/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_7071522469786365265+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_7071522469786365265+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_7071522469786365265+e30acd3a/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_7071522469786365265+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_7071522469786365265+e30acd3a/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_7071522469786365265+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..65cd73c86e8a07ff02487d4536d1f111a13f904e --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_7071522469786365265+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cb0a6b6b9c81d5c6c20c442718dccbf485f40c87a8217af91107a5ab3e0af055 +size 1584 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_7071522469786365265+e30acd3a/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_7071522469786365265+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..f18a3a3f7cd6411fd170674e7c0a1428f8d2b954 Binary files /dev/null and b/neuronxcc-2.21.33363.0+82129205/MODULE_7071522469786365265+e30acd3a/model.neff differ diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_73021bd2bcd85d0ae281+bafdbdde/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_73021bd2bcd85d0ae281+bafdbdde/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..5a228a7a4cc7c7df9e8b4887d22dcd862c2f60f3 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_73021bd2bcd85d0ae281+bafdbdde/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2", "-O1", "--lnc=1", "--enable-saturate-infinity", "--enable-mixed-precision-accumulation", "--internal-enable-dge-levels=vector_dynamic_offsets", "--internal-hlo2tensorizer-options=--verify-hlo=true", "--logfile=/tmp/nxd_model/token_generation/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_73021bd2bcd85d0ae281+bafdbdde/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_73021bd2bcd85d0ae281+bafdbdde/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_73021bd2bcd85d0ae281+bafdbdde/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_73021bd2bcd85d0ae281+bafdbdde/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..727fe2caac58854e2f659732c11b6b5473ac4505 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_73021bd2bcd85d0ae281+bafdbdde/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6596d3769509c9146ae4a3975d1c70c2eb236f1527bf8cab5cf9306c4300289f +size 89555 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_73021bd2bcd85d0ae281+bafdbdde/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_73021bd2bcd85d0ae281+bafdbdde/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..32fa287e2e4418c7c9002af355c7461d85f9f4bb --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_73021bd2bcd85d0ae281+bafdbdde/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d4e6305d96ffce7a09ffe9fbe739daef69c503eceaa33e7181c52bb69f8e669d +size 369664 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_73021bd2bcd85d0ae281+bafdbdde/wrapped_neff.hlo b/neuronxcc-2.21.33363.0+82129205/MODULE_73021bd2bcd85d0ae281+bafdbdde/wrapped_neff.hlo new file mode 100644 index 0000000000000000000000000000000000000000..cd4155aa997fa356903eb273926c2869086276d2 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_73021bd2bcd85d0ae281+bafdbdde/wrapped_neff.hlo @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0093375c250feaa10fa7e89832496ea173e63ca7c802ed01d0f81aca0be48912 +size 379362 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_73021bd2bcd85d0ae281+da15b874/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_73021bd2bcd85d0ae281+da15b874/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..c3fb8c073852fb04e7ae88fd2592978716b60eeb --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_73021bd2bcd85d0ae281+da15b874/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2", "-O1--lnc=1", "--enable-saturate-infinity", "--enable-mixed-precision-accumulation", "--internal-enable-dge-levels=vector_dynamic_offsets", "--internal-hlo2tensorizer-options=--verify-hlo=true", "--logfile=/tmp/nxd_model/token_generation/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_73021bd2bcd85d0ae281+da15b874/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_73021bd2bcd85d0ae281+da15b874/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..727fe2caac58854e2f659732c11b6b5473ac4505 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_73021bd2bcd85d0ae281+da15b874/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6596d3769509c9146ae4a3975d1c70c2eb236f1527bf8cab5cf9306c4300289f +size 89555 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_73021bd2bcd85d0ae281+da15b874/model.log b/neuronxcc-2.21.33363.0+82129205/MODULE_73021bd2bcd85d0ae281+da15b874/model.log new file mode 100644 index 0000000000000000000000000000000000000000..f5a382588428b9da47b14342f226d3a77768d5eb --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_73021bd2bcd85d0ae281+da15b874/model.log @@ -0,0 +1,5 @@ +Failed compilation with ['neuronx-cc', 'compile', '--framework=XLA', '/tmp/nxd_model/token_generation/_tp0_bk0/model.MODULE_73021bd2bcd85d0ae281+da15b874.hlo_module.pb', '--output', '/tmp/nxd_model/token_generation/_tp0_bk0/model.MODULE_73021bd2bcd85d0ae281+da15b874.neff', '--target=trn1', '--auto-cast=none', '--model-type=transformer', '--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2', '-O1--lnc=1', '--enable-saturate-infinity', '--enable-mixed-precision-accumulation', '--internal-enable-dge-levels=vector_dynamic_offsets', '--internal-hlo2tensorizer-options=--verify-hlo=true', '--logfile=/tmp/nxd_model/token_generation/_tp0_bk0/log-neuron-cc.txt', '--enable-internal-neff-wrapper', '--verbose=35']: neuronx-cc compile: argument --optlevel/-O: invalid choice: 1--lnc=1 (choose from 1, 2, 3) +usage: neuronx-cc compile --framework {XLA} --target {trn1,inf2,trn1n,trn2,trn2n} [--logical-nc-config {1,2}] [--enable-fast-loading-neuron-binaries] [--enable-fast-context-switch] + [--auto-cast ] [--auto-cast-type {fp16,bf16,tf32,fp8_e4m3}] [--output ] [--optlevel {1,2,3}] [--help] + [--model-type {transformer,unet-inference,generic}] [--distribution-strategy {fsdp,nemo,llm-training,generic}] [--enable-dge] + [--verbose {debug|info|warning|user|off}] [--logfile ] [--logfile-verbose {debug|info|warning|user}] diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_740c88e5b7c7bd2f9bae+a02c3a36/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_740c88e5b7c7bd2f9bae+a02c3a36/model.neff index 1d19ec58ea30fbc60460e92a65f667d9ff589ff4..c82043ade41edd2245f21b0612779e7cf36225d8 100644 --- a/neuronxcc-2.21.33363.0+82129205/MODULE_740c88e5b7c7bd2f9bae+a02c3a36/model.neff +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_740c88e5b7c7bd2f9bae+a02c3a36/model.neff @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:8f7a47d761c50e5ce0c9150e15d0e9f32726afb1e95a6072553758b37a853663 +oid sha256:0d00a067a62b1f1860deb777f444b9cb08cb6f877ec885847d64ea73763b0efc size 3073024 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_740c88e5b7c7bd2f9bae+a02c3a36/wrapped_neff.hlo b/neuronxcc-2.21.33363.0+82129205/MODULE_740c88e5b7c7bd2f9bae+a02c3a36/wrapped_neff.hlo index 2ec9b817684a199180fefb951640f29396b46be0..7ea34a25aa5497e5bb5b6816f001ddd754ed0800 100644 --- a/neuronxcc-2.21.33363.0+82129205/MODULE_740c88e5b7c7bd2f9bae+a02c3a36/wrapped_neff.hlo +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_740c88e5b7c7bd2f9bae+a02c3a36/wrapped_neff.hlo @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:c366c2aa9312137e4985670cf006f130a78f6f383ce45c8c327a270a772b4bf8 +oid sha256:26442807d050083846013c76054618f0984ad4569d6bc245666e9114a5c0a2cb size 3147125 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_748714541699003438+e30acd3a/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_748714541699003438+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_748714541699003438+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_748714541699003438+e30acd3a/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_748714541699003438+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_748714541699003438+e30acd3a/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_748714541699003438+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..624a3c1b56463ca0ba1cbc694c1d9b90576442b7 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_748714541699003438+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f5a94da50ba3ee7f04a09d0f188a7ad5540e359965b908e16572e1a5f6151498 +size 1584 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_748714541699003438+e30acd3a/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_748714541699003438+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..4ba3cebab5f2a48b106da8f4a230731a97916fb8 Binary files /dev/null and b/neuronxcc-2.21.33363.0+82129205/MODULE_748714541699003438+e30acd3a/model.neff differ diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_77f1b8fbe51833738f1c+24129607/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_77f1b8fbe51833738f1c+24129607/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..836724f44545ce0dedda1521fd4c623a6ea8ec72 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_77f1b8fbe51833738f1c+24129607/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/context_encoding/_tp0_bk0/log-neuron-cc.txt"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_77f1b8fbe51833738f1c+24129607/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_77f1b8fbe51833738f1c+24129607/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_77f1b8fbe51833738f1c+24129607/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_77f1b8fbe51833738f1c+24129607/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..c40126d5a207852bf5006e0a5ec468d377879109 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_77f1b8fbe51833738f1c+24129607/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8d6a08324e300c96d010e805b8c8ac8641071bdefe7f2baee9523167de763b2e +size 539301 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_77f1b8fbe51833738f1c+24129607/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_77f1b8fbe51833738f1c+24129607/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..4e9c8e9ed6e164c1e8eb16c0066e75abe716b1f8 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_77f1b8fbe51833738f1c+24129607/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:caec6c3d395c308dd8bd2557f4c49ae79205506b29b6e4e088b0b7cb54942b1d +size 41247744 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_780259796876411187+e30acd3a/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_780259796876411187+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_780259796876411187+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_780259796876411187+e30acd3a/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_780259796876411187+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_780259796876411187+e30acd3a/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_780259796876411187+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..147c1586aac46ddfe7b367fb4f90a52b1589362e --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_780259796876411187+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e3874129d23ad1c69d19cc9636edc6f6b0bec7684aaa4058429feb1e7acfc2c +size 1585 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_780259796876411187+e30acd3a/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_780259796876411187+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..39542d53bb3961c021aec3d7944bf64223663336 Binary files /dev/null and b/neuronxcc-2.21.33363.0+82129205/MODULE_780259796876411187+e30acd3a/model.neff differ diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_788940165194100575+e30acd3a/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_788940165194100575+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_788940165194100575+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_788940165194100575+e30acd3a/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_788940165194100575+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_788940165194100575+e30acd3a/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_788940165194100575+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..a3d9ab4f7c96a51129b485c987af0c3965fbd2e3 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_788940165194100575+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:12a4a82788fd9c10e258bc78cfac56903ed9e41e56c1b39918ac7a98aa50f857 +size 1584 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_788940165194100575+e30acd3a/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_788940165194100575+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..711b0e81fd87e197987f7da6b59e52c2f83a80c1 Binary files /dev/null and b/neuronxcc-2.21.33363.0+82129205/MODULE_788940165194100575+e30acd3a/model.neff differ diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_78a467fd5a1d9f7adeef+24129607/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_78a467fd5a1d9f7adeef+24129607/model.hlo_module.pb index b5354b7b5a65a43ef1260aa0e8de13980762d080..8efac31d5864de2a0cbd583784f247093eaa7a94 100644 --- a/neuronxcc-2.21.33363.0+82129205/MODULE_78a467fd5a1d9f7adeef+24129607/model.hlo_module.pb +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_78a467fd5a1d9f7adeef+24129607/model.hlo_module.pb @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:649ff83e0cbee13abda84e02c1a114e8b60d780456161e42f68c99c57744691c +oid sha256:7d98bb4abcef46bc4dfcb539ece861af724c555279e78c4ba6ef27c16f25cecc size 739558 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_78a467fd5a1d9f7adeef+24129607/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_78a467fd5a1d9f7adeef+24129607/model.neff index 7ecd1ce442179565edc8bb4d1660d21aff8162f3..b8556e1e2744f691770610f5d28bb67d270daeb5 100644 --- a/neuronxcc-2.21.33363.0+82129205/MODULE_78a467fd5a1d9f7adeef+24129607/model.neff +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_78a467fd5a1d9f7adeef+24129607/model.neff @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:40dfa607b020ef9e891d5a4dca71cd75f67a5ecc7a86e72b2146a17479837b20 +oid sha256:01d131442ec0615f97346844e44a2b093f093f77430729c4c6a75c4ec1267984 size 26133504 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_7ac33c003364730bb8e0+e4ea82eb/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_7ac33c003364730bb8e0+e4ea82eb/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..cb28f34e622020a54ea80c9e6f76fb60851c9273 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_7ac33c003364730bb8e0+e4ea82eb/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--enable-saturate-infinity", "--auto-cast=none", "--model-type=transformer", "-O1", "--logfile=/tmp/nxdi_test_facaae82-be8c-49ab-8b4d-d3ba892aacde/compiler_workdir/DecoderLayerWrapper/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_7ac33c003364730bb8e0+e4ea82eb/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_7ac33c003364730bb8e0+e4ea82eb/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_7ac33c003364730bb8e0+e4ea82eb/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_7ac33c003364730bb8e0+e4ea82eb/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..557f3c2606d8e3fea4e49480c9e678d4bb2e18b9 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_7ac33c003364730bb8e0+e4ea82eb/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:16b8737187be25031c594bd9293d7718b3a08e1b8669fcc99e4ca3e1382951ca +size 21842 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_7ac33c003364730bb8e0+e4ea82eb/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_7ac33c003364730bb8e0+e4ea82eb/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..f4bbb301322d638c60dbd4b535bbe1631bba64a9 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_7ac33c003364730bb8e0+e4ea82eb/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dd9ae33ac88fe308d95ffe126239f9948a3cbeb052821893ef70f9af6a74bb2a +size 13507584 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_7ac33c003364730bb8e0+e4ea82eb/wrapped_neff.hlo b/neuronxcc-2.21.33363.0+82129205/MODULE_7ac33c003364730bb8e0+e4ea82eb/wrapped_neff.hlo new file mode 100644 index 0000000000000000000000000000000000000000..5d33ba7065c501d267e0c195cd43cb5adb9a4b7c --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_7ac33c003364730bb8e0+e4ea82eb/wrapped_neff.hlo @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2bb8f4ec46dbabb68f95b15b98ef70269fe662b590c3bddf5c14729091467796 +size 13513141 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_7b28cd1e3dc6bc844fa3+24129607/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_7b28cd1e3dc6bc844fa3+24129607/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..836724f44545ce0dedda1521fd4c623a6ea8ec72 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_7b28cd1e3dc6bc844fa3+24129607/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/context_encoding/_tp0_bk0/log-neuron-cc.txt"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_7b28cd1e3dc6bc844fa3+24129607/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_7b28cd1e3dc6bc844fa3+24129607/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_7b28cd1e3dc6bc844fa3+24129607/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_7b28cd1e3dc6bc844fa3+24129607/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..608f7d5151e91c1e8fe38cd221e0f2cbcec4d9ec --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_7b28cd1e3dc6bc844fa3+24129607/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:21f0f18ad74724d528a22ba281be0eaa0215d4c51c32cc9f6e53ee2a5e6b63eb +size 539293 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_7b28cd1e3dc6bc844fa3+24129607/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_7b28cd1e3dc6bc844fa3+24129607/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..8d870b08c8cd3986457316500fe0f5429c30b004 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_7b28cd1e3dc6bc844fa3+24129607/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0613d55be77786ee4cc25078027d36a4e958c507c677291ba94bdb9f3dd9489a +size 41247744 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_7c2638502a7538102290+a02c3a36/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_7c2638502a7538102290+a02c3a36/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..5726abc7d1d8c52fa95bc7919439a23a23fe3b9a --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_7c2638502a7538102290+a02c3a36/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/token_generation/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_7c2638502a7538102290+a02c3a36/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_7c2638502a7538102290+a02c3a36/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_7c2638502a7538102290+a02c3a36/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_7c2638502a7538102290+a02c3a36/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..f6f790355c18a49e170acb8dfdc326047ee5b1bc --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_7c2638502a7538102290+a02c3a36/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7c677f4472d5cb6ee4fb280b2f7f0e9ec44ab34e3d2f22624181c1b9f68b9401 +size 749530 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_7c2638502a7538102290+a02c3a36/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_7c2638502a7538102290+a02c3a36/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..c9c4413fc51145e4cecde458badaed3765a3785e --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_7c2638502a7538102290+a02c3a36/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:838f56981e2283d5d2fc868f0288ab80d1b456db738cd422573fb27e75699297 +size 3124224 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_7c2638502a7538102290+a02c3a36/wrapped_neff.hlo b/neuronxcc-2.21.33363.0+82129205/MODULE_7c2638502a7538102290+a02c3a36/wrapped_neff.hlo new file mode 100644 index 0000000000000000000000000000000000000000..7ccf8a3794c0cd8be6bf5e5d96bf71e696de01f7 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_7c2638502a7538102290+a02c3a36/wrapped_neff.hlo @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:58a2383839877ae97d7e19f0f8758b8ce9e6bde442c0ac88fa32ea398a0ed7c5 +size 3272392 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_7d7829b80b30c6a8366e+82a94d75/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_7d7829b80b30c6a8366e+82a94d75/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..5f2bb45239674242975b0fa15f6f9fe225814f98 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_7d7829b80b30c6a8366e+82a94d75/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--enable-saturate-infinity", "--auto-cast=none", "--model-type=transformer", "-O1", "--logfile=/tmp/nxdi_test_8bed7412-f23c-4e85-8ceb-cddc3027189c/compiler_workdir/DecoderLayerWrapper/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_7d7829b80b30c6a8366e+82a94d75/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_7d7829b80b30c6a8366e+82a94d75/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_7d7829b80b30c6a8366e+82a94d75/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_7d7829b80b30c6a8366e+82a94d75/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..d0c380598b43a12fe53a8bcde96daee3e769f996 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_7d7829b80b30c6a8366e+82a94d75/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:95727e0f4f47bf86e8e5540c9bfba35739e9ca53d425c64b0935d402a878ac96 +size 15848 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_7d7829b80b30c6a8366e+82a94d75/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_7d7829b80b30c6a8366e+82a94d75/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..31cbc208c1940ddfa4cbce06acd9b7d6e136dbbc --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_7d7829b80b30c6a8366e+82a94d75/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:89b9f1309d95c86f5a3911d90a7ca4fd45675a0872436149c9118c7d8b762d3c +size 267264 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_7d7829b80b30c6a8366e+82a94d75/wrapped_neff.hlo b/neuronxcc-2.21.33363.0+82129205/MODULE_7d7829b80b30c6a8366e+82a94d75/wrapped_neff.hlo new file mode 100644 index 0000000000000000000000000000000000000000..b098350a73f9e4ad99e5fbf2b8491f371ebf7174 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_7d7829b80b30c6a8366e+82a94d75/wrapped_neff.hlo @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e0eca3aecd640e7bece133a800ff36d42d5e0ca6229855c0250064c87ff8e61c +size 272962 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_7f4b070326c197aa68db+a02c3a36/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_7f4b070326c197aa68db+a02c3a36/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..5726abc7d1d8c52fa95bc7919439a23a23fe3b9a --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_7f4b070326c197aa68db+a02c3a36/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/token_generation/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_7f4b070326c197aa68db+a02c3a36/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_7f4b070326c197aa68db+a02c3a36/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_7f4b070326c197aa68db+a02c3a36/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_7f4b070326c197aa68db+a02c3a36/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..c871f1164f825b857f1680082a5922e1d8cf255e --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_7f4b070326c197aa68db+a02c3a36/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4288f97159a1a045dfcb075cd63bfa2fe8d84a6eeeadc7e52c2de97d8307c6ab +size 702870 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_7f4b070326c197aa68db+a02c3a36/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_7f4b070326c197aa68db+a02c3a36/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..57b37f1e4cf2b985a6e062c1ffe45496e4ce1739 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_7f4b070326c197aa68db+a02c3a36/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:87af877110b1b8f51cfcf8285f9bdfb9ae805fcb7c1bda60244bf340d5a0b068 +size 3503104 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_7f4b070326c197aa68db+a02c3a36/wrapped_neff.hlo b/neuronxcc-2.21.33363.0+82129205/MODULE_7f4b070326c197aa68db+a02c3a36/wrapped_neff.hlo new file mode 100644 index 0000000000000000000000000000000000000000..32759e37f4b5e6514b2c03e2e0bce19c4d824f7f --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_7f4b070326c197aa68db+a02c3a36/wrapped_neff.hlo @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4389ea419121df0d40f1d0ff6725efe7ecb9e9d32df8b454e258be4f0c1fc4e2 +size 3640300 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_8040971574bb1f40a771+eb6614ba/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_8040971574bb1f40a771+eb6614ba/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..ce990ca454779cc18880e6c265e1f5a083544631 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_8040971574bb1f40a771+eb6614ba/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--enable-saturate-infinity", "--auto-cast=none", "--model-type=transformer", "-O1", "--logfile=/tmp/nxdi_test_a988fd86-bc45-43eb-8bbd-94af9fe20c4a/compiler_workdir/DecoderLayerWrapper/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_8040971574bb1f40a771+eb6614ba/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_8040971574bb1f40a771+eb6614ba/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_8040971574bb1f40a771+eb6614ba/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_8040971574bb1f40a771+eb6614ba/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..d0c380598b43a12fe53a8bcde96daee3e769f996 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_8040971574bb1f40a771+eb6614ba/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:95727e0f4f47bf86e8e5540c9bfba35739e9ca53d425c64b0935d402a878ac96 +size 15848 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_8040971574bb1f40a771+eb6614ba/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_8040971574bb1f40a771+eb6614ba/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..9d3d3d8e14a91bf235937ccdb070538cf9e74e2d --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_8040971574bb1f40a771+eb6614ba/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e9d2bcc6f0b9899df44d258cb7e9dd5c064898e03a61421cc0496a2cc3a44807 +size 267264 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_8040971574bb1f40a771+eb6614ba/wrapped_neff.hlo b/neuronxcc-2.21.33363.0+82129205/MODULE_8040971574bb1f40a771+eb6614ba/wrapped_neff.hlo new file mode 100644 index 0000000000000000000000000000000000000000..0f0af1087bfddc8f22eb226e714a762f86342447 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_8040971574bb1f40a771+eb6614ba/wrapped_neff.hlo @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e194998c9167b8ae0d48cef773247b7276440f09bee8a2e84b6bda7fc8369e47 +size 272962 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_818bc30ba0942fe4c3d6+24129607/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_818bc30ba0942fe4c3d6+24129607/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..836724f44545ce0dedda1521fd4c623a6ea8ec72 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_818bc30ba0942fe4c3d6+24129607/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/context_encoding/_tp0_bk0/log-neuron-cc.txt"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_818bc30ba0942fe4c3d6+24129607/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_818bc30ba0942fe4c3d6+24129607/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_818bc30ba0942fe4c3d6+24129607/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_818bc30ba0942fe4c3d6+24129607/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..20d3cbc1058d161a886aa47a1cc2625bf5060d27 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_818bc30ba0942fe4c3d6+24129607/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:94e7f32be2a78824bbbe1288dddfbf9685dc9cae840ae36e1b0e23897548bdb4 +size 542592 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_818bc30ba0942fe4c3d6+24129607/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_818bc30ba0942fe4c3d6+24129607/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..3d774f0d94be94cf53efdab65e7d5bd315600035 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_818bc30ba0942fe4c3d6+24129607/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3bfc58019c455b9997a24abadcd533738c835473303cf7b2405cdf3d3eca56f6 +size 41319424 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_82cabaf7b1369e971e5c+5e080832/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_82cabaf7b1369e971e5c+5e080832/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..1212dbab684ccf0d8c4973516f0da2545e9646fa --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_82cabaf7b1369e971e5c+5e080832/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--enable-saturate-infinity", "--auto-cast=none", "--model-type=transformer", "-O1", "--logfile=/tmp/nxdi_test_0488345e-ec2a-4bf1-b6e4-dc7c5869662d/compiler_workdir/DecoderLayerWrapper/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_82cabaf7b1369e971e5c+5e080832/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_82cabaf7b1369e971e5c+5e080832/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_82cabaf7b1369e971e5c+5e080832/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_82cabaf7b1369e971e5c+5e080832/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..c0085b990f557c43d8e51445d9ee78974487c16d --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_82cabaf7b1369e971e5c+5e080832/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0bf2f097fbd06b979910d8b7304be86176d5776d2cd05fa2d3fa2617eb43ccc9 +size 15614 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_82cabaf7b1369e971e5c+5e080832/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_82cabaf7b1369e971e5c+5e080832/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..686b83a485c467b98b7ac4627fa4dd3cdf764860 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_82cabaf7b1369e971e5c+5e080832/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f99646f284e115efdcc2e1daed844333b81b7da217fdfbf5d776176bf993b67b +size 154624 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_82cabaf7b1369e971e5c+5e080832/wrapped_neff.hlo b/neuronxcc-2.21.33363.0+82129205/MODULE_82cabaf7b1369e971e5c+5e080832/wrapped_neff.hlo new file mode 100644 index 0000000000000000000000000000000000000000..92b5454b49d3435f00d64ae6f775ba773003cbe6 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_82cabaf7b1369e971e5c+5e080832/wrapped_neff.hlo @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2ce533ac3993128b9f41824d853998d9007328dfb041adafb9f421070770eec8 +size 159439 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_8432304590411733968+e30acd3a/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_8432304590411733968+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_8432304590411733968+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_8432304590411733968+e30acd3a/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_8432304590411733968+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_8432304590411733968+e30acd3a/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_8432304590411733968+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..ea75b72ceb1ffddf1735837bb050ce370fb813af --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_8432304590411733968+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:81c88ba71326839d9c30573e697266a88ef7c7e6ca153aca44fcb611072884d8 +size 1584 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_8432304590411733968+e30acd3a/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_8432304590411733968+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..78b3020a0f4b3514d2823af3281b88cb75c28775 Binary files /dev/null and b/neuronxcc-2.21.33363.0+82129205/MODULE_8432304590411733968+e30acd3a/model.neff differ diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_8468241434736974290+e30acd3a/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_8468241434736974290+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_8468241434736974290+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_8468241434736974290+e30acd3a/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_8468241434736974290+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_8468241434736974290+e30acd3a/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_8468241434736974290+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..5ce4a24a3f4ad9ddae0cf6c4f101d0fb719b0485 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_8468241434736974290+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:924f25eeb83b1f2c854719d98be6e51db203789ac31568689f5bd4aef63dfb9a +size 1584 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_8468241434736974290+e30acd3a/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_8468241434736974290+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..8cf63b519dd0fc253a5de1381f2e58a41ce898cc Binary files /dev/null and b/neuronxcc-2.21.33363.0+82129205/MODULE_8468241434736974290+e30acd3a/model.neff differ diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_8476840015321783067+e30acd3a/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_8476840015321783067+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_8476840015321783067+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_8476840015321783067+e30acd3a/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_8476840015321783067+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_8476840015321783067+e30acd3a/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_8476840015321783067+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..1efd6b7dedc83c3704cd1b735e12395887f6da8a --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_8476840015321783067+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e9b5c4ccf12d542b037ab62137b8b394682b100f2c521675c7bf12890efda020 +size 1585 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_8476840015321783067+e30acd3a/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_8476840015321783067+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..f1c785df9c6ff3a021269f572b498971435f8c75 Binary files /dev/null and b/neuronxcc-2.21.33363.0+82129205/MODULE_8476840015321783067+e30acd3a/model.neff differ diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_862f4269950d182a7b0b+bceffd01/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_862f4269950d182a7b0b+bceffd01/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..a3c1beceabba94d325340c341772b0e0195d01ed --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_862f4269950d182a7b0b+bceffd01/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--enable-saturate-infinity", "--auto-cast=none", "--model-type=transformer", "-O1", "--logfile=/tmp/nxdi_test_b4e7168f-d113-4369-8789-403a0e77e0f4/compiler_workdir/DecoderLayerWrapper/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_862f4269950d182a7b0b+bceffd01/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_862f4269950d182a7b0b+bceffd01/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_862f4269950d182a7b0b+bceffd01/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_862f4269950d182a7b0b+bceffd01/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..0178c3d56ce706eb29ef263fef96f2d4ec891d21 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_862f4269950d182a7b0b+bceffd01/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0a549dd87d6b9d7ef0fd6b25a2d4cc3432ca1059e80b4862da74f5b881b28285 +size 15614 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_862f4269950d182a7b0b+bceffd01/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_862f4269950d182a7b0b+bceffd01/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..c35d96db1923a4e87f54a9faad5b97eab40ee28a --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_862f4269950d182a7b0b+bceffd01/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a09bff8e6c21a114a70e5f8edaf8239b30677ab38b603c7e8caa55bbb1b31a00 +size 154624 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_862f4269950d182a7b0b+bceffd01/wrapped_neff.hlo b/neuronxcc-2.21.33363.0+82129205/MODULE_862f4269950d182a7b0b+bceffd01/wrapped_neff.hlo new file mode 100644 index 0000000000000000000000000000000000000000..9725cf29055a68b1c97f15116c7cc8f119b768cc --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_862f4269950d182a7b0b+bceffd01/wrapped_neff.hlo @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3de70eaa89353bb39d47dfee567914ecc72d5265ae426d63723b8f66333c878f +size 159439 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_879201820668420060+e30acd3a/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_879201820668420060+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_879201820668420060+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_879201820668420060+e30acd3a/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_879201820668420060+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_879201820668420060+e30acd3a/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_879201820668420060+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..a2b43988cc81aa73f757af772d542c413e653e2e --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_879201820668420060+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cef670d6b80a7e4253b327fd39e1d079ac588f85021dabc03613787fe9e15793 +size 1584 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_879201820668420060+e30acd3a/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_879201820668420060+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..ba58a8ac545478c73d732c1d8901d02aa7bc55fa Binary files /dev/null and b/neuronxcc-2.21.33363.0+82129205/MODULE_879201820668420060+e30acd3a/model.neff differ diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_8976186fc1a14a570398+24129607/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_8976186fc1a14a570398+24129607/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..836724f44545ce0dedda1521fd4c623a6ea8ec72 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_8976186fc1a14a570398+24129607/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/context_encoding/_tp0_bk0/log-neuron-cc.txt"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_8976186fc1a14a570398+24129607/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_8976186fc1a14a570398+24129607/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_8976186fc1a14a570398+24129607/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_8976186fc1a14a570398+24129607/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..1061888e375ff6c653817e77647513d0f85f4a51 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_8976186fc1a14a570398+24129607/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9618983cb3b58f43eba8b4defb4ef66b3f8bdd11d441c021d90d3507ba304ef5 +size 923499 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_8976186fc1a14a570398+24129607/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_8976186fc1a14a570398+24129607/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..182c2dd0f0c9c8b7ccb61f5cd10e94a7a517430e --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_8976186fc1a14a570398+24129607/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9cf6f3e794ce64e8618eafbe02bfa901b4ca21963ddd8542ee648dd6755613a5 +size 11408384 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_8e3aecb3518895a4ebd0+a02c3a36/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_8e3aecb3518895a4ebd0+a02c3a36/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..5726abc7d1d8c52fa95bc7919439a23a23fe3b9a --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_8e3aecb3518895a4ebd0+a02c3a36/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/token_generation/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_8e3aecb3518895a4ebd0+a02c3a36/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_8e3aecb3518895a4ebd0+a02c3a36/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_8e3aecb3518895a4ebd0+a02c3a36/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_8e3aecb3518895a4ebd0+a02c3a36/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..9eeeb0a712f25cbf47e575e1cefc3b3fa7b56734 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_8e3aecb3518895a4ebd0+a02c3a36/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:da75b95f934328ef0c490142c5e1f9d2ef53a2baf0294f4d74c82b4f69331768 +size 59654 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_8e3aecb3518895a4ebd0+a02c3a36/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_8e3aecb3518895a4ebd0+a02c3a36/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..7cf3bff6f4e7f424639d182f5a801d75d63acb57 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_8e3aecb3518895a4ebd0+a02c3a36/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bd648936f1cd588f7e4667462d37b3430a4f9d914edbb090f6b80752943e8dc2 +size 1086464 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_8e3aecb3518895a4ebd0+a02c3a36/wrapped_neff.hlo b/neuronxcc-2.21.33363.0+82129205/MODULE_8e3aecb3518895a4ebd0+a02c3a36/wrapped_neff.hlo new file mode 100644 index 0000000000000000000000000000000000000000..092863b1637386d806723a4a0b8b6425a7fce996 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_8e3aecb3518895a4ebd0+a02c3a36/wrapped_neff.hlo @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1129f0880cccd3ceb0e801ed2d4a938aee9d031dfc1e2619dbe948d3100f55c0 +size 1093249 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_8f63e2da128b2efd447e+a02c3a36/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_8f63e2da128b2efd447e+a02c3a36/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..5726abc7d1d8c52fa95bc7919439a23a23fe3b9a --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_8f63e2da128b2efd447e+a02c3a36/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/token_generation/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_8f63e2da128b2efd447e+a02c3a36/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_8f63e2da128b2efd447e+a02c3a36/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_8f63e2da128b2efd447e+a02c3a36/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_8f63e2da128b2efd447e+a02c3a36/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..be8215e4db02a98e7c7d9a9b026367f5b42a91ea --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_8f63e2da128b2efd447e+a02c3a36/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:20ed0858162f8fc2c58bc4c23d0925dbeda5897dae0889f87758206676394f4e +size 81843 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_8f63e2da128b2efd447e+a02c3a36/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_8f63e2da128b2efd447e+a02c3a36/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..99c7d655cddbc1912973cc04fe157dafa9859f50 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_8f63e2da128b2efd447e+a02c3a36/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e9cd8bc061981baceefabdaa5ca287e1e48f591b569eaeb4ce05b5fa636e1d8c +size 246784 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_8f63e2da128b2efd447e+a02c3a36/wrapped_neff.hlo b/neuronxcc-2.21.33363.0+82129205/MODULE_8f63e2da128b2efd447e+a02c3a36/wrapped_neff.hlo new file mode 100644 index 0000000000000000000000000000000000000000..21acafea44333656b4673e656ada71c9c58748d8 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_8f63e2da128b2efd447e+a02c3a36/wrapped_neff.hlo @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cee6b0533aa9da5b3c8273ba009014b88e974e7ede3f77b3afd82c665bb13389 +size 255104 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_9312fb1868a91c85e16a+24129607/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_9312fb1868a91c85e16a+24129607/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..836724f44545ce0dedda1521fd4c623a6ea8ec72 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_9312fb1868a91c85e16a+24129607/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/context_encoding/_tp0_bk0/log-neuron-cc.txt"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_9312fb1868a91c85e16a+24129607/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_9312fb1868a91c85e16a+24129607/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_9312fb1868a91c85e16a+24129607/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_9312fb1868a91c85e16a+24129607/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..4e9aa2561beb27efdbfa9b821173c511de5fa520 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_9312fb1868a91c85e16a+24129607/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8871b29715ad7fd6db79f35c066c13a5596d8363311d383c1493179918d9a641 +size 71982 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_9312fb1868a91c85e16a+24129607/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_9312fb1868a91c85e16a+24129607/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..4c3929950855db434e6f40cf14d09ae96c5dce80 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_9312fb1868a91c85e16a+24129607/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a71fe4be79904c99e25282d6ac6f2b3bc63dba94287a3cc5487eb97d3746ab49 +size 24730624 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_9359742670556022940+e30acd3a/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_9359742670556022940+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_9359742670556022940+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_9359742670556022940+e30acd3a/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_9359742670556022940+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_9359742670556022940+e30acd3a/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_9359742670556022940+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..d8aea4a29916e9ee6c3d3cb01dd7040f9449b6e7 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_9359742670556022940+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e281a28fd4383e251e58b20244d279c47e2a97ff0e8d2ce7c4cdb5d6ebff3689 +size 1584 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_9359742670556022940+e30acd3a/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_9359742670556022940+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..87eb28e4596daed06413ac0b47e33673f0db962b Binary files /dev/null and b/neuronxcc-2.21.33363.0+82129205/MODULE_9359742670556022940+e30acd3a/model.neff differ diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_9551663534243818596+e30acd3a/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_9551663534243818596+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_9551663534243818596+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_9551663534243818596+e30acd3a/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_9551663534243818596+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_9551663534243818596+e30acd3a/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_9551663534243818596+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..9918fd3fa8009a6648d5eb93e90edc50804acd4c --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_9551663534243818596+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c3bb8a07961986496e8562aaa6b8e2c95f1a16486d01671b496004968c006d1a +size 1584 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_9551663534243818596+e30acd3a/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_9551663534243818596+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..95d02cfd4094e2a2c5d23ca91d65ff927ab9151e Binary files /dev/null and b/neuronxcc-2.21.33363.0+82129205/MODULE_9551663534243818596+e30acd3a/model.neff differ diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_96198b429c7161961ae8+a02c3a36/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_96198b429c7161961ae8+a02c3a36/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..5726abc7d1d8c52fa95bc7919439a23a23fe3b9a --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_96198b429c7161961ae8+a02c3a36/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/token_generation/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_96198b429c7161961ae8+a02c3a36/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_96198b429c7161961ae8+a02c3a36/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_96198b429c7161961ae8+a02c3a36/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_96198b429c7161961ae8+a02c3a36/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..a3187b3243e2f51d9ec4180d71f829368c83292b --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_96198b429c7161961ae8+a02c3a36/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7a7fe45265a07c517367eeb14a9e872a13b28bd852a3c700cd95f3aaca45e606 +size 1072107 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_96198b429c7161961ae8+a02c3a36/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_96198b429c7161961ae8+a02c3a36/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..083476660664ad069c752f92a1df9275350ddf93 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_96198b429c7161961ae8+a02c3a36/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:be00683456c8e53ac1d8b636bc43948334439945df69e21d13bb024fb0c8f74b +size 6974464 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_96198b429c7161961ae8+a02c3a36/wrapped_neff.hlo b/neuronxcc-2.21.33363.0+82129205/MODULE_96198b429c7161961ae8+a02c3a36/wrapped_neff.hlo new file mode 100644 index 0000000000000000000000000000000000000000..aced4acc115b3cf69db0aa9ed26620565197e7e5 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_96198b429c7161961ae8+a02c3a36/wrapped_neff.hlo @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0a02a01e12342eca2024052e03e32319101c7dfa74747cebd14b8ee01efd7341 +size 7158800 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_97d05358399518e4efee+a02c3a36/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_97d05358399518e4efee+a02c3a36/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..5726abc7d1d8c52fa95bc7919439a23a23fe3b9a --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_97d05358399518e4efee+a02c3a36/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/token_generation/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_97d05358399518e4efee+a02c3a36/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_97d05358399518e4efee+a02c3a36/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_97d05358399518e4efee+a02c3a36/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_97d05358399518e4efee+a02c3a36/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..96fe3f3e5c945607376827a4431c3bca17fb08d9 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_97d05358399518e4efee+a02c3a36/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:97f7d0fd62b57e405033e6732e923bfef8aca85b712557cee2b0b792bdb4c0c8 +size 691657 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_97d05358399518e4efee+a02c3a36/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_97d05358399518e4efee+a02c3a36/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..84a848047b706b29a202cffd6885fe799456aaf5 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_97d05358399518e4efee+a02c3a36/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:89974f7eed4d0bab949c0feb58ae405cf6c126cbd20818140de2e62266ee699f +size 12411904 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_97d05358399518e4efee+a02c3a36/wrapped_neff.hlo b/neuronxcc-2.21.33363.0+82129205/MODULE_97d05358399518e4efee+a02c3a36/wrapped_neff.hlo new file mode 100644 index 0000000000000000000000000000000000000000..0bf06efa9573c9afd0c66ad08a9f88dc3405edc1 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_97d05358399518e4efee+a02c3a36/wrapped_neff.hlo @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:064fa5dfc0c2256ae81bf23273a14f13e795cdc5086d85f6038578c00ceeb7d7 +size 12559063 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_9a0754abf83f7bc78b7d+098c44e3/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_9a0754abf83f7bc78b7d+098c44e3/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..c271fa2cc2817515d095ebac013642a160609a93 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_9a0754abf83f7bc78b7d+098c44e3/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--enable-saturate-infinity", "--auto-cast=none", "--model-type=transformer", "-O1", "--logfile=/tmp/nxdi_test_191ea227-e475-47e3-8582-0090d3a205fa/compiler_workdir/DecoderLayerWrapper/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_9a0754abf83f7bc78b7d+098c44e3/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_9a0754abf83f7bc78b7d+098c44e3/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_9a0754abf83f7bc78b7d+098c44e3/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_9a0754abf83f7bc78b7d+098c44e3/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..c0085b990f557c43d8e51445d9ee78974487c16d --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_9a0754abf83f7bc78b7d+098c44e3/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0bf2f097fbd06b979910d8b7304be86176d5776d2cd05fa2d3fa2617eb43ccc9 +size 15614 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_9a0754abf83f7bc78b7d+098c44e3/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_9a0754abf83f7bc78b7d+098c44e3/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..d4ec7b30f4a9a02d9cebed8b7c5b684f0dead565 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_9a0754abf83f7bc78b7d+098c44e3/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a283f7efd3f1dc65fd9f971033c9e87b0e39eaaca960e4a3294aef9008980c63 +size 154624 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_9a0754abf83f7bc78b7d+098c44e3/wrapped_neff.hlo b/neuronxcc-2.21.33363.0+82129205/MODULE_9a0754abf83f7bc78b7d+098c44e3/wrapped_neff.hlo new file mode 100644 index 0000000000000000000000000000000000000000..515838cf62cc91e98a6a69759d44d2462c1864ec --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_9a0754abf83f7bc78b7d+098c44e3/wrapped_neff.hlo @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3e906fa4bdb753e27d763c16fdd67fd094ceb82708005aea142bc5d86d569935 +size 159439 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_9abf1a24d09eee8a089b+a02c3a36/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_9abf1a24d09eee8a089b+a02c3a36/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..5726abc7d1d8c52fa95bc7919439a23a23fe3b9a --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_9abf1a24d09eee8a089b+a02c3a36/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/token_generation/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_9abf1a24d09eee8a089b+a02c3a36/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_9abf1a24d09eee8a089b+a02c3a36/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..369384d427240466c4c7f473667e3aa6734cc089 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_9abf1a24d09eee8a089b+a02c3a36/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:84a477f8b50b9be22f54776ff24af864b78e6ee9c58ecf43790250f183eaba4b +size 1881525 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_9abf1a24d09eee8a089b+a02c3a36/model.log b/neuronxcc-2.21.33363.0+82129205/MODULE_9abf1a24d09eee8a089b+a02c3a36/model.log new file mode 100644 index 0000000000000000000000000000000000000000..8de04a42f25a869d18620da058893d56c484372a --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_9abf1a24d09eee8a089b+a02c3a36/model.log @@ -0,0 +1,2 @@ +Failed compilation with ['neuronx-cc', 'compile', '--framework=XLA', '/tmp/nxd_model/token_generation/_tp0_bk0/model.MODULE_9abf1a24d09eee8a089b+a02c3a36.hlo_module.pb', '--output', '/tmp/nxd_model/token_generation/_tp0_bk0/model.MODULE_9abf1a24d09eee8a089b+a02c3a36.neff', '--target=trn1', '--auto-cast=none', '--model-type=transformer', '--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ', '-O2', '--lnc=1', '--logfile=/tmp/nxd_model/token_generation/_tp0_bk0/log-neuron-cc.txt', '--enable-internal-neff-wrapper', '--verbose=35']: 2026-01-26T08:21:13Z 2026-01-26 08:21:13.680235: F hilo/hlo_passes/NeuronHloVerifier.cc:504] [ERROR] [NCC_VRF009] Memory requirement exceeds target architecture's HBM limit. Needed 146476122136 bytes (136 GB) vs. available 17179869184 bytes (16 GB). TIP: Consider using smaller batches or applying model parallelism + diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_9b81a779cf3ae3a12644+149cbfff/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_9b81a779cf3ae3a12644+149cbfff/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..5ed218758630ff325a9e7a1ab9934d6b338ac971 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_9b81a779cf3ae3a12644+149cbfff/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--enable-saturate-infinity", "--auto-cast=none", "--model-type=transformer", "-O1", "--logfile=/tmp/nxdi_test_66b71490-01f8-452c-9422-3a2872d25f2f/compiler_workdir/DecoderLayerWrapper/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_9b81a779cf3ae3a12644+149cbfff/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_9b81a779cf3ae3a12644+149cbfff/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_9b81a779cf3ae3a12644+149cbfff/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_9b81a779cf3ae3a12644+149cbfff/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..8e20bd811466212d95884a7f4fabaa750266df60 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_9b81a779cf3ae3a12644+149cbfff/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a658223854590b04ecc83a4b4f7c71c554737aff1f655391d4dff954e553213b +size 15848 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_9b81a779cf3ae3a12644+149cbfff/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_9b81a779cf3ae3a12644+149cbfff/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..b2c5e164a2375aa1553f596172d723afa103a5c5 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_9b81a779cf3ae3a12644+149cbfff/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f4e8970db7d868e6a9d2a031f44f4a53fbee931f3db11f7d4092243b28f4b43 +size 400384 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_9b81a779cf3ae3a12644+149cbfff/wrapped_neff.hlo b/neuronxcc-2.21.33363.0+82129205/MODULE_9b81a779cf3ae3a12644+149cbfff/wrapped_neff.hlo new file mode 100644 index 0000000000000000000000000000000000000000..719fc7f880e39f75e239ca1d2b27f96187fd29c7 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_9b81a779cf3ae3a12644+149cbfff/wrapped_neff.hlo @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1eb975d2c5b365e6fc9656ee39af4fb6dc314938c001baaf58d5e79a9324bf56 +size 406082 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_9bc06d024b9ce47e5f56+24129607/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_9bc06d024b9ce47e5f56+24129607/model.hlo_module.pb index 2dfe28bd941cdcb1aa0cd8e62b7727c1b2ce8f58..78b5cc8665d05cb8f7c7db976481945ecb1bb354 100644 --- a/neuronxcc-2.21.33363.0+82129205/MODULE_9bc06d024b9ce47e5f56+24129607/model.hlo_module.pb +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_9bc06d024b9ce47e5f56+24129607/model.hlo_module.pb @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:dfa7ee587c6dd7eb719c810d0b3390042fe6e1ba6c8c33b36d4f10a723820f13 +oid sha256:18debfa97c09c988925a1aaaa8b9c0f8f4cd2b025cbeb08d7ef3bfc4ec9a865f size 509380 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_9bc06d024b9ce47e5f56+24129607/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_9bc06d024b9ce47e5f56+24129607/model.neff index 9120cd17e6add4b59847b4c481e64723b78e789d..c410473e6bd09ffec233ea46ca33324c0cddd158 100644 --- a/neuronxcc-2.21.33363.0+82129205/MODULE_9bc06d024b9ce47e5f56+24129607/model.neff +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_9bc06d024b9ce47e5f56+24129607/model.neff @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:6fcc51a8a2631ef64a3fc55d99615f28707984ec5d38a3df36fa25006a98fe9a +oid sha256:693b83d4f6771c87b8387a60f6b448121dd1c389524ed32f8e1e427f5e1aaacd size 41585664 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_9c53a5ac284b649e893b+a02c3a36/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_9c53a5ac284b649e893b+a02c3a36/model.neff index 97ce758dae65295731f1803d803ded3f316ad263..6dfc3b39a64ae6384a22e8750bf1a363f6cca3e8 100644 --- a/neuronxcc-2.21.33363.0+82129205/MODULE_9c53a5ac284b649e893b+a02c3a36/model.neff +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_9c53a5ac284b649e893b+a02c3a36/model.neff @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:4abcbcd9ed97fc54df10216f947fd987bb4a49d0d9dd32dcb0020f5700e0505a +oid sha256:6b700e53c7323708f3c63e59bb1860f7782dbeb3d0a487869aa5f4ab23989151 size 6933504 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_9c53a5ac284b649e893b+a02c3a36/wrapped_neff.hlo b/neuronxcc-2.21.33363.0+82129205/MODULE_9c53a5ac284b649e893b+a02c3a36/wrapped_neff.hlo index da9e6f6ac2c6cbf41e43d04854bdf148e6d137e4..8a3086feba376f428e59e75565e23ec53bf01736 100644 --- a/neuronxcc-2.21.33363.0+82129205/MODULE_9c53a5ac284b649e893b+a02c3a36/wrapped_neff.hlo +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_9c53a5ac284b649e893b+a02c3a36/wrapped_neff.hlo @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:6c552fcec7dd7ab6d4bc6aa95ba48435854f7a8c7ced6894a50ab596ef3526e5 +oid sha256:699ac7e338dc0f77e05957f9d7f60b222256aea2924dc61b2903f55dc592357f size 7117697 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_9d52760610a001af812a+f8e6d902/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_9d52760610a001af812a+f8e6d902/model.neff index 0ce3bfe677e37bbe8937405949e98969e95b3235..c64a91bd3edecb0e67429d35330d7e0c16e8b16f 100644 --- a/neuronxcc-2.21.33363.0+82129205/MODULE_9d52760610a001af812a+f8e6d902/model.neff +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_9d52760610a001af812a+f8e6d902/model.neff @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:0b32b26173495629dd59108bcb4f98b21a4b73aff9e6736bdb979ddb2c118126 +oid sha256:e884a06795f3dbe019d77779bf01db493d426ba8ec0ef1f7465464fa9d361a12 size 646144 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_9f3d72fade252307a3fc+a02c3a36/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_9f3d72fade252307a3fc+a02c3a36/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..5726abc7d1d8c52fa95bc7919439a23a23fe3b9a --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_9f3d72fade252307a3fc+a02c3a36/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/token_generation/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_9f3d72fade252307a3fc+a02c3a36/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_9f3d72fade252307a3fc+a02c3a36/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_9f3d72fade252307a3fc+a02c3a36/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_9f3d72fade252307a3fc+a02c3a36/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..0174d999b5d3a7737c499a9002b9ca3661cfae6b --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_9f3d72fade252307a3fc+a02c3a36/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:57707ea0510b8582bd32bc5b13de9eb9d483735f61fec6bb308f8ece555c4c81 +size 59731 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_9f3d72fade252307a3fc+a02c3a36/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_9f3d72fade252307a3fc+a02c3a36/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..c810d1ee34bbb8414aa1bc528489de8382505e8c --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_9f3d72fade252307a3fc+a02c3a36/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bfaebe68764eba12ec938070782a5410f49c1109a4889bdc9eb07c3727d5278e +size 1229824 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_9f3d72fade252307a3fc+a02c3a36/wrapped_neff.hlo b/neuronxcc-2.21.33363.0+82129205/MODULE_9f3d72fade252307a3fc+a02c3a36/wrapped_neff.hlo new file mode 100644 index 0000000000000000000000000000000000000000..1cb496b583cfc2f7a19bc99a8fa349f3037912e1 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_9f3d72fade252307a3fc+a02c3a36/wrapped_neff.hlo @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:70ca60fc923b033644b2f54e587d2bb67ea257d8eb0570ba69b67a6f98e555f7 +size 1236627 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_a0467b8b82934a24d142+a02c3a36/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_a0467b8b82934a24d142+a02c3a36/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..5726abc7d1d8c52fa95bc7919439a23a23fe3b9a --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_a0467b8b82934a24d142+a02c3a36/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/token_generation/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_a0467b8b82934a24d142+a02c3a36/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_a0467b8b82934a24d142+a02c3a36/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_a0467b8b82934a24d142+a02c3a36/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_a0467b8b82934a24d142+a02c3a36/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..4a170d38a283bc10333e440270f4979f207bfebd --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_a0467b8b82934a24d142+a02c3a36/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b570926ce0fcfd782ef61d818285f77f7df61321cfef5c4f1085b51b81d2a1a +size 588406 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_a0467b8b82934a24d142+a02c3a36/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_a0467b8b82934a24d142+a02c3a36/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..428aba0b0b297a55a092a9ba23188f5391380713 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_a0467b8b82934a24d142+a02c3a36/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0bdb7fe0707deec155b675d44f17cb110f8403fae5b7b04cac215a09d2eb7317 +size 1926144 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_a0467b8b82934a24d142+a02c3a36/wrapped_neff.hlo b/neuronxcc-2.21.33363.0+82129205/MODULE_a0467b8b82934a24d142+a02c3a36/wrapped_neff.hlo new file mode 100644 index 0000000000000000000000000000000000000000..c76ff560b0c347187495ee9aceae807d947cebe1 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_a0467b8b82934a24d142+a02c3a36/wrapped_neff.hlo @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5594ea63388e063d2549be4063f6717b9f3e66c58b9211cc28d7d9772cdc8ffd +size 2082478 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_aa3ef3e7a5cba473337f+1dee5e5e/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_aa3ef3e7a5cba473337f+1dee5e5e/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..380687684013c9625ec4d33ddcb58289816c6971 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_aa3ef3e7a5cba473337f+1dee5e5e/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--enable-saturate-infinity", "--auto-cast=none", "--model-type=transformer", "-O1", "--logfile=/tmp/nxdi_test_5eff1cd4-0774-49e6-b0fe-0cbca7f78a40/compiler_workdir/DecoderLayerWrapper/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_aa3ef3e7a5cba473337f+1dee5e5e/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_aa3ef3e7a5cba473337f+1dee5e5e/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_aa3ef3e7a5cba473337f+1dee5e5e/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_aa3ef3e7a5cba473337f+1dee5e5e/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..24059d82bbcd149441306f8c07104e0d1a528b8d --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_aa3ef3e7a5cba473337f+1dee5e5e/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ffcb69581a275910194c1f9da6e6f165815ff451ce0b8fc2a627210726a1426a +size 14480 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_aa3ef3e7a5cba473337f+1dee5e5e/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_aa3ef3e7a5cba473337f+1dee5e5e/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..8c21921aeb60871ffaec1e009e5d3867b3ce93e4 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_aa3ef3e7a5cba473337f+1dee5e5e/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9f1757f5a33326acc510330c786d60f5f8564b1720636e0017c4c2f35c581e64 +size 267264 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_aa3ef3e7a5cba473337f+1dee5e5e/wrapped_neff.hlo b/neuronxcc-2.21.33363.0+82129205/MODULE_aa3ef3e7a5cba473337f+1dee5e5e/wrapped_neff.hlo new file mode 100644 index 0000000000000000000000000000000000000000..248fc2e73b9c46ad9b921dd48930374be4230a79 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_aa3ef3e7a5cba473337f+1dee5e5e/wrapped_neff.hlo @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e2d366cbcf518efce079ef9b1ef4a89217819dafbbde0fa2f435082e5ba591d +size 272962 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_ab1b160b3d8fa09ed76e+a02c3a36/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_ab1b160b3d8fa09ed76e+a02c3a36/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..5726abc7d1d8c52fa95bc7919439a23a23fe3b9a --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_ab1b160b3d8fa09ed76e+a02c3a36/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/token_generation/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_ab1b160b3d8fa09ed76e+a02c3a36/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_ab1b160b3d8fa09ed76e+a02c3a36/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_ab1b160b3d8fa09ed76e+a02c3a36/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_ab1b160b3d8fa09ed76e+a02c3a36/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..4aad113904f040ffd01d80cd1b899e3cfb94c3e0 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_ab1b160b3d8fa09ed76e+a02c3a36/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0ae2066b3bb7b9d1cc6e9185d24d7392d458203fe036cc1c8c1f35dea98d9737 +size 59654 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_ab1b160b3d8fa09ed76e+a02c3a36/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_ab1b160b3d8fa09ed76e+a02c3a36/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..dd0bfee7e001a6699f9becd75060396331dd14c5 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_ab1b160b3d8fa09ed76e+a02c3a36/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cdb3c91a397a44a1b967849a224e0cfff34a0cd166d211d24bf0e8b509845063 +size 1158144 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_ab1b160b3d8fa09ed76e+a02c3a36/wrapped_neff.hlo b/neuronxcc-2.21.33363.0+82129205/MODULE_ab1b160b3d8fa09ed76e+a02c3a36/wrapped_neff.hlo new file mode 100644 index 0000000000000000000000000000000000000000..6f4f9a89e02b6a5c299298d112f3656a0ca349cc --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_ab1b160b3d8fa09ed76e+a02c3a36/wrapped_neff.hlo @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7cc6858d30d31f2d0d86b83d99a1b81d2454280081f8cd3cdec45d9628d9de33 +size 1164929 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_ad7c8ac474ec4bdeae52+24129607/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_ad7c8ac474ec4bdeae52+24129607/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_ad7c8ac474ec4bdeae52+24129607/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_ad7c8ac474ec4bdeae52+24129607/model.hlo_module.pb index 748c409b8729fc9463051767dad159bc8d1c7cdb..b928c9a2f728815784f9ace1a24d0c5aa729fc33 100644 --- a/neuronxcc-2.21.33363.0+82129205/MODULE_ad7c8ac474ec4bdeae52+24129607/model.hlo_module.pb +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_ad7c8ac474ec4bdeae52+24129607/model.hlo_module.pb @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:fdb4342d18a3192874a17bcc4ddeadc592624a4db04b0444c931b0f2dc4e6d9b +oid sha256:3f1d26ab78f5dcdc49abcc6e752412007c6cc8d21445bfa1a0078c7ec9c8d610 size 761066 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_ad7c8ac474ec4bdeae52+24129607/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_ad7c8ac474ec4bdeae52+24129607/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..10acb8f92e98f282b39955520db7d6e3a2c0ba7d --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_ad7c8ac474ec4bdeae52+24129607/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:45d76b90151b45d3386d3374c30a864e389e6223be192d8cc711f967ba42673f +size 12504064 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_adf2c812522e586cea39+24129607/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_adf2c812522e586cea39+24129607/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..836724f44545ce0dedda1521fd4c623a6ea8ec72 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_adf2c812522e586cea39+24129607/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/context_encoding/_tp0_bk0/log-neuron-cc.txt"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_adf2c812522e586cea39+24129607/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_adf2c812522e586cea39+24129607/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_adf2c812522e586cea39+24129607/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_adf2c812522e586cea39+24129607/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..069f3f85eb5a96f2866ae1e359efc25a8428a78f --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_adf2c812522e586cea39+24129607/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:579f0a15276a65db703800e734c1dab4fb8f58f59b8118b3fcf606d8e4cf1a9a +size 911029 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_adf2c812522e586cea39+24129607/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_adf2c812522e586cea39+24129607/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..a6315cddd37c7981cb32418f306a6817f9b545d4 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_adf2c812522e586cea39+24129607/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:98b5b19e79f8c1f78243eaec7164e5c23124c9f3227d191bfccae54fafa76baf +size 11705344 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_b0d91b1607c7df83fc7f+a02c3a36/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_b0d91b1607c7df83fc7f+a02c3a36/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..5726abc7d1d8c52fa95bc7919439a23a23fe3b9a --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_b0d91b1607c7df83fc7f+a02c3a36/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/token_generation/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_b0d91b1607c7df83fc7f+a02c3a36/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_b0d91b1607c7df83fc7f+a02c3a36/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_b0d91b1607c7df83fc7f+a02c3a36/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_b0d91b1607c7df83fc7f+a02c3a36/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..7e9d26beec0f977cbffadaa07e072b813d5c384c --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_b0d91b1607c7df83fc7f+a02c3a36/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3d672c3848f8e54a8c124e63aef9b6c46e8501de480a8030d8cf09134de5c5b +size 418223 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_b0d91b1607c7df83fc7f+a02c3a36/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_b0d91b1607c7df83fc7f+a02c3a36/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..25ea89c3f2b0853afe69b2448b7885064f574ce7 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_b0d91b1607c7df83fc7f+a02c3a36/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f47aecd094b3b8cb82df7c967651758b567bcccf097b29eba650557745c3e60e +size 3093504 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_b0d91b1607c7df83fc7f+a02c3a36/wrapped_neff.hlo b/neuronxcc-2.21.33363.0+82129205/MODULE_b0d91b1607c7df83fc7f+a02c3a36/wrapped_neff.hlo new file mode 100644 index 0000000000000000000000000000000000000000..22e5f487b5c845a3f3f69935816d6a80430a4d35 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_b0d91b1607c7df83fc7f+a02c3a36/wrapped_neff.hlo @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:265f665976eca094764e237dff906e3564a680b7bd52746a2d9e2c0bdcb992b7 +size 3167748 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_b1cd3aa0106a6921386d+a02c3a36/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_b1cd3aa0106a6921386d+a02c3a36/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..5726abc7d1d8c52fa95bc7919439a23a23fe3b9a --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_b1cd3aa0106a6921386d+a02c3a36/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/token_generation/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_b1cd3aa0106a6921386d+a02c3a36/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_b1cd3aa0106a6921386d+a02c3a36/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_b1cd3aa0106a6921386d+a02c3a36/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_b1cd3aa0106a6921386d+a02c3a36/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..dfcb34dedfbd344ffcdb8170137c2132b684f2d0 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_b1cd3aa0106a6921386d+a02c3a36/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1c5bdaf7ab1c592348c87b32d7abd5f29334e7ba4607e47b500beded5fa611d2 +size 760831 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_b1cd3aa0106a6921386d+a02c3a36/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_b1cd3aa0106a6921386d+a02c3a36/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..de6aa0a026054cb3bc1a3832903adad67a422864 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_b1cd3aa0106a6921386d+a02c3a36/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:312ef0522c097b8a8ea70483f3ba91f2faaaa1cb53fd0579b80af8ba3520ac59 +size 9165824 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_b1cd3aa0106a6921386d+a02c3a36/wrapped_neff.hlo b/neuronxcc-2.21.33363.0+82129205/MODULE_b1cd3aa0106a6921386d+a02c3a36/wrapped_neff.hlo new file mode 100644 index 0000000000000000000000000000000000000000..4f078d8d757930e2c29bbe021816285dccd977fe --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_b1cd3aa0106a6921386d+a02c3a36/wrapped_neff.hlo @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca7519b76e0ce31948d91cc3a9cd78e334016664da913a256f822cc179fe0d71 +size 9313782 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_bb3cafc9659e6ad373c7+24129607/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_bb3cafc9659e6ad373c7+24129607/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..836724f44545ce0dedda1521fd4c623a6ea8ec72 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_bb3cafc9659e6ad373c7+24129607/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/context_encoding/_tp0_bk0/log-neuron-cc.txt"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_bb3cafc9659e6ad373c7+24129607/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_bb3cafc9659e6ad373c7+24129607/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_bb3cafc9659e6ad373c7+24129607/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_bb3cafc9659e6ad373c7+24129607/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..c954f65885fbf67996673a116e3777ee791b82dc --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_bb3cafc9659e6ad373c7+24129607/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d167b7fc9794adb3af4bedd335c8d928c11cd023681a9cc51494d42f7eba8fbe +size 392910 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_bb3cafc9659e6ad373c7+24129607/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_bb3cafc9659e6ad373c7+24129607/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..9287b45323238faafca6467dfa67dbcee21710cf --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_bb3cafc9659e6ad373c7+24129607/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:06c6ca430e3bc3418f1bc987b6baf586e5e27fc5fefa0cfa5b6f22fa338dbb5f +size 41626624 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_bc57576bbc26e14097b8+24129607/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_bc57576bbc26e14097b8+24129607/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..836724f44545ce0dedda1521fd4c623a6ea8ec72 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_bc57576bbc26e14097b8+24129607/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/context_encoding/_tp0_bk0/log-neuron-cc.txt"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_bc57576bbc26e14097b8+24129607/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_bc57576bbc26e14097b8+24129607/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_bc57576bbc26e14097b8+24129607/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_bc57576bbc26e14097b8+24129607/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..c77f5df526ba05fb188bb445988daed2eac3f55f --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_bc57576bbc26e14097b8+24129607/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b72501a2436298494e06c9346dcf952b606e8bb1d9659729c4e446acdef0c10 +size 61748 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_bc57576bbc26e14097b8+24129607/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_bc57576bbc26e14097b8+24129607/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..5bb6c10dd73fea0ec916cc9d0d0c8279ba95d765 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_bc57576bbc26e14097b8+24129607/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:63216654893520c4b09815b4cd28dd514a75912210c304115daf0619c13add00 +size 1874944 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_bdefd4948bd161bfec05+24129607/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_bdefd4948bd161bfec05+24129607/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..836724f44545ce0dedda1521fd4c623a6ea8ec72 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_bdefd4948bd161bfec05+24129607/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/context_encoding/_tp0_bk0/log-neuron-cc.txt"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_bdefd4948bd161bfec05+24129607/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_bdefd4948bd161bfec05+24129607/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_bdefd4948bd161bfec05+24129607/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_bdefd4948bd161bfec05+24129607/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..fdde262c7dcc3ac858dc4243924332b441864aa9 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_bdefd4948bd161bfec05+24129607/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f7ead07711618b2216d43d45a7485d58adac3a9fb9d0d2c142df842d47aa8a8f +size 72714 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_bdefd4948bd161bfec05+24129607/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_bdefd4948bd161bfec05+24129607/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..1dde68bbd6197009c13079bbfe1c41b7b0e00ab2 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_bdefd4948bd161bfec05+24129607/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1f460154eaf75e5dcc590ead1a47f47f1b163721d37f8a8a7a176cd9927f1310 +size 27771904 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_c26856b929d58ebddc23+24129607/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_c26856b929d58ebddc23+24129607/model.hlo_module.pb index 32942c066618e9d65cb12b4e62d9a5097ba42e3a..2490c1fe7fef9d747c24ae4daa81eb948a183fc1 100644 --- a/neuronxcc-2.21.33363.0+82129205/MODULE_c26856b929d58ebddc23+24129607/model.hlo_module.pb +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_c26856b929d58ebddc23+24129607/model.hlo_module.pb @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:eb45ccdda05a2a2ee1cf89ec265cdb0766071dc0512a114d5a7a007c1d523b9a +oid sha256:ba30bac1303e4d846c40c65f8e4d8a644794b6964038372ff73e155714762bdc size 83504 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_c26856b929d58ebddc23+24129607/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_c26856b929d58ebddc23+24129607/model.neff index 0bc673303d2f6a85cb41332e26052b5a2a238a8e..3612ae764be895e726e58f5ca7f02b1d988c5d24 100644 --- a/neuronxcc-2.21.33363.0+82129205/MODULE_c26856b929d58ebddc23+24129607/model.neff +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_c26856b929d58ebddc23+24129607/model.neff @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:36c9055608092f4be44de678aa77e873c858f75429d901c3851babbebe581dc4 +oid sha256:9ba77eb824772e994518cb8cae28e31fdb69af6393a0fac70a28fb9d3d5f6d51 size 328704 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_c47d987826f446f9955b+a02c3a36/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_c47d987826f446f9955b+a02c3a36/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..5726abc7d1d8c52fa95bc7919439a23a23fe3b9a --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_c47d987826f446f9955b+a02c3a36/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/token_generation/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_c47d987826f446f9955b+a02c3a36/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_c47d987826f446f9955b+a02c3a36/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_c47d987826f446f9955b+a02c3a36/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_c47d987826f446f9955b+a02c3a36/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..23f8ecb1751ba3f38c722fb4bd8ecb2ae91bfc72 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_c47d987826f446f9955b+a02c3a36/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5d09bed673b620f2bc20e66f30cf1f25a33e824c1d0af763597a7aaa1c1a8195 +size 1994386 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_c47d987826f446f9955b+a02c3a36/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_c47d987826f446f9955b+a02c3a36/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..ba03e7a16b808e9645f0925271e612adc0eae1b5 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_c47d987826f446f9955b+a02c3a36/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:edf8d58670a095b6b0f15d26459c6c25d18def69ed46c14e80be33bf830698e9 +size 10732544 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_c47d987826f446f9955b+a02c3a36/wrapped_neff.hlo b/neuronxcc-2.21.33363.0+82129205/MODULE_c47d987826f446f9955b+a02c3a36/wrapped_neff.hlo new file mode 100644 index 0000000000000000000000000000000000000000..25b878daa7c1e39ec43651fbd38cb4df0d8a2071 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_c47d987826f446f9955b+a02c3a36/wrapped_neff.hlo @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d6db53075f5ae7da7719da645e18e7318888b4d16083af2d90dbd1ceff94dc28 +size 11101510 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_c9952f69ef9cfc495903+a02c3a36/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_c9952f69ef9cfc495903+a02c3a36/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..5726abc7d1d8c52fa95bc7919439a23a23fe3b9a --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_c9952f69ef9cfc495903+a02c3a36/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/token_generation/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_c9952f69ef9cfc495903+a02c3a36/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_c9952f69ef9cfc495903+a02c3a36/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_c9952f69ef9cfc495903+a02c3a36/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_c9952f69ef9cfc495903+a02c3a36/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..61972ab77477b19dee312608af414e380c48b7e9 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_c9952f69ef9cfc495903+a02c3a36/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:613e342a683da59642c46d2dc2e949301ad5e16ba24ad1cf98df935a5a3b8b2a +size 380010 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_c9952f69ef9cfc495903+a02c3a36/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_c9952f69ef9cfc495903+a02c3a36/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..54571f1a62ab2ebf6901aac0c1c6a332e7d41837 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_c9952f69ef9cfc495903+a02c3a36/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a2637194e76cbb4b312631400300d49273ed6a87940f9f2c4dd3d3ab7526ef24 +size 1926144 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_c9952f69ef9cfc495903+a02c3a36/wrapped_neff.hlo b/neuronxcc-2.21.33363.0+82129205/MODULE_c9952f69ef9cfc495903+a02c3a36/wrapped_neff.hlo new file mode 100644 index 0000000000000000000000000000000000000000..c5621a25f9695bedf6e65a3fa70ee50bc4d1a723 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_c9952f69ef9cfc495903+a02c3a36/wrapped_neff.hlo @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e16b82265d54b66fd5d81b88e5f78f95b11398a097ded0670fd5b698b9482ac +size 2019200 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_cb6b880fc977b7ae4bda+24129607/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_cb6b880fc977b7ae4bda+24129607/model.hlo_module.pb index 28ee1398fee500d4fd4ce4bd55db6a4f4eb78dba..bc9cfc879012a007d2e0baa000a3b24812f240e8 100644 --- a/neuronxcc-2.21.33363.0+82129205/MODULE_cb6b880fc977b7ae4bda+24129607/model.hlo_module.pb +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_cb6b880fc977b7ae4bda+24129607/model.hlo_module.pb @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:5d12d23545ccb2c03c3978d33636c9589b7b6da434697f7b5507f28fd0062075 +oid sha256:488ac1572ce8e1b1ff2d6254afaf39e40218d5b117f226473da52d9ac7929c91 size 81516 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_cb6b880fc977b7ae4bda+24129607/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_cb6b880fc977b7ae4bda+24129607/model.neff index 0ebe76da33da7f535289f868ecf2170765c2801f..340e7cce3851d2abdb5ee14285f6645d1dbe5088 100644 --- a/neuronxcc-2.21.33363.0+82129205/MODULE_cb6b880fc977b7ae4bda+24129607/model.neff +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_cb6b880fc977b7ae4bda+24129607/model.neff @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:1bede074a656737d1b8bb3a4c99933c04b3172880e2528fa29965fad3b087226 +oid sha256:50269c93a4f89b9cfe1a88721a71f9262fee57c37777da36ef0127d536e4c0ee size 267264 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_cbda8a59038c9c5ffc17+a02c3a36/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_cbda8a59038c9c5ffc17+a02c3a36/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..5726abc7d1d8c52fa95bc7919439a23a23fe3b9a --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_cbda8a59038c9c5ffc17+a02c3a36/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/token_generation/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_cbda8a59038c9c5ffc17+a02c3a36/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_cbda8a59038c9c5ffc17+a02c3a36/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_cbda8a59038c9c5ffc17+a02c3a36/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_cbda8a59038c9c5ffc17+a02c3a36/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..64028cc78541c1833466a343e251d2e19d025203 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_cbda8a59038c9c5ffc17+a02c3a36/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e70386c0d4c7acaf312dfe4908f119fe46d817ab3d82394d549c5ed84707d551 +size 80382 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_cbda8a59038c9c5ffc17+a02c3a36/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_cbda8a59038c9c5ffc17+a02c3a36/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..9f774c385f737da46e6a63322211a66d9bb89832 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_cbda8a59038c9c5ffc17+a02c3a36/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a582473554f7c0b0ebb4a0e019ca598c2fa03deecb64203e0d069bbbe3f4ec90 +size 216064 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_cbda8a59038c9c5ffc17+a02c3a36/wrapped_neff.hlo b/neuronxcc-2.21.33363.0+82129205/MODULE_cbda8a59038c9c5ffc17+a02c3a36/wrapped_neff.hlo new file mode 100644 index 0000000000000000000000000000000000000000..08f24903a066f359551b07369d33b83b641effb7 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_cbda8a59038c9c5ffc17+a02c3a36/wrapped_neff.hlo @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:98b553f35aae2cec12206bcc2a8f472dfbef4f963b3c195462d31f6246f0eaed +size 224412 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_ccc2d4abbb67d5b7286f+a02c3a36/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_ccc2d4abbb67d5b7286f+a02c3a36/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..5726abc7d1d8c52fa95bc7919439a23a23fe3b9a --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_ccc2d4abbb67d5b7286f+a02c3a36/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/token_generation/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_ccc2d4abbb67d5b7286f+a02c3a36/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_ccc2d4abbb67d5b7286f+a02c3a36/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_ccc2d4abbb67d5b7286f+a02c3a36/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_ccc2d4abbb67d5b7286f+a02c3a36/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..df42b573cf644a6ce1513ac52c69b8e91fdcb2c1 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_ccc2d4abbb67d5b7286f+a02c3a36/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f9e6d2246d093ac5f9592eddf34f50ac231965a42a87f664d94749d61a0f5c7a +size 792713 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_ccc2d4abbb67d5b7286f+a02c3a36/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_ccc2d4abbb67d5b7286f+a02c3a36/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..0b425443c8ae76f06341228f60cc5a128922788a --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_ccc2d4abbb67d5b7286f+a02c3a36/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:485fcab1a5e44600370abc68d9e79dd52e9434d1d4501f9b7207e9d232e5322c +size 3154944 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_ccc2d4abbb67d5b7286f+a02c3a36/wrapped_neff.hlo b/neuronxcc-2.21.33363.0+82129205/MODULE_ccc2d4abbb67d5b7286f+a02c3a36/wrapped_neff.hlo new file mode 100644 index 0000000000000000000000000000000000000000..e3e1fd6dfc4e2cef6fb09072f7f7331f0d216d39 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_ccc2d4abbb67d5b7286f+a02c3a36/wrapped_neff.hlo @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b6d8b050b8d90396adcf804483c19946564cbb26fabebb488ed32aaa964280c3 +size 3303227 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_ce1ed82235621875fbad+eef3363a/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_ce1ed82235621875fbad+eef3363a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..e3df2e28f84ee07f1d05aca9d95201878bba07ad --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_ce1ed82235621875fbad+eef3363a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--enable-saturate-infinity", "--auto-cast=none", "--model-type=transformer", "-O1", "--logfile=/tmp/nxdi_test_bf789014-cacd-4464-891b-f97854c023f4/compiler_workdir/DecoderLayerWrapper/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_ce1ed82235621875fbad+eef3363a/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_ce1ed82235621875fbad+eef3363a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_ce1ed82235621875fbad+eef3363a/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_ce1ed82235621875fbad+eef3363a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..90dd1f7c4841c9bf4e1b3b5cd26795ff877acf47 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_ce1ed82235621875fbad+eef3363a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c4e6fcff8e146cbec5d2744e61c914a8b79121a10961ed1a82b5edbcf55083cb +size 21842 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_ce1ed82235621875fbad+eef3363a/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_ce1ed82235621875fbad+eef3363a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..3a6b888b1d43f7bf289b61c7d0fa2ec06153b855 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_ce1ed82235621875fbad+eef3363a/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6896a6b5cab3b471d621790289a4b3b41d13d797433ed9d07af53c3eb91fbd84 +size 5356544 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_ce1ed82235621875fbad+eef3363a/wrapped_neff.hlo b/neuronxcc-2.21.33363.0+82129205/MODULE_ce1ed82235621875fbad+eef3363a/wrapped_neff.hlo new file mode 100644 index 0000000000000000000000000000000000000000..11bdbf498c796a146ff0ccdd122f7ea0a98f3bc8 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_ce1ed82235621875fbad+eef3363a/wrapped_neff.hlo @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8a1d317d953a5e8c30ad9b42984eed844df51c7d93d530e02f2c822662d9bcc5 +size 5362101 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_ce8e893faf0f99f6c70b+f0422fe3/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_ce8e893faf0f99f6c70b+f0422fe3/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..af568624bc02bd975658341e36d6c815db86a60d --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_ce8e893faf0f99f6c70b+f0422fe3/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--enable-saturate-infinity", "--auto-cast=none", "--model-type=transformer", "-O1", "--logfile=/tmp/nxdi_test_5dcb89cf-270d-4667-9432-984d55b8c3f5/compiler_workdir/DecoderLayerWrapper/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_ce8e893faf0f99f6c70b+f0422fe3/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_ce8e893faf0f99f6c70b+f0422fe3/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_ce8e893faf0f99f6c70b+f0422fe3/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_ce8e893faf0f99f6c70b+f0422fe3/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..1c28a9b47eb52c8980bc7eca3d110647e87316ad --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_ce8e893faf0f99f6c70b+f0422fe3/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ddba865d08645ac2ad17638eae6847fe07b8239f95c55b373d3baacc85e1bb67 +size 15848 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_ce8e893faf0f99f6c70b+f0422fe3/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_ce8e893faf0f99f6c70b+f0422fe3/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..86ff56d17b4da47b7fb323bd1121017bc3df534e --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_ce8e893faf0f99f6c70b+f0422fe3/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ae9b6da11c38717d80c090b6d9fd4be81c5e795acf971ce4a0da1697db5f1de +size 2192384 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_ce8e893faf0f99f6c70b+f0422fe3/wrapped_neff.hlo b/neuronxcc-2.21.33363.0+82129205/MODULE_ce8e893faf0f99f6c70b+f0422fe3/wrapped_neff.hlo new file mode 100644 index 0000000000000000000000000000000000000000..0e7604a9a5d376236f0050f44935c12d15a6f1fb --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_ce8e893faf0f99f6c70b+f0422fe3/wrapped_neff.hlo @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:57f0a1cf456010e1caab21cba995b542c04c154b3f8845962d8a4ee3fc75646a +size 2198099 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_d053e5a2bdf45f8b64ef+a02c3a36/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_d053e5a2bdf45f8b64ef+a02c3a36/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..5726abc7d1d8c52fa95bc7919439a23a23fe3b9a --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_d053e5a2bdf45f8b64ef+a02c3a36/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/token_generation/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_d053e5a2bdf45f8b64ef+a02c3a36/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_d053e5a2bdf45f8b64ef+a02c3a36/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_d053e5a2bdf45f8b64ef+a02c3a36/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_d053e5a2bdf45f8b64ef+a02c3a36/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..eed523bea6eeaa784de41539eea2f866aeb3271f --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_d053e5a2bdf45f8b64ef+a02c3a36/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ac2983af5e71f668da961091ac3df341f2faebdcc5decdbf94e2a015b272ad8 +size 378995 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_d053e5a2bdf45f8b64ef+a02c3a36/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_d053e5a2bdf45f8b64ef+a02c3a36/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..874485ac17f12cdf2fecf1a47e7a0a6630e501c4 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_d053e5a2bdf45f8b64ef+a02c3a36/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b2f7b39fec1e16b5f026adada7723d0bb6add3f42dec771d0a4f85ed419ee716 +size 1936384 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_d053e5a2bdf45f8b64ef+a02c3a36/wrapped_neff.hlo b/neuronxcc-2.21.33363.0+82129205/MODULE_d053e5a2bdf45f8b64ef+a02c3a36/wrapped_neff.hlo new file mode 100644 index 0000000000000000000000000000000000000000..3894d7eb038a41564885f5529badc4c6d7360bfc --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_d053e5a2bdf45f8b64ef+a02c3a36/wrapped_neff.hlo @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:741c44dc2f1de52d46c5aa9dadfb01cd7bb8b8cfd898a8c7604c596fb1149f93 +size 2010496 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_d1b92df9d7d3f05023d5+6df9a02b/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_d1b92df9d7d3f05023d5+6df9a02b/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..49097c815276b563e3e7373dda1638e0a7f90ae2 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_d1b92df9d7d3f05023d5+6df9a02b/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--enable-saturate-infinity", "--auto-cast=none", "--model-type=transformer", "-O1", "--logfile=/tmp/nxdi_test_a240c504-8069-4000-a8e8-5c5818cb9681/compiler_workdir/DecoderLayerWrapper/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_d1b92df9d7d3f05023d5+6df9a02b/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_d1b92df9d7d3f05023d5+6df9a02b/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_d1b92df9d7d3f05023d5+6df9a02b/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_d1b92df9d7d3f05023d5+6df9a02b/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..39c703ed34d8f3f3b6e33c142a18ed4c91041384 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_d1b92df9d7d3f05023d5+6df9a02b/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:db79c5bb71c6b8dc88d476504febd997f95f956e0a1678b46d3d832716251a63 +size 15848 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_d1b92df9d7d3f05023d5+6df9a02b/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_d1b92df9d7d3f05023d5+6df9a02b/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..1001790706334c9bc70a31499fe906fcc657fdff --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_d1b92df9d7d3f05023d5+6df9a02b/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5c185d431016cc4a86a6982b1ab4a60a042770b09ddc41532667b0504a678832 +size 830464 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_d1b92df9d7d3f05023d5+6df9a02b/wrapped_neff.hlo b/neuronxcc-2.21.33363.0+82129205/MODULE_d1b92df9d7d3f05023d5+6df9a02b/wrapped_neff.hlo new file mode 100644 index 0000000000000000000000000000000000000000..f0ac33d6148585fc4403627b0b4c1f113f77b1a7 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_d1b92df9d7d3f05023d5+6df9a02b/wrapped_neff.hlo @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6bf54ab7aae70ec9125d209918efb7292ac78e5d595bb5fbb381011f479e566f +size 836176 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_d557da6777202c62f6c1+a02c3a36/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_d557da6777202c62f6c1+a02c3a36/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..5726abc7d1d8c52fa95bc7919439a23a23fe3b9a --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_d557da6777202c62f6c1+a02c3a36/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/token_generation/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_d557da6777202c62f6c1+a02c3a36/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_d557da6777202c62f6c1+a02c3a36/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_d557da6777202c62f6c1+a02c3a36/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_d557da6777202c62f6c1+a02c3a36/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..d4fb10dbc6d3e0d1a32651ea1f061079efec21ab --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_d557da6777202c62f6c1+a02c3a36/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b4af49e736f7ed19546d336775faa29cc9a06e62099771c342ebe8a4d13d18ed +size 59654 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_d557da6777202c62f6c1+a02c3a36/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_d557da6777202c62f6c1+a02c3a36/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..d47cde2022167a6c8b18486304b6b9f538017225 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_d557da6777202c62f6c1+a02c3a36/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:50330310fedd411eace7dfb0a6e835556ce261ab1fbba6ef9200d325a687af2c +size 1065984 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_d557da6777202c62f6c1+a02c3a36/wrapped_neff.hlo b/neuronxcc-2.21.33363.0+82129205/MODULE_d557da6777202c62f6c1+a02c3a36/wrapped_neff.hlo new file mode 100644 index 0000000000000000000000000000000000000000..cd652536b30f992b06656d9331fae9e94c7b4741 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_d557da6777202c62f6c1+a02c3a36/wrapped_neff.hlo @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:466eee1c505ec21269602bd913fd54696e096bb799760995b7a0838a74fff908 +size 1072769 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_d5ee7d5ab32cdaaa0ee0+677eeb9d/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_d5ee7d5ab32cdaaa0ee0+677eeb9d/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..ae7e0c6790082c43cd145aae8cc7e3cc89e15ca8 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_d5ee7d5ab32cdaaa0ee0+677eeb9d/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/speculation_model/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_d5ee7d5ab32cdaaa0ee0+677eeb9d/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_d5ee7d5ab32cdaaa0ee0+677eeb9d/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_d5ee7d5ab32cdaaa0ee0+677eeb9d/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_d5ee7d5ab32cdaaa0ee0+677eeb9d/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..e1d47503a6147d6660f78d4a89f05f4657bfe8b7 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_d5ee7d5ab32cdaaa0ee0+677eeb9d/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d7707ed593b1cd987d6610a983e0d581ebae6f51eba46aec434d58c14dd2eec6 +size 415213 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_d5ee7d5ab32cdaaa0ee0+677eeb9d/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_d5ee7d5ab32cdaaa0ee0+677eeb9d/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..b838707475a68e013910d58a69222014ec213cde --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_d5ee7d5ab32cdaaa0ee0+677eeb9d/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5e4bb8ba872a4dc122627fe81dedb8993987f8f4aa336be999d966dc1e45787c +size 3666944 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_d97f2a797158f5574518+24129607/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_d97f2a797158f5574518+24129607/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..836724f44545ce0dedda1521fd4c623a6ea8ec72 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_d97f2a797158f5574518+24129607/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/context_encoding/_tp0_bk0/log-neuron-cc.txt"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_d97f2a797158f5574518+24129607/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_d97f2a797158f5574518+24129607/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_d97f2a797158f5574518+24129607/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_d97f2a797158f5574518+24129607/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..95b1c06b45aff7492a41d6822dd0c0229348e3d8 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_d97f2a797158f5574518+24129607/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8a44de1c87fa9bb9536d02720a2897c0c73a82c47f32943898cc7d1148dbf791 +size 2234266 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_d97f2a797158f5574518+24129607/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_d97f2a797158f5574518+24129607/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..86062c36fc6767c46761702164527a2fa0b6e008 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_d97f2a797158f5574518+24129607/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:33dff883c03b38028cb31aa2305950e76fa3302e5339298dfd57b989bdfa32da +size 14593024 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_dc7fcef2e19ad392688a+24129607/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_dc7fcef2e19ad392688a+24129607/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..836724f44545ce0dedda1521fd4c623a6ea8ec72 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_dc7fcef2e19ad392688a+24129607/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/context_encoding/_tp0_bk0/log-neuron-cc.txt"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_dc7fcef2e19ad392688a+24129607/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_dc7fcef2e19ad392688a+24129607/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_dc7fcef2e19ad392688a+24129607/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_dc7fcef2e19ad392688a+24129607/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..b26925848f25079f899f904423b5514397351583 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_dc7fcef2e19ad392688a+24129607/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d79197135d214495e13bdbe0883fd3e9dde45a54149ba177c7d32773488375d0 +size 434848 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_dc7fcef2e19ad392688a+24129607/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_dc7fcef2e19ad392688a+24129607/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..1cc99a40553298ef0dab7e056ec916b1671e0b7a --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_dc7fcef2e19ad392688a+24129607/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b25dd3c84d4240f07300673a2919f10729a6e6ece2c1444ec397e737ce1d73ac +size 42179584 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_de64a5eb66d5e73e20ff+ee6b6593/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_de64a5eb66d5e73e20ff+ee6b6593/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..95b9d68f51722c435d3c81c7f4c1d83f93a09060 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_de64a5eb66d5e73e20ff+ee6b6593/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--enable-saturate-infinity", "--auto-cast=none", "--model-type=transformer", "-O1", "--logfile=/tmp/nxdi_test_8771a305-6545-4b1f-9aa2-9b616c5ba375/compiler_workdir/DecoderLayerWrapper/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_de64a5eb66d5e73e20ff+ee6b6593/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_de64a5eb66d5e73e20ff+ee6b6593/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_de64a5eb66d5e73e20ff+ee6b6593/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_de64a5eb66d5e73e20ff+ee6b6593/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..0178c3d56ce706eb29ef263fef96f2d4ec891d21 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_de64a5eb66d5e73e20ff+ee6b6593/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0a549dd87d6b9d7ef0fd6b25a2d4cc3432ca1059e80b4862da74f5b881b28285 +size 15614 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_de64a5eb66d5e73e20ff+ee6b6593/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_de64a5eb66d5e73e20ff+ee6b6593/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..cfef4eadba2aa48970589ebcd7638e3f3c022b6a --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_de64a5eb66d5e73e20ff+ee6b6593/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:26ad90824854c905a28ead29a4d1c60ef3cd18f2ebf02130b35a02df4ed9c08f +size 154624 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_de64a5eb66d5e73e20ff+ee6b6593/wrapped_neff.hlo b/neuronxcc-2.21.33363.0+82129205/MODULE_de64a5eb66d5e73e20ff+ee6b6593/wrapped_neff.hlo new file mode 100644 index 0000000000000000000000000000000000000000..f234d6ee2ae3ab929c648f4a68e701df573e1d9e --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_de64a5eb66d5e73e20ff+ee6b6593/wrapped_neff.hlo @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:27574b8976983e16ea3701002ddf850856b68c0ffd39c60e0d6e3dbef2e51fd9 +size 159439 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_e5486eb6f3f1a553b5f8+ecd1b333/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_e5486eb6f3f1a553b5f8+ecd1b333/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..86042237b9e868290494dac5359d8cc97e8d66d8 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_e5486eb6f3f1a553b5f8+ecd1b333/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--enable-saturate-infinity", "--auto-cast=none", "--model-type=transformer", "-O1", "--logfile=/tmp/nxdi_test_0a7bb8f3-642f-4902-93b5-55b3f79a6d49/compiler_workdir/DecoderLayerWrapper/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_e5486eb6f3f1a553b5f8+ecd1b333/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_e5486eb6f3f1a553b5f8+ecd1b333/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_e5486eb6f3f1a553b5f8+ecd1b333/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_e5486eb6f3f1a553b5f8+ecd1b333/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..c138c5cc140b22fd8230bdcf6ba90d0f0c7d2e8c --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_e5486eb6f3f1a553b5f8+ecd1b333/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a5e1fd5981be696e697f349ed0a98b679b7e09aed816f966f8b42b5defc7488c +size 15848 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_e5486eb6f3f1a553b5f8+ecd1b333/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_e5486eb6f3f1a553b5f8+ecd1b333/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..5aba9f14a6e1a6156f6b66585e3be16b56e9ad37 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_e5486eb6f3f1a553b5f8+ecd1b333/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a2903e8af6a2b0f680176b2c38e99471c7dc33bb093ab8f1dfb5c6a5e8c65f1f +size 2192384 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_e5486eb6f3f1a553b5f8+ecd1b333/wrapped_neff.hlo b/neuronxcc-2.21.33363.0+82129205/MODULE_e5486eb6f3f1a553b5f8+ecd1b333/wrapped_neff.hlo new file mode 100644 index 0000000000000000000000000000000000000000..197e0f812b01831c56ccb34b3421f3104d1612b9 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_e5486eb6f3f1a553b5f8+ecd1b333/wrapped_neff.hlo @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5d3a0f79d2e96d7bab5028a83208c5cf93da51dfd99cc7e98a1f4a24469fb5fc +size 2198099 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_e54f2eec2036cfaa2527+a02c3a36/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_e54f2eec2036cfaa2527+a02c3a36/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..5726abc7d1d8c52fa95bc7919439a23a23fe3b9a --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_e54f2eec2036cfaa2527+a02c3a36/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/token_generation/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_e54f2eec2036cfaa2527+a02c3a36/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_e54f2eec2036cfaa2527+a02c3a36/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_e54f2eec2036cfaa2527+a02c3a36/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_e54f2eec2036cfaa2527+a02c3a36/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..ab6e232e9ee3b133ae3d4a0bd368ac35f0d0320a --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_e54f2eec2036cfaa2527+a02c3a36/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2276273abc61e34200c7e5a7de5816a7b24632f44411a30fb9fbe0cd8a2c6025 +size 79532 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_e54f2eec2036cfaa2527+a02c3a36/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_e54f2eec2036cfaa2527+a02c3a36/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..bcb5ecb725258520dd20f292eeeb512e7a5bcb1f --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_e54f2eec2036cfaa2527+a02c3a36/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8d1195a8042301d6d00dde4797038105abf5e7b8a8e57b91f5ca4e7018133574 +size 1403904 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_e54f2eec2036cfaa2527+a02c3a36/wrapped_neff.hlo b/neuronxcc-2.21.33363.0+82129205/MODULE_e54f2eec2036cfaa2527+a02c3a36/wrapped_neff.hlo new file mode 100644 index 0000000000000000000000000000000000000000..c357a7332b7b2abeab22aa0a138faee89cdeb0e9 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_e54f2eec2036cfaa2527+a02c3a36/wrapped_neff.hlo @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4f4882327d38006313e821ec651f69d76aedc7796d87a761b48bd9552c4bd9b0 +size 1415127 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_e899b698a237c528bb16+24129607/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_e899b698a237c528bb16+24129607/model.hlo_module.pb index cf7107baae9339edc2d8373b74081ff19581db39..c8e158507cef0abd568e18481672a47be580132b 100644 --- a/neuronxcc-2.21.33363.0+82129205/MODULE_e899b698a237c528bb16+24129607/model.hlo_module.pb +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_e899b698a237c528bb16+24129607/model.hlo_module.pb @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:1250088885cd64fc4a0be3a10d2f8222c991a426632b4d7a86c18a890d6232ff +oid sha256:dbee7375c8021657bbb337b137190e79d46ae75cf40db4df9597daa481da9e5c size 90382 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_e899b698a237c528bb16+24129607/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_e899b698a237c528bb16+24129607/model.neff index 868cb15bc41071fe8d10f01f207a994c89b1e9f5..638d8a898464a976db0604cd8306a7f0af1c1262 100644 --- a/neuronxcc-2.21.33363.0+82129205/MODULE_e899b698a237c528bb16+24129607/model.neff +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_e899b698a237c528bb16+24129607/model.neff @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:de7fc6b6461262a518d9b4e6d67c1c6fe943b04806e1f726deaf29d599cb1911 +oid sha256:30550222149aae50b173e32adaeec5e384280fdc8f3e65aa0d0a6c4ee049106d size 359424 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_eadbca4e425481d07426+24129607/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_eadbca4e425481d07426+24129607/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..836724f44545ce0dedda1521fd4c623a6ea8ec72 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_eadbca4e425481d07426+24129607/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/context_encoding/_tp0_bk0/log-neuron-cc.txt"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_eadbca4e425481d07426+24129607/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_eadbca4e425481d07426+24129607/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_eadbca4e425481d07426+24129607/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_eadbca4e425481d07426+24129607/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..5520594aaa25ff8cc0e450c4d88f80a9136f2bec --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_eadbca4e425481d07426+24129607/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2ed141f95bc65aaa516c591933deb8e5be01c79c4a6efa2e311512186099619c +size 468573 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_eadbca4e425481d07426+24129607/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_eadbca4e425481d07426+24129607/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..4b104238bb81ed6139ed2789d5af757e2682a05e --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_eadbca4e425481d07426+24129607/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a34840aa752b8ac73e36fcadeddaded78e26f109cbc4b9f7125f902c7d3da820 +size 31048704 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_ebda959e0a7e1b1b3d41+24129607/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_ebda959e0a7e1b1b3d41+24129607/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..836724f44545ce0dedda1521fd4c623a6ea8ec72 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_ebda959e0a7e1b1b3d41+24129607/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/context_encoding/_tp0_bk0/log-neuron-cc.txt"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_ebda959e0a7e1b1b3d41+24129607/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_ebda959e0a7e1b1b3d41+24129607/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_ebda959e0a7e1b1b3d41+24129607/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_ebda959e0a7e1b1b3d41+24129607/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..3f83206a6e2c54211055572a7acac6c014775542 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_ebda959e0a7e1b1b3d41+24129607/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4872a69eb3a3edd4dfde05804f634e594dd9ac58017d508faa161b8be069e0b2 +size 63363 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_ebda959e0a7e1b1b3d41+24129607/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_ebda959e0a7e1b1b3d41+24129607/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..62ce506aee331c0d9165cbdd886eafc8f7840c4b --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_ebda959e0a7e1b1b3d41+24129607/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:683ab0a15335bdff2fb59a0427242d606838cec00b7709d27b3a91924146ea37 +size 1055744 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_ecafd5c328f53085c3ac+a02c3a36/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_ecafd5c328f53085c3ac+a02c3a36/model.hlo_module.pb index e984f1bfcc67f74c845bbd03e125247152b9b6bc..c871f1164f825b857f1680082a5922e1d8cf255e 100644 --- a/neuronxcc-2.21.33363.0+82129205/MODULE_ecafd5c328f53085c3ac+a02c3a36/model.hlo_module.pb +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_ecafd5c328f53085c3ac+a02c3a36/model.hlo_module.pb @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:828b718ac0d544f14a9a683c76b442c49520573027ba2e8347fdd5e79531704b +oid sha256:4288f97159a1a045dfcb075cd63bfa2fe8d84a6eeeadc7e52c2de97d8307c6ab size 702870 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_ecafd5c328f53085c3ac+a02c3a36/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_ecafd5c328f53085c3ac+a02c3a36/model.neff index 52c86daa6454c0a6fc14e3a48c4388125728f9aa..56b89da0bd5ce7a6401c532d3f8961a7911fef83 100644 --- a/neuronxcc-2.21.33363.0+82129205/MODULE_ecafd5c328f53085c3ac+a02c3a36/model.neff +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_ecafd5c328f53085c3ac+a02c3a36/model.neff @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:531b32643c31f3c4d905200b603578986c7aeea10d903bdc114e433b413ca7b5 +oid sha256:f0602f177b03698dfceb419eddcfa62291769924c4b7b8449abe1406cda3960b size 3503104 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_ecafd5c328f53085c3ac+a02c3a36/wrapped_neff.hlo b/neuronxcc-2.21.33363.0+82129205/MODULE_ecafd5c328f53085c3ac+a02c3a36/wrapped_neff.hlo index 62270876f7386ace9937e0c4f25937387345303c..3859be88d61395072bfd7f6b980f671cef85a1d1 100644 --- a/neuronxcc-2.21.33363.0+82129205/MODULE_ecafd5c328f53085c3ac+a02c3a36/wrapped_neff.hlo +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_ecafd5c328f53085c3ac+a02c3a36/wrapped_neff.hlo @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:3c0d6afa4411a36001c78d6ec60f60edf22477fc4fdaa73791c78e13d70c5b9f +oid sha256:c0f525a4deb9b89ea0e1a9dcea66d3a1ba404e2f0ad5a116d8e0aee492fedd2a size 3640300 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_ed0ddf13430a2a717168+24129607/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_ed0ddf13430a2a717168+24129607/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..836724f44545ce0dedda1521fd4c623a6ea8ec72 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_ed0ddf13430a2a717168+24129607/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/context_encoding/_tp0_bk0/log-neuron-cc.txt"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_ed0ddf13430a2a717168+24129607/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_ed0ddf13430a2a717168+24129607/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_ed0ddf13430a2a717168+24129607/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_ed0ddf13430a2a717168+24129607/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..1dfd0b5bb9e04dfddd4038e38bea1d5e1ba9ff15 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_ed0ddf13430a2a717168+24129607/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4dc5733491df336fd3985f8d434d3e669f9e56be47cb3825dbf3a899f837de23 +size 66585 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_ed0ddf13430a2a717168+24129607/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_ed0ddf13430a2a717168+24129607/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..9f9465e16024a77bfd75213dca177fdb8975c0b8 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_ed0ddf13430a2a717168+24129607/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fc556959b8b6ca168b0afbc4436724bfdff3471406930b26e3cfc0df55122495 +size 16897024 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_ee8ab158a9c272b70f44+a02c3a36/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_ee8ab158a9c272b70f44+a02c3a36/model.hlo_module.pb index e273fd0722ce8ffe0e967376ff2afbdcca6fda04..d40b921f650e4ca344d330f95f6380893d402d2c 100644 --- a/neuronxcc-2.21.33363.0+82129205/MODULE_ee8ab158a9c272b70f44+a02c3a36/model.hlo_module.pb +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_ee8ab158a9c272b70f44+a02c3a36/model.hlo_module.pb @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:2913e1dfc67fb201967593ca210cad72244a745757d1e7bc3aea7db3ea05712a +oid sha256:2d9150bc5aa42ad4c1035fe623592bcc639869b51cf86746a0c48faaebc5f464 size 388429 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_ee8ab158a9c272b70f44+a02c3a36/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_ee8ab158a9c272b70f44+a02c3a36/model.neff index 7eff559275e2672962b48b51eedb6a04889fab7b..03e794c3f8b60cfdec2a621d757acaacdce0ff23 100644 --- a/neuronxcc-2.21.33363.0+82129205/MODULE_ee8ab158a9c272b70f44+a02c3a36/model.neff +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_ee8ab158a9c272b70f44+a02c3a36/model.neff @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:17d7716beb9c13eb7c1c78f894b95a728e7e5328786bca494183ffe9bac29087 +oid sha256:e82c64993b7dad469832d89ca02c23124828e74901a02e0b125550a097819e24 size 1936384 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_ee8ab158a9c272b70f44+a02c3a36/wrapped_neff.hlo b/neuronxcc-2.21.33363.0+82129205/MODULE_ee8ab158a9c272b70f44+a02c3a36/wrapped_neff.hlo index e384e93b0290a003cdc2c110e1a74f327ea3126d..18cd72b07567e1657d1d4dba3f58621774ac4443 100644 --- a/neuronxcc-2.21.33363.0+82129205/MODULE_ee8ab158a9c272b70f44+a02c3a36/wrapped_neff.hlo +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_ee8ab158a9c272b70f44+a02c3a36/wrapped_neff.hlo @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:e52f89184f2cfaf87162c3bfcb7b0f554b0030ad0c173ef1bb100950728fdb54 +oid sha256:ad121dd45a5e872e2414bedf511fdd50223631112354b949c9c4709cacb17645 size 2029297 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_f03f06a24a40a8dbe7e1+24129607/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_f03f06a24a40a8dbe7e1+24129607/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..836724f44545ce0dedda1521fd4c623a6ea8ec72 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_f03f06a24a40a8dbe7e1+24129607/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/context_encoding/_tp0_bk0/log-neuron-cc.txt"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_f03f06a24a40a8dbe7e1+24129607/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_f03f06a24a40a8dbe7e1+24129607/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_f03f06a24a40a8dbe7e1+24129607/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_f03f06a24a40a8dbe7e1+24129607/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..779d6adad1e216cb8b1f10e339136e26a5a696a8 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_f03f06a24a40a8dbe7e1+24129607/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1a5f7e7fb48516f7bede6624ee0b00b2dde29dc93d69a43c49418738ed77f7a2 +size 926239 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_f03f06a24a40a8dbe7e1+24129607/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_f03f06a24a40a8dbe7e1+24129607/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..9c33a06391256ad23e7bb5534b1742e9175d3399 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_f03f06a24a40a8dbe7e1+24129607/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d96120e3848fe6462a17a682fd74c0227d2b9a2a3e0769c25715d282b27e56d0 +size 6575104 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_f2ba194e95963ca457c2+a02c3a36/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_f2ba194e95963ca457c2+a02c3a36/model.hlo_module.pb index ecc3ca05e8ae0662f2cff8f22dbb020e8b85acef..0400d3c20a9e3a798cc48491d3a15bde52b38caa 100644 --- a/neuronxcc-2.21.33363.0+82129205/MODULE_f2ba194e95963ca457c2+a02c3a36/model.hlo_module.pb +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_f2ba194e95963ca457c2+a02c3a36/model.hlo_module.pb @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:66355f45b5a564dad737213b1575c3673e50af834b71a571c765842a1e0bf372 +oid sha256:05a4038a70da97389bf754168583601f7fd3c730fe4edc619ed6004e6c5b4c7c size 700208 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_f2ba194e95963ca457c2+a02c3a36/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_f2ba194e95963ca457c2+a02c3a36/model.neff index 3137c2911607162b3709df115c937401fdaeaaaa..13d42efe82d80a40308378e1015073e7bc3b90b4 100644 --- a/neuronxcc-2.21.33363.0+82129205/MODULE_f2ba194e95963ca457c2+a02c3a36/model.neff +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_f2ba194e95963ca457c2+a02c3a36/model.neff @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:2dab91a2defcdf6da09de04cd1e7c2f29a26ff093603f3c8557bc90132d43616 +oid sha256:746fafd52eb90811cff39c5014a2c42a482e171dfbbefb934d746aea4b3e99d7 size 12411904 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_f2ba194e95963ca457c2+a02c3a36/wrapped_neff.hlo b/neuronxcc-2.21.33363.0+82129205/MODULE_f2ba194e95963ca457c2+a02c3a36/wrapped_neff.hlo index 6969511446904860e7649c42d766c4705a0c339c..1864b508bcc63f62492c972c3e150fa504cb80df 100644 --- a/neuronxcc-2.21.33363.0+82129205/MODULE_f2ba194e95963ca457c2+a02c3a36/wrapped_neff.hlo +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_f2ba194e95963ca457c2+a02c3a36/wrapped_neff.hlo @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:eb3127cde3d04cf5d9bc208ad0a3cc1b9e98493bbbdfd8ff1808bcd8a72e6858 +oid sha256:145ea9aeb136bfad8e0926a6aad9ede415dae6a4e80746db62c3c97a29eb1c1f size 12558920 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_f9c594cf85ceddc7f3ad+24129607/model.log b/neuronxcc-2.21.33363.0+82129205/MODULE_f9c594cf85ceddc7f3ad+24129607/model.log new file mode 100644 index 0000000000000000000000000000000000000000..b9d3a3d2494c9d43cbfdca14561828b3c33bcdf8 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_f9c594cf85ceddc7f3ad+24129607/model.log @@ -0,0 +1 @@ +Failed compilation with ['neuronx-cc', 'compile', '--framework=XLA', '/tmp/nxd_model/context_encoding/_tp0_bk0/model.MODULE_f9c594cf85ceddc7f3ad+24129607.hlo_module.pb', '--output', '/tmp/nxd_model/context_encoding/_tp0_bk0/model.MODULE_f9c594cf85ceddc7f3ad+24129607.neff', '--target=trn1', '--auto-cast=none', '--model-type=transformer', '--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ', '-O2', '--lnc=1', '--logfile=/tmp/nxd_model/context_encoding/_tp0_bk0/log-neuron-cc.txt', '--verbose=35']: \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_fcaa5220788f46dccc4f+a02c3a36/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_fcaa5220788f46dccc4f+a02c3a36/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..5726abc7d1d8c52fa95bc7919439a23a23fe3b9a --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_fcaa5220788f46dccc4f+a02c3a36/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/token_generation/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_fcaa5220788f46dccc4f+a02c3a36/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_fcaa5220788f46dccc4f+a02c3a36/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_fcaa5220788f46dccc4f+a02c3a36/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_fcaa5220788f46dccc4f+a02c3a36/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..f9aac85f572373187ed5932ede47f59a7a91323f --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_fcaa5220788f46dccc4f+a02c3a36/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0902b9467e36affd529236be99c466bb326eb59e56e6b6414b2bde17d7913ac8 +size 676474 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_fcaa5220788f46dccc4f+a02c3a36/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_fcaa5220788f46dccc4f+a02c3a36/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..ca2edeaff7a5a773737bb772667d191baf73e8b1 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_fcaa5220788f46dccc4f+a02c3a36/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a52f43c55d8c3cf96000b769db5b872074d525da0914de6733490c2db2b389d7 +size 543744 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_fcaa5220788f46dccc4f+a02c3a36/wrapped_neff.hlo b/neuronxcc-2.21.33363.0+82129205/MODULE_fcaa5220788f46dccc4f+a02c3a36/wrapped_neff.hlo new file mode 100644 index 0000000000000000000000000000000000000000..feb6b50c11b4c69e433bda628b73c5ad8fc4fab1 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_fcaa5220788f46dccc4f+a02c3a36/wrapped_neff.hlo @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a388ff10768fbb20c3c5dcc430ea96cc9974eeddebc8b8cd62a491f1328eab55 +size 563380 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_fd44e24d672157f0bc14+a02c3a36/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_fd44e24d672157f0bc14+a02c3a36/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..5726abc7d1d8c52fa95bc7919439a23a23fe3b9a --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_fd44e24d672157f0bc14+a02c3a36/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/token_generation/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_fd44e24d672157f0bc14+a02c3a36/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_fd44e24d672157f0bc14+a02c3a36/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_fd44e24d672157f0bc14+a02c3a36/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_fd44e24d672157f0bc14+a02c3a36/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..c81c30e219fd168ba5fdb3df5e4fede33a859ced --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_fd44e24d672157f0bc14+a02c3a36/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8f4b1a20b9b5729a253582eeded6be8bd71404900097df80d61fa2eaca91aa9a +size 380126 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_fd44e24d672157f0bc14+a02c3a36/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_fd44e24d672157f0bc14+a02c3a36/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..91e6eb7390977bff5b84580f3e316b0a7f9e28ef --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_fd44e24d672157f0bc14+a02c3a36/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9d181f557e36d91e6bcebdb4191a973b4a25c0f5b4ec1c9203c7d904bd567591 +size 2765824 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_fd44e24d672157f0bc14+a02c3a36/wrapped_neff.hlo b/neuronxcc-2.21.33363.0+82129205/MODULE_fd44e24d672157f0bc14+a02c3a36/wrapped_neff.hlo new file mode 100644 index 0000000000000000000000000000000000000000..3eb56d86ce9869f96d486099259afbc86cb21cbd --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_fd44e24d672157f0bc14+a02c3a36/wrapped_neff.hlo @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d519613c8b28426f8dbf8d72ce20a247514bab75a7f1106b5c77b385fbb173cb +size 2840167