program(1.0) [buildInfo = dict, tensor>({{"coremlc-component-MIL", "3510.2.1"}, {"coremlc-version", "3500.32.1"}})] { func main(tensor input_ids) { tensor wrapped_model_language_model_embed_tokens_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(64))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(335626368))), name = tensor("wrapped_model_language_model_embed_tokens_weight_palettized"), shape = tensor([262208, 2560])]; tensor wrapped_model_language_model_layers_0_self_attn_q_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(335626496))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(338248000))), name = tensor("wrapped_model_language_model_layers_0_self_attn_q_proj_weight_palettized"), shape = tensor([2048, 2560])]; tensor wrapped_model_language_model_layers_0_self_attn_k_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(338248128))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(339558912))), name = tensor("wrapped_model_language_model_layers_0_self_attn_k_proj_weight_palettized"), shape = tensor([1024, 2560])]; tensor wrapped_model_language_model_layers_0_self_attn_v_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(339559040))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(340869824))), name = tensor("wrapped_model_language_model_layers_0_self_attn_v_proj_weight_palettized"), shape = tensor([1024, 2560])]; tensor wrapped_model_language_model_layers_0_self_attn_o_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(340869952))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(343491456))), name = tensor("wrapped_model_language_model_layers_0_self_attn_o_proj_weight_palettized"), shape = tensor([2560, 2048])]; tensor wrapped_model_language_model_layers_0_mlp_gate_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(343491584))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(356598848))), name = tensor("wrapped_model_language_model_layers_0_mlp_gate_proj_weight_palettized"), shape = tensor([10240, 2560])]; tensor wrapped_model_language_model_layers_0_mlp_up_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(356598976))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(369706240))), name = tensor("wrapped_model_language_model_layers_0_mlp_up_proj_weight_palettized"), shape = tensor([10240, 2560])]; tensor wrapped_model_language_model_layers_0_mlp_down_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(369706368))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(382813632))), name = tensor("wrapped_model_language_model_layers_0_mlp_down_proj_weight_palettized"), shape = tensor([2560, 10240])]; tensor wrapped_model_language_model_layers_1_self_attn_q_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(382813760))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(385435264))), name = tensor("wrapped_model_language_model_layers_1_self_attn_q_proj_weight_palettized"), shape = tensor([2048, 2560])]; tensor wrapped_model_language_model_layers_1_self_attn_k_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(385435392))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(386746176))), name = tensor("wrapped_model_language_model_layers_1_self_attn_k_proj_weight_palettized"), shape = tensor([1024, 2560])]; tensor wrapped_model_language_model_layers_1_self_attn_v_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(386746304))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(388057088))), name = tensor("wrapped_model_language_model_layers_1_self_attn_v_proj_weight_palettized"), shape = tensor([1024, 2560])]; tensor wrapped_model_language_model_layers_1_self_attn_o_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(388057216))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(390678720))), name = tensor("wrapped_model_language_model_layers_1_self_attn_o_proj_weight_palettized"), shape = tensor([2560, 2048])]; tensor wrapped_model_language_model_layers_1_mlp_gate_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(390678848))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(403786112))), name = tensor("wrapped_model_language_model_layers_1_mlp_gate_proj_weight_palettized"), shape = tensor([10240, 2560])]; tensor wrapped_model_language_model_layers_1_mlp_up_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(403786240))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(416893504))), name = tensor("wrapped_model_language_model_layers_1_mlp_up_proj_weight_palettized"), shape = tensor([10240, 2560])]; tensor wrapped_model_language_model_layers_1_mlp_down_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(416893632))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(430000896))), name = tensor("wrapped_model_language_model_layers_1_mlp_down_proj_weight_palettized"), shape = tensor([2560, 10240])]; tensor wrapped_model_language_model_layers_2_self_attn_q_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(430001024))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(432622528))), name = tensor("wrapped_model_language_model_layers_2_self_attn_q_proj_weight_palettized"), shape = tensor([2048, 2560])]; tensor wrapped_model_language_model_layers_2_self_attn_k_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(432622656))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(433933440))), name = tensor("wrapped_model_language_model_layers_2_self_attn_k_proj_weight_palettized"), shape = tensor([1024, 2560])]; tensor wrapped_model_language_model_layers_2_self_attn_v_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(433933568))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(435244352))), name = tensor("wrapped_model_language_model_layers_2_self_attn_v_proj_weight_palettized"), shape = tensor([1024, 2560])]; tensor wrapped_model_language_model_layers_2_self_attn_o_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(435244480))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(437865984))), name = tensor("wrapped_model_language_model_layers_2_self_attn_o_proj_weight_palettized"), shape = tensor([2560, 2048])]; tensor wrapped_model_language_model_layers_2_mlp_gate_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(437866112))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(450973376))), name = tensor("wrapped_model_language_model_layers_2_mlp_gate_proj_weight_palettized"), shape = tensor([10240, 2560])]; tensor wrapped_model_language_model_layers_2_mlp_up_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(450973504))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(464080768))), name = tensor("wrapped_model_language_model_layers_2_mlp_up_proj_weight_palettized"), shape = tensor([10240, 2560])]; tensor wrapped_model_language_model_layers_2_mlp_down_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(464080896))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(477188160))), name = tensor("wrapped_model_language_model_layers_2_mlp_down_proj_weight_palettized"), shape = tensor([2560, 10240])]; tensor wrapped_model_language_model_layers_3_self_attn_q_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(477188288))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(479809792))), name = tensor("wrapped_model_language_model_layers_3_self_attn_q_proj_weight_palettized"), shape = tensor([2048, 2560])]; tensor wrapped_model_language_model_layers_3_self_attn_k_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(479809920))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(481120704))), name = tensor("wrapped_model_language_model_layers_3_self_attn_k_proj_weight_palettized"), shape = tensor([1024, 2560])]; tensor wrapped_model_language_model_layers_3_self_attn_v_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(481120832))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(482431616))), name = tensor("wrapped_model_language_model_layers_3_self_attn_v_proj_weight_palettized"), shape = tensor([1024, 2560])]; tensor wrapped_model_language_model_layers_3_self_attn_o_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(482431744))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(485053248))), name = tensor("wrapped_model_language_model_layers_3_self_attn_o_proj_weight_palettized"), shape = tensor([2560, 2048])]; tensor wrapped_model_language_model_layers_3_mlp_gate_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(485053376))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(498160640))), name = tensor("wrapped_model_language_model_layers_3_mlp_gate_proj_weight_palettized"), shape = tensor([10240, 2560])]; tensor wrapped_model_language_model_layers_3_mlp_up_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(498160768))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(511268032))), name = tensor("wrapped_model_language_model_layers_3_mlp_up_proj_weight_palettized"), shape = tensor([10240, 2560])]; tensor wrapped_model_language_model_layers_3_mlp_down_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(511268160))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(524375424))), name = tensor("wrapped_model_language_model_layers_3_mlp_down_proj_weight_palettized"), shape = tensor([2560, 10240])]; tensor wrapped_model_language_model_layers_4_self_attn_q_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(524375552))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(526997056))), name = tensor("wrapped_model_language_model_layers_4_self_attn_q_proj_weight_palettized"), shape = tensor([2048, 2560])]; tensor wrapped_model_language_model_layers_4_self_attn_k_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(526997184))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(528307968))), name = tensor("wrapped_model_language_model_layers_4_self_attn_k_proj_weight_palettized"), shape = tensor([1024, 2560])]; tensor wrapped_model_language_model_layers_4_self_attn_v_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(528308096))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(529618880))), name = tensor("wrapped_model_language_model_layers_4_self_attn_v_proj_weight_palettized"), shape = tensor([1024, 2560])]; tensor wrapped_model_language_model_layers_4_self_attn_o_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(529619008))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(532240512))), name = tensor("wrapped_model_language_model_layers_4_self_attn_o_proj_weight_palettized"), shape = tensor([2560, 2048])]; tensor wrapped_model_language_model_layers_4_mlp_gate_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(532240640))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(545347904))), name = tensor("wrapped_model_language_model_layers_4_mlp_gate_proj_weight_palettized"), shape = tensor([10240, 2560])]; tensor wrapped_model_language_model_layers_4_mlp_up_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(545348032))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(558455296))), name = tensor("wrapped_model_language_model_layers_4_mlp_up_proj_weight_palettized"), shape = tensor([10240, 2560])]; tensor wrapped_model_language_model_layers_4_mlp_down_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(558455424))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(571562688))), name = tensor("wrapped_model_language_model_layers_4_mlp_down_proj_weight_palettized"), shape = tensor([2560, 10240])]; tensor wrapped_model_language_model_layers_5_self_attn_q_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(571562816))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(574184320))), name = tensor("wrapped_model_language_model_layers_5_self_attn_q_proj_weight_palettized"), shape = tensor([2048, 2560])]; tensor wrapped_model_language_model_layers_5_self_attn_k_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(574184448))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(575495232))), name = tensor("wrapped_model_language_model_layers_5_self_attn_k_proj_weight_palettized"), shape = tensor([1024, 2560])]; tensor wrapped_model_language_model_layers_5_self_attn_v_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(575495360))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(576806144))), name = tensor("wrapped_model_language_model_layers_5_self_attn_v_proj_weight_palettized"), shape = tensor([1024, 2560])]; tensor wrapped_model_language_model_layers_5_self_attn_o_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(576806272))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(579427776))), name = tensor("wrapped_model_language_model_layers_5_self_attn_o_proj_weight_palettized"), shape = tensor([2560, 2048])]; tensor wrapped_model_language_model_layers_5_mlp_gate_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(579427904))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(592535168))), name = tensor("wrapped_model_language_model_layers_5_mlp_gate_proj_weight_palettized"), shape = tensor([10240, 2560])]; tensor wrapped_model_language_model_layers_5_mlp_up_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(592535296))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(605642560))), name = tensor("wrapped_model_language_model_layers_5_mlp_up_proj_weight_palettized"), shape = tensor([10240, 2560])]; tensor wrapped_model_language_model_layers_5_mlp_down_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(605642688))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(618749952))), name = tensor("wrapped_model_language_model_layers_5_mlp_down_proj_weight_palettized"), shape = tensor([2560, 10240])]; tensor wrapped_model_language_model_layers_6_self_attn_q_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(618750080))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(621371584))), name = tensor("wrapped_model_language_model_layers_6_self_attn_q_proj_weight_palettized"), shape = tensor([2048, 2560])]; tensor wrapped_model_language_model_layers_6_self_attn_k_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(621371712))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(622682496))), name = tensor("wrapped_model_language_model_layers_6_self_attn_k_proj_weight_palettized"), shape = tensor([1024, 2560])]; tensor wrapped_model_language_model_layers_6_self_attn_v_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(622682624))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(623993408))), name = tensor("wrapped_model_language_model_layers_6_self_attn_v_proj_weight_palettized"), shape = tensor([1024, 2560])]; tensor wrapped_model_language_model_layers_6_self_attn_o_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(623993536))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(626615040))), name = tensor("wrapped_model_language_model_layers_6_self_attn_o_proj_weight_palettized"), shape = tensor([2560, 2048])]; tensor wrapped_model_language_model_layers_6_mlp_gate_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(626615168))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(639722432))), name = tensor("wrapped_model_language_model_layers_6_mlp_gate_proj_weight_palettized"), shape = tensor([10240, 2560])]; tensor wrapped_model_language_model_layers_6_mlp_up_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(639722560))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(652829824))), name = tensor("wrapped_model_language_model_layers_6_mlp_up_proj_weight_palettized"), shape = tensor([10240, 2560])]; tensor wrapped_model_language_model_layers_6_mlp_down_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(652829952))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(665937216))), name = tensor("wrapped_model_language_model_layers_6_mlp_down_proj_weight_palettized"), shape = tensor([2560, 10240])]; tensor wrapped_model_language_model_layers_7_self_attn_q_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(665937344))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(668558848))), name = tensor("wrapped_model_language_model_layers_7_self_attn_q_proj_weight_palettized"), shape = tensor([2048, 2560])]; tensor wrapped_model_language_model_layers_7_self_attn_k_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(668558976))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(669869760))), name = tensor("wrapped_model_language_model_layers_7_self_attn_k_proj_weight_palettized"), shape = tensor([1024, 2560])]; tensor wrapped_model_language_model_layers_7_self_attn_v_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(669869888))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(671180672))), name = tensor("wrapped_model_language_model_layers_7_self_attn_v_proj_weight_palettized"), shape = tensor([1024, 2560])]; tensor wrapped_model_language_model_layers_7_self_attn_o_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(671180800))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(673802304))), name = tensor("wrapped_model_language_model_layers_7_self_attn_o_proj_weight_palettized"), shape = tensor([2560, 2048])]; tensor wrapped_model_language_model_layers_7_mlp_gate_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(673802432))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(686909696))), name = tensor("wrapped_model_language_model_layers_7_mlp_gate_proj_weight_palettized"), shape = tensor([10240, 2560])]; tensor wrapped_model_language_model_layers_7_mlp_up_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(686909824))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(700017088))), name = tensor("wrapped_model_language_model_layers_7_mlp_up_proj_weight_palettized"), shape = tensor([10240, 2560])]; tensor wrapped_model_language_model_layers_7_mlp_down_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(700017216))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(713124480))), name = tensor("wrapped_model_language_model_layers_7_mlp_down_proj_weight_palettized"), shape = tensor([2560, 10240])]; tensor wrapped_model_language_model_layers_8_self_attn_q_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(713124608))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(715746112))), name = tensor("wrapped_model_language_model_layers_8_self_attn_q_proj_weight_palettized"), shape = tensor([2048, 2560])]; tensor wrapped_model_language_model_layers_8_self_attn_k_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(715746240))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(717057024))), name = tensor("wrapped_model_language_model_layers_8_self_attn_k_proj_weight_palettized"), shape = tensor([1024, 2560])]; tensor wrapped_model_language_model_layers_8_self_attn_v_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(717057152))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(718367936))), name = tensor("wrapped_model_language_model_layers_8_self_attn_v_proj_weight_palettized"), shape = tensor([1024, 2560])]; tensor wrapped_model_language_model_layers_8_self_attn_o_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(718368064))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(720989568))), name = tensor("wrapped_model_language_model_layers_8_self_attn_o_proj_weight_palettized"), shape = tensor([2560, 2048])]; tensor wrapped_model_language_model_layers_8_mlp_gate_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(720989696))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(734096960))), name = tensor("wrapped_model_language_model_layers_8_mlp_gate_proj_weight_palettized"), shape = tensor([10240, 2560])]; tensor wrapped_model_language_model_layers_8_mlp_up_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(734097088))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(747204352))), name = tensor("wrapped_model_language_model_layers_8_mlp_up_proj_weight_palettized"), shape = tensor([10240, 2560])]; tensor wrapped_model_language_model_layers_8_mlp_down_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(747204480))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(760311744))), name = tensor("wrapped_model_language_model_layers_8_mlp_down_proj_weight_palettized"), shape = tensor([2560, 10240])]; tensor wrapped_model_language_model_layers_9_self_attn_q_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(760311872))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(762933376))), name = tensor("wrapped_model_language_model_layers_9_self_attn_q_proj_weight_palettized"), shape = tensor([2048, 2560])]; tensor wrapped_model_language_model_layers_9_self_attn_k_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(762933504))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(764244288))), name = tensor("wrapped_model_language_model_layers_9_self_attn_k_proj_weight_palettized"), shape = tensor([1024, 2560])]; tensor wrapped_model_language_model_layers_9_self_attn_v_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(764244416))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(765555200))), name = tensor("wrapped_model_language_model_layers_9_self_attn_v_proj_weight_palettized"), shape = tensor([1024, 2560])]; tensor wrapped_model_language_model_layers_9_self_attn_o_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(765555328))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(768176832))), name = tensor("wrapped_model_language_model_layers_9_self_attn_o_proj_weight_palettized"), shape = tensor([2560, 2048])]; tensor wrapped_model_language_model_layers_9_mlp_gate_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(768176960))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(781284224))), name = tensor("wrapped_model_language_model_layers_9_mlp_gate_proj_weight_palettized"), shape = tensor([10240, 2560])]; tensor wrapped_model_language_model_layers_9_mlp_up_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(781284352))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(794391616))), name = tensor("wrapped_model_language_model_layers_9_mlp_up_proj_weight_palettized"), shape = tensor([10240, 2560])]; tensor wrapped_model_language_model_layers_9_mlp_down_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(794391744))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(807499008))), name = tensor("wrapped_model_language_model_layers_9_mlp_down_proj_weight_palettized"), shape = tensor([2560, 10240])]; tensor wrapped_model_language_model_layers_10_self_attn_q_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(807499136))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(810120640))), name = tensor("wrapped_model_language_model_layers_10_self_attn_q_proj_weight_palettized"), shape = tensor([2048, 2560])]; tensor wrapped_model_language_model_layers_10_self_attn_k_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(810120768))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(811431552))), name = tensor("wrapped_model_language_model_layers_10_self_attn_k_proj_weight_palettized"), shape = tensor([1024, 2560])]; tensor wrapped_model_language_model_layers_10_self_attn_v_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(811431680))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(812742464))), name = tensor("wrapped_model_language_model_layers_10_self_attn_v_proj_weight_palettized"), shape = tensor([1024, 2560])]; tensor wrapped_model_language_model_layers_10_self_attn_o_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(812742592))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(815364096))), name = tensor("wrapped_model_language_model_layers_10_self_attn_o_proj_weight_palettized"), shape = tensor([2560, 2048])]; tensor wrapped_model_language_model_layers_10_mlp_gate_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(815364224))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(828471488))), name = tensor("wrapped_model_language_model_layers_10_mlp_gate_proj_weight_palettized"), shape = tensor([10240, 2560])]; tensor wrapped_model_language_model_layers_10_mlp_up_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(828471616))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(841578880))), name = tensor("wrapped_model_language_model_layers_10_mlp_up_proj_weight_palettized"), shape = tensor([10240, 2560])]; tensor wrapped_model_language_model_layers_10_mlp_down_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(841579008))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(854686272))), name = tensor("wrapped_model_language_model_layers_10_mlp_down_proj_weight_palettized"), shape = tensor([2560, 10240])]; tensor wrapped_model_language_model_layers_11_self_attn_q_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(854686400))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(857307904))), name = tensor("wrapped_model_language_model_layers_11_self_attn_q_proj_weight_palettized"), shape = tensor([2048, 2560])]; tensor wrapped_model_language_model_layers_11_self_attn_k_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(857308032))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(858618816))), name = tensor("wrapped_model_language_model_layers_11_self_attn_k_proj_weight_palettized"), shape = tensor([1024, 2560])]; tensor wrapped_model_language_model_layers_11_self_attn_v_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(858618944))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(859929728))), name = tensor("wrapped_model_language_model_layers_11_self_attn_v_proj_weight_palettized"), shape = tensor([1024, 2560])]; tensor wrapped_model_language_model_layers_11_self_attn_o_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(859929856))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(862551360))), name = tensor("wrapped_model_language_model_layers_11_self_attn_o_proj_weight_palettized"), shape = tensor([2560, 2048])]; tensor wrapped_model_language_model_layers_11_mlp_gate_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(862551488))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(875658752))), name = tensor("wrapped_model_language_model_layers_11_mlp_gate_proj_weight_palettized"), shape = tensor([10240, 2560])]; tensor wrapped_model_language_model_layers_11_mlp_up_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(875658880))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(888766144))), name = tensor("wrapped_model_language_model_layers_11_mlp_up_proj_weight_palettized"), shape = tensor([10240, 2560])]; tensor wrapped_model_language_model_layers_11_mlp_down_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(888766272))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(901873536))), name = tensor("wrapped_model_language_model_layers_11_mlp_down_proj_weight_palettized"), shape = tensor([2560, 10240])]; tensor wrapped_model_language_model_layers_12_self_attn_q_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(901873664))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(904495168))), name = tensor("wrapped_model_language_model_layers_12_self_attn_q_proj_weight_palettized"), shape = tensor([2048, 2560])]; tensor wrapped_model_language_model_layers_12_self_attn_k_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(904495296))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(905806080))), name = tensor("wrapped_model_language_model_layers_12_self_attn_k_proj_weight_palettized"), shape = tensor([1024, 2560])]; tensor wrapped_model_language_model_layers_12_self_attn_v_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(905806208))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(907116992))), name = tensor("wrapped_model_language_model_layers_12_self_attn_v_proj_weight_palettized"), shape = tensor([1024, 2560])]; tensor wrapped_model_language_model_layers_12_self_attn_o_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(907117120))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(909738624))), name = tensor("wrapped_model_language_model_layers_12_self_attn_o_proj_weight_palettized"), shape = tensor([2560, 2048])]; tensor wrapped_model_language_model_layers_12_mlp_gate_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(909738752))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(922846016))), name = tensor("wrapped_model_language_model_layers_12_mlp_gate_proj_weight_palettized"), shape = tensor([10240, 2560])]; tensor wrapped_model_language_model_layers_12_mlp_up_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(922846144))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(935953408))), name = tensor("wrapped_model_language_model_layers_12_mlp_up_proj_weight_palettized"), shape = tensor([10240, 2560])]; tensor wrapped_model_language_model_layers_12_mlp_down_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(935953536))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(949060800))), name = tensor("wrapped_model_language_model_layers_12_mlp_down_proj_weight_palettized"), shape = tensor([2560, 10240])]; tensor wrapped_model_language_model_layers_13_self_attn_q_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(949060928))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(951682432))), name = tensor("wrapped_model_language_model_layers_13_self_attn_q_proj_weight_palettized"), shape = tensor([2048, 2560])]; tensor wrapped_model_language_model_layers_13_self_attn_k_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(951682560))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(952993344))), name = tensor("wrapped_model_language_model_layers_13_self_attn_k_proj_weight_palettized"), shape = tensor([1024, 2560])]; tensor wrapped_model_language_model_layers_13_self_attn_v_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(952993472))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(954304256))), name = tensor("wrapped_model_language_model_layers_13_self_attn_v_proj_weight_palettized"), shape = tensor([1024, 2560])]; tensor wrapped_model_language_model_layers_13_self_attn_o_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(954304384))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(956925888))), name = tensor("wrapped_model_language_model_layers_13_self_attn_o_proj_weight_palettized"), shape = tensor([2560, 2048])]; tensor wrapped_model_language_model_layers_13_mlp_gate_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(956926016))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(970033280))), name = tensor("wrapped_model_language_model_layers_13_mlp_gate_proj_weight_palettized"), shape = tensor([10240, 2560])]; tensor wrapped_model_language_model_layers_13_mlp_up_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(970033408))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(983140672))), name = tensor("wrapped_model_language_model_layers_13_mlp_up_proj_weight_palettized"), shape = tensor([10240, 2560])]; tensor wrapped_model_language_model_layers_13_mlp_down_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(983140800))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(996248064))), name = tensor("wrapped_model_language_model_layers_13_mlp_down_proj_weight_palettized"), shape = tensor([2560, 10240])]; tensor wrapped_model_language_model_layers_14_self_attn_q_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(996248192))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(998869696))), name = tensor("wrapped_model_language_model_layers_14_self_attn_q_proj_weight_palettized"), shape = tensor([2048, 2560])]; tensor wrapped_model_language_model_layers_14_self_attn_k_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(998869824))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1000180608))), name = tensor("wrapped_model_language_model_layers_14_self_attn_k_proj_weight_palettized"), shape = tensor([1024, 2560])]; tensor wrapped_model_language_model_layers_14_self_attn_v_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1000180736))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1001491520))), name = tensor("wrapped_model_language_model_layers_14_self_attn_v_proj_weight_palettized"), shape = tensor([1024, 2560])]; tensor wrapped_model_language_model_layers_14_self_attn_o_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1001491648))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1004113152))), name = tensor("wrapped_model_language_model_layers_14_self_attn_o_proj_weight_palettized"), shape = tensor([2560, 2048])]; tensor wrapped_model_language_model_layers_14_mlp_gate_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1004113280))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1017220544))), name = tensor("wrapped_model_language_model_layers_14_mlp_gate_proj_weight_palettized"), shape = tensor([10240, 2560])]; tensor wrapped_model_language_model_layers_14_mlp_up_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1017220672))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1030327936))), name = tensor("wrapped_model_language_model_layers_14_mlp_up_proj_weight_palettized"), shape = tensor([10240, 2560])]; tensor wrapped_model_language_model_layers_14_mlp_down_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1030328064))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1043435328))), name = tensor("wrapped_model_language_model_layers_14_mlp_down_proj_weight_palettized"), shape = tensor([2560, 10240])]; tensor wrapped_model_language_model_layers_15_self_attn_q_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1043435456))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1046056960))), name = tensor("wrapped_model_language_model_layers_15_self_attn_q_proj_weight_palettized"), shape = tensor([2048, 2560])]; tensor wrapped_model_language_model_layers_15_self_attn_k_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1046057088))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1047367872))), name = tensor("wrapped_model_language_model_layers_15_self_attn_k_proj_weight_palettized"), shape = tensor([1024, 2560])]; tensor wrapped_model_language_model_layers_15_self_attn_v_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1047368000))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1048678784))), name = tensor("wrapped_model_language_model_layers_15_self_attn_v_proj_weight_palettized"), shape = tensor([1024, 2560])]; tensor wrapped_model_language_model_layers_15_self_attn_o_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1048678912))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1051300416))), name = tensor("wrapped_model_language_model_layers_15_self_attn_o_proj_weight_palettized"), shape = tensor([2560, 2048])]; tensor wrapped_model_language_model_layers_15_mlp_gate_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1051300544))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1064407808))), name = tensor("wrapped_model_language_model_layers_15_mlp_gate_proj_weight_palettized"), shape = tensor([10240, 2560])]; tensor wrapped_model_language_model_layers_15_mlp_up_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1064407936))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1077515200))), name = tensor("wrapped_model_language_model_layers_15_mlp_up_proj_weight_palettized"), shape = tensor([10240, 2560])]; tensor wrapped_model_language_model_layers_15_mlp_down_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1077515328))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1090622592))), name = tensor("wrapped_model_language_model_layers_15_mlp_down_proj_weight_palettized"), shape = tensor([2560, 10240])]; tensor wrapped_model_language_model_layers_16_self_attn_q_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1090622720))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1093244224))), name = tensor("wrapped_model_language_model_layers_16_self_attn_q_proj_weight_palettized"), shape = tensor([2048, 2560])]; tensor wrapped_model_language_model_layers_16_self_attn_k_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1093244352))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1094555136))), name = tensor("wrapped_model_language_model_layers_16_self_attn_k_proj_weight_palettized"), shape = tensor([1024, 2560])]; tensor wrapped_model_language_model_layers_16_self_attn_v_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1094555264))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1095866048))), name = tensor("wrapped_model_language_model_layers_16_self_attn_v_proj_weight_palettized"), shape = tensor([1024, 2560])]; tensor wrapped_model_language_model_layers_16_self_attn_o_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1095866176))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1098487680))), name = tensor("wrapped_model_language_model_layers_16_self_attn_o_proj_weight_palettized"), shape = tensor([2560, 2048])]; tensor wrapped_model_language_model_layers_16_mlp_gate_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1098487808))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1111595072))), name = tensor("wrapped_model_language_model_layers_16_mlp_gate_proj_weight_palettized"), shape = tensor([10240, 2560])]; tensor wrapped_model_language_model_layers_16_mlp_up_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1111595200))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1124702464))), name = tensor("wrapped_model_language_model_layers_16_mlp_up_proj_weight_palettized"), shape = tensor([10240, 2560])]; tensor wrapped_model_language_model_layers_16_mlp_down_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1124702592))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1137809856))), name = tensor("wrapped_model_language_model_layers_16_mlp_down_proj_weight_palettized"), shape = tensor([2560, 10240])]; tensor wrapped_model_language_model_layers_17_self_attn_q_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1137809984))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1140431488))), name = tensor("wrapped_model_language_model_layers_17_self_attn_q_proj_weight_palettized"), shape = tensor([2048, 2560])]; tensor wrapped_model_language_model_layers_17_self_attn_k_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1140431616))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1141742400))), name = tensor("wrapped_model_language_model_layers_17_self_attn_k_proj_weight_palettized"), shape = tensor([1024, 2560])]; tensor wrapped_model_language_model_layers_17_self_attn_v_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1141742528))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1143053312))), name = tensor("wrapped_model_language_model_layers_17_self_attn_v_proj_weight_palettized"), shape = tensor([1024, 2560])]; tensor wrapped_model_language_model_layers_17_self_attn_o_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1143053440))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1145674944))), name = tensor("wrapped_model_language_model_layers_17_self_attn_o_proj_weight_palettized"), shape = tensor([2560, 2048])]; tensor wrapped_model_language_model_layers_17_mlp_gate_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1145675072))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1158782336))), name = tensor("wrapped_model_language_model_layers_17_mlp_gate_proj_weight_palettized"), shape = tensor([10240, 2560])]; tensor wrapped_model_language_model_layers_17_mlp_up_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1158782464))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1171889728))), name = tensor("wrapped_model_language_model_layers_17_mlp_up_proj_weight_palettized"), shape = tensor([10240, 2560])]; tensor wrapped_model_language_model_layers_17_mlp_down_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1171889856))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1184997120))), name = tensor("wrapped_model_language_model_layers_17_mlp_down_proj_weight_palettized"), shape = tensor([2560, 10240])]; tensor wrapped_model_language_model_layers_18_self_attn_q_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1184997248))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1187618752))), name = tensor("wrapped_model_language_model_layers_18_self_attn_q_proj_weight_palettized"), shape = tensor([2048, 2560])]; tensor wrapped_model_language_model_layers_18_self_attn_k_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1187618880))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1188929664))), name = tensor("wrapped_model_language_model_layers_18_self_attn_k_proj_weight_palettized"), shape = tensor([1024, 2560])]; tensor wrapped_model_language_model_layers_18_self_attn_v_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1188929792))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1190240576))), name = tensor("wrapped_model_language_model_layers_18_self_attn_v_proj_weight_palettized"), shape = tensor([1024, 2560])]; tensor wrapped_model_language_model_layers_18_self_attn_o_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1190240704))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1192862208))), name = tensor("wrapped_model_language_model_layers_18_self_attn_o_proj_weight_palettized"), shape = tensor([2560, 2048])]; tensor wrapped_model_language_model_layers_18_mlp_gate_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1192862336))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1205969600))), name = tensor("wrapped_model_language_model_layers_18_mlp_gate_proj_weight_palettized"), shape = tensor([10240, 2560])]; tensor wrapped_model_language_model_layers_18_mlp_up_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1205969728))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1219076992))), name = tensor("wrapped_model_language_model_layers_18_mlp_up_proj_weight_palettized"), shape = tensor([10240, 2560])]; tensor wrapped_model_language_model_layers_18_mlp_down_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1219077120))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1232184384))), name = tensor("wrapped_model_language_model_layers_18_mlp_down_proj_weight_palettized"), shape = tensor([2560, 10240])]; tensor wrapped_model_language_model_layers_19_self_attn_q_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1232184512))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1234806016))), name = tensor("wrapped_model_language_model_layers_19_self_attn_q_proj_weight_palettized"), shape = tensor([2048, 2560])]; tensor wrapped_model_language_model_layers_19_self_attn_k_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1234806144))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1236116928))), name = tensor("wrapped_model_language_model_layers_19_self_attn_k_proj_weight_palettized"), shape = tensor([1024, 2560])]; tensor wrapped_model_language_model_layers_19_self_attn_v_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1236117056))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1237427840))), name = tensor("wrapped_model_language_model_layers_19_self_attn_v_proj_weight_palettized"), shape = tensor([1024, 2560])]; tensor wrapped_model_language_model_layers_19_self_attn_o_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1237427968))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1240049472))), name = tensor("wrapped_model_language_model_layers_19_self_attn_o_proj_weight_palettized"), shape = tensor([2560, 2048])]; tensor wrapped_model_language_model_layers_19_mlp_gate_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1240049600))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1253156864))), name = tensor("wrapped_model_language_model_layers_19_mlp_gate_proj_weight_palettized"), shape = tensor([10240, 2560])]; tensor wrapped_model_language_model_layers_19_mlp_up_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1253156992))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1266264256))), name = tensor("wrapped_model_language_model_layers_19_mlp_up_proj_weight_palettized"), shape = tensor([10240, 2560])]; tensor wrapped_model_language_model_layers_19_mlp_down_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1266264384))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1279371648))), name = tensor("wrapped_model_language_model_layers_19_mlp_down_proj_weight_palettized"), shape = tensor([2560, 10240])]; tensor wrapped_model_language_model_layers_20_self_attn_q_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1279371776))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1281993280))), name = tensor("wrapped_model_language_model_layers_20_self_attn_q_proj_weight_palettized"), shape = tensor([2048, 2560])]; tensor wrapped_model_language_model_layers_20_self_attn_k_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1281993408))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1283304192))), name = tensor("wrapped_model_language_model_layers_20_self_attn_k_proj_weight_palettized"), shape = tensor([1024, 2560])]; tensor wrapped_model_language_model_layers_20_self_attn_v_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1283304320))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1284615104))), name = tensor("wrapped_model_language_model_layers_20_self_attn_v_proj_weight_palettized"), shape = tensor([1024, 2560])]; tensor wrapped_model_language_model_layers_20_self_attn_o_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1284615232))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1287236736))), name = tensor("wrapped_model_language_model_layers_20_self_attn_o_proj_weight_palettized"), shape = tensor([2560, 2048])]; tensor wrapped_model_language_model_layers_20_mlp_gate_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1287236864))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1300344128))), name = tensor("wrapped_model_language_model_layers_20_mlp_gate_proj_weight_palettized"), shape = tensor([10240, 2560])]; tensor wrapped_model_language_model_layers_20_mlp_up_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1300344256))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1313451520))), name = tensor("wrapped_model_language_model_layers_20_mlp_up_proj_weight_palettized"), shape = tensor([10240, 2560])]; tensor wrapped_model_language_model_layers_20_mlp_down_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1313451648))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1326558912))), name = tensor("wrapped_model_language_model_layers_20_mlp_down_proj_weight_palettized"), shape = tensor([2560, 10240])]; tensor wrapped_model_language_model_layers_21_self_attn_q_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1326559040))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1329180544))), name = tensor("wrapped_model_language_model_layers_21_self_attn_q_proj_weight_palettized"), shape = tensor([2048, 2560])]; tensor wrapped_model_language_model_layers_21_self_attn_k_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1329180672))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1330491456))), name = tensor("wrapped_model_language_model_layers_21_self_attn_k_proj_weight_palettized"), shape = tensor([1024, 2560])]; tensor wrapped_model_language_model_layers_21_self_attn_v_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1330491584))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1331802368))), name = tensor("wrapped_model_language_model_layers_21_self_attn_v_proj_weight_palettized"), shape = tensor([1024, 2560])]; tensor wrapped_model_language_model_layers_21_self_attn_o_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1331802496))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1334424000))), name = tensor("wrapped_model_language_model_layers_21_self_attn_o_proj_weight_palettized"), shape = tensor([2560, 2048])]; tensor wrapped_model_language_model_layers_21_mlp_gate_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1334424128))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1347531392))), name = tensor("wrapped_model_language_model_layers_21_mlp_gate_proj_weight_palettized"), shape = tensor([10240, 2560])]; tensor wrapped_model_language_model_layers_21_mlp_up_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1347531520))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1360638784))), name = tensor("wrapped_model_language_model_layers_21_mlp_up_proj_weight_palettized"), shape = tensor([10240, 2560])]; tensor wrapped_model_language_model_layers_21_mlp_down_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1360638912))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1373746176))), name = tensor("wrapped_model_language_model_layers_21_mlp_down_proj_weight_palettized"), shape = tensor([2560, 10240])]; tensor wrapped_model_language_model_layers_22_self_attn_q_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1373746304))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1376367808))), name = tensor("wrapped_model_language_model_layers_22_self_attn_q_proj_weight_palettized"), shape = tensor([2048, 2560])]; tensor wrapped_model_language_model_layers_22_self_attn_k_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1376367936))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1377678720))), name = tensor("wrapped_model_language_model_layers_22_self_attn_k_proj_weight_palettized"), shape = tensor([1024, 2560])]; tensor wrapped_model_language_model_layers_22_self_attn_v_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1377678848))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1378989632))), name = tensor("wrapped_model_language_model_layers_22_self_attn_v_proj_weight_palettized"), shape = tensor([1024, 2560])]; tensor wrapped_model_language_model_layers_22_self_attn_o_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1378989760))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1381611264))), name = tensor("wrapped_model_language_model_layers_22_self_attn_o_proj_weight_palettized"), shape = tensor([2560, 2048])]; tensor wrapped_model_language_model_layers_22_mlp_gate_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1381611392))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1394718656))), name = tensor("wrapped_model_language_model_layers_22_mlp_gate_proj_weight_palettized"), shape = tensor([10240, 2560])]; tensor wrapped_model_language_model_layers_22_mlp_up_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1394718784))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1407826048))), name = tensor("wrapped_model_language_model_layers_22_mlp_up_proj_weight_palettized"), shape = tensor([10240, 2560])]; tensor wrapped_model_language_model_layers_22_mlp_down_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1407826176))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1420933440))), name = tensor("wrapped_model_language_model_layers_22_mlp_down_proj_weight_palettized"), shape = tensor([2560, 10240])]; tensor wrapped_model_language_model_layers_23_self_attn_q_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1420933568))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1423555072))), name = tensor("wrapped_model_language_model_layers_23_self_attn_q_proj_weight_palettized"), shape = tensor([2048, 2560])]; tensor wrapped_model_language_model_layers_23_self_attn_k_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1423555200))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1424865984))), name = tensor("wrapped_model_language_model_layers_23_self_attn_k_proj_weight_palettized"), shape = tensor([1024, 2560])]; tensor wrapped_model_language_model_layers_23_self_attn_v_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1424866112))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1426176896))), name = tensor("wrapped_model_language_model_layers_23_self_attn_v_proj_weight_palettized"), shape = tensor([1024, 2560])]; tensor wrapped_model_language_model_layers_23_self_attn_o_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1426177024))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1428798528))), name = tensor("wrapped_model_language_model_layers_23_self_attn_o_proj_weight_palettized"), shape = tensor([2560, 2048])]; tensor wrapped_model_language_model_layers_23_mlp_gate_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1428798656))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1441905920))), name = tensor("wrapped_model_language_model_layers_23_mlp_gate_proj_weight_palettized"), shape = tensor([10240, 2560])]; tensor wrapped_model_language_model_layers_23_mlp_up_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1441906048))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1455013312))), name = tensor("wrapped_model_language_model_layers_23_mlp_up_proj_weight_palettized"), shape = tensor([10240, 2560])]; tensor wrapped_model_language_model_layers_23_mlp_down_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1455013440))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1468120704))), name = tensor("wrapped_model_language_model_layers_23_mlp_down_proj_weight_palettized"), shape = tensor([2560, 10240])]; tensor wrapped_model_language_model_layers_24_self_attn_q_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1468120832))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1470742336))), name = tensor("wrapped_model_language_model_layers_24_self_attn_q_proj_weight_palettized"), shape = tensor([2048, 2560])]; tensor wrapped_model_language_model_layers_24_self_attn_k_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1470742464))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1472053248))), name = tensor("wrapped_model_language_model_layers_24_self_attn_k_proj_weight_palettized"), shape = tensor([1024, 2560])]; tensor wrapped_model_language_model_layers_24_self_attn_v_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1472053376))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1473364160))), name = tensor("wrapped_model_language_model_layers_24_self_attn_v_proj_weight_palettized"), shape = tensor([1024, 2560])]; tensor wrapped_model_language_model_layers_24_self_attn_o_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1473364288))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1475985792))), name = tensor("wrapped_model_language_model_layers_24_self_attn_o_proj_weight_palettized"), shape = tensor([2560, 2048])]; tensor wrapped_model_language_model_layers_24_mlp_gate_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1475985920))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1489093184))), name = tensor("wrapped_model_language_model_layers_24_mlp_gate_proj_weight_palettized"), shape = tensor([10240, 2560])]; tensor wrapped_model_language_model_layers_24_mlp_up_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1489093312))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1502200576))), name = tensor("wrapped_model_language_model_layers_24_mlp_up_proj_weight_palettized"), shape = tensor([10240, 2560])]; tensor wrapped_model_language_model_layers_24_mlp_down_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1502200704))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1515307968))), name = tensor("wrapped_model_language_model_layers_24_mlp_down_proj_weight_palettized"), shape = tensor([2560, 10240])]; tensor wrapped_model_language_model_layers_25_self_attn_q_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1515308096))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1517929600))), name = tensor("wrapped_model_language_model_layers_25_self_attn_q_proj_weight_palettized"), shape = tensor([2048, 2560])]; tensor wrapped_model_language_model_layers_25_self_attn_k_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1517929728))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1519240512))), name = tensor("wrapped_model_language_model_layers_25_self_attn_k_proj_weight_palettized"), shape = tensor([1024, 2560])]; tensor wrapped_model_language_model_layers_25_self_attn_v_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1519240640))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1520551424))), name = tensor("wrapped_model_language_model_layers_25_self_attn_v_proj_weight_palettized"), shape = tensor([1024, 2560])]; tensor wrapped_model_language_model_layers_25_self_attn_o_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1520551552))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1523173056))), name = tensor("wrapped_model_language_model_layers_25_self_attn_o_proj_weight_palettized"), shape = tensor([2560, 2048])]; tensor wrapped_model_language_model_layers_25_mlp_gate_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1523173184))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1536280448))), name = tensor("wrapped_model_language_model_layers_25_mlp_gate_proj_weight_palettized"), shape = tensor([10240, 2560])]; tensor wrapped_model_language_model_layers_25_mlp_up_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1536280576))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1549387840))), name = tensor("wrapped_model_language_model_layers_25_mlp_up_proj_weight_palettized"), shape = tensor([10240, 2560])]; tensor wrapped_model_language_model_layers_25_mlp_down_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1549387968))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1562495232))), name = tensor("wrapped_model_language_model_layers_25_mlp_down_proj_weight_palettized"), shape = tensor([2560, 10240])]; tensor wrapped_model_language_model_layers_26_self_attn_q_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1562495360))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1565116864))), name = tensor("wrapped_model_language_model_layers_26_self_attn_q_proj_weight_palettized"), shape = tensor([2048, 2560])]; tensor wrapped_model_language_model_layers_26_self_attn_k_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1565116992))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1566427776))), name = tensor("wrapped_model_language_model_layers_26_self_attn_k_proj_weight_palettized"), shape = tensor([1024, 2560])]; tensor wrapped_model_language_model_layers_26_self_attn_v_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1566427904))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1567738688))), name = tensor("wrapped_model_language_model_layers_26_self_attn_v_proj_weight_palettized"), shape = tensor([1024, 2560])]; tensor wrapped_model_language_model_layers_26_self_attn_o_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1567738816))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1570360320))), name = tensor("wrapped_model_language_model_layers_26_self_attn_o_proj_weight_palettized"), shape = tensor([2560, 2048])]; tensor wrapped_model_language_model_layers_26_mlp_gate_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1570360448))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1583467712))), name = tensor("wrapped_model_language_model_layers_26_mlp_gate_proj_weight_palettized"), shape = tensor([10240, 2560])]; tensor wrapped_model_language_model_layers_26_mlp_up_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1583467840))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1596575104))), name = tensor("wrapped_model_language_model_layers_26_mlp_up_proj_weight_palettized"), shape = tensor([10240, 2560])]; tensor wrapped_model_language_model_layers_26_mlp_down_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1596575232))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1609682496))), name = tensor("wrapped_model_language_model_layers_26_mlp_down_proj_weight_palettized"), shape = tensor([2560, 10240])]; tensor wrapped_model_language_model_layers_27_self_attn_q_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1609682624))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1612304128))), name = tensor("wrapped_model_language_model_layers_27_self_attn_q_proj_weight_palettized"), shape = tensor([2048, 2560])]; tensor wrapped_model_language_model_layers_27_self_attn_k_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1612304256))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1613615040))), name = tensor("wrapped_model_language_model_layers_27_self_attn_k_proj_weight_palettized"), shape = tensor([1024, 2560])]; tensor wrapped_model_language_model_layers_27_self_attn_v_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1613615168))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1614925952))), name = tensor("wrapped_model_language_model_layers_27_self_attn_v_proj_weight_palettized"), shape = tensor([1024, 2560])]; tensor wrapped_model_language_model_layers_27_self_attn_o_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1614926080))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1617547584))), name = tensor("wrapped_model_language_model_layers_27_self_attn_o_proj_weight_palettized"), shape = tensor([2560, 2048])]; tensor wrapped_model_language_model_layers_27_mlp_gate_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1617547712))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1630654976))), name = tensor("wrapped_model_language_model_layers_27_mlp_gate_proj_weight_palettized"), shape = tensor([10240, 2560])]; tensor wrapped_model_language_model_layers_27_mlp_up_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1630655104))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1643762368))), name = tensor("wrapped_model_language_model_layers_27_mlp_up_proj_weight_palettized"), shape = tensor([10240, 2560])]; tensor wrapped_model_language_model_layers_27_mlp_down_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1643762496))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1656869760))), name = tensor("wrapped_model_language_model_layers_27_mlp_down_proj_weight_palettized"), shape = tensor([2560, 10240])]; tensor wrapped_model_language_model_layers_28_self_attn_q_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1656869888))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1659491392))), name = tensor("wrapped_model_language_model_layers_28_self_attn_q_proj_weight_palettized"), shape = tensor([2048, 2560])]; tensor wrapped_model_language_model_layers_28_self_attn_k_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1659491520))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1660802304))), name = tensor("wrapped_model_language_model_layers_28_self_attn_k_proj_weight_palettized"), shape = tensor([1024, 2560])]; tensor wrapped_model_language_model_layers_28_self_attn_v_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1660802432))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1662113216))), name = tensor("wrapped_model_language_model_layers_28_self_attn_v_proj_weight_palettized"), shape = tensor([1024, 2560])]; tensor wrapped_model_language_model_layers_28_self_attn_o_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1662113344))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1664734848))), name = tensor("wrapped_model_language_model_layers_28_self_attn_o_proj_weight_palettized"), shape = tensor([2560, 2048])]; tensor wrapped_model_language_model_layers_28_mlp_gate_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1664734976))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1677842240))), name = tensor("wrapped_model_language_model_layers_28_mlp_gate_proj_weight_palettized"), shape = tensor([10240, 2560])]; tensor wrapped_model_language_model_layers_28_mlp_up_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1677842368))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1690949632))), name = tensor("wrapped_model_language_model_layers_28_mlp_up_proj_weight_palettized"), shape = tensor([10240, 2560])]; tensor wrapped_model_language_model_layers_28_mlp_down_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1690949760))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1704057024))), name = tensor("wrapped_model_language_model_layers_28_mlp_down_proj_weight_palettized"), shape = tensor([2560, 10240])]; tensor wrapped_model_language_model_layers_29_self_attn_q_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1704057152))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1706678656))), name = tensor("wrapped_model_language_model_layers_29_self_attn_q_proj_weight_palettized"), shape = tensor([2048, 2560])]; tensor wrapped_model_language_model_layers_29_self_attn_k_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1706678784))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1707989568))), name = tensor("wrapped_model_language_model_layers_29_self_attn_k_proj_weight_palettized"), shape = tensor([1024, 2560])]; tensor wrapped_model_language_model_layers_29_self_attn_v_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1707989696))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1709300480))), name = tensor("wrapped_model_language_model_layers_29_self_attn_v_proj_weight_palettized"), shape = tensor([1024, 2560])]; tensor wrapped_model_language_model_layers_29_self_attn_o_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1709300608))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1711922112))), name = tensor("wrapped_model_language_model_layers_29_self_attn_o_proj_weight_palettized"), shape = tensor([2560, 2048])]; tensor wrapped_model_language_model_layers_29_mlp_gate_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1711922240))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1725029504))), name = tensor("wrapped_model_language_model_layers_29_mlp_gate_proj_weight_palettized"), shape = tensor([10240, 2560])]; tensor wrapped_model_language_model_layers_29_mlp_up_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1725029632))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1738136896))), name = tensor("wrapped_model_language_model_layers_29_mlp_up_proj_weight_palettized"), shape = tensor([10240, 2560])]; tensor wrapped_model_language_model_layers_29_mlp_down_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1738137024))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1751244288))), name = tensor("wrapped_model_language_model_layers_29_mlp_down_proj_weight_palettized"), shape = tensor([2560, 10240])]; tensor wrapped_model_language_model_layers_30_self_attn_q_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1751244416))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1753865920))), name = tensor("wrapped_model_language_model_layers_30_self_attn_q_proj_weight_palettized"), shape = tensor([2048, 2560])]; tensor wrapped_model_language_model_layers_30_self_attn_k_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1753866048))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1755176832))), name = tensor("wrapped_model_language_model_layers_30_self_attn_k_proj_weight_palettized"), shape = tensor([1024, 2560])]; tensor wrapped_model_language_model_layers_30_self_attn_v_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1755176960))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1756487744))), name = tensor("wrapped_model_language_model_layers_30_self_attn_v_proj_weight_palettized"), shape = tensor([1024, 2560])]; tensor wrapped_model_language_model_layers_30_self_attn_o_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1756487872))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1759109376))), name = tensor("wrapped_model_language_model_layers_30_self_attn_o_proj_weight_palettized"), shape = tensor([2560, 2048])]; tensor wrapped_model_language_model_layers_30_mlp_gate_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1759109504))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1772216768))), name = tensor("wrapped_model_language_model_layers_30_mlp_gate_proj_weight_palettized"), shape = tensor([10240, 2560])]; tensor wrapped_model_language_model_layers_30_mlp_up_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1772216896))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1785324160))), name = tensor("wrapped_model_language_model_layers_30_mlp_up_proj_weight_palettized"), shape = tensor([10240, 2560])]; tensor wrapped_model_language_model_layers_30_mlp_down_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1785324288))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1798431552))), name = tensor("wrapped_model_language_model_layers_30_mlp_down_proj_weight_palettized"), shape = tensor([2560, 10240])]; tensor wrapped_model_language_model_layers_31_self_attn_q_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1798431680))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1801053184))), name = tensor("wrapped_model_language_model_layers_31_self_attn_q_proj_weight_palettized"), shape = tensor([2048, 2560])]; tensor wrapped_model_language_model_layers_31_self_attn_k_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1801053312))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1802364096))), name = tensor("wrapped_model_language_model_layers_31_self_attn_k_proj_weight_palettized"), shape = tensor([1024, 2560])]; tensor wrapped_model_language_model_layers_31_self_attn_v_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1802364224))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1803675008))), name = tensor("wrapped_model_language_model_layers_31_self_attn_v_proj_weight_palettized"), shape = tensor([1024, 2560])]; tensor wrapped_model_language_model_layers_31_self_attn_o_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1803675136))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1806296640))), name = tensor("wrapped_model_language_model_layers_31_self_attn_o_proj_weight_palettized"), shape = tensor([2560, 2048])]; tensor wrapped_model_language_model_layers_31_mlp_gate_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1806296768))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1819404032))), name = tensor("wrapped_model_language_model_layers_31_mlp_gate_proj_weight_palettized"), shape = tensor([10240, 2560])]; tensor wrapped_model_language_model_layers_31_mlp_up_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1819404160))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1832511424))), name = tensor("wrapped_model_language_model_layers_31_mlp_up_proj_weight_palettized"), shape = tensor([10240, 2560])]; tensor wrapped_model_language_model_layers_31_mlp_down_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1832511552))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1845618816))), name = tensor("wrapped_model_language_model_layers_31_mlp_down_proj_weight_palettized"), shape = tensor([2560, 10240])]; tensor wrapped_model_language_model_layers_32_self_attn_q_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1845618944))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1848240448))), name = tensor("wrapped_model_language_model_layers_32_self_attn_q_proj_weight_palettized"), shape = tensor([2048, 2560])]; tensor wrapped_model_language_model_layers_32_self_attn_k_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1848240576))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1849551360))), name = tensor("wrapped_model_language_model_layers_32_self_attn_k_proj_weight_palettized"), shape = tensor([1024, 2560])]; tensor wrapped_model_language_model_layers_32_self_attn_v_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1849551488))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1850862272))), name = tensor("wrapped_model_language_model_layers_32_self_attn_v_proj_weight_palettized"), shape = tensor([1024, 2560])]; tensor wrapped_model_language_model_layers_32_self_attn_o_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1850862400))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1853483904))), name = tensor("wrapped_model_language_model_layers_32_self_attn_o_proj_weight_palettized"), shape = tensor([2560, 2048])]; tensor wrapped_model_language_model_layers_32_mlp_gate_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1853484032))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1866591296))), name = tensor("wrapped_model_language_model_layers_32_mlp_gate_proj_weight_palettized"), shape = tensor([10240, 2560])]; tensor wrapped_model_language_model_layers_32_mlp_up_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1866591424))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1879698688))), name = tensor("wrapped_model_language_model_layers_32_mlp_up_proj_weight_palettized"), shape = tensor([10240, 2560])]; tensor wrapped_model_language_model_layers_32_mlp_down_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1879698816))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1892806080))), name = tensor("wrapped_model_language_model_layers_32_mlp_down_proj_weight_palettized"), shape = tensor([2560, 10240])]; tensor wrapped_model_language_model_layers_33_self_attn_q_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1892806208))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1895427712))), name = tensor("wrapped_model_language_model_layers_33_self_attn_q_proj_weight_palettized"), shape = tensor([2048, 2560])]; tensor wrapped_model_language_model_layers_33_self_attn_k_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1895427840))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1896738624))), name = tensor("wrapped_model_language_model_layers_33_self_attn_k_proj_weight_palettized"), shape = tensor([1024, 2560])]; tensor wrapped_model_language_model_layers_33_self_attn_v_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1896738752))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1898049536))), name = tensor("wrapped_model_language_model_layers_33_self_attn_v_proj_weight_palettized"), shape = tensor([1024, 2560])]; tensor wrapped_model_language_model_layers_33_self_attn_o_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1898049664))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1900671168))), name = tensor("wrapped_model_language_model_layers_33_self_attn_o_proj_weight_palettized"), shape = tensor([2560, 2048])]; tensor wrapped_model_language_model_layers_33_mlp_gate_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1900671296))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1913778560))), name = tensor("wrapped_model_language_model_layers_33_mlp_gate_proj_weight_palettized"), shape = tensor([10240, 2560])]; tensor wrapped_model_language_model_layers_33_mlp_up_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1913778688))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1926885952))), name = tensor("wrapped_model_language_model_layers_33_mlp_up_proj_weight_palettized"), shape = tensor([10240, 2560])]; tensor wrapped_model_language_model_layers_33_mlp_down_proj_weight_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1926886080))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1939993344))), name = tensor("wrapped_model_language_model_layers_33_mlp_down_proj_weight_palettized"), shape = tensor([2560, 10240])]; tensor var_24 = const()[name = tensor("op_24"), val = tensor(-1)]; tensor var_35_batch_dims_0 = const()[name = tensor("op_35_batch_dims_0"), val = tensor(0)]; tensor var_35_validate_indices_0 = const()[name = tensor("op_35_validate_indices_0"), val = tensor(false)]; tensor greater_equal_0_y_0 = const()[name = tensor("greater_equal_0_y_0"), val = tensor(0)]; tensor greater_equal_0 = greater_equal(x = input_ids, y = greater_equal_0_y_0)[name = tensor("greater_equal_0")]; tensor slice_by_index_0 = const()[name = tensor("slice_by_index_0"), val = tensor(262208)]; tensor add_0 = add(x = input_ids, y = slice_by_index_0)[name = tensor("add_0")]; tensor select_0 = select(a = input_ids, b = add_0, cond = greater_equal_0)[name = tensor("select_0")]; tensor greater_equal_0_y_0_1 = const()[name = tensor("greater_equal_0_y_0_1"), val = tensor(0)]; tensor greater_equal_0_1 = greater_equal(x = select_0, y = greater_equal_0_y_0_1)[name = tensor("greater_equal_0_1")]; tensor slice_by_index_0_1 = const()[name = tensor("slice_by_index_0_1"), val = tensor(262208)]; tensor add_0_1 = add(x = select_0, y = slice_by_index_0_1)[name = tensor("add_0_1")]; tensor select_0_1 = select(a = select_0, b = add_0_1, cond = greater_equal_0_1)[name = tensor("select_0_1")]; tensor op_35_axis_0 = const()[name = tensor("op_35_axis_0"), val = tensor(0)]; tensor op_35 = gather(axis = op_35_axis_0, batch_dims = var_35_batch_dims_0, indices = select_0_1, validate_indices = var_35_validate_indices_0, x = wrapped_model_language_model_embed_tokens_weight_palettized)[name = tensor("op_35")]; tensor const_0 = const()[name = tensor("const_0"), val = tensor(0x1.94cp+5)]; tensor inputs_embeds = mul(x = op_35, y = const_0)[name = tensor("inputs_embeds")]; tensor var_22_promoted_to_fp16 = const()[name = tensor("op_22_promoted_to_fp16"), val = tensor(0x1p+1)]; tensor var_219_cast_fp16 = pow(x = inputs_embeds, y = var_22_promoted_to_fp16)[name = tensor("op_219_cast_fp16")]; tensor var_221_axes_0 = const()[name = tensor("op_221_axes_0"), val = tensor([-1])]; tensor var_221_keep_dims_0 = const()[name = tensor("op_221_keep_dims_0"), val = tensor(true)]; tensor var_221_cast_fp16 = reduce_mean(axes = var_221_axes_0, keep_dims = var_221_keep_dims_0, x = var_219_cast_fp16)[name = tensor("op_221_cast_fp16")]; tensor var_222_to_fp16 = const()[name = tensor("op_222_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_223_cast_fp16 = add(x = var_221_cast_fp16, y = var_222_to_fp16)[name = tensor("op_223_cast_fp16")]; tensor var_224_epsilon_0 = const()[name = tensor("op_224_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_224_cast_fp16 = rsqrt(epsilon = var_224_epsilon_0, x = var_223_cast_fp16)[name = tensor("op_224_cast_fp16")]; tensor output_1_cast_fp16 = mul(x = inputs_embeds, y = var_224_cast_fp16)[name = tensor("output_1_cast_fp16")]; tensor var_228_to_fp16 = const()[name = tensor("op_228_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1939993472)))]; tensor output_3_cast_fp16 = mul(x = output_1_cast_fp16, y = var_228_to_fp16)[name = tensor("output_3_cast_fp16")]; tensor linear_0_bias_0 = const()[name = tensor("linear_0_bias_0"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1939998656)))]; tensor var_240 = linear(bias = linear_0_bias_0, weight = wrapped_model_language_model_layers_0_self_attn_q_proj_weight_palettized, x = output_3_cast_fp16)[name = tensor("linear_0")]; tensor var_241 = const()[name = tensor("op_241"), val = tensor([1, 256, -1, 256])]; tensor var_242 = reshape(shape = var_241, x = var_240)[name = tensor("op_242")]; tensor x_3_perm_0 = const()[name = tensor("x_3_perm_0"), val = tensor([0, 2, 1, 3])]; tensor linear_1_bias_0 = const()[name = tensor("linear_1_bias_0"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940002816)))]; tensor var_245 = linear(bias = linear_1_bias_0, weight = wrapped_model_language_model_layers_0_self_attn_k_proj_weight_palettized, x = output_3_cast_fp16)[name = tensor("linear_1")]; tensor var_246 = const()[name = tensor("op_246"), val = tensor([1, 256, -1, 256])]; tensor var_247 = reshape(shape = var_246, x = var_245)[name = tensor("op_247")]; tensor x_7_perm_0 = const()[name = tensor("x_7_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_250 = linear(bias = linear_1_bias_0, weight = wrapped_model_language_model_layers_0_self_attn_v_proj_weight_palettized, x = output_3_cast_fp16)[name = tensor("linear_2")]; tensor var_251 = const()[name = tensor("op_251"), val = tensor([1, 256, -1, 256])]; tensor var_252 = reshape(shape = var_251, x = var_250)[name = tensor("op_252")]; tensor hidden_states_7_perm_0 = const()[name = tensor("hidden_states_7_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_22_promoted_1_to_fp16 = const()[name = tensor("op_22_promoted_1_to_fp16"), val = tensor(0x1p+1)]; tensor x_3 = transpose(perm = x_3_perm_0, x = var_242)[name = tensor("transpose_135")]; tensor var_256_cast_fp16 = pow(x = x_3, y = var_22_promoted_1_to_fp16)[name = tensor("op_256_cast_fp16")]; tensor var_258_axes_0 = const()[name = tensor("op_258_axes_0"), val = tensor([-1])]; tensor var_258_keep_dims_0 = const()[name = tensor("op_258_keep_dims_0"), val = tensor(true)]; tensor var_258_cast_fp16 = reduce_mean(axes = var_258_axes_0, keep_dims = var_258_keep_dims_0, x = var_256_cast_fp16)[name = tensor("op_258_cast_fp16")]; tensor var_259_to_fp16 = const()[name = tensor("op_259_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_260_cast_fp16 = add(x = var_258_cast_fp16, y = var_259_to_fp16)[name = tensor("op_260_cast_fp16")]; tensor var_261_epsilon_0 = const()[name = tensor("op_261_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_261_cast_fp16 = rsqrt(epsilon = var_261_epsilon_0, x = var_260_cast_fp16)[name = tensor("op_261_cast_fp16")]; tensor output_5_cast_fp16 = mul(x = x_3, y = var_261_cast_fp16)[name = tensor("output_5_cast_fp16")]; tensor var_265_to_fp16 = const()[name = tensor("op_265_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940004928)))]; tensor output_7_cast_fp16 = mul(x = output_5_cast_fp16, y = var_265_to_fp16)[name = tensor("output_7_cast_fp16")]; tensor var_22_promoted_2_to_fp16 = const()[name = tensor("op_22_promoted_2_to_fp16"), val = tensor(0x1p+1)]; tensor x_7 = transpose(perm = x_7_perm_0, x = var_247)[name = tensor("transpose_134")]; tensor var_270_cast_fp16 = pow(x = x_7, y = var_22_promoted_2_to_fp16)[name = tensor("op_270_cast_fp16")]; tensor var_272_axes_0 = const()[name = tensor("op_272_axes_0"), val = tensor([-1])]; tensor var_272_keep_dims_0 = const()[name = tensor("op_272_keep_dims_0"), val = tensor(true)]; tensor var_272_cast_fp16 = reduce_mean(axes = var_272_axes_0, keep_dims = var_272_keep_dims_0, x = var_270_cast_fp16)[name = tensor("op_272_cast_fp16")]; tensor var_273_to_fp16 = const()[name = tensor("op_273_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_274_cast_fp16 = add(x = var_272_cast_fp16, y = var_273_to_fp16)[name = tensor("op_274_cast_fp16")]; tensor var_275_epsilon_0 = const()[name = tensor("op_275_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_275_cast_fp16 = rsqrt(epsilon = var_275_epsilon_0, x = var_274_cast_fp16)[name = tensor("op_275_cast_fp16")]; tensor output_9_cast_fp16 = mul(x = x_7, y = var_275_cast_fp16)[name = tensor("output_9_cast_fp16")]; tensor var_279_to_fp16 = const()[name = tensor("op_279_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940005504)))]; tensor output_11_cast_fp16 = mul(x = output_9_cast_fp16, y = var_279_to_fp16)[name = tensor("output_11_cast_fp16")]; tensor cos_7_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940006080))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940038912))), name = tensor("cos_7_palettized"), shape = tensor([1, 1, 256, 256])]; tensor sin_7_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940039040))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940071872))), name = tensor("sin_7_palettized"), shape = tensor([1, 1, 256, 256])]; tensor var_284 = mul(x = output_7_cast_fp16, y = cos_7_palettized)[name = tensor("op_284")]; tensor x1_1_begin_0 = const()[name = tensor("x1_1_begin_0"), val = tensor([0, 0, 0, 0])]; tensor x1_1_end_0 = const()[name = tensor("x1_1_end_0"), val = tensor([1, 8, 256, 128])]; tensor x1_1_end_mask_0 = const()[name = tensor("x1_1_end_mask_0"), val = tensor([true, true, true, false])]; tensor x1_1 = slice_by_index(begin = x1_1_begin_0, end = x1_1_end_0, end_mask = x1_1_end_mask_0, x = output_7_cast_fp16)[name = tensor("x1_1")]; tensor x2_1_begin_0 = const()[name = tensor("x2_1_begin_0"), val = tensor([0, 0, 0, 128])]; tensor x2_1_end_0 = const()[name = tensor("x2_1_end_0"), val = tensor([1, 8, 256, 256])]; tensor x2_1_end_mask_0 = const()[name = tensor("x2_1_end_mask_0"), val = tensor([true, true, true, true])]; tensor x2_1 = slice_by_index(begin = x2_1_begin_0, end = x2_1_end_0, end_mask = x2_1_end_mask_0, x = output_7_cast_fp16)[name = tensor("x2_1")]; tensor const_35_promoted = const()[name = tensor("const_35_promoted"), val = tensor(-0x1p+0)]; tensor var_295 = mul(x = x2_1, y = const_35_promoted)[name = tensor("op_295")]; tensor var_297_interleave_0 = const()[name = tensor("op_297_interleave_0"), val = tensor(false)]; tensor var_297 = concat(axis = var_24, interleave = var_297_interleave_0, values = (var_295, x1_1))[name = tensor("op_297")]; tensor var_298 = mul(x = var_297, y = sin_7_palettized)[name = tensor("op_298")]; tensor query_1 = add(x = var_284, y = var_298)[name = tensor("query_1")]; tensor var_300 = mul(x = output_11_cast_fp16, y = cos_7_palettized)[name = tensor("op_300")]; tensor x1_3_begin_0 = const()[name = tensor("x1_3_begin_0"), val = tensor([0, 0, 0, 0])]; tensor x1_3_end_0 = const()[name = tensor("x1_3_end_0"), val = tensor([1, 4, 256, 128])]; tensor x1_3_end_mask_0 = const()[name = tensor("x1_3_end_mask_0"), val = tensor([true, true, true, false])]; tensor x1_3 = slice_by_index(begin = x1_3_begin_0, end = x1_3_end_0, end_mask = x1_3_end_mask_0, x = output_11_cast_fp16)[name = tensor("x1_3")]; tensor x2_3_begin_0 = const()[name = tensor("x2_3_begin_0"), val = tensor([0, 0, 0, 128])]; tensor x2_3_end_0 = const()[name = tensor("x2_3_end_0"), val = tensor([1, 4, 256, 256])]; tensor x2_3_end_mask_0 = const()[name = tensor("x2_3_end_mask_0"), val = tensor([true, true, true, true])]; tensor x2_3 = slice_by_index(begin = x2_3_begin_0, end = x2_3_end_0, end_mask = x2_3_end_mask_0, x = output_11_cast_fp16)[name = tensor("x2_3")]; tensor const_38_promoted = const()[name = tensor("const_38_promoted"), val = tensor(-0x1p+0)]; tensor var_311 = mul(x = x2_3, y = const_38_promoted)[name = tensor("op_311")]; tensor var_313_interleave_0 = const()[name = tensor("op_313_interleave_0"), val = tensor(false)]; tensor var_313 = concat(axis = var_24, interleave = var_313_interleave_0, values = (var_311, x1_3))[name = tensor("op_313")]; tensor var_314 = mul(x = var_313, y = sin_7_palettized)[name = tensor("op_314")]; tensor hidden_states_3 = add(x = var_300, y = var_314)[name = tensor("hidden_states_3")]; tensor var_323_axes_0 = const()[name = tensor("op_323_axes_0"), val = tensor([2])]; tensor var_323 = expand_dims(axes = var_323_axes_0, x = hidden_states_3)[name = tensor("op_323")]; tensor hidden_states_5_reps_0 = const()[name = tensor("hidden_states_5_reps_0"), val = tensor([1, 1, 2, 1, 1])]; tensor hidden_states_5 = tile(reps = hidden_states_5_reps_0, x = var_323)[name = tensor("hidden_states_5")]; tensor var_331 = const()[name = tensor("op_331"), val = tensor([1, 8, 256, 256])]; tensor key_states_1 = reshape(shape = var_331, x = hidden_states_5)[name = tensor("key_states_1")]; tensor var_340_axes_0 = const()[name = tensor("op_340_axes_0"), val = tensor([2])]; tensor hidden_states_7 = transpose(perm = hidden_states_7_perm_0, x = var_252)[name = tensor("transpose_133")]; tensor var_340 = expand_dims(axes = var_340_axes_0, x = hidden_states_7)[name = tensor("op_340")]; tensor hidden_states_9_reps_0 = const()[name = tensor("hidden_states_9_reps_0"), val = tensor([1, 1, 2, 1, 1])]; tensor hidden_states_9 = tile(reps = hidden_states_9_reps_0, x = var_340)[name = tensor("hidden_states_9")]; tensor var_348 = const()[name = tensor("op_348"), val = tensor([1, 8, 256, 256])]; tensor value_states_1 = reshape(shape = var_348, x = hidden_states_9)[name = tensor("value_states_1")]; tensor var_351_transpose_x_1 = const()[name = tensor("op_351_transpose_x_1"), val = tensor(false)]; tensor var_351_transpose_y_1 = const()[name = tensor("op_351_transpose_y_1"), val = tensor(true)]; tensor var_351 = matmul(transpose_x = var_351_transpose_x_1, transpose_y = var_351_transpose_y_1, x = query_1, y = key_states_1)[name = tensor("op_351")]; tensor var_352_to_fp16 = const()[name = tensor("op_352_to_fp16"), val = tensor(0x1p-4)]; tensor attn_weights_1_cast_fp16 = mul(x = var_351, y = var_352_to_fp16)[name = tensor("attn_weights_1_cast_fp16")]; tensor attention_mask_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940072000))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940104832))), name = tensor("attention_mask_to_fp16_palettized"), shape = tensor([1, 1, 256, 256])]; tensor input_1_cast_fp16 = add(x = attn_weights_1_cast_fp16, y = attention_mask_to_fp16_palettized)[name = tensor("input_1_cast_fp16")]; tensor var_360_cast_fp16 = softmax(axis = var_24, x = input_1_cast_fp16)[name = tensor("op_360_cast_fp16")]; tensor attn_output_1_transpose_x_0 = const()[name = tensor("attn_output_1_transpose_x_0"), val = tensor(false)]; tensor attn_output_1_transpose_y_0 = const()[name = tensor("attn_output_1_transpose_y_0"), val = tensor(false)]; tensor attn_output_1 = matmul(transpose_x = attn_output_1_transpose_x_0, transpose_y = attn_output_1_transpose_y_0, x = var_360_cast_fp16, y = value_states_1)[name = tensor("attn_output_1")]; tensor var_364_perm_0 = const()[name = tensor("op_364_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_366 = const()[name = tensor("op_366"), val = tensor([1, 256, -1])]; tensor var_364 = transpose(perm = var_364_perm_0, x = attn_output_1)[name = tensor("transpose_132")]; tensor var_367 = reshape(shape = var_366, x = var_364)[name = tensor("op_367")]; tensor linear_3_bias_0 = const()[name = tensor("linear_3_bias_0"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940104960)))]; tensor x_11 = linear(bias = linear_3_bias_0, weight = wrapped_model_language_model_layers_0_self_attn_o_proj_weight_palettized, x = var_367)[name = tensor("linear_3")]; tensor var_22_promoted_3_to_fp16 = const()[name = tensor("op_22_promoted_3_to_fp16"), val = tensor(0x1p+1)]; tensor var_373_cast_fp16 = pow(x = x_11, y = var_22_promoted_3_to_fp16)[name = tensor("op_373_cast_fp16")]; tensor var_375_axes_0 = const()[name = tensor("op_375_axes_0"), val = tensor([-1])]; tensor var_375_keep_dims_0 = const()[name = tensor("op_375_keep_dims_0"), val = tensor(true)]; tensor var_375_cast_fp16 = reduce_mean(axes = var_375_axes_0, keep_dims = var_375_keep_dims_0, x = var_373_cast_fp16)[name = tensor("op_375_cast_fp16")]; tensor var_376_to_fp16 = const()[name = tensor("op_376_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_377_cast_fp16 = add(x = var_375_cast_fp16, y = var_376_to_fp16)[name = tensor("op_377_cast_fp16")]; tensor var_378_epsilon_0 = const()[name = tensor("op_378_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_378_cast_fp16 = rsqrt(epsilon = var_378_epsilon_0, x = var_377_cast_fp16)[name = tensor("op_378_cast_fp16")]; tensor output_13_cast_fp16 = mul(x = x_11, y = var_378_cast_fp16)[name = tensor("output_13_cast_fp16")]; tensor var_382_to_fp16 = const()[name = tensor("op_382_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940110144)))]; tensor output_15_cast_fp16 = mul(x = output_13_cast_fp16, y = var_382_to_fp16)[name = tensor("output_15_cast_fp16")]; tensor x_15 = add(x = inputs_embeds, y = output_15_cast_fp16)[name = tensor("x_15")]; tensor var_22_promoted_4_to_fp16 = const()[name = tensor("op_22_promoted_4_to_fp16"), val = tensor(0x1p+1)]; tensor var_388_cast_fp16 = pow(x = x_15, y = var_22_promoted_4_to_fp16)[name = tensor("op_388_cast_fp16")]; tensor var_390_axes_0 = const()[name = tensor("op_390_axes_0"), val = tensor([-1])]; tensor var_390_keep_dims_0 = const()[name = tensor("op_390_keep_dims_0"), val = tensor(true)]; tensor var_390_cast_fp16 = reduce_mean(axes = var_390_axes_0, keep_dims = var_390_keep_dims_0, x = var_388_cast_fp16)[name = tensor("op_390_cast_fp16")]; tensor var_391_to_fp16 = const()[name = tensor("op_391_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_392_cast_fp16 = add(x = var_390_cast_fp16, y = var_391_to_fp16)[name = tensor("op_392_cast_fp16")]; tensor var_393_epsilon_0 = const()[name = tensor("op_393_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_393_cast_fp16 = rsqrt(epsilon = var_393_epsilon_0, x = var_392_cast_fp16)[name = tensor("op_393_cast_fp16")]; tensor output_17_cast_fp16 = mul(x = x_15, y = var_393_cast_fp16)[name = tensor("output_17_cast_fp16")]; tensor var_397_to_fp16 = const()[name = tensor("op_397_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940115328)))]; tensor output_19_cast_fp16 = mul(x = output_17_cast_fp16, y = var_397_to_fp16)[name = tensor("output_19_cast_fp16")]; tensor linear_4_bias_0 = const()[name = tensor("linear_4_bias_0"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940120512)))]; tensor input_9 = linear(bias = linear_4_bias_0, weight = wrapped_model_language_model_layers_0_mlp_gate_proj_weight_palettized, x = output_19_cast_fp16)[name = tensor("linear_4")]; tensor var_405_mode_0 = const()[name = tensor("op_405_mode_0"), val = tensor("TANH_APPROXIMATION")]; tensor var_405 = gelu(mode = var_405_mode_0, x = input_9)[name = tensor("op_405")]; tensor var_407 = linear(bias = linear_4_bias_0, weight = wrapped_model_language_model_layers_0_mlp_up_proj_weight_palettized, x = output_19_cast_fp16)[name = tensor("linear_5")]; tensor input_11 = mul(x = var_405, y = var_407)[name = tensor("input_11")]; tensor x_19 = linear(bias = linear_3_bias_0, weight = wrapped_model_language_model_layers_0_mlp_down_proj_weight_palettized, x = input_11)[name = tensor("linear_6")]; tensor var_22_promoted_5_to_fp16 = const()[name = tensor("op_22_promoted_5_to_fp16"), val = tensor(0x1p+1)]; tensor var_413_cast_fp16 = pow(x = x_19, y = var_22_promoted_5_to_fp16)[name = tensor("op_413_cast_fp16")]; tensor var_415_axes_0 = const()[name = tensor("op_415_axes_0"), val = tensor([-1])]; tensor var_415_keep_dims_0 = const()[name = tensor("op_415_keep_dims_0"), val = tensor(true)]; tensor var_415_cast_fp16 = reduce_mean(axes = var_415_axes_0, keep_dims = var_415_keep_dims_0, x = var_413_cast_fp16)[name = tensor("op_415_cast_fp16")]; tensor var_416_to_fp16 = const()[name = tensor("op_416_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_417_cast_fp16 = add(x = var_415_cast_fp16, y = var_416_to_fp16)[name = tensor("op_417_cast_fp16")]; tensor var_418_epsilon_0 = const()[name = tensor("op_418_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_418_cast_fp16 = rsqrt(epsilon = var_418_epsilon_0, x = var_417_cast_fp16)[name = tensor("op_418_cast_fp16")]; tensor output_21_cast_fp16 = mul(x = x_19, y = var_418_cast_fp16)[name = tensor("output_21_cast_fp16")]; tensor var_422_to_fp16 = const()[name = tensor("op_422_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940141056)))]; tensor output_23_cast_fp16 = mul(x = output_21_cast_fp16, y = var_422_to_fp16)[name = tensor("output_23_cast_fp16")]; tensor x_23 = add(x = x_15, y = output_23_cast_fp16)[name = tensor("x_23")]; tensor var_22_promoted_6_to_fp16 = const()[name = tensor("op_22_promoted_6_to_fp16"), val = tensor(0x1p+1)]; tensor var_434_cast_fp16 = pow(x = x_23, y = var_22_promoted_6_to_fp16)[name = tensor("op_434_cast_fp16")]; tensor var_436_axes_0 = const()[name = tensor("op_436_axes_0"), val = tensor([-1])]; tensor var_436_keep_dims_0 = const()[name = tensor("op_436_keep_dims_0"), val = tensor(true)]; tensor var_436_cast_fp16 = reduce_mean(axes = var_436_axes_0, keep_dims = var_436_keep_dims_0, x = var_434_cast_fp16)[name = tensor("op_436_cast_fp16")]; tensor var_437_to_fp16 = const()[name = tensor("op_437_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_438_cast_fp16 = add(x = var_436_cast_fp16, y = var_437_to_fp16)[name = tensor("op_438_cast_fp16")]; tensor var_439_epsilon_0 = const()[name = tensor("op_439_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_439_cast_fp16 = rsqrt(epsilon = var_439_epsilon_0, x = var_438_cast_fp16)[name = tensor("op_439_cast_fp16")]; tensor output_25_cast_fp16 = mul(x = x_23, y = var_439_cast_fp16)[name = tensor("output_25_cast_fp16")]; tensor var_443_to_fp16 = const()[name = tensor("op_443_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940146240)))]; tensor output_27_cast_fp16 = mul(x = output_25_cast_fp16, y = var_443_to_fp16)[name = tensor("output_27_cast_fp16")]; tensor var_455 = linear(bias = linear_0_bias_0, weight = wrapped_model_language_model_layers_1_self_attn_q_proj_weight_palettized, x = output_27_cast_fp16)[name = tensor("linear_7")]; tensor var_456 = const()[name = tensor("op_456"), val = tensor([1, 256, -1, 256])]; tensor var_457 = reshape(shape = var_456, x = var_455)[name = tensor("op_457")]; tensor x_27_perm_0 = const()[name = tensor("x_27_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_460 = linear(bias = linear_1_bias_0, weight = wrapped_model_language_model_layers_1_self_attn_k_proj_weight_palettized, x = output_27_cast_fp16)[name = tensor("linear_8")]; tensor var_461 = const()[name = tensor("op_461"), val = tensor([1, 256, -1, 256])]; tensor var_462 = reshape(shape = var_461, x = var_460)[name = tensor("op_462")]; tensor x_31_perm_0 = const()[name = tensor("x_31_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_465 = linear(bias = linear_1_bias_0, weight = wrapped_model_language_model_layers_1_self_attn_v_proj_weight_palettized, x = output_27_cast_fp16)[name = tensor("linear_9")]; tensor var_466 = const()[name = tensor("op_466"), val = tensor([1, 256, -1, 256])]; tensor var_467 = reshape(shape = var_466, x = var_465)[name = tensor("op_467")]; tensor hidden_states_21_perm_0 = const()[name = tensor("hidden_states_21_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_22_promoted_7_to_fp16 = const()[name = tensor("op_22_promoted_7_to_fp16"), val = tensor(0x1p+1)]; tensor x_27 = transpose(perm = x_27_perm_0, x = var_457)[name = tensor("transpose_131")]; tensor var_471_cast_fp16 = pow(x = x_27, y = var_22_promoted_7_to_fp16)[name = tensor("op_471_cast_fp16")]; tensor var_473_axes_0 = const()[name = tensor("op_473_axes_0"), val = tensor([-1])]; tensor var_473_keep_dims_0 = const()[name = tensor("op_473_keep_dims_0"), val = tensor(true)]; tensor var_473_cast_fp16 = reduce_mean(axes = var_473_axes_0, keep_dims = var_473_keep_dims_0, x = var_471_cast_fp16)[name = tensor("op_473_cast_fp16")]; tensor var_474_to_fp16 = const()[name = tensor("op_474_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_475_cast_fp16 = add(x = var_473_cast_fp16, y = var_474_to_fp16)[name = tensor("op_475_cast_fp16")]; tensor var_476_epsilon_0 = const()[name = tensor("op_476_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_476_cast_fp16 = rsqrt(epsilon = var_476_epsilon_0, x = var_475_cast_fp16)[name = tensor("op_476_cast_fp16")]; tensor output_29_cast_fp16 = mul(x = x_27, y = var_476_cast_fp16)[name = tensor("output_29_cast_fp16")]; tensor var_480_to_fp16 = const()[name = tensor("op_480_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940151424)))]; tensor output_31_cast_fp16 = mul(x = output_29_cast_fp16, y = var_480_to_fp16)[name = tensor("output_31_cast_fp16")]; tensor var_22_promoted_8_to_fp16 = const()[name = tensor("op_22_promoted_8_to_fp16"), val = tensor(0x1p+1)]; tensor x_31 = transpose(perm = x_31_perm_0, x = var_462)[name = tensor("transpose_130")]; tensor var_485_cast_fp16 = pow(x = x_31, y = var_22_promoted_8_to_fp16)[name = tensor("op_485_cast_fp16")]; tensor var_487_axes_0 = const()[name = tensor("op_487_axes_0"), val = tensor([-1])]; tensor var_487_keep_dims_0 = const()[name = tensor("op_487_keep_dims_0"), val = tensor(true)]; tensor var_487_cast_fp16 = reduce_mean(axes = var_487_axes_0, keep_dims = var_487_keep_dims_0, x = var_485_cast_fp16)[name = tensor("op_487_cast_fp16")]; tensor var_488_to_fp16 = const()[name = tensor("op_488_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_489_cast_fp16 = add(x = var_487_cast_fp16, y = var_488_to_fp16)[name = tensor("op_489_cast_fp16")]; tensor var_490_epsilon_0 = const()[name = tensor("op_490_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_490_cast_fp16 = rsqrt(epsilon = var_490_epsilon_0, x = var_489_cast_fp16)[name = tensor("op_490_cast_fp16")]; tensor output_33_cast_fp16 = mul(x = x_31, y = var_490_cast_fp16)[name = tensor("output_33_cast_fp16")]; tensor var_494_to_fp16 = const()[name = tensor("op_494_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940152000)))]; tensor output_35_cast_fp16 = mul(x = output_33_cast_fp16, y = var_494_to_fp16)[name = tensor("output_35_cast_fp16")]; tensor var_499 = mul(x = output_31_cast_fp16, y = cos_7_palettized)[name = tensor("op_499")]; tensor x1_5_begin_0 = const()[name = tensor("x1_5_begin_0"), val = tensor([0, 0, 0, 0])]; tensor x1_5_end_0 = const()[name = tensor("x1_5_end_0"), val = tensor([1, 8, 256, 128])]; tensor x1_5_end_mask_0 = const()[name = tensor("x1_5_end_mask_0"), val = tensor([true, true, true, false])]; tensor x1_5 = slice_by_index(begin = x1_5_begin_0, end = x1_5_end_0, end_mask = x1_5_end_mask_0, x = output_31_cast_fp16)[name = tensor("x1_5")]; tensor x2_5_begin_0 = const()[name = tensor("x2_5_begin_0"), val = tensor([0, 0, 0, 128])]; tensor x2_5_end_0 = const()[name = tensor("x2_5_end_0"), val = tensor([1, 8, 256, 256])]; tensor x2_5_end_mask_0 = const()[name = tensor("x2_5_end_mask_0"), val = tensor([true, true, true, true])]; tensor x2_5 = slice_by_index(begin = x2_5_begin_0, end = x2_5_end_0, end_mask = x2_5_end_mask_0, x = output_31_cast_fp16)[name = tensor("x2_5")]; tensor const_58_promoted = const()[name = tensor("const_58_promoted"), val = tensor(-0x1p+0)]; tensor var_510 = mul(x = x2_5, y = const_58_promoted)[name = tensor("op_510")]; tensor var_512_interleave_0 = const()[name = tensor("op_512_interleave_0"), val = tensor(false)]; tensor var_512 = concat(axis = var_24, interleave = var_512_interleave_0, values = (var_510, x1_5))[name = tensor("op_512")]; tensor var_513 = mul(x = var_512, y = sin_7_palettized)[name = tensor("op_513")]; tensor query_3 = add(x = var_499, y = var_513)[name = tensor("query_3")]; tensor var_515 = mul(x = output_35_cast_fp16, y = cos_7_palettized)[name = tensor("op_515")]; tensor x1_7_begin_0 = const()[name = tensor("x1_7_begin_0"), val = tensor([0, 0, 0, 0])]; tensor x1_7_end_0 = const()[name = tensor("x1_7_end_0"), val = tensor([1, 4, 256, 128])]; tensor x1_7_end_mask_0 = const()[name = tensor("x1_7_end_mask_0"), val = tensor([true, true, true, false])]; tensor x1_7 = slice_by_index(begin = x1_7_begin_0, end = x1_7_end_0, end_mask = x1_7_end_mask_0, x = output_35_cast_fp16)[name = tensor("x1_7")]; tensor x2_7_begin_0 = const()[name = tensor("x2_7_begin_0"), val = tensor([0, 0, 0, 128])]; tensor x2_7_end_0 = const()[name = tensor("x2_7_end_0"), val = tensor([1, 4, 256, 256])]; tensor x2_7_end_mask_0 = const()[name = tensor("x2_7_end_mask_0"), val = tensor([true, true, true, true])]; tensor x2_7 = slice_by_index(begin = x2_7_begin_0, end = x2_7_end_0, end_mask = x2_7_end_mask_0, x = output_35_cast_fp16)[name = tensor("x2_7")]; tensor const_61_promoted = const()[name = tensor("const_61_promoted"), val = tensor(-0x1p+0)]; tensor var_526 = mul(x = x2_7, y = const_61_promoted)[name = tensor("op_526")]; tensor var_528_interleave_0 = const()[name = tensor("op_528_interleave_0"), val = tensor(false)]; tensor var_528 = concat(axis = var_24, interleave = var_528_interleave_0, values = (var_526, x1_7))[name = tensor("op_528")]; tensor var_529 = mul(x = var_528, y = sin_7_palettized)[name = tensor("op_529")]; tensor hidden_states_17 = add(x = var_515, y = var_529)[name = tensor("hidden_states_17")]; tensor var_538_axes_0 = const()[name = tensor("op_538_axes_0"), val = tensor([2])]; tensor var_538 = expand_dims(axes = var_538_axes_0, x = hidden_states_17)[name = tensor("op_538")]; tensor hidden_states_19_reps_0 = const()[name = tensor("hidden_states_19_reps_0"), val = tensor([1, 1, 2, 1, 1])]; tensor hidden_states_19 = tile(reps = hidden_states_19_reps_0, x = var_538)[name = tensor("hidden_states_19")]; tensor var_546 = const()[name = tensor("op_546"), val = tensor([1, 8, 256, 256])]; tensor key_states_3 = reshape(shape = var_546, x = hidden_states_19)[name = tensor("key_states_3")]; tensor var_555_axes_0 = const()[name = tensor("op_555_axes_0"), val = tensor([2])]; tensor hidden_states_21 = transpose(perm = hidden_states_21_perm_0, x = var_467)[name = tensor("transpose_129")]; tensor var_555 = expand_dims(axes = var_555_axes_0, x = hidden_states_21)[name = tensor("op_555")]; tensor hidden_states_23_reps_0 = const()[name = tensor("hidden_states_23_reps_0"), val = tensor([1, 1, 2, 1, 1])]; tensor hidden_states_23 = tile(reps = hidden_states_23_reps_0, x = var_555)[name = tensor("hidden_states_23")]; tensor var_563 = const()[name = tensor("op_563"), val = tensor([1, 8, 256, 256])]; tensor value_states_3 = reshape(shape = var_563, x = hidden_states_23)[name = tensor("value_states_3")]; tensor var_566_transpose_x_1 = const()[name = tensor("op_566_transpose_x_1"), val = tensor(false)]; tensor var_566_transpose_y_1 = const()[name = tensor("op_566_transpose_y_1"), val = tensor(true)]; tensor var_566 = matmul(transpose_x = var_566_transpose_x_1, transpose_y = var_566_transpose_y_1, x = query_3, y = key_states_3)[name = tensor("op_566")]; tensor var_567_to_fp16 = const()[name = tensor("op_567_to_fp16"), val = tensor(0x1p-4)]; tensor attn_weights_5_cast_fp16 = mul(x = var_566, y = var_567_to_fp16)[name = tensor("attn_weights_5_cast_fp16")]; tensor input_13_cast_fp16 = add(x = attn_weights_5_cast_fp16, y = attention_mask_to_fp16_palettized)[name = tensor("input_13_cast_fp16")]; tensor var_575_cast_fp16 = softmax(axis = var_24, x = input_13_cast_fp16)[name = tensor("op_575_cast_fp16")]; tensor attn_output_5_transpose_x_0 = const()[name = tensor("attn_output_5_transpose_x_0"), val = tensor(false)]; tensor attn_output_5_transpose_y_0 = const()[name = tensor("attn_output_5_transpose_y_0"), val = tensor(false)]; tensor attn_output_5 = matmul(transpose_x = attn_output_5_transpose_x_0, transpose_y = attn_output_5_transpose_y_0, x = var_575_cast_fp16, y = value_states_3)[name = tensor("attn_output_5")]; tensor var_579_perm_0 = const()[name = tensor("op_579_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_581 = const()[name = tensor("op_581"), val = tensor([1, 256, -1])]; tensor var_579 = transpose(perm = var_579_perm_0, x = attn_output_5)[name = tensor("transpose_128")]; tensor var_582 = reshape(shape = var_581, x = var_579)[name = tensor("op_582")]; tensor x_35 = linear(bias = linear_3_bias_0, weight = wrapped_model_language_model_layers_1_self_attn_o_proj_weight_palettized, x = var_582)[name = tensor("linear_10")]; tensor var_22_promoted_9_to_fp16 = const()[name = tensor("op_22_promoted_9_to_fp16"), val = tensor(0x1p+1)]; tensor var_588_cast_fp16 = pow(x = x_35, y = var_22_promoted_9_to_fp16)[name = tensor("op_588_cast_fp16")]; tensor var_590_axes_0 = const()[name = tensor("op_590_axes_0"), val = tensor([-1])]; tensor var_590_keep_dims_0 = const()[name = tensor("op_590_keep_dims_0"), val = tensor(true)]; tensor var_590_cast_fp16 = reduce_mean(axes = var_590_axes_0, keep_dims = var_590_keep_dims_0, x = var_588_cast_fp16)[name = tensor("op_590_cast_fp16")]; tensor var_591_to_fp16 = const()[name = tensor("op_591_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_592_cast_fp16 = add(x = var_590_cast_fp16, y = var_591_to_fp16)[name = tensor("op_592_cast_fp16")]; tensor var_593_epsilon_0 = const()[name = tensor("op_593_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_593_cast_fp16 = rsqrt(epsilon = var_593_epsilon_0, x = var_592_cast_fp16)[name = tensor("op_593_cast_fp16")]; tensor output_37_cast_fp16 = mul(x = x_35, y = var_593_cast_fp16)[name = tensor("output_37_cast_fp16")]; tensor var_597_to_fp16 = const()[name = tensor("op_597_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940152576)))]; tensor output_39_cast_fp16 = mul(x = output_37_cast_fp16, y = var_597_to_fp16)[name = tensor("output_39_cast_fp16")]; tensor x_39 = add(x = x_23, y = output_39_cast_fp16)[name = tensor("x_39")]; tensor var_22_promoted_10_to_fp16 = const()[name = tensor("op_22_promoted_10_to_fp16"), val = tensor(0x1p+1)]; tensor var_603_cast_fp16 = pow(x = x_39, y = var_22_promoted_10_to_fp16)[name = tensor("op_603_cast_fp16")]; tensor var_605_axes_0 = const()[name = tensor("op_605_axes_0"), val = tensor([-1])]; tensor var_605_keep_dims_0 = const()[name = tensor("op_605_keep_dims_0"), val = tensor(true)]; tensor var_605_cast_fp16 = reduce_mean(axes = var_605_axes_0, keep_dims = var_605_keep_dims_0, x = var_603_cast_fp16)[name = tensor("op_605_cast_fp16")]; tensor var_606_to_fp16 = const()[name = tensor("op_606_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_607_cast_fp16 = add(x = var_605_cast_fp16, y = var_606_to_fp16)[name = tensor("op_607_cast_fp16")]; tensor var_608_epsilon_0 = const()[name = tensor("op_608_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_608_cast_fp16 = rsqrt(epsilon = var_608_epsilon_0, x = var_607_cast_fp16)[name = tensor("op_608_cast_fp16")]; tensor output_41_cast_fp16 = mul(x = x_39, y = var_608_cast_fp16)[name = tensor("output_41_cast_fp16")]; tensor var_612_to_fp16 = const()[name = tensor("op_612_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940157760)))]; tensor output_43_cast_fp16 = mul(x = output_41_cast_fp16, y = var_612_to_fp16)[name = tensor("output_43_cast_fp16")]; tensor input_21 = linear(bias = linear_4_bias_0, weight = wrapped_model_language_model_layers_1_mlp_gate_proj_weight_palettized, x = output_43_cast_fp16)[name = tensor("linear_11")]; tensor var_620_mode_0 = const()[name = tensor("op_620_mode_0"), val = tensor("TANH_APPROXIMATION")]; tensor var_620 = gelu(mode = var_620_mode_0, x = input_21)[name = tensor("op_620")]; tensor var_622 = linear(bias = linear_4_bias_0, weight = wrapped_model_language_model_layers_1_mlp_up_proj_weight_palettized, x = output_43_cast_fp16)[name = tensor("linear_12")]; tensor input_23 = mul(x = var_620, y = var_622)[name = tensor("input_23")]; tensor x_43 = linear(bias = linear_3_bias_0, weight = wrapped_model_language_model_layers_1_mlp_down_proj_weight_palettized, x = input_23)[name = tensor("linear_13")]; tensor var_22_promoted_11_to_fp16 = const()[name = tensor("op_22_promoted_11_to_fp16"), val = tensor(0x1p+1)]; tensor var_628_cast_fp16 = pow(x = x_43, y = var_22_promoted_11_to_fp16)[name = tensor("op_628_cast_fp16")]; tensor var_630_axes_0 = const()[name = tensor("op_630_axes_0"), val = tensor([-1])]; tensor var_630_keep_dims_0 = const()[name = tensor("op_630_keep_dims_0"), val = tensor(true)]; tensor var_630_cast_fp16 = reduce_mean(axes = var_630_axes_0, keep_dims = var_630_keep_dims_0, x = var_628_cast_fp16)[name = tensor("op_630_cast_fp16")]; tensor var_631_to_fp16 = const()[name = tensor("op_631_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_632_cast_fp16 = add(x = var_630_cast_fp16, y = var_631_to_fp16)[name = tensor("op_632_cast_fp16")]; tensor var_633_epsilon_0 = const()[name = tensor("op_633_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_633_cast_fp16 = rsqrt(epsilon = var_633_epsilon_0, x = var_632_cast_fp16)[name = tensor("op_633_cast_fp16")]; tensor output_45_cast_fp16 = mul(x = x_43, y = var_633_cast_fp16)[name = tensor("output_45_cast_fp16")]; tensor var_637_to_fp16 = const()[name = tensor("op_637_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940162944)))]; tensor output_47_cast_fp16 = mul(x = output_45_cast_fp16, y = var_637_to_fp16)[name = tensor("output_47_cast_fp16")]; tensor x_47 = add(x = x_39, y = output_47_cast_fp16)[name = tensor("x_47")]; tensor var_22_promoted_12_to_fp16 = const()[name = tensor("op_22_promoted_12_to_fp16"), val = tensor(0x1p+1)]; tensor var_649_cast_fp16 = pow(x = x_47, y = var_22_promoted_12_to_fp16)[name = tensor("op_649_cast_fp16")]; tensor var_651_axes_0 = const()[name = tensor("op_651_axes_0"), val = tensor([-1])]; tensor var_651_keep_dims_0 = const()[name = tensor("op_651_keep_dims_0"), val = tensor(true)]; tensor var_651_cast_fp16 = reduce_mean(axes = var_651_axes_0, keep_dims = var_651_keep_dims_0, x = var_649_cast_fp16)[name = tensor("op_651_cast_fp16")]; tensor var_652_to_fp16 = const()[name = tensor("op_652_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_653_cast_fp16 = add(x = var_651_cast_fp16, y = var_652_to_fp16)[name = tensor("op_653_cast_fp16")]; tensor var_654_epsilon_0 = const()[name = tensor("op_654_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_654_cast_fp16 = rsqrt(epsilon = var_654_epsilon_0, x = var_653_cast_fp16)[name = tensor("op_654_cast_fp16")]; tensor output_49_cast_fp16 = mul(x = x_47, y = var_654_cast_fp16)[name = tensor("output_49_cast_fp16")]; tensor var_658_to_fp16 = const()[name = tensor("op_658_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940168128)))]; tensor output_51_cast_fp16 = mul(x = output_49_cast_fp16, y = var_658_to_fp16)[name = tensor("output_51_cast_fp16")]; tensor var_670 = linear(bias = linear_0_bias_0, weight = wrapped_model_language_model_layers_2_self_attn_q_proj_weight_palettized, x = output_51_cast_fp16)[name = tensor("linear_14")]; tensor var_671 = const()[name = tensor("op_671"), val = tensor([1, 256, -1, 256])]; tensor var_672 = reshape(shape = var_671, x = var_670)[name = tensor("op_672")]; tensor x_51_perm_0 = const()[name = tensor("x_51_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_675 = linear(bias = linear_1_bias_0, weight = wrapped_model_language_model_layers_2_self_attn_k_proj_weight_palettized, x = output_51_cast_fp16)[name = tensor("linear_15")]; tensor var_676 = const()[name = tensor("op_676"), val = tensor([1, 256, -1, 256])]; tensor var_677 = reshape(shape = var_676, x = var_675)[name = tensor("op_677")]; tensor x_55_perm_0 = const()[name = tensor("x_55_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_680 = linear(bias = linear_1_bias_0, weight = wrapped_model_language_model_layers_2_self_attn_v_proj_weight_palettized, x = output_51_cast_fp16)[name = tensor("linear_16")]; tensor var_681 = const()[name = tensor("op_681"), val = tensor([1, 256, -1, 256])]; tensor var_682 = reshape(shape = var_681, x = var_680)[name = tensor("op_682")]; tensor hidden_states_35_perm_0 = const()[name = tensor("hidden_states_35_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_22_promoted_13_to_fp16 = const()[name = tensor("op_22_promoted_13_to_fp16"), val = tensor(0x1p+1)]; tensor x_51 = transpose(perm = x_51_perm_0, x = var_672)[name = tensor("transpose_127")]; tensor var_686_cast_fp16 = pow(x = x_51, y = var_22_promoted_13_to_fp16)[name = tensor("op_686_cast_fp16")]; tensor var_688_axes_0 = const()[name = tensor("op_688_axes_0"), val = tensor([-1])]; tensor var_688_keep_dims_0 = const()[name = tensor("op_688_keep_dims_0"), val = tensor(true)]; tensor var_688_cast_fp16 = reduce_mean(axes = var_688_axes_0, keep_dims = var_688_keep_dims_0, x = var_686_cast_fp16)[name = tensor("op_688_cast_fp16")]; tensor var_689_to_fp16 = const()[name = tensor("op_689_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_690_cast_fp16 = add(x = var_688_cast_fp16, y = var_689_to_fp16)[name = tensor("op_690_cast_fp16")]; tensor var_691_epsilon_0 = const()[name = tensor("op_691_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_691_cast_fp16 = rsqrt(epsilon = var_691_epsilon_0, x = var_690_cast_fp16)[name = tensor("op_691_cast_fp16")]; tensor output_53_cast_fp16 = mul(x = x_51, y = var_691_cast_fp16)[name = tensor("output_53_cast_fp16")]; tensor var_695_to_fp16 = const()[name = tensor("op_695_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940173312)))]; tensor output_55_cast_fp16 = mul(x = output_53_cast_fp16, y = var_695_to_fp16)[name = tensor("output_55_cast_fp16")]; tensor var_22_promoted_14_to_fp16 = const()[name = tensor("op_22_promoted_14_to_fp16"), val = tensor(0x1p+1)]; tensor x_55 = transpose(perm = x_55_perm_0, x = var_677)[name = tensor("transpose_126")]; tensor var_700_cast_fp16 = pow(x = x_55, y = var_22_promoted_14_to_fp16)[name = tensor("op_700_cast_fp16")]; tensor var_702_axes_0 = const()[name = tensor("op_702_axes_0"), val = tensor([-1])]; tensor var_702_keep_dims_0 = const()[name = tensor("op_702_keep_dims_0"), val = tensor(true)]; tensor var_702_cast_fp16 = reduce_mean(axes = var_702_axes_0, keep_dims = var_702_keep_dims_0, x = var_700_cast_fp16)[name = tensor("op_702_cast_fp16")]; tensor var_703_to_fp16 = const()[name = tensor("op_703_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_704_cast_fp16 = add(x = var_702_cast_fp16, y = var_703_to_fp16)[name = tensor("op_704_cast_fp16")]; tensor var_705_epsilon_0 = const()[name = tensor("op_705_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_705_cast_fp16 = rsqrt(epsilon = var_705_epsilon_0, x = var_704_cast_fp16)[name = tensor("op_705_cast_fp16")]; tensor output_57_cast_fp16 = mul(x = x_55, y = var_705_cast_fp16)[name = tensor("output_57_cast_fp16")]; tensor var_709_to_fp16 = const()[name = tensor("op_709_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940173888)))]; tensor output_59_cast_fp16 = mul(x = output_57_cast_fp16, y = var_709_to_fp16)[name = tensor("output_59_cast_fp16")]; tensor var_714 = mul(x = output_55_cast_fp16, y = cos_7_palettized)[name = tensor("op_714")]; tensor x1_9_begin_0 = const()[name = tensor("x1_9_begin_0"), val = tensor([0, 0, 0, 0])]; tensor x1_9_end_0 = const()[name = tensor("x1_9_end_0"), val = tensor([1, 8, 256, 128])]; tensor x1_9_end_mask_0 = const()[name = tensor("x1_9_end_mask_0"), val = tensor([true, true, true, false])]; tensor x1_9 = slice_by_index(begin = x1_9_begin_0, end = x1_9_end_0, end_mask = x1_9_end_mask_0, x = output_55_cast_fp16)[name = tensor("x1_9")]; tensor x2_9_begin_0 = const()[name = tensor("x2_9_begin_0"), val = tensor([0, 0, 0, 128])]; tensor x2_9_end_0 = const()[name = tensor("x2_9_end_0"), val = tensor([1, 8, 256, 256])]; tensor x2_9_end_mask_0 = const()[name = tensor("x2_9_end_mask_0"), val = tensor([true, true, true, true])]; tensor x2_9 = slice_by_index(begin = x2_9_begin_0, end = x2_9_end_0, end_mask = x2_9_end_mask_0, x = output_55_cast_fp16)[name = tensor("x2_9")]; tensor const_81_promoted = const()[name = tensor("const_81_promoted"), val = tensor(-0x1p+0)]; tensor var_725 = mul(x = x2_9, y = const_81_promoted)[name = tensor("op_725")]; tensor var_727_interleave_0 = const()[name = tensor("op_727_interleave_0"), val = tensor(false)]; tensor var_727 = concat(axis = var_24, interleave = var_727_interleave_0, values = (var_725, x1_9))[name = tensor("op_727")]; tensor var_728 = mul(x = var_727, y = sin_7_palettized)[name = tensor("op_728")]; tensor query_5 = add(x = var_714, y = var_728)[name = tensor("query_5")]; tensor var_730 = mul(x = output_59_cast_fp16, y = cos_7_palettized)[name = tensor("op_730")]; tensor x1_11_begin_0 = const()[name = tensor("x1_11_begin_0"), val = tensor([0, 0, 0, 0])]; tensor x1_11_end_0 = const()[name = tensor("x1_11_end_0"), val = tensor([1, 4, 256, 128])]; tensor x1_11_end_mask_0 = const()[name = tensor("x1_11_end_mask_0"), val = tensor([true, true, true, false])]; tensor x1_11 = slice_by_index(begin = x1_11_begin_0, end = x1_11_end_0, end_mask = x1_11_end_mask_0, x = output_59_cast_fp16)[name = tensor("x1_11")]; tensor x2_11_begin_0 = const()[name = tensor("x2_11_begin_0"), val = tensor([0, 0, 0, 128])]; tensor x2_11_end_0 = const()[name = tensor("x2_11_end_0"), val = tensor([1, 4, 256, 256])]; tensor x2_11_end_mask_0 = const()[name = tensor("x2_11_end_mask_0"), val = tensor([true, true, true, true])]; tensor x2_11 = slice_by_index(begin = x2_11_begin_0, end = x2_11_end_0, end_mask = x2_11_end_mask_0, x = output_59_cast_fp16)[name = tensor("x2_11")]; tensor const_84_promoted = const()[name = tensor("const_84_promoted"), val = tensor(-0x1p+0)]; tensor var_741 = mul(x = x2_11, y = const_84_promoted)[name = tensor("op_741")]; tensor var_743_interleave_0 = const()[name = tensor("op_743_interleave_0"), val = tensor(false)]; tensor var_743 = concat(axis = var_24, interleave = var_743_interleave_0, values = (var_741, x1_11))[name = tensor("op_743")]; tensor var_744 = mul(x = var_743, y = sin_7_palettized)[name = tensor("op_744")]; tensor hidden_states_31 = add(x = var_730, y = var_744)[name = tensor("hidden_states_31")]; tensor var_753_axes_0 = const()[name = tensor("op_753_axes_0"), val = tensor([2])]; tensor var_753 = expand_dims(axes = var_753_axes_0, x = hidden_states_31)[name = tensor("op_753")]; tensor hidden_states_33_reps_0 = const()[name = tensor("hidden_states_33_reps_0"), val = tensor([1, 1, 2, 1, 1])]; tensor hidden_states_33 = tile(reps = hidden_states_33_reps_0, x = var_753)[name = tensor("hidden_states_33")]; tensor var_761 = const()[name = tensor("op_761"), val = tensor([1, 8, 256, 256])]; tensor key_states_5 = reshape(shape = var_761, x = hidden_states_33)[name = tensor("key_states_5")]; tensor var_770_axes_0 = const()[name = tensor("op_770_axes_0"), val = tensor([2])]; tensor hidden_states_35 = transpose(perm = hidden_states_35_perm_0, x = var_682)[name = tensor("transpose_125")]; tensor var_770 = expand_dims(axes = var_770_axes_0, x = hidden_states_35)[name = tensor("op_770")]; tensor hidden_states_37_reps_0 = const()[name = tensor("hidden_states_37_reps_0"), val = tensor([1, 1, 2, 1, 1])]; tensor hidden_states_37 = tile(reps = hidden_states_37_reps_0, x = var_770)[name = tensor("hidden_states_37")]; tensor var_778 = const()[name = tensor("op_778"), val = tensor([1, 8, 256, 256])]; tensor value_states_5 = reshape(shape = var_778, x = hidden_states_37)[name = tensor("value_states_5")]; tensor var_781_transpose_x_1 = const()[name = tensor("op_781_transpose_x_1"), val = tensor(false)]; tensor var_781_transpose_y_1 = const()[name = tensor("op_781_transpose_y_1"), val = tensor(true)]; tensor var_781 = matmul(transpose_x = var_781_transpose_x_1, transpose_y = var_781_transpose_y_1, x = query_5, y = key_states_5)[name = tensor("op_781")]; tensor var_782_to_fp16 = const()[name = tensor("op_782_to_fp16"), val = tensor(0x1p-4)]; tensor attn_weights_9_cast_fp16 = mul(x = var_781, y = var_782_to_fp16)[name = tensor("attn_weights_9_cast_fp16")]; tensor input_25_cast_fp16 = add(x = attn_weights_9_cast_fp16, y = attention_mask_to_fp16_palettized)[name = tensor("input_25_cast_fp16")]; tensor var_790_cast_fp16 = softmax(axis = var_24, x = input_25_cast_fp16)[name = tensor("op_790_cast_fp16")]; tensor attn_output_9_transpose_x_0 = const()[name = tensor("attn_output_9_transpose_x_0"), val = tensor(false)]; tensor attn_output_9_transpose_y_0 = const()[name = tensor("attn_output_9_transpose_y_0"), val = tensor(false)]; tensor attn_output_9 = matmul(transpose_x = attn_output_9_transpose_x_0, transpose_y = attn_output_9_transpose_y_0, x = var_790_cast_fp16, y = value_states_5)[name = tensor("attn_output_9")]; tensor var_794_perm_0 = const()[name = tensor("op_794_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_796 = const()[name = tensor("op_796"), val = tensor([1, 256, -1])]; tensor var_794 = transpose(perm = var_794_perm_0, x = attn_output_9)[name = tensor("transpose_124")]; tensor var_797 = reshape(shape = var_796, x = var_794)[name = tensor("op_797")]; tensor x_59 = linear(bias = linear_3_bias_0, weight = wrapped_model_language_model_layers_2_self_attn_o_proj_weight_palettized, x = var_797)[name = tensor("linear_17")]; tensor var_22_promoted_15_to_fp16 = const()[name = tensor("op_22_promoted_15_to_fp16"), val = tensor(0x1p+1)]; tensor var_803_cast_fp16 = pow(x = x_59, y = var_22_promoted_15_to_fp16)[name = tensor("op_803_cast_fp16")]; tensor var_805_axes_0 = const()[name = tensor("op_805_axes_0"), val = tensor([-1])]; tensor var_805_keep_dims_0 = const()[name = tensor("op_805_keep_dims_0"), val = tensor(true)]; tensor var_805_cast_fp16 = reduce_mean(axes = var_805_axes_0, keep_dims = var_805_keep_dims_0, x = var_803_cast_fp16)[name = tensor("op_805_cast_fp16")]; tensor var_806_to_fp16 = const()[name = tensor("op_806_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_807_cast_fp16 = add(x = var_805_cast_fp16, y = var_806_to_fp16)[name = tensor("op_807_cast_fp16")]; tensor var_808_epsilon_0 = const()[name = tensor("op_808_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_808_cast_fp16 = rsqrt(epsilon = var_808_epsilon_0, x = var_807_cast_fp16)[name = tensor("op_808_cast_fp16")]; tensor output_61_cast_fp16 = mul(x = x_59, y = var_808_cast_fp16)[name = tensor("output_61_cast_fp16")]; tensor var_812_to_fp16 = const()[name = tensor("op_812_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940174464)))]; tensor output_63_cast_fp16 = mul(x = output_61_cast_fp16, y = var_812_to_fp16)[name = tensor("output_63_cast_fp16")]; tensor x_63 = add(x = x_47, y = output_63_cast_fp16)[name = tensor("x_63")]; tensor var_22_promoted_16_to_fp16 = const()[name = tensor("op_22_promoted_16_to_fp16"), val = tensor(0x1p+1)]; tensor var_818_cast_fp16 = pow(x = x_63, y = var_22_promoted_16_to_fp16)[name = tensor("op_818_cast_fp16")]; tensor var_820_axes_0 = const()[name = tensor("op_820_axes_0"), val = tensor([-1])]; tensor var_820_keep_dims_0 = const()[name = tensor("op_820_keep_dims_0"), val = tensor(true)]; tensor var_820_cast_fp16 = reduce_mean(axes = var_820_axes_0, keep_dims = var_820_keep_dims_0, x = var_818_cast_fp16)[name = tensor("op_820_cast_fp16")]; tensor var_821_to_fp16 = const()[name = tensor("op_821_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_822_cast_fp16 = add(x = var_820_cast_fp16, y = var_821_to_fp16)[name = tensor("op_822_cast_fp16")]; tensor var_823_epsilon_0 = const()[name = tensor("op_823_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_823_cast_fp16 = rsqrt(epsilon = var_823_epsilon_0, x = var_822_cast_fp16)[name = tensor("op_823_cast_fp16")]; tensor output_65_cast_fp16 = mul(x = x_63, y = var_823_cast_fp16)[name = tensor("output_65_cast_fp16")]; tensor var_827_to_fp16 = const()[name = tensor("op_827_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940179648)))]; tensor output_67_cast_fp16 = mul(x = output_65_cast_fp16, y = var_827_to_fp16)[name = tensor("output_67_cast_fp16")]; tensor input_33 = linear(bias = linear_4_bias_0, weight = wrapped_model_language_model_layers_2_mlp_gate_proj_weight_palettized, x = output_67_cast_fp16)[name = tensor("linear_18")]; tensor var_835_mode_0 = const()[name = tensor("op_835_mode_0"), val = tensor("TANH_APPROXIMATION")]; tensor var_835 = gelu(mode = var_835_mode_0, x = input_33)[name = tensor("op_835")]; tensor var_837 = linear(bias = linear_4_bias_0, weight = wrapped_model_language_model_layers_2_mlp_up_proj_weight_palettized, x = output_67_cast_fp16)[name = tensor("linear_19")]; tensor input_35 = mul(x = var_835, y = var_837)[name = tensor("input_35")]; tensor x_67 = linear(bias = linear_3_bias_0, weight = wrapped_model_language_model_layers_2_mlp_down_proj_weight_palettized, x = input_35)[name = tensor("linear_20")]; tensor var_22_promoted_17_to_fp16 = const()[name = tensor("op_22_promoted_17_to_fp16"), val = tensor(0x1p+1)]; tensor var_843_cast_fp16 = pow(x = x_67, y = var_22_promoted_17_to_fp16)[name = tensor("op_843_cast_fp16")]; tensor var_845_axes_0 = const()[name = tensor("op_845_axes_0"), val = tensor([-1])]; tensor var_845_keep_dims_0 = const()[name = tensor("op_845_keep_dims_0"), val = tensor(true)]; tensor var_845_cast_fp16 = reduce_mean(axes = var_845_axes_0, keep_dims = var_845_keep_dims_0, x = var_843_cast_fp16)[name = tensor("op_845_cast_fp16")]; tensor var_846_to_fp16 = const()[name = tensor("op_846_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_847_cast_fp16 = add(x = var_845_cast_fp16, y = var_846_to_fp16)[name = tensor("op_847_cast_fp16")]; tensor var_848_epsilon_0 = const()[name = tensor("op_848_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_848_cast_fp16 = rsqrt(epsilon = var_848_epsilon_0, x = var_847_cast_fp16)[name = tensor("op_848_cast_fp16")]; tensor output_69_cast_fp16 = mul(x = x_67, y = var_848_cast_fp16)[name = tensor("output_69_cast_fp16")]; tensor var_852_to_fp16 = const()[name = tensor("op_852_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940184832)))]; tensor output_71_cast_fp16 = mul(x = output_69_cast_fp16, y = var_852_to_fp16)[name = tensor("output_71_cast_fp16")]; tensor x_71 = add(x = x_63, y = output_71_cast_fp16)[name = tensor("x_71")]; tensor var_22_promoted_18_to_fp16 = const()[name = tensor("op_22_promoted_18_to_fp16"), val = tensor(0x1p+1)]; tensor var_864_cast_fp16 = pow(x = x_71, y = var_22_promoted_18_to_fp16)[name = tensor("op_864_cast_fp16")]; tensor var_866_axes_0 = const()[name = tensor("op_866_axes_0"), val = tensor([-1])]; tensor var_866_keep_dims_0 = const()[name = tensor("op_866_keep_dims_0"), val = tensor(true)]; tensor var_866_cast_fp16 = reduce_mean(axes = var_866_axes_0, keep_dims = var_866_keep_dims_0, x = var_864_cast_fp16)[name = tensor("op_866_cast_fp16")]; tensor var_867_to_fp16 = const()[name = tensor("op_867_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_868_cast_fp16 = add(x = var_866_cast_fp16, y = var_867_to_fp16)[name = tensor("op_868_cast_fp16")]; tensor var_869_epsilon_0 = const()[name = tensor("op_869_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_869_cast_fp16 = rsqrt(epsilon = var_869_epsilon_0, x = var_868_cast_fp16)[name = tensor("op_869_cast_fp16")]; tensor output_73_cast_fp16 = mul(x = x_71, y = var_869_cast_fp16)[name = tensor("output_73_cast_fp16")]; tensor var_873_to_fp16 = const()[name = tensor("op_873_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940190016)))]; tensor output_75_cast_fp16 = mul(x = output_73_cast_fp16, y = var_873_to_fp16)[name = tensor("output_75_cast_fp16")]; tensor var_885 = linear(bias = linear_0_bias_0, weight = wrapped_model_language_model_layers_3_self_attn_q_proj_weight_palettized, x = output_75_cast_fp16)[name = tensor("linear_21")]; tensor var_886 = const()[name = tensor("op_886"), val = tensor([1, 256, -1, 256])]; tensor var_887 = reshape(shape = var_886, x = var_885)[name = tensor("op_887")]; tensor x_75_perm_0 = const()[name = tensor("x_75_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_890 = linear(bias = linear_1_bias_0, weight = wrapped_model_language_model_layers_3_self_attn_k_proj_weight_palettized, x = output_75_cast_fp16)[name = tensor("linear_22")]; tensor var_891 = const()[name = tensor("op_891"), val = tensor([1, 256, -1, 256])]; tensor var_892 = reshape(shape = var_891, x = var_890)[name = tensor("op_892")]; tensor x_79_perm_0 = const()[name = tensor("x_79_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_895 = linear(bias = linear_1_bias_0, weight = wrapped_model_language_model_layers_3_self_attn_v_proj_weight_palettized, x = output_75_cast_fp16)[name = tensor("linear_23")]; tensor var_896 = const()[name = tensor("op_896"), val = tensor([1, 256, -1, 256])]; tensor var_897 = reshape(shape = var_896, x = var_895)[name = tensor("op_897")]; tensor hidden_states_49_perm_0 = const()[name = tensor("hidden_states_49_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_22_promoted_19_to_fp16 = const()[name = tensor("op_22_promoted_19_to_fp16"), val = tensor(0x1p+1)]; tensor x_75 = transpose(perm = x_75_perm_0, x = var_887)[name = tensor("transpose_123")]; tensor var_901_cast_fp16 = pow(x = x_75, y = var_22_promoted_19_to_fp16)[name = tensor("op_901_cast_fp16")]; tensor var_903_axes_0 = const()[name = tensor("op_903_axes_0"), val = tensor([-1])]; tensor var_903_keep_dims_0 = const()[name = tensor("op_903_keep_dims_0"), val = tensor(true)]; tensor var_903_cast_fp16 = reduce_mean(axes = var_903_axes_0, keep_dims = var_903_keep_dims_0, x = var_901_cast_fp16)[name = tensor("op_903_cast_fp16")]; tensor var_904_to_fp16 = const()[name = tensor("op_904_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_905_cast_fp16 = add(x = var_903_cast_fp16, y = var_904_to_fp16)[name = tensor("op_905_cast_fp16")]; tensor var_906_epsilon_0 = const()[name = tensor("op_906_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_906_cast_fp16 = rsqrt(epsilon = var_906_epsilon_0, x = var_905_cast_fp16)[name = tensor("op_906_cast_fp16")]; tensor output_77_cast_fp16 = mul(x = x_75, y = var_906_cast_fp16)[name = tensor("output_77_cast_fp16")]; tensor var_910_to_fp16 = const()[name = tensor("op_910_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940195200)))]; tensor output_79_cast_fp16 = mul(x = output_77_cast_fp16, y = var_910_to_fp16)[name = tensor("output_79_cast_fp16")]; tensor var_22_promoted_20_to_fp16 = const()[name = tensor("op_22_promoted_20_to_fp16"), val = tensor(0x1p+1)]; tensor x_79 = transpose(perm = x_79_perm_0, x = var_892)[name = tensor("transpose_122")]; tensor var_915_cast_fp16 = pow(x = x_79, y = var_22_promoted_20_to_fp16)[name = tensor("op_915_cast_fp16")]; tensor var_917_axes_0 = const()[name = tensor("op_917_axes_0"), val = tensor([-1])]; tensor var_917_keep_dims_0 = const()[name = tensor("op_917_keep_dims_0"), val = tensor(true)]; tensor var_917_cast_fp16 = reduce_mean(axes = var_917_axes_0, keep_dims = var_917_keep_dims_0, x = var_915_cast_fp16)[name = tensor("op_917_cast_fp16")]; tensor var_918_to_fp16 = const()[name = tensor("op_918_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_919_cast_fp16 = add(x = var_917_cast_fp16, y = var_918_to_fp16)[name = tensor("op_919_cast_fp16")]; tensor var_920_epsilon_0 = const()[name = tensor("op_920_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_920_cast_fp16 = rsqrt(epsilon = var_920_epsilon_0, x = var_919_cast_fp16)[name = tensor("op_920_cast_fp16")]; tensor output_81_cast_fp16 = mul(x = x_79, y = var_920_cast_fp16)[name = tensor("output_81_cast_fp16")]; tensor var_924_to_fp16 = const()[name = tensor("op_924_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940195776)))]; tensor output_83_cast_fp16 = mul(x = output_81_cast_fp16, y = var_924_to_fp16)[name = tensor("output_83_cast_fp16")]; tensor var_929 = mul(x = output_79_cast_fp16, y = cos_7_palettized)[name = tensor("op_929")]; tensor x1_13_begin_0 = const()[name = tensor("x1_13_begin_0"), val = tensor([0, 0, 0, 0])]; tensor x1_13_end_0 = const()[name = tensor("x1_13_end_0"), val = tensor([1, 8, 256, 128])]; tensor x1_13_end_mask_0 = const()[name = tensor("x1_13_end_mask_0"), val = tensor([true, true, true, false])]; tensor x1_13 = slice_by_index(begin = x1_13_begin_0, end = x1_13_end_0, end_mask = x1_13_end_mask_0, x = output_79_cast_fp16)[name = tensor("x1_13")]; tensor x2_13_begin_0 = const()[name = tensor("x2_13_begin_0"), val = tensor([0, 0, 0, 128])]; tensor x2_13_end_0 = const()[name = tensor("x2_13_end_0"), val = tensor([1, 8, 256, 256])]; tensor x2_13_end_mask_0 = const()[name = tensor("x2_13_end_mask_0"), val = tensor([true, true, true, true])]; tensor x2_13 = slice_by_index(begin = x2_13_begin_0, end = x2_13_end_0, end_mask = x2_13_end_mask_0, x = output_79_cast_fp16)[name = tensor("x2_13")]; tensor const_104_promoted = const()[name = tensor("const_104_promoted"), val = tensor(-0x1p+0)]; tensor var_940 = mul(x = x2_13, y = const_104_promoted)[name = tensor("op_940")]; tensor var_942_interleave_0 = const()[name = tensor("op_942_interleave_0"), val = tensor(false)]; tensor var_942 = concat(axis = var_24, interleave = var_942_interleave_0, values = (var_940, x1_13))[name = tensor("op_942")]; tensor var_943 = mul(x = var_942, y = sin_7_palettized)[name = tensor("op_943")]; tensor query_7 = add(x = var_929, y = var_943)[name = tensor("query_7")]; tensor var_945 = mul(x = output_83_cast_fp16, y = cos_7_palettized)[name = tensor("op_945")]; tensor x1_15_begin_0 = const()[name = tensor("x1_15_begin_0"), val = tensor([0, 0, 0, 0])]; tensor x1_15_end_0 = const()[name = tensor("x1_15_end_0"), val = tensor([1, 4, 256, 128])]; tensor x1_15_end_mask_0 = const()[name = tensor("x1_15_end_mask_0"), val = tensor([true, true, true, false])]; tensor x1_15 = slice_by_index(begin = x1_15_begin_0, end = x1_15_end_0, end_mask = x1_15_end_mask_0, x = output_83_cast_fp16)[name = tensor("x1_15")]; tensor x2_15_begin_0 = const()[name = tensor("x2_15_begin_0"), val = tensor([0, 0, 0, 128])]; tensor x2_15_end_0 = const()[name = tensor("x2_15_end_0"), val = tensor([1, 4, 256, 256])]; tensor x2_15_end_mask_0 = const()[name = tensor("x2_15_end_mask_0"), val = tensor([true, true, true, true])]; tensor x2_15 = slice_by_index(begin = x2_15_begin_0, end = x2_15_end_0, end_mask = x2_15_end_mask_0, x = output_83_cast_fp16)[name = tensor("x2_15")]; tensor const_107_promoted = const()[name = tensor("const_107_promoted"), val = tensor(-0x1p+0)]; tensor var_956 = mul(x = x2_15, y = const_107_promoted)[name = tensor("op_956")]; tensor var_958_interleave_0 = const()[name = tensor("op_958_interleave_0"), val = tensor(false)]; tensor var_958 = concat(axis = var_24, interleave = var_958_interleave_0, values = (var_956, x1_15))[name = tensor("op_958")]; tensor var_959 = mul(x = var_958, y = sin_7_palettized)[name = tensor("op_959")]; tensor hidden_states_45 = add(x = var_945, y = var_959)[name = tensor("hidden_states_45")]; tensor var_968_axes_0 = const()[name = tensor("op_968_axes_0"), val = tensor([2])]; tensor var_968 = expand_dims(axes = var_968_axes_0, x = hidden_states_45)[name = tensor("op_968")]; tensor hidden_states_47_reps_0 = const()[name = tensor("hidden_states_47_reps_0"), val = tensor([1, 1, 2, 1, 1])]; tensor hidden_states_47 = tile(reps = hidden_states_47_reps_0, x = var_968)[name = tensor("hidden_states_47")]; tensor var_976 = const()[name = tensor("op_976"), val = tensor([1, 8, 256, 256])]; tensor key_states_7 = reshape(shape = var_976, x = hidden_states_47)[name = tensor("key_states_7")]; tensor var_985_axes_0 = const()[name = tensor("op_985_axes_0"), val = tensor([2])]; tensor hidden_states_49 = transpose(perm = hidden_states_49_perm_0, x = var_897)[name = tensor("transpose_121")]; tensor var_985 = expand_dims(axes = var_985_axes_0, x = hidden_states_49)[name = tensor("op_985")]; tensor hidden_states_51_reps_0 = const()[name = tensor("hidden_states_51_reps_0"), val = tensor([1, 1, 2, 1, 1])]; tensor hidden_states_51 = tile(reps = hidden_states_51_reps_0, x = var_985)[name = tensor("hidden_states_51")]; tensor var_993 = const()[name = tensor("op_993"), val = tensor([1, 8, 256, 256])]; tensor value_states_7 = reshape(shape = var_993, x = hidden_states_51)[name = tensor("value_states_7")]; tensor var_996_transpose_x_1 = const()[name = tensor("op_996_transpose_x_1"), val = tensor(false)]; tensor var_996_transpose_y_1 = const()[name = tensor("op_996_transpose_y_1"), val = tensor(true)]; tensor var_996 = matmul(transpose_x = var_996_transpose_x_1, transpose_y = var_996_transpose_y_1, x = query_7, y = key_states_7)[name = tensor("op_996")]; tensor var_997_to_fp16 = const()[name = tensor("op_997_to_fp16"), val = tensor(0x1p-4)]; tensor attn_weights_13_cast_fp16 = mul(x = var_996, y = var_997_to_fp16)[name = tensor("attn_weights_13_cast_fp16")]; tensor input_37_cast_fp16 = add(x = attn_weights_13_cast_fp16, y = attention_mask_to_fp16_palettized)[name = tensor("input_37_cast_fp16")]; tensor var_1005_cast_fp16 = softmax(axis = var_24, x = input_37_cast_fp16)[name = tensor("op_1005_cast_fp16")]; tensor attn_output_13_transpose_x_0 = const()[name = tensor("attn_output_13_transpose_x_0"), val = tensor(false)]; tensor attn_output_13_transpose_y_0 = const()[name = tensor("attn_output_13_transpose_y_0"), val = tensor(false)]; tensor attn_output_13 = matmul(transpose_x = attn_output_13_transpose_x_0, transpose_y = attn_output_13_transpose_y_0, x = var_1005_cast_fp16, y = value_states_7)[name = tensor("attn_output_13")]; tensor var_1009_perm_0 = const()[name = tensor("op_1009_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_1011 = const()[name = tensor("op_1011"), val = tensor([1, 256, -1])]; tensor var_1009 = transpose(perm = var_1009_perm_0, x = attn_output_13)[name = tensor("transpose_120")]; tensor var_1012 = reshape(shape = var_1011, x = var_1009)[name = tensor("op_1012")]; tensor x_83 = linear(bias = linear_3_bias_0, weight = wrapped_model_language_model_layers_3_self_attn_o_proj_weight_palettized, x = var_1012)[name = tensor("linear_24")]; tensor var_22_promoted_21_to_fp16 = const()[name = tensor("op_22_promoted_21_to_fp16"), val = tensor(0x1p+1)]; tensor var_1018_cast_fp16 = pow(x = x_83, y = var_22_promoted_21_to_fp16)[name = tensor("op_1018_cast_fp16")]; tensor var_1020_axes_0 = const()[name = tensor("op_1020_axes_0"), val = tensor([-1])]; tensor var_1020_keep_dims_0 = const()[name = tensor("op_1020_keep_dims_0"), val = tensor(true)]; tensor var_1020_cast_fp16 = reduce_mean(axes = var_1020_axes_0, keep_dims = var_1020_keep_dims_0, x = var_1018_cast_fp16)[name = tensor("op_1020_cast_fp16")]; tensor var_1021_to_fp16 = const()[name = tensor("op_1021_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_1022_cast_fp16 = add(x = var_1020_cast_fp16, y = var_1021_to_fp16)[name = tensor("op_1022_cast_fp16")]; tensor var_1023_epsilon_0 = const()[name = tensor("op_1023_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_1023_cast_fp16 = rsqrt(epsilon = var_1023_epsilon_0, x = var_1022_cast_fp16)[name = tensor("op_1023_cast_fp16")]; tensor output_85_cast_fp16 = mul(x = x_83, y = var_1023_cast_fp16)[name = tensor("output_85_cast_fp16")]; tensor var_1027_to_fp16 = const()[name = tensor("op_1027_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940196352)))]; tensor output_87_cast_fp16 = mul(x = output_85_cast_fp16, y = var_1027_to_fp16)[name = tensor("output_87_cast_fp16")]; tensor x_87 = add(x = x_71, y = output_87_cast_fp16)[name = tensor("x_87")]; tensor var_22_promoted_22_to_fp16 = const()[name = tensor("op_22_promoted_22_to_fp16"), val = tensor(0x1p+1)]; tensor var_1033_cast_fp16 = pow(x = x_87, y = var_22_promoted_22_to_fp16)[name = tensor("op_1033_cast_fp16")]; tensor var_1035_axes_0 = const()[name = tensor("op_1035_axes_0"), val = tensor([-1])]; tensor var_1035_keep_dims_0 = const()[name = tensor("op_1035_keep_dims_0"), val = tensor(true)]; tensor var_1035_cast_fp16 = reduce_mean(axes = var_1035_axes_0, keep_dims = var_1035_keep_dims_0, x = var_1033_cast_fp16)[name = tensor("op_1035_cast_fp16")]; tensor var_1036_to_fp16 = const()[name = tensor("op_1036_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_1037_cast_fp16 = add(x = var_1035_cast_fp16, y = var_1036_to_fp16)[name = tensor("op_1037_cast_fp16")]; tensor var_1038_epsilon_0 = const()[name = tensor("op_1038_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_1038_cast_fp16 = rsqrt(epsilon = var_1038_epsilon_0, x = var_1037_cast_fp16)[name = tensor("op_1038_cast_fp16")]; tensor output_89_cast_fp16 = mul(x = x_87, y = var_1038_cast_fp16)[name = tensor("output_89_cast_fp16")]; tensor var_1042_to_fp16 = const()[name = tensor("op_1042_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940201536)))]; tensor output_91_cast_fp16 = mul(x = output_89_cast_fp16, y = var_1042_to_fp16)[name = tensor("output_91_cast_fp16")]; tensor input_45 = linear(bias = linear_4_bias_0, weight = wrapped_model_language_model_layers_3_mlp_gate_proj_weight_palettized, x = output_91_cast_fp16)[name = tensor("linear_25")]; tensor var_1050_mode_0 = const()[name = tensor("op_1050_mode_0"), val = tensor("TANH_APPROXIMATION")]; tensor var_1050 = gelu(mode = var_1050_mode_0, x = input_45)[name = tensor("op_1050")]; tensor var_1052 = linear(bias = linear_4_bias_0, weight = wrapped_model_language_model_layers_3_mlp_up_proj_weight_palettized, x = output_91_cast_fp16)[name = tensor("linear_26")]; tensor input_47 = mul(x = var_1050, y = var_1052)[name = tensor("input_47")]; tensor x_91 = linear(bias = linear_3_bias_0, weight = wrapped_model_language_model_layers_3_mlp_down_proj_weight_palettized, x = input_47)[name = tensor("linear_27")]; tensor var_22_promoted_23_to_fp16 = const()[name = tensor("op_22_promoted_23_to_fp16"), val = tensor(0x1p+1)]; tensor var_1058_cast_fp16 = pow(x = x_91, y = var_22_promoted_23_to_fp16)[name = tensor("op_1058_cast_fp16")]; tensor var_1060_axes_0 = const()[name = tensor("op_1060_axes_0"), val = tensor([-1])]; tensor var_1060_keep_dims_0 = const()[name = tensor("op_1060_keep_dims_0"), val = tensor(true)]; tensor var_1060_cast_fp16 = reduce_mean(axes = var_1060_axes_0, keep_dims = var_1060_keep_dims_0, x = var_1058_cast_fp16)[name = tensor("op_1060_cast_fp16")]; tensor var_1061_to_fp16 = const()[name = tensor("op_1061_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_1062_cast_fp16 = add(x = var_1060_cast_fp16, y = var_1061_to_fp16)[name = tensor("op_1062_cast_fp16")]; tensor var_1063_epsilon_0 = const()[name = tensor("op_1063_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_1063_cast_fp16 = rsqrt(epsilon = var_1063_epsilon_0, x = var_1062_cast_fp16)[name = tensor("op_1063_cast_fp16")]; tensor output_93_cast_fp16 = mul(x = x_91, y = var_1063_cast_fp16)[name = tensor("output_93_cast_fp16")]; tensor var_1067_to_fp16 = const()[name = tensor("op_1067_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940206720)))]; tensor output_95_cast_fp16 = mul(x = output_93_cast_fp16, y = var_1067_to_fp16)[name = tensor("output_95_cast_fp16")]; tensor x_95 = add(x = x_87, y = output_95_cast_fp16)[name = tensor("x_95")]; tensor var_22_promoted_24_to_fp16 = const()[name = tensor("op_22_promoted_24_to_fp16"), val = tensor(0x1p+1)]; tensor var_1079_cast_fp16 = pow(x = x_95, y = var_22_promoted_24_to_fp16)[name = tensor("op_1079_cast_fp16")]; tensor var_1081_axes_0 = const()[name = tensor("op_1081_axes_0"), val = tensor([-1])]; tensor var_1081_keep_dims_0 = const()[name = tensor("op_1081_keep_dims_0"), val = tensor(true)]; tensor var_1081_cast_fp16 = reduce_mean(axes = var_1081_axes_0, keep_dims = var_1081_keep_dims_0, x = var_1079_cast_fp16)[name = tensor("op_1081_cast_fp16")]; tensor var_1082_to_fp16 = const()[name = tensor("op_1082_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_1083_cast_fp16 = add(x = var_1081_cast_fp16, y = var_1082_to_fp16)[name = tensor("op_1083_cast_fp16")]; tensor var_1084_epsilon_0 = const()[name = tensor("op_1084_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_1084_cast_fp16 = rsqrt(epsilon = var_1084_epsilon_0, x = var_1083_cast_fp16)[name = tensor("op_1084_cast_fp16")]; tensor output_97_cast_fp16 = mul(x = x_95, y = var_1084_cast_fp16)[name = tensor("output_97_cast_fp16")]; tensor var_1088_to_fp16 = const()[name = tensor("op_1088_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940211904)))]; tensor output_99_cast_fp16 = mul(x = output_97_cast_fp16, y = var_1088_to_fp16)[name = tensor("output_99_cast_fp16")]; tensor var_1100 = linear(bias = linear_0_bias_0, weight = wrapped_model_language_model_layers_4_self_attn_q_proj_weight_palettized, x = output_99_cast_fp16)[name = tensor("linear_28")]; tensor var_1101 = const()[name = tensor("op_1101"), val = tensor([1, 256, -1, 256])]; tensor var_1102 = reshape(shape = var_1101, x = var_1100)[name = tensor("op_1102")]; tensor x_99_perm_0 = const()[name = tensor("x_99_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_1105 = linear(bias = linear_1_bias_0, weight = wrapped_model_language_model_layers_4_self_attn_k_proj_weight_palettized, x = output_99_cast_fp16)[name = tensor("linear_29")]; tensor var_1106 = const()[name = tensor("op_1106"), val = tensor([1, 256, -1, 256])]; tensor var_1107 = reshape(shape = var_1106, x = var_1105)[name = tensor("op_1107")]; tensor x_103_perm_0 = const()[name = tensor("x_103_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_1110 = linear(bias = linear_1_bias_0, weight = wrapped_model_language_model_layers_4_self_attn_v_proj_weight_palettized, x = output_99_cast_fp16)[name = tensor("linear_30")]; tensor var_1111 = const()[name = tensor("op_1111"), val = tensor([1, 256, -1, 256])]; tensor var_1112 = reshape(shape = var_1111, x = var_1110)[name = tensor("op_1112")]; tensor hidden_states_63_perm_0 = const()[name = tensor("hidden_states_63_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_22_promoted_25_to_fp16 = const()[name = tensor("op_22_promoted_25_to_fp16"), val = tensor(0x1p+1)]; tensor x_99 = transpose(perm = x_99_perm_0, x = var_1102)[name = tensor("transpose_119")]; tensor var_1116_cast_fp16 = pow(x = x_99, y = var_22_promoted_25_to_fp16)[name = tensor("op_1116_cast_fp16")]; tensor var_1118_axes_0 = const()[name = tensor("op_1118_axes_0"), val = tensor([-1])]; tensor var_1118_keep_dims_0 = const()[name = tensor("op_1118_keep_dims_0"), val = tensor(true)]; tensor var_1118_cast_fp16 = reduce_mean(axes = var_1118_axes_0, keep_dims = var_1118_keep_dims_0, x = var_1116_cast_fp16)[name = tensor("op_1118_cast_fp16")]; tensor var_1119_to_fp16 = const()[name = tensor("op_1119_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_1120_cast_fp16 = add(x = var_1118_cast_fp16, y = var_1119_to_fp16)[name = tensor("op_1120_cast_fp16")]; tensor var_1121_epsilon_0 = const()[name = tensor("op_1121_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_1121_cast_fp16 = rsqrt(epsilon = var_1121_epsilon_0, x = var_1120_cast_fp16)[name = tensor("op_1121_cast_fp16")]; tensor output_101_cast_fp16 = mul(x = x_99, y = var_1121_cast_fp16)[name = tensor("output_101_cast_fp16")]; tensor var_1125_to_fp16 = const()[name = tensor("op_1125_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940217088)))]; tensor output_103_cast_fp16 = mul(x = output_101_cast_fp16, y = var_1125_to_fp16)[name = tensor("output_103_cast_fp16")]; tensor var_22_promoted_26_to_fp16 = const()[name = tensor("op_22_promoted_26_to_fp16"), val = tensor(0x1p+1)]; tensor x_103 = transpose(perm = x_103_perm_0, x = var_1107)[name = tensor("transpose_118")]; tensor var_1130_cast_fp16 = pow(x = x_103, y = var_22_promoted_26_to_fp16)[name = tensor("op_1130_cast_fp16")]; tensor var_1132_axes_0 = const()[name = tensor("op_1132_axes_0"), val = tensor([-1])]; tensor var_1132_keep_dims_0 = const()[name = tensor("op_1132_keep_dims_0"), val = tensor(true)]; tensor var_1132_cast_fp16 = reduce_mean(axes = var_1132_axes_0, keep_dims = var_1132_keep_dims_0, x = var_1130_cast_fp16)[name = tensor("op_1132_cast_fp16")]; tensor var_1133_to_fp16 = const()[name = tensor("op_1133_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_1134_cast_fp16 = add(x = var_1132_cast_fp16, y = var_1133_to_fp16)[name = tensor("op_1134_cast_fp16")]; tensor var_1135_epsilon_0 = const()[name = tensor("op_1135_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_1135_cast_fp16 = rsqrt(epsilon = var_1135_epsilon_0, x = var_1134_cast_fp16)[name = tensor("op_1135_cast_fp16")]; tensor output_105_cast_fp16 = mul(x = x_103, y = var_1135_cast_fp16)[name = tensor("output_105_cast_fp16")]; tensor var_1139_to_fp16 = const()[name = tensor("op_1139_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940217664)))]; tensor output_107_cast_fp16 = mul(x = output_105_cast_fp16, y = var_1139_to_fp16)[name = tensor("output_107_cast_fp16")]; tensor var_1144 = mul(x = output_103_cast_fp16, y = cos_7_palettized)[name = tensor("op_1144")]; tensor x1_17_begin_0 = const()[name = tensor("x1_17_begin_0"), val = tensor([0, 0, 0, 0])]; tensor x1_17_end_0 = const()[name = tensor("x1_17_end_0"), val = tensor([1, 8, 256, 128])]; tensor x1_17_end_mask_0 = const()[name = tensor("x1_17_end_mask_0"), val = tensor([true, true, true, false])]; tensor x1_17 = slice_by_index(begin = x1_17_begin_0, end = x1_17_end_0, end_mask = x1_17_end_mask_0, x = output_103_cast_fp16)[name = tensor("x1_17")]; tensor x2_17_begin_0 = const()[name = tensor("x2_17_begin_0"), val = tensor([0, 0, 0, 128])]; tensor x2_17_end_0 = const()[name = tensor("x2_17_end_0"), val = tensor([1, 8, 256, 256])]; tensor x2_17_end_mask_0 = const()[name = tensor("x2_17_end_mask_0"), val = tensor([true, true, true, true])]; tensor x2_17 = slice_by_index(begin = x2_17_begin_0, end = x2_17_end_0, end_mask = x2_17_end_mask_0, x = output_103_cast_fp16)[name = tensor("x2_17")]; tensor const_127_promoted = const()[name = tensor("const_127_promoted"), val = tensor(-0x1p+0)]; tensor var_1155 = mul(x = x2_17, y = const_127_promoted)[name = tensor("op_1155")]; tensor var_1157_interleave_0 = const()[name = tensor("op_1157_interleave_0"), val = tensor(false)]; tensor var_1157 = concat(axis = var_24, interleave = var_1157_interleave_0, values = (var_1155, x1_17))[name = tensor("op_1157")]; tensor var_1158 = mul(x = var_1157, y = sin_7_palettized)[name = tensor("op_1158")]; tensor query_9 = add(x = var_1144, y = var_1158)[name = tensor("query_9")]; tensor var_1160 = mul(x = output_107_cast_fp16, y = cos_7_palettized)[name = tensor("op_1160")]; tensor x1_19_begin_0 = const()[name = tensor("x1_19_begin_0"), val = tensor([0, 0, 0, 0])]; tensor x1_19_end_0 = const()[name = tensor("x1_19_end_0"), val = tensor([1, 4, 256, 128])]; tensor x1_19_end_mask_0 = const()[name = tensor("x1_19_end_mask_0"), val = tensor([true, true, true, false])]; tensor x1_19 = slice_by_index(begin = x1_19_begin_0, end = x1_19_end_0, end_mask = x1_19_end_mask_0, x = output_107_cast_fp16)[name = tensor("x1_19")]; tensor x2_19_begin_0 = const()[name = tensor("x2_19_begin_0"), val = tensor([0, 0, 0, 128])]; tensor x2_19_end_0 = const()[name = tensor("x2_19_end_0"), val = tensor([1, 4, 256, 256])]; tensor x2_19_end_mask_0 = const()[name = tensor("x2_19_end_mask_0"), val = tensor([true, true, true, true])]; tensor x2_19 = slice_by_index(begin = x2_19_begin_0, end = x2_19_end_0, end_mask = x2_19_end_mask_0, x = output_107_cast_fp16)[name = tensor("x2_19")]; tensor const_130_promoted = const()[name = tensor("const_130_promoted"), val = tensor(-0x1p+0)]; tensor var_1171 = mul(x = x2_19, y = const_130_promoted)[name = tensor("op_1171")]; tensor var_1173_interleave_0 = const()[name = tensor("op_1173_interleave_0"), val = tensor(false)]; tensor var_1173 = concat(axis = var_24, interleave = var_1173_interleave_0, values = (var_1171, x1_19))[name = tensor("op_1173")]; tensor var_1174 = mul(x = var_1173, y = sin_7_palettized)[name = tensor("op_1174")]; tensor hidden_states_59 = add(x = var_1160, y = var_1174)[name = tensor("hidden_states_59")]; tensor var_1183_axes_0 = const()[name = tensor("op_1183_axes_0"), val = tensor([2])]; tensor var_1183 = expand_dims(axes = var_1183_axes_0, x = hidden_states_59)[name = tensor("op_1183")]; tensor hidden_states_61_reps_0 = const()[name = tensor("hidden_states_61_reps_0"), val = tensor([1, 1, 2, 1, 1])]; tensor hidden_states_61 = tile(reps = hidden_states_61_reps_0, x = var_1183)[name = tensor("hidden_states_61")]; tensor var_1191 = const()[name = tensor("op_1191"), val = tensor([1, 8, 256, 256])]; tensor key_states_9 = reshape(shape = var_1191, x = hidden_states_61)[name = tensor("key_states_9")]; tensor var_1200_axes_0 = const()[name = tensor("op_1200_axes_0"), val = tensor([2])]; tensor hidden_states_63 = transpose(perm = hidden_states_63_perm_0, x = var_1112)[name = tensor("transpose_117")]; tensor var_1200 = expand_dims(axes = var_1200_axes_0, x = hidden_states_63)[name = tensor("op_1200")]; tensor hidden_states_65_reps_0 = const()[name = tensor("hidden_states_65_reps_0"), val = tensor([1, 1, 2, 1, 1])]; tensor hidden_states_65 = tile(reps = hidden_states_65_reps_0, x = var_1200)[name = tensor("hidden_states_65")]; tensor var_1208 = const()[name = tensor("op_1208"), val = tensor([1, 8, 256, 256])]; tensor value_states_9 = reshape(shape = var_1208, x = hidden_states_65)[name = tensor("value_states_9")]; tensor var_1211_transpose_x_1 = const()[name = tensor("op_1211_transpose_x_1"), val = tensor(false)]; tensor var_1211_transpose_y_1 = const()[name = tensor("op_1211_transpose_y_1"), val = tensor(true)]; tensor var_1211 = matmul(transpose_x = var_1211_transpose_x_1, transpose_y = var_1211_transpose_y_1, x = query_9, y = key_states_9)[name = tensor("op_1211")]; tensor var_1212_to_fp16 = const()[name = tensor("op_1212_to_fp16"), val = tensor(0x1p-4)]; tensor attn_weights_17_cast_fp16 = mul(x = var_1211, y = var_1212_to_fp16)[name = tensor("attn_weights_17_cast_fp16")]; tensor input_49_cast_fp16 = add(x = attn_weights_17_cast_fp16, y = attention_mask_to_fp16_palettized)[name = tensor("input_49_cast_fp16")]; tensor var_1220_cast_fp16 = softmax(axis = var_24, x = input_49_cast_fp16)[name = tensor("op_1220_cast_fp16")]; tensor attn_output_17_transpose_x_0 = const()[name = tensor("attn_output_17_transpose_x_0"), val = tensor(false)]; tensor attn_output_17_transpose_y_0 = const()[name = tensor("attn_output_17_transpose_y_0"), val = tensor(false)]; tensor attn_output_17 = matmul(transpose_x = attn_output_17_transpose_x_0, transpose_y = attn_output_17_transpose_y_0, x = var_1220_cast_fp16, y = value_states_9)[name = tensor("attn_output_17")]; tensor var_1224_perm_0 = const()[name = tensor("op_1224_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_1226 = const()[name = tensor("op_1226"), val = tensor([1, 256, -1])]; tensor var_1224 = transpose(perm = var_1224_perm_0, x = attn_output_17)[name = tensor("transpose_116")]; tensor var_1227 = reshape(shape = var_1226, x = var_1224)[name = tensor("op_1227")]; tensor x_107 = linear(bias = linear_3_bias_0, weight = wrapped_model_language_model_layers_4_self_attn_o_proj_weight_palettized, x = var_1227)[name = tensor("linear_31")]; tensor var_22_promoted_27_to_fp16 = const()[name = tensor("op_22_promoted_27_to_fp16"), val = tensor(0x1p+1)]; tensor var_1233_cast_fp16 = pow(x = x_107, y = var_22_promoted_27_to_fp16)[name = tensor("op_1233_cast_fp16")]; tensor var_1235_axes_0 = const()[name = tensor("op_1235_axes_0"), val = tensor([-1])]; tensor var_1235_keep_dims_0 = const()[name = tensor("op_1235_keep_dims_0"), val = tensor(true)]; tensor var_1235_cast_fp16 = reduce_mean(axes = var_1235_axes_0, keep_dims = var_1235_keep_dims_0, x = var_1233_cast_fp16)[name = tensor("op_1235_cast_fp16")]; tensor var_1236_to_fp16 = const()[name = tensor("op_1236_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_1237_cast_fp16 = add(x = var_1235_cast_fp16, y = var_1236_to_fp16)[name = tensor("op_1237_cast_fp16")]; tensor var_1238_epsilon_0 = const()[name = tensor("op_1238_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_1238_cast_fp16 = rsqrt(epsilon = var_1238_epsilon_0, x = var_1237_cast_fp16)[name = tensor("op_1238_cast_fp16")]; tensor output_109_cast_fp16 = mul(x = x_107, y = var_1238_cast_fp16)[name = tensor("output_109_cast_fp16")]; tensor var_1242_to_fp16 = const()[name = tensor("op_1242_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940218240)))]; tensor output_111_cast_fp16 = mul(x = output_109_cast_fp16, y = var_1242_to_fp16)[name = tensor("output_111_cast_fp16")]; tensor x_111 = add(x = x_95, y = output_111_cast_fp16)[name = tensor("x_111")]; tensor var_22_promoted_28_to_fp16 = const()[name = tensor("op_22_promoted_28_to_fp16"), val = tensor(0x1p+1)]; tensor var_1248_cast_fp16 = pow(x = x_111, y = var_22_promoted_28_to_fp16)[name = tensor("op_1248_cast_fp16")]; tensor var_1250_axes_0 = const()[name = tensor("op_1250_axes_0"), val = tensor([-1])]; tensor var_1250_keep_dims_0 = const()[name = tensor("op_1250_keep_dims_0"), val = tensor(true)]; tensor var_1250_cast_fp16 = reduce_mean(axes = var_1250_axes_0, keep_dims = var_1250_keep_dims_0, x = var_1248_cast_fp16)[name = tensor("op_1250_cast_fp16")]; tensor var_1251_to_fp16 = const()[name = tensor("op_1251_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_1252_cast_fp16 = add(x = var_1250_cast_fp16, y = var_1251_to_fp16)[name = tensor("op_1252_cast_fp16")]; tensor var_1253_epsilon_0 = const()[name = tensor("op_1253_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_1253_cast_fp16 = rsqrt(epsilon = var_1253_epsilon_0, x = var_1252_cast_fp16)[name = tensor("op_1253_cast_fp16")]; tensor output_113_cast_fp16 = mul(x = x_111, y = var_1253_cast_fp16)[name = tensor("output_113_cast_fp16")]; tensor var_1257_to_fp16 = const()[name = tensor("op_1257_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940223424)))]; tensor output_115_cast_fp16 = mul(x = output_113_cast_fp16, y = var_1257_to_fp16)[name = tensor("output_115_cast_fp16")]; tensor input_57 = linear(bias = linear_4_bias_0, weight = wrapped_model_language_model_layers_4_mlp_gate_proj_weight_palettized, x = output_115_cast_fp16)[name = tensor("linear_32")]; tensor var_1265_mode_0 = const()[name = tensor("op_1265_mode_0"), val = tensor("TANH_APPROXIMATION")]; tensor var_1265 = gelu(mode = var_1265_mode_0, x = input_57)[name = tensor("op_1265")]; tensor var_1267 = linear(bias = linear_4_bias_0, weight = wrapped_model_language_model_layers_4_mlp_up_proj_weight_palettized, x = output_115_cast_fp16)[name = tensor("linear_33")]; tensor input_59 = mul(x = var_1265, y = var_1267)[name = tensor("input_59")]; tensor x_115 = linear(bias = linear_3_bias_0, weight = wrapped_model_language_model_layers_4_mlp_down_proj_weight_palettized, x = input_59)[name = tensor("linear_34")]; tensor var_22_promoted_29_to_fp16 = const()[name = tensor("op_22_promoted_29_to_fp16"), val = tensor(0x1p+1)]; tensor var_1273_cast_fp16 = pow(x = x_115, y = var_22_promoted_29_to_fp16)[name = tensor("op_1273_cast_fp16")]; tensor var_1275_axes_0 = const()[name = tensor("op_1275_axes_0"), val = tensor([-1])]; tensor var_1275_keep_dims_0 = const()[name = tensor("op_1275_keep_dims_0"), val = tensor(true)]; tensor var_1275_cast_fp16 = reduce_mean(axes = var_1275_axes_0, keep_dims = var_1275_keep_dims_0, x = var_1273_cast_fp16)[name = tensor("op_1275_cast_fp16")]; tensor var_1276_to_fp16 = const()[name = tensor("op_1276_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_1277_cast_fp16 = add(x = var_1275_cast_fp16, y = var_1276_to_fp16)[name = tensor("op_1277_cast_fp16")]; tensor var_1278_epsilon_0 = const()[name = tensor("op_1278_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_1278_cast_fp16 = rsqrt(epsilon = var_1278_epsilon_0, x = var_1277_cast_fp16)[name = tensor("op_1278_cast_fp16")]; tensor output_117_cast_fp16 = mul(x = x_115, y = var_1278_cast_fp16)[name = tensor("output_117_cast_fp16")]; tensor var_1282_to_fp16 = const()[name = tensor("op_1282_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940228608)))]; tensor output_119_cast_fp16 = mul(x = output_117_cast_fp16, y = var_1282_to_fp16)[name = tensor("output_119_cast_fp16")]; tensor x_119 = add(x = x_111, y = output_119_cast_fp16)[name = tensor("x_119")]; tensor var_22_promoted_30_to_fp16 = const()[name = tensor("op_22_promoted_30_to_fp16"), val = tensor(0x1p+1)]; tensor var_1294_cast_fp16 = pow(x = x_119, y = var_22_promoted_30_to_fp16)[name = tensor("op_1294_cast_fp16")]; tensor var_1296_axes_0 = const()[name = tensor("op_1296_axes_0"), val = tensor([-1])]; tensor var_1296_keep_dims_0 = const()[name = tensor("op_1296_keep_dims_0"), val = tensor(true)]; tensor var_1296_cast_fp16 = reduce_mean(axes = var_1296_axes_0, keep_dims = var_1296_keep_dims_0, x = var_1294_cast_fp16)[name = tensor("op_1296_cast_fp16")]; tensor var_1297_to_fp16 = const()[name = tensor("op_1297_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_1298_cast_fp16 = add(x = var_1296_cast_fp16, y = var_1297_to_fp16)[name = tensor("op_1298_cast_fp16")]; tensor var_1299_epsilon_0 = const()[name = tensor("op_1299_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_1299_cast_fp16 = rsqrt(epsilon = var_1299_epsilon_0, x = var_1298_cast_fp16)[name = tensor("op_1299_cast_fp16")]; tensor output_121_cast_fp16 = mul(x = x_119, y = var_1299_cast_fp16)[name = tensor("output_121_cast_fp16")]; tensor var_1303_to_fp16 = const()[name = tensor("op_1303_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940233792)))]; tensor output_123_cast_fp16 = mul(x = output_121_cast_fp16, y = var_1303_to_fp16)[name = tensor("output_123_cast_fp16")]; tensor var_1315 = linear(bias = linear_0_bias_0, weight = wrapped_model_language_model_layers_5_self_attn_q_proj_weight_palettized, x = output_123_cast_fp16)[name = tensor("linear_35")]; tensor var_1316 = const()[name = tensor("op_1316"), val = tensor([1, 256, -1, 256])]; tensor var_1317 = reshape(shape = var_1316, x = var_1315)[name = tensor("op_1317")]; tensor x_123_perm_0 = const()[name = tensor("x_123_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_1320 = linear(bias = linear_1_bias_0, weight = wrapped_model_language_model_layers_5_self_attn_k_proj_weight_palettized, x = output_123_cast_fp16)[name = tensor("linear_36")]; tensor var_1321 = const()[name = tensor("op_1321"), val = tensor([1, 256, -1, 256])]; tensor var_1322 = reshape(shape = var_1321, x = var_1320)[name = tensor("op_1322")]; tensor x_127_perm_0 = const()[name = tensor("x_127_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_1325 = linear(bias = linear_1_bias_0, weight = wrapped_model_language_model_layers_5_self_attn_v_proj_weight_palettized, x = output_123_cast_fp16)[name = tensor("linear_37")]; tensor var_1326 = const()[name = tensor("op_1326"), val = tensor([1, 256, -1, 256])]; tensor var_1327 = reshape(shape = var_1326, x = var_1325)[name = tensor("op_1327")]; tensor hidden_states_77_perm_0 = const()[name = tensor("hidden_states_77_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_22_promoted_31_to_fp16 = const()[name = tensor("op_22_promoted_31_to_fp16"), val = tensor(0x1p+1)]; tensor x_123 = transpose(perm = x_123_perm_0, x = var_1317)[name = tensor("transpose_115")]; tensor var_1331_cast_fp16 = pow(x = x_123, y = var_22_promoted_31_to_fp16)[name = tensor("op_1331_cast_fp16")]; tensor var_1333_axes_0 = const()[name = tensor("op_1333_axes_0"), val = tensor([-1])]; tensor var_1333_keep_dims_0 = const()[name = tensor("op_1333_keep_dims_0"), val = tensor(true)]; tensor var_1333_cast_fp16 = reduce_mean(axes = var_1333_axes_0, keep_dims = var_1333_keep_dims_0, x = var_1331_cast_fp16)[name = tensor("op_1333_cast_fp16")]; tensor var_1334_to_fp16 = const()[name = tensor("op_1334_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_1335_cast_fp16 = add(x = var_1333_cast_fp16, y = var_1334_to_fp16)[name = tensor("op_1335_cast_fp16")]; tensor var_1336_epsilon_0 = const()[name = tensor("op_1336_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_1336_cast_fp16 = rsqrt(epsilon = var_1336_epsilon_0, x = var_1335_cast_fp16)[name = tensor("op_1336_cast_fp16")]; tensor output_125_cast_fp16 = mul(x = x_123, y = var_1336_cast_fp16)[name = tensor("output_125_cast_fp16")]; tensor var_1340_to_fp16 = const()[name = tensor("op_1340_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940238976)))]; tensor output_127_cast_fp16 = mul(x = output_125_cast_fp16, y = var_1340_to_fp16)[name = tensor("output_127_cast_fp16")]; tensor var_22_promoted_32_to_fp16 = const()[name = tensor("op_22_promoted_32_to_fp16"), val = tensor(0x1p+1)]; tensor x_127 = transpose(perm = x_127_perm_0, x = var_1322)[name = tensor("transpose_114")]; tensor var_1345_cast_fp16 = pow(x = x_127, y = var_22_promoted_32_to_fp16)[name = tensor("op_1345_cast_fp16")]; tensor var_1347_axes_0 = const()[name = tensor("op_1347_axes_0"), val = tensor([-1])]; tensor var_1347_keep_dims_0 = const()[name = tensor("op_1347_keep_dims_0"), val = tensor(true)]; tensor var_1347_cast_fp16 = reduce_mean(axes = var_1347_axes_0, keep_dims = var_1347_keep_dims_0, x = var_1345_cast_fp16)[name = tensor("op_1347_cast_fp16")]; tensor var_1348_to_fp16 = const()[name = tensor("op_1348_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_1349_cast_fp16 = add(x = var_1347_cast_fp16, y = var_1348_to_fp16)[name = tensor("op_1349_cast_fp16")]; tensor var_1350_epsilon_0 = const()[name = tensor("op_1350_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_1350_cast_fp16 = rsqrt(epsilon = var_1350_epsilon_0, x = var_1349_cast_fp16)[name = tensor("op_1350_cast_fp16")]; tensor output_129_cast_fp16 = mul(x = x_127, y = var_1350_cast_fp16)[name = tensor("output_129_cast_fp16")]; tensor var_1354_to_fp16 = const()[name = tensor("op_1354_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940239552)))]; tensor output_131_cast_fp16 = mul(x = output_129_cast_fp16, y = var_1354_to_fp16)[name = tensor("output_131_cast_fp16")]; tensor cos_19_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940240128))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940272960))), name = tensor("cos_19_palettized"), shape = tensor([1, 1, 256, 256])]; tensor sin_19_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940273088))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940305920))), name = tensor("sin_19_palettized"), shape = tensor([1, 1, 256, 256])]; tensor var_1359 = mul(x = output_127_cast_fp16, y = cos_19_palettized)[name = tensor("op_1359")]; tensor x1_21_begin_0 = const()[name = tensor("x1_21_begin_0"), val = tensor([0, 0, 0, 0])]; tensor x1_21_end_0 = const()[name = tensor("x1_21_end_0"), val = tensor([1, 8, 256, 128])]; tensor x1_21_end_mask_0 = const()[name = tensor("x1_21_end_mask_0"), val = tensor([true, true, true, false])]; tensor x1_21 = slice_by_index(begin = x1_21_begin_0, end = x1_21_end_0, end_mask = x1_21_end_mask_0, x = output_127_cast_fp16)[name = tensor("x1_21")]; tensor x2_21_begin_0 = const()[name = tensor("x2_21_begin_0"), val = tensor([0, 0, 0, 128])]; tensor x2_21_end_0 = const()[name = tensor("x2_21_end_0"), val = tensor([1, 8, 256, 256])]; tensor x2_21_end_mask_0 = const()[name = tensor("x2_21_end_mask_0"), val = tensor([true, true, true, true])]; tensor x2_21 = slice_by_index(begin = x2_21_begin_0, end = x2_21_end_0, end_mask = x2_21_end_mask_0, x = output_127_cast_fp16)[name = tensor("x2_21")]; tensor const_150_promoted = const()[name = tensor("const_150_promoted"), val = tensor(-0x1p+0)]; tensor var_1370 = mul(x = x2_21, y = const_150_promoted)[name = tensor("op_1370")]; tensor var_1372_interleave_0 = const()[name = tensor("op_1372_interleave_0"), val = tensor(false)]; tensor var_1372 = concat(axis = var_24, interleave = var_1372_interleave_0, values = (var_1370, x1_21))[name = tensor("op_1372")]; tensor var_1373 = mul(x = var_1372, y = sin_19_palettized)[name = tensor("op_1373")]; tensor query_11 = add(x = var_1359, y = var_1373)[name = tensor("query_11")]; tensor var_1375 = mul(x = output_131_cast_fp16, y = cos_19_palettized)[name = tensor("op_1375")]; tensor x1_23_begin_0 = const()[name = tensor("x1_23_begin_0"), val = tensor([0, 0, 0, 0])]; tensor x1_23_end_0 = const()[name = tensor("x1_23_end_0"), val = tensor([1, 4, 256, 128])]; tensor x1_23_end_mask_0 = const()[name = tensor("x1_23_end_mask_0"), val = tensor([true, true, true, false])]; tensor x1_23 = slice_by_index(begin = x1_23_begin_0, end = x1_23_end_0, end_mask = x1_23_end_mask_0, x = output_131_cast_fp16)[name = tensor("x1_23")]; tensor x2_23_begin_0 = const()[name = tensor("x2_23_begin_0"), val = tensor([0, 0, 0, 128])]; tensor x2_23_end_0 = const()[name = tensor("x2_23_end_0"), val = tensor([1, 4, 256, 256])]; tensor x2_23_end_mask_0 = const()[name = tensor("x2_23_end_mask_0"), val = tensor([true, true, true, true])]; tensor x2_23 = slice_by_index(begin = x2_23_begin_0, end = x2_23_end_0, end_mask = x2_23_end_mask_0, x = output_131_cast_fp16)[name = tensor("x2_23")]; tensor const_153_promoted = const()[name = tensor("const_153_promoted"), val = tensor(-0x1p+0)]; tensor var_1386 = mul(x = x2_23, y = const_153_promoted)[name = tensor("op_1386")]; tensor var_1388_interleave_0 = const()[name = tensor("op_1388_interleave_0"), val = tensor(false)]; tensor var_1388 = concat(axis = var_24, interleave = var_1388_interleave_0, values = (var_1386, x1_23))[name = tensor("op_1388")]; tensor var_1389 = mul(x = var_1388, y = sin_19_palettized)[name = tensor("op_1389")]; tensor hidden_states_73 = add(x = var_1375, y = var_1389)[name = tensor("hidden_states_73")]; tensor var_1398_axes_0 = const()[name = tensor("op_1398_axes_0"), val = tensor([2])]; tensor var_1398 = expand_dims(axes = var_1398_axes_0, x = hidden_states_73)[name = tensor("op_1398")]; tensor hidden_states_75_reps_0 = const()[name = tensor("hidden_states_75_reps_0"), val = tensor([1, 1, 2, 1, 1])]; tensor hidden_states_75 = tile(reps = hidden_states_75_reps_0, x = var_1398)[name = tensor("hidden_states_75")]; tensor var_1406 = const()[name = tensor("op_1406"), val = tensor([1, 8, 256, 256])]; tensor key_states_11 = reshape(shape = var_1406, x = hidden_states_75)[name = tensor("key_states_11")]; tensor var_1415_axes_0 = const()[name = tensor("op_1415_axes_0"), val = tensor([2])]; tensor hidden_states_77 = transpose(perm = hidden_states_77_perm_0, x = var_1327)[name = tensor("transpose_113")]; tensor var_1415 = expand_dims(axes = var_1415_axes_0, x = hidden_states_77)[name = tensor("op_1415")]; tensor hidden_states_79_reps_0 = const()[name = tensor("hidden_states_79_reps_0"), val = tensor([1, 1, 2, 1, 1])]; tensor hidden_states_79 = tile(reps = hidden_states_79_reps_0, x = var_1415)[name = tensor("hidden_states_79")]; tensor var_1423 = const()[name = tensor("op_1423"), val = tensor([1, 8, 256, 256])]; tensor value_states_11 = reshape(shape = var_1423, x = hidden_states_79)[name = tensor("value_states_11")]; tensor var_1426_transpose_x_1 = const()[name = tensor("op_1426_transpose_x_1"), val = tensor(false)]; tensor var_1426_transpose_y_1 = const()[name = tensor("op_1426_transpose_y_1"), val = tensor(true)]; tensor var_1426 = matmul(transpose_x = var_1426_transpose_x_1, transpose_y = var_1426_transpose_y_1, x = query_11, y = key_states_11)[name = tensor("op_1426")]; tensor var_1427_to_fp16 = const()[name = tensor("op_1427_to_fp16"), val = tensor(0x1p-4)]; tensor attn_weights_21_cast_fp16 = mul(x = var_1426, y = var_1427_to_fp16)[name = tensor("attn_weights_21_cast_fp16")]; tensor input_61_cast_fp16 = add(x = attn_weights_21_cast_fp16, y = attention_mask_to_fp16_palettized)[name = tensor("input_61_cast_fp16")]; tensor var_1435_cast_fp16 = softmax(axis = var_24, x = input_61_cast_fp16)[name = tensor("op_1435_cast_fp16")]; tensor attn_output_21_transpose_x_0 = const()[name = tensor("attn_output_21_transpose_x_0"), val = tensor(false)]; tensor attn_output_21_transpose_y_0 = const()[name = tensor("attn_output_21_transpose_y_0"), val = tensor(false)]; tensor attn_output_21 = matmul(transpose_x = attn_output_21_transpose_x_0, transpose_y = attn_output_21_transpose_y_0, x = var_1435_cast_fp16, y = value_states_11)[name = tensor("attn_output_21")]; tensor var_1439_perm_0 = const()[name = tensor("op_1439_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_1441 = const()[name = tensor("op_1441"), val = tensor([1, 256, -1])]; tensor var_1439 = transpose(perm = var_1439_perm_0, x = attn_output_21)[name = tensor("transpose_112")]; tensor var_1442 = reshape(shape = var_1441, x = var_1439)[name = tensor("op_1442")]; tensor x_131 = linear(bias = linear_3_bias_0, weight = wrapped_model_language_model_layers_5_self_attn_o_proj_weight_palettized, x = var_1442)[name = tensor("linear_38")]; tensor var_22_promoted_33_to_fp16 = const()[name = tensor("op_22_promoted_33_to_fp16"), val = tensor(0x1p+1)]; tensor var_1448_cast_fp16 = pow(x = x_131, y = var_22_promoted_33_to_fp16)[name = tensor("op_1448_cast_fp16")]; tensor var_1450_axes_0 = const()[name = tensor("op_1450_axes_0"), val = tensor([-1])]; tensor var_1450_keep_dims_0 = const()[name = tensor("op_1450_keep_dims_0"), val = tensor(true)]; tensor var_1450_cast_fp16 = reduce_mean(axes = var_1450_axes_0, keep_dims = var_1450_keep_dims_0, x = var_1448_cast_fp16)[name = tensor("op_1450_cast_fp16")]; tensor var_1451_to_fp16 = const()[name = tensor("op_1451_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_1452_cast_fp16 = add(x = var_1450_cast_fp16, y = var_1451_to_fp16)[name = tensor("op_1452_cast_fp16")]; tensor var_1453_epsilon_0 = const()[name = tensor("op_1453_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_1453_cast_fp16 = rsqrt(epsilon = var_1453_epsilon_0, x = var_1452_cast_fp16)[name = tensor("op_1453_cast_fp16")]; tensor output_133_cast_fp16 = mul(x = x_131, y = var_1453_cast_fp16)[name = tensor("output_133_cast_fp16")]; tensor var_1457_to_fp16 = const()[name = tensor("op_1457_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940306048)))]; tensor output_135_cast_fp16 = mul(x = output_133_cast_fp16, y = var_1457_to_fp16)[name = tensor("output_135_cast_fp16")]; tensor x_135 = add(x = x_119, y = output_135_cast_fp16)[name = tensor("x_135")]; tensor var_22_promoted_34_to_fp16 = const()[name = tensor("op_22_promoted_34_to_fp16"), val = tensor(0x1p+1)]; tensor var_1463_cast_fp16 = pow(x = x_135, y = var_22_promoted_34_to_fp16)[name = tensor("op_1463_cast_fp16")]; tensor var_1465_axes_0 = const()[name = tensor("op_1465_axes_0"), val = tensor([-1])]; tensor var_1465_keep_dims_0 = const()[name = tensor("op_1465_keep_dims_0"), val = tensor(true)]; tensor var_1465_cast_fp16 = reduce_mean(axes = var_1465_axes_0, keep_dims = var_1465_keep_dims_0, x = var_1463_cast_fp16)[name = tensor("op_1465_cast_fp16")]; tensor var_1466_to_fp16 = const()[name = tensor("op_1466_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_1467_cast_fp16 = add(x = var_1465_cast_fp16, y = var_1466_to_fp16)[name = tensor("op_1467_cast_fp16")]; tensor var_1468_epsilon_0 = const()[name = tensor("op_1468_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_1468_cast_fp16 = rsqrt(epsilon = var_1468_epsilon_0, x = var_1467_cast_fp16)[name = tensor("op_1468_cast_fp16")]; tensor output_137_cast_fp16 = mul(x = x_135, y = var_1468_cast_fp16)[name = tensor("output_137_cast_fp16")]; tensor var_1472_to_fp16 = const()[name = tensor("op_1472_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940311232)))]; tensor output_139_cast_fp16 = mul(x = output_137_cast_fp16, y = var_1472_to_fp16)[name = tensor("output_139_cast_fp16")]; tensor input_69 = linear(bias = linear_4_bias_0, weight = wrapped_model_language_model_layers_5_mlp_gate_proj_weight_palettized, x = output_139_cast_fp16)[name = tensor("linear_39")]; tensor var_1480_mode_0 = const()[name = tensor("op_1480_mode_0"), val = tensor("TANH_APPROXIMATION")]; tensor var_1480 = gelu(mode = var_1480_mode_0, x = input_69)[name = tensor("op_1480")]; tensor var_1482 = linear(bias = linear_4_bias_0, weight = wrapped_model_language_model_layers_5_mlp_up_proj_weight_palettized, x = output_139_cast_fp16)[name = tensor("linear_40")]; tensor input_71 = mul(x = var_1480, y = var_1482)[name = tensor("input_71")]; tensor x_139 = linear(bias = linear_3_bias_0, weight = wrapped_model_language_model_layers_5_mlp_down_proj_weight_palettized, x = input_71)[name = tensor("linear_41")]; tensor var_22_promoted_35_to_fp16 = const()[name = tensor("op_22_promoted_35_to_fp16"), val = tensor(0x1p+1)]; tensor var_1488_cast_fp16 = pow(x = x_139, y = var_22_promoted_35_to_fp16)[name = tensor("op_1488_cast_fp16")]; tensor var_1490_axes_0 = const()[name = tensor("op_1490_axes_0"), val = tensor([-1])]; tensor var_1490_keep_dims_0 = const()[name = tensor("op_1490_keep_dims_0"), val = tensor(true)]; tensor var_1490_cast_fp16 = reduce_mean(axes = var_1490_axes_0, keep_dims = var_1490_keep_dims_0, x = var_1488_cast_fp16)[name = tensor("op_1490_cast_fp16")]; tensor var_1491_to_fp16 = const()[name = tensor("op_1491_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_1492_cast_fp16 = add(x = var_1490_cast_fp16, y = var_1491_to_fp16)[name = tensor("op_1492_cast_fp16")]; tensor var_1493_epsilon_0 = const()[name = tensor("op_1493_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_1493_cast_fp16 = rsqrt(epsilon = var_1493_epsilon_0, x = var_1492_cast_fp16)[name = tensor("op_1493_cast_fp16")]; tensor output_141_cast_fp16 = mul(x = x_139, y = var_1493_cast_fp16)[name = tensor("output_141_cast_fp16")]; tensor var_1497_to_fp16 = const()[name = tensor("op_1497_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940316416)))]; tensor output_143_cast_fp16 = mul(x = output_141_cast_fp16, y = var_1497_to_fp16)[name = tensor("output_143_cast_fp16")]; tensor x_143 = add(x = x_135, y = output_143_cast_fp16)[name = tensor("x_143")]; tensor var_22_promoted_36_to_fp16 = const()[name = tensor("op_22_promoted_36_to_fp16"), val = tensor(0x1p+1)]; tensor var_1509_cast_fp16 = pow(x = x_143, y = var_22_promoted_36_to_fp16)[name = tensor("op_1509_cast_fp16")]; tensor var_1511_axes_0 = const()[name = tensor("op_1511_axes_0"), val = tensor([-1])]; tensor var_1511_keep_dims_0 = const()[name = tensor("op_1511_keep_dims_0"), val = tensor(true)]; tensor var_1511_cast_fp16 = reduce_mean(axes = var_1511_axes_0, keep_dims = var_1511_keep_dims_0, x = var_1509_cast_fp16)[name = tensor("op_1511_cast_fp16")]; tensor var_1512_to_fp16 = const()[name = tensor("op_1512_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_1513_cast_fp16 = add(x = var_1511_cast_fp16, y = var_1512_to_fp16)[name = tensor("op_1513_cast_fp16")]; tensor var_1514_epsilon_0 = const()[name = tensor("op_1514_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_1514_cast_fp16 = rsqrt(epsilon = var_1514_epsilon_0, x = var_1513_cast_fp16)[name = tensor("op_1514_cast_fp16")]; tensor output_145_cast_fp16 = mul(x = x_143, y = var_1514_cast_fp16)[name = tensor("output_145_cast_fp16")]; tensor var_1518_to_fp16 = const()[name = tensor("op_1518_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940321600)))]; tensor output_147_cast_fp16 = mul(x = output_145_cast_fp16, y = var_1518_to_fp16)[name = tensor("output_147_cast_fp16")]; tensor var_1530 = linear(bias = linear_0_bias_0, weight = wrapped_model_language_model_layers_6_self_attn_q_proj_weight_palettized, x = output_147_cast_fp16)[name = tensor("linear_42")]; tensor var_1531 = const()[name = tensor("op_1531"), val = tensor([1, 256, -1, 256])]; tensor var_1532 = reshape(shape = var_1531, x = var_1530)[name = tensor("op_1532")]; tensor x_147_perm_0 = const()[name = tensor("x_147_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_1535 = linear(bias = linear_1_bias_0, weight = wrapped_model_language_model_layers_6_self_attn_k_proj_weight_palettized, x = output_147_cast_fp16)[name = tensor("linear_43")]; tensor var_1536 = const()[name = tensor("op_1536"), val = tensor([1, 256, -1, 256])]; tensor var_1537 = reshape(shape = var_1536, x = var_1535)[name = tensor("op_1537")]; tensor x_151_perm_0 = const()[name = tensor("x_151_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_1540 = linear(bias = linear_1_bias_0, weight = wrapped_model_language_model_layers_6_self_attn_v_proj_weight_palettized, x = output_147_cast_fp16)[name = tensor("linear_44")]; tensor var_1541 = const()[name = tensor("op_1541"), val = tensor([1, 256, -1, 256])]; tensor var_1542 = reshape(shape = var_1541, x = var_1540)[name = tensor("op_1542")]; tensor hidden_states_91_perm_0 = const()[name = tensor("hidden_states_91_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_22_promoted_37_to_fp16 = const()[name = tensor("op_22_promoted_37_to_fp16"), val = tensor(0x1p+1)]; tensor x_147 = transpose(perm = x_147_perm_0, x = var_1532)[name = tensor("transpose_111")]; tensor var_1546_cast_fp16 = pow(x = x_147, y = var_22_promoted_37_to_fp16)[name = tensor("op_1546_cast_fp16")]; tensor var_1548_axes_0 = const()[name = tensor("op_1548_axes_0"), val = tensor([-1])]; tensor var_1548_keep_dims_0 = const()[name = tensor("op_1548_keep_dims_0"), val = tensor(true)]; tensor var_1548_cast_fp16 = reduce_mean(axes = var_1548_axes_0, keep_dims = var_1548_keep_dims_0, x = var_1546_cast_fp16)[name = tensor("op_1548_cast_fp16")]; tensor var_1549_to_fp16 = const()[name = tensor("op_1549_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_1550_cast_fp16 = add(x = var_1548_cast_fp16, y = var_1549_to_fp16)[name = tensor("op_1550_cast_fp16")]; tensor var_1551_epsilon_0 = const()[name = tensor("op_1551_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_1551_cast_fp16 = rsqrt(epsilon = var_1551_epsilon_0, x = var_1550_cast_fp16)[name = tensor("op_1551_cast_fp16")]; tensor output_149_cast_fp16 = mul(x = x_147, y = var_1551_cast_fp16)[name = tensor("output_149_cast_fp16")]; tensor var_1555_to_fp16 = const()[name = tensor("op_1555_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940326784)))]; tensor output_151_cast_fp16 = mul(x = output_149_cast_fp16, y = var_1555_to_fp16)[name = tensor("output_151_cast_fp16")]; tensor var_22_promoted_38_to_fp16 = const()[name = tensor("op_22_promoted_38_to_fp16"), val = tensor(0x1p+1)]; tensor x_151 = transpose(perm = x_151_perm_0, x = var_1537)[name = tensor("transpose_110")]; tensor var_1560_cast_fp16 = pow(x = x_151, y = var_22_promoted_38_to_fp16)[name = tensor("op_1560_cast_fp16")]; tensor var_1562_axes_0 = const()[name = tensor("op_1562_axes_0"), val = tensor([-1])]; tensor var_1562_keep_dims_0 = const()[name = tensor("op_1562_keep_dims_0"), val = tensor(true)]; tensor var_1562_cast_fp16 = reduce_mean(axes = var_1562_axes_0, keep_dims = var_1562_keep_dims_0, x = var_1560_cast_fp16)[name = tensor("op_1562_cast_fp16")]; tensor var_1563_to_fp16 = const()[name = tensor("op_1563_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_1564_cast_fp16 = add(x = var_1562_cast_fp16, y = var_1563_to_fp16)[name = tensor("op_1564_cast_fp16")]; tensor var_1565_epsilon_0 = const()[name = tensor("op_1565_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_1565_cast_fp16 = rsqrt(epsilon = var_1565_epsilon_0, x = var_1564_cast_fp16)[name = tensor("op_1565_cast_fp16")]; tensor output_153_cast_fp16 = mul(x = x_151, y = var_1565_cast_fp16)[name = tensor("output_153_cast_fp16")]; tensor var_1569_to_fp16 = const()[name = tensor("op_1569_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940327360)))]; tensor output_155_cast_fp16 = mul(x = output_153_cast_fp16, y = var_1569_to_fp16)[name = tensor("output_155_cast_fp16")]; tensor var_1574 = mul(x = output_151_cast_fp16, y = cos_7_palettized)[name = tensor("op_1574")]; tensor x1_25_begin_0 = const()[name = tensor("x1_25_begin_0"), val = tensor([0, 0, 0, 0])]; tensor x1_25_end_0 = const()[name = tensor("x1_25_end_0"), val = tensor([1, 8, 256, 128])]; tensor x1_25_end_mask_0 = const()[name = tensor("x1_25_end_mask_0"), val = tensor([true, true, true, false])]; tensor x1_25 = slice_by_index(begin = x1_25_begin_0, end = x1_25_end_0, end_mask = x1_25_end_mask_0, x = output_151_cast_fp16)[name = tensor("x1_25")]; tensor x2_25_begin_0 = const()[name = tensor("x2_25_begin_0"), val = tensor([0, 0, 0, 128])]; tensor x2_25_end_0 = const()[name = tensor("x2_25_end_0"), val = tensor([1, 8, 256, 256])]; tensor x2_25_end_mask_0 = const()[name = tensor("x2_25_end_mask_0"), val = tensor([true, true, true, true])]; tensor x2_25 = slice_by_index(begin = x2_25_begin_0, end = x2_25_end_0, end_mask = x2_25_end_mask_0, x = output_151_cast_fp16)[name = tensor("x2_25")]; tensor const_173_promoted = const()[name = tensor("const_173_promoted"), val = tensor(-0x1p+0)]; tensor var_1585 = mul(x = x2_25, y = const_173_promoted)[name = tensor("op_1585")]; tensor var_1587_interleave_0 = const()[name = tensor("op_1587_interleave_0"), val = tensor(false)]; tensor var_1587 = concat(axis = var_24, interleave = var_1587_interleave_0, values = (var_1585, x1_25))[name = tensor("op_1587")]; tensor var_1588 = mul(x = var_1587, y = sin_7_palettized)[name = tensor("op_1588")]; tensor query_13 = add(x = var_1574, y = var_1588)[name = tensor("query_13")]; tensor var_1590 = mul(x = output_155_cast_fp16, y = cos_7_palettized)[name = tensor("op_1590")]; tensor x1_27_begin_0 = const()[name = tensor("x1_27_begin_0"), val = tensor([0, 0, 0, 0])]; tensor x1_27_end_0 = const()[name = tensor("x1_27_end_0"), val = tensor([1, 4, 256, 128])]; tensor x1_27_end_mask_0 = const()[name = tensor("x1_27_end_mask_0"), val = tensor([true, true, true, false])]; tensor x1_27 = slice_by_index(begin = x1_27_begin_0, end = x1_27_end_0, end_mask = x1_27_end_mask_0, x = output_155_cast_fp16)[name = tensor("x1_27")]; tensor x2_27_begin_0 = const()[name = tensor("x2_27_begin_0"), val = tensor([0, 0, 0, 128])]; tensor x2_27_end_0 = const()[name = tensor("x2_27_end_0"), val = tensor([1, 4, 256, 256])]; tensor x2_27_end_mask_0 = const()[name = tensor("x2_27_end_mask_0"), val = tensor([true, true, true, true])]; tensor x2_27 = slice_by_index(begin = x2_27_begin_0, end = x2_27_end_0, end_mask = x2_27_end_mask_0, x = output_155_cast_fp16)[name = tensor("x2_27")]; tensor const_176_promoted = const()[name = tensor("const_176_promoted"), val = tensor(-0x1p+0)]; tensor var_1601 = mul(x = x2_27, y = const_176_promoted)[name = tensor("op_1601")]; tensor var_1603_interleave_0 = const()[name = tensor("op_1603_interleave_0"), val = tensor(false)]; tensor var_1603 = concat(axis = var_24, interleave = var_1603_interleave_0, values = (var_1601, x1_27))[name = tensor("op_1603")]; tensor var_1604 = mul(x = var_1603, y = sin_7_palettized)[name = tensor("op_1604")]; tensor hidden_states_87 = add(x = var_1590, y = var_1604)[name = tensor("hidden_states_87")]; tensor var_1613_axes_0 = const()[name = tensor("op_1613_axes_0"), val = tensor([2])]; tensor var_1613 = expand_dims(axes = var_1613_axes_0, x = hidden_states_87)[name = tensor("op_1613")]; tensor hidden_states_89_reps_0 = const()[name = tensor("hidden_states_89_reps_0"), val = tensor([1, 1, 2, 1, 1])]; tensor hidden_states_89 = tile(reps = hidden_states_89_reps_0, x = var_1613)[name = tensor("hidden_states_89")]; tensor var_1621 = const()[name = tensor("op_1621"), val = tensor([1, 8, 256, 256])]; tensor key_states_13 = reshape(shape = var_1621, x = hidden_states_89)[name = tensor("key_states_13")]; tensor var_1630_axes_0 = const()[name = tensor("op_1630_axes_0"), val = tensor([2])]; tensor hidden_states_91 = transpose(perm = hidden_states_91_perm_0, x = var_1542)[name = tensor("transpose_109")]; tensor var_1630 = expand_dims(axes = var_1630_axes_0, x = hidden_states_91)[name = tensor("op_1630")]; tensor hidden_states_93_reps_0 = const()[name = tensor("hidden_states_93_reps_0"), val = tensor([1, 1, 2, 1, 1])]; tensor hidden_states_93 = tile(reps = hidden_states_93_reps_0, x = var_1630)[name = tensor("hidden_states_93")]; tensor var_1638 = const()[name = tensor("op_1638"), val = tensor([1, 8, 256, 256])]; tensor value_states_13 = reshape(shape = var_1638, x = hidden_states_93)[name = tensor("value_states_13")]; tensor var_1641_transpose_x_1 = const()[name = tensor("op_1641_transpose_x_1"), val = tensor(false)]; tensor var_1641_transpose_y_1 = const()[name = tensor("op_1641_transpose_y_1"), val = tensor(true)]; tensor var_1641 = matmul(transpose_x = var_1641_transpose_x_1, transpose_y = var_1641_transpose_y_1, x = query_13, y = key_states_13)[name = tensor("op_1641")]; tensor var_1642_to_fp16 = const()[name = tensor("op_1642_to_fp16"), val = tensor(0x1p-4)]; tensor attn_weights_25_cast_fp16 = mul(x = var_1641, y = var_1642_to_fp16)[name = tensor("attn_weights_25_cast_fp16")]; tensor input_73_cast_fp16 = add(x = attn_weights_25_cast_fp16, y = attention_mask_to_fp16_palettized)[name = tensor("input_73_cast_fp16")]; tensor var_1650_cast_fp16 = softmax(axis = var_24, x = input_73_cast_fp16)[name = tensor("op_1650_cast_fp16")]; tensor attn_output_25_transpose_x_0 = const()[name = tensor("attn_output_25_transpose_x_0"), val = tensor(false)]; tensor attn_output_25_transpose_y_0 = const()[name = tensor("attn_output_25_transpose_y_0"), val = tensor(false)]; tensor attn_output_25 = matmul(transpose_x = attn_output_25_transpose_x_0, transpose_y = attn_output_25_transpose_y_0, x = var_1650_cast_fp16, y = value_states_13)[name = tensor("attn_output_25")]; tensor var_1654_perm_0 = const()[name = tensor("op_1654_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_1656 = const()[name = tensor("op_1656"), val = tensor([1, 256, -1])]; tensor var_1654 = transpose(perm = var_1654_perm_0, x = attn_output_25)[name = tensor("transpose_108")]; tensor var_1657 = reshape(shape = var_1656, x = var_1654)[name = tensor("op_1657")]; tensor x_155 = linear(bias = linear_3_bias_0, weight = wrapped_model_language_model_layers_6_self_attn_o_proj_weight_palettized, x = var_1657)[name = tensor("linear_45")]; tensor var_22_promoted_39_to_fp16 = const()[name = tensor("op_22_promoted_39_to_fp16"), val = tensor(0x1p+1)]; tensor var_1663_cast_fp16 = pow(x = x_155, y = var_22_promoted_39_to_fp16)[name = tensor("op_1663_cast_fp16")]; tensor var_1665_axes_0 = const()[name = tensor("op_1665_axes_0"), val = tensor([-1])]; tensor var_1665_keep_dims_0 = const()[name = tensor("op_1665_keep_dims_0"), val = tensor(true)]; tensor var_1665_cast_fp16 = reduce_mean(axes = var_1665_axes_0, keep_dims = var_1665_keep_dims_0, x = var_1663_cast_fp16)[name = tensor("op_1665_cast_fp16")]; tensor var_1666_to_fp16 = const()[name = tensor("op_1666_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_1667_cast_fp16 = add(x = var_1665_cast_fp16, y = var_1666_to_fp16)[name = tensor("op_1667_cast_fp16")]; tensor var_1668_epsilon_0 = const()[name = tensor("op_1668_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_1668_cast_fp16 = rsqrt(epsilon = var_1668_epsilon_0, x = var_1667_cast_fp16)[name = tensor("op_1668_cast_fp16")]; tensor output_157_cast_fp16 = mul(x = x_155, y = var_1668_cast_fp16)[name = tensor("output_157_cast_fp16")]; tensor var_1672_to_fp16 = const()[name = tensor("op_1672_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940327936)))]; tensor output_159_cast_fp16 = mul(x = output_157_cast_fp16, y = var_1672_to_fp16)[name = tensor("output_159_cast_fp16")]; tensor x_159 = add(x = x_143, y = output_159_cast_fp16)[name = tensor("x_159")]; tensor var_22_promoted_40_to_fp16 = const()[name = tensor("op_22_promoted_40_to_fp16"), val = tensor(0x1p+1)]; tensor var_1678_cast_fp16 = pow(x = x_159, y = var_22_promoted_40_to_fp16)[name = tensor("op_1678_cast_fp16")]; tensor var_1680_axes_0 = const()[name = tensor("op_1680_axes_0"), val = tensor([-1])]; tensor var_1680_keep_dims_0 = const()[name = tensor("op_1680_keep_dims_0"), val = tensor(true)]; tensor var_1680_cast_fp16 = reduce_mean(axes = var_1680_axes_0, keep_dims = var_1680_keep_dims_0, x = var_1678_cast_fp16)[name = tensor("op_1680_cast_fp16")]; tensor var_1681_to_fp16 = const()[name = tensor("op_1681_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_1682_cast_fp16 = add(x = var_1680_cast_fp16, y = var_1681_to_fp16)[name = tensor("op_1682_cast_fp16")]; tensor var_1683_epsilon_0 = const()[name = tensor("op_1683_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_1683_cast_fp16 = rsqrt(epsilon = var_1683_epsilon_0, x = var_1682_cast_fp16)[name = tensor("op_1683_cast_fp16")]; tensor output_161_cast_fp16 = mul(x = x_159, y = var_1683_cast_fp16)[name = tensor("output_161_cast_fp16")]; tensor var_1687_to_fp16 = const()[name = tensor("op_1687_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940333120)))]; tensor output_163_cast_fp16 = mul(x = output_161_cast_fp16, y = var_1687_to_fp16)[name = tensor("output_163_cast_fp16")]; tensor input_81 = linear(bias = linear_4_bias_0, weight = wrapped_model_language_model_layers_6_mlp_gate_proj_weight_palettized, x = output_163_cast_fp16)[name = tensor("linear_46")]; tensor var_1695_mode_0 = const()[name = tensor("op_1695_mode_0"), val = tensor("TANH_APPROXIMATION")]; tensor var_1695 = gelu(mode = var_1695_mode_0, x = input_81)[name = tensor("op_1695")]; tensor var_1697 = linear(bias = linear_4_bias_0, weight = wrapped_model_language_model_layers_6_mlp_up_proj_weight_palettized, x = output_163_cast_fp16)[name = tensor("linear_47")]; tensor input_83 = mul(x = var_1695, y = var_1697)[name = tensor("input_83")]; tensor x_163 = linear(bias = linear_3_bias_0, weight = wrapped_model_language_model_layers_6_mlp_down_proj_weight_palettized, x = input_83)[name = tensor("linear_48")]; tensor var_22_promoted_41_to_fp16 = const()[name = tensor("op_22_promoted_41_to_fp16"), val = tensor(0x1p+1)]; tensor var_1703_cast_fp16 = pow(x = x_163, y = var_22_promoted_41_to_fp16)[name = tensor("op_1703_cast_fp16")]; tensor var_1705_axes_0 = const()[name = tensor("op_1705_axes_0"), val = tensor([-1])]; tensor var_1705_keep_dims_0 = const()[name = tensor("op_1705_keep_dims_0"), val = tensor(true)]; tensor var_1705_cast_fp16 = reduce_mean(axes = var_1705_axes_0, keep_dims = var_1705_keep_dims_0, x = var_1703_cast_fp16)[name = tensor("op_1705_cast_fp16")]; tensor var_1706_to_fp16 = const()[name = tensor("op_1706_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_1707_cast_fp16 = add(x = var_1705_cast_fp16, y = var_1706_to_fp16)[name = tensor("op_1707_cast_fp16")]; tensor var_1708_epsilon_0 = const()[name = tensor("op_1708_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_1708_cast_fp16 = rsqrt(epsilon = var_1708_epsilon_0, x = var_1707_cast_fp16)[name = tensor("op_1708_cast_fp16")]; tensor output_165_cast_fp16 = mul(x = x_163, y = var_1708_cast_fp16)[name = tensor("output_165_cast_fp16")]; tensor var_1712_to_fp16 = const()[name = tensor("op_1712_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940338304)))]; tensor output_167_cast_fp16 = mul(x = output_165_cast_fp16, y = var_1712_to_fp16)[name = tensor("output_167_cast_fp16")]; tensor x_167 = add(x = x_159, y = output_167_cast_fp16)[name = tensor("x_167")]; tensor var_22_promoted_42_to_fp16 = const()[name = tensor("op_22_promoted_42_to_fp16"), val = tensor(0x1p+1)]; tensor var_1724_cast_fp16 = pow(x = x_167, y = var_22_promoted_42_to_fp16)[name = tensor("op_1724_cast_fp16")]; tensor var_1726_axes_0 = const()[name = tensor("op_1726_axes_0"), val = tensor([-1])]; tensor var_1726_keep_dims_0 = const()[name = tensor("op_1726_keep_dims_0"), val = tensor(true)]; tensor var_1726_cast_fp16 = reduce_mean(axes = var_1726_axes_0, keep_dims = var_1726_keep_dims_0, x = var_1724_cast_fp16)[name = tensor("op_1726_cast_fp16")]; tensor var_1727_to_fp16 = const()[name = tensor("op_1727_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_1728_cast_fp16 = add(x = var_1726_cast_fp16, y = var_1727_to_fp16)[name = tensor("op_1728_cast_fp16")]; tensor var_1729_epsilon_0 = const()[name = tensor("op_1729_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_1729_cast_fp16 = rsqrt(epsilon = var_1729_epsilon_0, x = var_1728_cast_fp16)[name = tensor("op_1729_cast_fp16")]; tensor output_169_cast_fp16 = mul(x = x_167, y = var_1729_cast_fp16)[name = tensor("output_169_cast_fp16")]; tensor var_1733_to_fp16 = const()[name = tensor("op_1733_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940343488)))]; tensor output_171_cast_fp16 = mul(x = output_169_cast_fp16, y = var_1733_to_fp16)[name = tensor("output_171_cast_fp16")]; tensor var_1745 = linear(bias = linear_0_bias_0, weight = wrapped_model_language_model_layers_7_self_attn_q_proj_weight_palettized, x = output_171_cast_fp16)[name = tensor("linear_49")]; tensor var_1746 = const()[name = tensor("op_1746"), val = tensor([1, 256, -1, 256])]; tensor var_1747 = reshape(shape = var_1746, x = var_1745)[name = tensor("op_1747")]; tensor x_171_perm_0 = const()[name = tensor("x_171_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_1750 = linear(bias = linear_1_bias_0, weight = wrapped_model_language_model_layers_7_self_attn_k_proj_weight_palettized, x = output_171_cast_fp16)[name = tensor("linear_50")]; tensor var_1751 = const()[name = tensor("op_1751"), val = tensor([1, 256, -1, 256])]; tensor var_1752 = reshape(shape = var_1751, x = var_1750)[name = tensor("op_1752")]; tensor x_175_perm_0 = const()[name = tensor("x_175_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_1755 = linear(bias = linear_1_bias_0, weight = wrapped_model_language_model_layers_7_self_attn_v_proj_weight_palettized, x = output_171_cast_fp16)[name = tensor("linear_51")]; tensor var_1756 = const()[name = tensor("op_1756"), val = tensor([1, 256, -1, 256])]; tensor var_1757 = reshape(shape = var_1756, x = var_1755)[name = tensor("op_1757")]; tensor hidden_states_105_perm_0 = const()[name = tensor("hidden_states_105_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_22_promoted_43_to_fp16 = const()[name = tensor("op_22_promoted_43_to_fp16"), val = tensor(0x1p+1)]; tensor x_171 = transpose(perm = x_171_perm_0, x = var_1747)[name = tensor("transpose_107")]; tensor var_1761_cast_fp16 = pow(x = x_171, y = var_22_promoted_43_to_fp16)[name = tensor("op_1761_cast_fp16")]; tensor var_1763_axes_0 = const()[name = tensor("op_1763_axes_0"), val = tensor([-1])]; tensor var_1763_keep_dims_0 = const()[name = tensor("op_1763_keep_dims_0"), val = tensor(true)]; tensor var_1763_cast_fp16 = reduce_mean(axes = var_1763_axes_0, keep_dims = var_1763_keep_dims_0, x = var_1761_cast_fp16)[name = tensor("op_1763_cast_fp16")]; tensor var_1764_to_fp16 = const()[name = tensor("op_1764_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_1765_cast_fp16 = add(x = var_1763_cast_fp16, y = var_1764_to_fp16)[name = tensor("op_1765_cast_fp16")]; tensor var_1766_epsilon_0 = const()[name = tensor("op_1766_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_1766_cast_fp16 = rsqrt(epsilon = var_1766_epsilon_0, x = var_1765_cast_fp16)[name = tensor("op_1766_cast_fp16")]; tensor output_173_cast_fp16 = mul(x = x_171, y = var_1766_cast_fp16)[name = tensor("output_173_cast_fp16")]; tensor var_1770_to_fp16 = const()[name = tensor("op_1770_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940348672)))]; tensor output_175_cast_fp16 = mul(x = output_173_cast_fp16, y = var_1770_to_fp16)[name = tensor("output_175_cast_fp16")]; tensor var_22_promoted_44_to_fp16 = const()[name = tensor("op_22_promoted_44_to_fp16"), val = tensor(0x1p+1)]; tensor x_175 = transpose(perm = x_175_perm_0, x = var_1752)[name = tensor("transpose_106")]; tensor var_1775_cast_fp16 = pow(x = x_175, y = var_22_promoted_44_to_fp16)[name = tensor("op_1775_cast_fp16")]; tensor var_1777_axes_0 = const()[name = tensor("op_1777_axes_0"), val = tensor([-1])]; tensor var_1777_keep_dims_0 = const()[name = tensor("op_1777_keep_dims_0"), val = tensor(true)]; tensor var_1777_cast_fp16 = reduce_mean(axes = var_1777_axes_0, keep_dims = var_1777_keep_dims_0, x = var_1775_cast_fp16)[name = tensor("op_1777_cast_fp16")]; tensor var_1778_to_fp16 = const()[name = tensor("op_1778_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_1779_cast_fp16 = add(x = var_1777_cast_fp16, y = var_1778_to_fp16)[name = tensor("op_1779_cast_fp16")]; tensor var_1780_epsilon_0 = const()[name = tensor("op_1780_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_1780_cast_fp16 = rsqrt(epsilon = var_1780_epsilon_0, x = var_1779_cast_fp16)[name = tensor("op_1780_cast_fp16")]; tensor output_177_cast_fp16 = mul(x = x_175, y = var_1780_cast_fp16)[name = tensor("output_177_cast_fp16")]; tensor var_1784_to_fp16 = const()[name = tensor("op_1784_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940349248)))]; tensor output_179_cast_fp16 = mul(x = output_177_cast_fp16, y = var_1784_to_fp16)[name = tensor("output_179_cast_fp16")]; tensor var_1789 = mul(x = output_175_cast_fp16, y = cos_7_palettized)[name = tensor("op_1789")]; tensor x1_29_begin_0 = const()[name = tensor("x1_29_begin_0"), val = tensor([0, 0, 0, 0])]; tensor x1_29_end_0 = const()[name = tensor("x1_29_end_0"), val = tensor([1, 8, 256, 128])]; tensor x1_29_end_mask_0 = const()[name = tensor("x1_29_end_mask_0"), val = tensor([true, true, true, false])]; tensor x1_29 = slice_by_index(begin = x1_29_begin_0, end = x1_29_end_0, end_mask = x1_29_end_mask_0, x = output_175_cast_fp16)[name = tensor("x1_29")]; tensor x2_29_begin_0 = const()[name = tensor("x2_29_begin_0"), val = tensor([0, 0, 0, 128])]; tensor x2_29_end_0 = const()[name = tensor("x2_29_end_0"), val = tensor([1, 8, 256, 256])]; tensor x2_29_end_mask_0 = const()[name = tensor("x2_29_end_mask_0"), val = tensor([true, true, true, true])]; tensor x2_29 = slice_by_index(begin = x2_29_begin_0, end = x2_29_end_0, end_mask = x2_29_end_mask_0, x = output_175_cast_fp16)[name = tensor("x2_29")]; tensor const_196_promoted = const()[name = tensor("const_196_promoted"), val = tensor(-0x1p+0)]; tensor var_1800 = mul(x = x2_29, y = const_196_promoted)[name = tensor("op_1800")]; tensor var_1802_interleave_0 = const()[name = tensor("op_1802_interleave_0"), val = tensor(false)]; tensor var_1802 = concat(axis = var_24, interleave = var_1802_interleave_0, values = (var_1800, x1_29))[name = tensor("op_1802")]; tensor var_1803 = mul(x = var_1802, y = sin_7_palettized)[name = tensor("op_1803")]; tensor query_15 = add(x = var_1789, y = var_1803)[name = tensor("query_15")]; tensor var_1805 = mul(x = output_179_cast_fp16, y = cos_7_palettized)[name = tensor("op_1805")]; tensor x1_31_begin_0 = const()[name = tensor("x1_31_begin_0"), val = tensor([0, 0, 0, 0])]; tensor x1_31_end_0 = const()[name = tensor("x1_31_end_0"), val = tensor([1, 4, 256, 128])]; tensor x1_31_end_mask_0 = const()[name = tensor("x1_31_end_mask_0"), val = tensor([true, true, true, false])]; tensor x1_31 = slice_by_index(begin = x1_31_begin_0, end = x1_31_end_0, end_mask = x1_31_end_mask_0, x = output_179_cast_fp16)[name = tensor("x1_31")]; tensor x2_31_begin_0 = const()[name = tensor("x2_31_begin_0"), val = tensor([0, 0, 0, 128])]; tensor x2_31_end_0 = const()[name = tensor("x2_31_end_0"), val = tensor([1, 4, 256, 256])]; tensor x2_31_end_mask_0 = const()[name = tensor("x2_31_end_mask_0"), val = tensor([true, true, true, true])]; tensor x2_31 = slice_by_index(begin = x2_31_begin_0, end = x2_31_end_0, end_mask = x2_31_end_mask_0, x = output_179_cast_fp16)[name = tensor("x2_31")]; tensor const_199_promoted = const()[name = tensor("const_199_promoted"), val = tensor(-0x1p+0)]; tensor var_1816 = mul(x = x2_31, y = const_199_promoted)[name = tensor("op_1816")]; tensor var_1818_interleave_0 = const()[name = tensor("op_1818_interleave_0"), val = tensor(false)]; tensor var_1818 = concat(axis = var_24, interleave = var_1818_interleave_0, values = (var_1816, x1_31))[name = tensor("op_1818")]; tensor var_1819 = mul(x = var_1818, y = sin_7_palettized)[name = tensor("op_1819")]; tensor hidden_states_101 = add(x = var_1805, y = var_1819)[name = tensor("hidden_states_101")]; tensor var_1828_axes_0 = const()[name = tensor("op_1828_axes_0"), val = tensor([2])]; tensor var_1828 = expand_dims(axes = var_1828_axes_0, x = hidden_states_101)[name = tensor("op_1828")]; tensor hidden_states_103_reps_0 = const()[name = tensor("hidden_states_103_reps_0"), val = tensor([1, 1, 2, 1, 1])]; tensor hidden_states_103 = tile(reps = hidden_states_103_reps_0, x = var_1828)[name = tensor("hidden_states_103")]; tensor var_1836 = const()[name = tensor("op_1836"), val = tensor([1, 8, 256, 256])]; tensor key_states_15 = reshape(shape = var_1836, x = hidden_states_103)[name = tensor("key_states_15")]; tensor var_1845_axes_0 = const()[name = tensor("op_1845_axes_0"), val = tensor([2])]; tensor hidden_states_105 = transpose(perm = hidden_states_105_perm_0, x = var_1757)[name = tensor("transpose_105")]; tensor var_1845 = expand_dims(axes = var_1845_axes_0, x = hidden_states_105)[name = tensor("op_1845")]; tensor hidden_states_107_reps_0 = const()[name = tensor("hidden_states_107_reps_0"), val = tensor([1, 1, 2, 1, 1])]; tensor hidden_states_107 = tile(reps = hidden_states_107_reps_0, x = var_1845)[name = tensor("hidden_states_107")]; tensor var_1853 = const()[name = tensor("op_1853"), val = tensor([1, 8, 256, 256])]; tensor value_states_15 = reshape(shape = var_1853, x = hidden_states_107)[name = tensor("value_states_15")]; tensor var_1856_transpose_x_1 = const()[name = tensor("op_1856_transpose_x_1"), val = tensor(false)]; tensor var_1856_transpose_y_1 = const()[name = tensor("op_1856_transpose_y_1"), val = tensor(true)]; tensor var_1856 = matmul(transpose_x = var_1856_transpose_x_1, transpose_y = var_1856_transpose_y_1, x = query_15, y = key_states_15)[name = tensor("op_1856")]; tensor var_1857_to_fp16 = const()[name = tensor("op_1857_to_fp16"), val = tensor(0x1p-4)]; tensor attn_weights_29_cast_fp16 = mul(x = var_1856, y = var_1857_to_fp16)[name = tensor("attn_weights_29_cast_fp16")]; tensor input_85_cast_fp16 = add(x = attn_weights_29_cast_fp16, y = attention_mask_to_fp16_palettized)[name = tensor("input_85_cast_fp16")]; tensor var_1865_cast_fp16 = softmax(axis = var_24, x = input_85_cast_fp16)[name = tensor("op_1865_cast_fp16")]; tensor attn_output_29_transpose_x_0 = const()[name = tensor("attn_output_29_transpose_x_0"), val = tensor(false)]; tensor attn_output_29_transpose_y_0 = const()[name = tensor("attn_output_29_transpose_y_0"), val = tensor(false)]; tensor attn_output_29 = matmul(transpose_x = attn_output_29_transpose_x_0, transpose_y = attn_output_29_transpose_y_0, x = var_1865_cast_fp16, y = value_states_15)[name = tensor("attn_output_29")]; tensor var_1869_perm_0 = const()[name = tensor("op_1869_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_1871 = const()[name = tensor("op_1871"), val = tensor([1, 256, -1])]; tensor var_1869 = transpose(perm = var_1869_perm_0, x = attn_output_29)[name = tensor("transpose_104")]; tensor var_1872 = reshape(shape = var_1871, x = var_1869)[name = tensor("op_1872")]; tensor x_179 = linear(bias = linear_3_bias_0, weight = wrapped_model_language_model_layers_7_self_attn_o_proj_weight_palettized, x = var_1872)[name = tensor("linear_52")]; tensor var_22_promoted_45_to_fp16 = const()[name = tensor("op_22_promoted_45_to_fp16"), val = tensor(0x1p+1)]; tensor var_1878_cast_fp16 = pow(x = x_179, y = var_22_promoted_45_to_fp16)[name = tensor("op_1878_cast_fp16")]; tensor var_1880_axes_0 = const()[name = tensor("op_1880_axes_0"), val = tensor([-1])]; tensor var_1880_keep_dims_0 = const()[name = tensor("op_1880_keep_dims_0"), val = tensor(true)]; tensor var_1880_cast_fp16 = reduce_mean(axes = var_1880_axes_0, keep_dims = var_1880_keep_dims_0, x = var_1878_cast_fp16)[name = tensor("op_1880_cast_fp16")]; tensor var_1881_to_fp16 = const()[name = tensor("op_1881_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_1882_cast_fp16 = add(x = var_1880_cast_fp16, y = var_1881_to_fp16)[name = tensor("op_1882_cast_fp16")]; tensor var_1883_epsilon_0 = const()[name = tensor("op_1883_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_1883_cast_fp16 = rsqrt(epsilon = var_1883_epsilon_0, x = var_1882_cast_fp16)[name = tensor("op_1883_cast_fp16")]; tensor output_181_cast_fp16 = mul(x = x_179, y = var_1883_cast_fp16)[name = tensor("output_181_cast_fp16")]; tensor var_1887_to_fp16 = const()[name = tensor("op_1887_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940349824)))]; tensor output_183_cast_fp16 = mul(x = output_181_cast_fp16, y = var_1887_to_fp16)[name = tensor("output_183_cast_fp16")]; tensor x_183 = add(x = x_167, y = output_183_cast_fp16)[name = tensor("x_183")]; tensor var_22_promoted_46_to_fp16 = const()[name = tensor("op_22_promoted_46_to_fp16"), val = tensor(0x1p+1)]; tensor var_1893_cast_fp16 = pow(x = x_183, y = var_22_promoted_46_to_fp16)[name = tensor("op_1893_cast_fp16")]; tensor var_1895_axes_0 = const()[name = tensor("op_1895_axes_0"), val = tensor([-1])]; tensor var_1895_keep_dims_0 = const()[name = tensor("op_1895_keep_dims_0"), val = tensor(true)]; tensor var_1895_cast_fp16 = reduce_mean(axes = var_1895_axes_0, keep_dims = var_1895_keep_dims_0, x = var_1893_cast_fp16)[name = tensor("op_1895_cast_fp16")]; tensor var_1896_to_fp16 = const()[name = tensor("op_1896_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_1897_cast_fp16 = add(x = var_1895_cast_fp16, y = var_1896_to_fp16)[name = tensor("op_1897_cast_fp16")]; tensor var_1898_epsilon_0 = const()[name = tensor("op_1898_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_1898_cast_fp16 = rsqrt(epsilon = var_1898_epsilon_0, x = var_1897_cast_fp16)[name = tensor("op_1898_cast_fp16")]; tensor output_185_cast_fp16 = mul(x = x_183, y = var_1898_cast_fp16)[name = tensor("output_185_cast_fp16")]; tensor var_1902_to_fp16 = const()[name = tensor("op_1902_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940355008)))]; tensor output_187_cast_fp16 = mul(x = output_185_cast_fp16, y = var_1902_to_fp16)[name = tensor("output_187_cast_fp16")]; tensor input_93 = linear(bias = linear_4_bias_0, weight = wrapped_model_language_model_layers_7_mlp_gate_proj_weight_palettized, x = output_187_cast_fp16)[name = tensor("linear_53")]; tensor var_1910_mode_0 = const()[name = tensor("op_1910_mode_0"), val = tensor("TANH_APPROXIMATION")]; tensor var_1910 = gelu(mode = var_1910_mode_0, x = input_93)[name = tensor("op_1910")]; tensor var_1912 = linear(bias = linear_4_bias_0, weight = wrapped_model_language_model_layers_7_mlp_up_proj_weight_palettized, x = output_187_cast_fp16)[name = tensor("linear_54")]; tensor input_95 = mul(x = var_1910, y = var_1912)[name = tensor("input_95")]; tensor x_187 = linear(bias = linear_3_bias_0, weight = wrapped_model_language_model_layers_7_mlp_down_proj_weight_palettized, x = input_95)[name = tensor("linear_55")]; tensor var_22_promoted_47_to_fp16 = const()[name = tensor("op_22_promoted_47_to_fp16"), val = tensor(0x1p+1)]; tensor var_1918_cast_fp16 = pow(x = x_187, y = var_22_promoted_47_to_fp16)[name = tensor("op_1918_cast_fp16")]; tensor var_1920_axes_0 = const()[name = tensor("op_1920_axes_0"), val = tensor([-1])]; tensor var_1920_keep_dims_0 = const()[name = tensor("op_1920_keep_dims_0"), val = tensor(true)]; tensor var_1920_cast_fp16 = reduce_mean(axes = var_1920_axes_0, keep_dims = var_1920_keep_dims_0, x = var_1918_cast_fp16)[name = tensor("op_1920_cast_fp16")]; tensor var_1921_to_fp16 = const()[name = tensor("op_1921_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_1922_cast_fp16 = add(x = var_1920_cast_fp16, y = var_1921_to_fp16)[name = tensor("op_1922_cast_fp16")]; tensor var_1923_epsilon_0 = const()[name = tensor("op_1923_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_1923_cast_fp16 = rsqrt(epsilon = var_1923_epsilon_0, x = var_1922_cast_fp16)[name = tensor("op_1923_cast_fp16")]; tensor output_189_cast_fp16 = mul(x = x_187, y = var_1923_cast_fp16)[name = tensor("output_189_cast_fp16")]; tensor var_1927_to_fp16 = const()[name = tensor("op_1927_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940360192)))]; tensor output_191_cast_fp16 = mul(x = output_189_cast_fp16, y = var_1927_to_fp16)[name = tensor("output_191_cast_fp16")]; tensor x_191 = add(x = x_183, y = output_191_cast_fp16)[name = tensor("x_191")]; tensor var_22_promoted_48_to_fp16 = const()[name = tensor("op_22_promoted_48_to_fp16"), val = tensor(0x1p+1)]; tensor var_1939_cast_fp16 = pow(x = x_191, y = var_22_promoted_48_to_fp16)[name = tensor("op_1939_cast_fp16")]; tensor var_1941_axes_0 = const()[name = tensor("op_1941_axes_0"), val = tensor([-1])]; tensor var_1941_keep_dims_0 = const()[name = tensor("op_1941_keep_dims_0"), val = tensor(true)]; tensor var_1941_cast_fp16 = reduce_mean(axes = var_1941_axes_0, keep_dims = var_1941_keep_dims_0, x = var_1939_cast_fp16)[name = tensor("op_1941_cast_fp16")]; tensor var_1942_to_fp16 = const()[name = tensor("op_1942_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_1943_cast_fp16 = add(x = var_1941_cast_fp16, y = var_1942_to_fp16)[name = tensor("op_1943_cast_fp16")]; tensor var_1944_epsilon_0 = const()[name = tensor("op_1944_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_1944_cast_fp16 = rsqrt(epsilon = var_1944_epsilon_0, x = var_1943_cast_fp16)[name = tensor("op_1944_cast_fp16")]; tensor output_193_cast_fp16 = mul(x = x_191, y = var_1944_cast_fp16)[name = tensor("output_193_cast_fp16")]; tensor var_1948_to_fp16 = const()[name = tensor("op_1948_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940365376)))]; tensor output_195_cast_fp16 = mul(x = output_193_cast_fp16, y = var_1948_to_fp16)[name = tensor("output_195_cast_fp16")]; tensor var_1960 = linear(bias = linear_0_bias_0, weight = wrapped_model_language_model_layers_8_self_attn_q_proj_weight_palettized, x = output_195_cast_fp16)[name = tensor("linear_56")]; tensor var_1961 = const()[name = tensor("op_1961"), val = tensor([1, 256, -1, 256])]; tensor var_1962 = reshape(shape = var_1961, x = var_1960)[name = tensor("op_1962")]; tensor x_195_perm_0 = const()[name = tensor("x_195_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_1965 = linear(bias = linear_1_bias_0, weight = wrapped_model_language_model_layers_8_self_attn_k_proj_weight_palettized, x = output_195_cast_fp16)[name = tensor("linear_57")]; tensor var_1966 = const()[name = tensor("op_1966"), val = tensor([1, 256, -1, 256])]; tensor var_1967 = reshape(shape = var_1966, x = var_1965)[name = tensor("op_1967")]; tensor x_199_perm_0 = const()[name = tensor("x_199_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_1970 = linear(bias = linear_1_bias_0, weight = wrapped_model_language_model_layers_8_self_attn_v_proj_weight_palettized, x = output_195_cast_fp16)[name = tensor("linear_58")]; tensor var_1971 = const()[name = tensor("op_1971"), val = tensor([1, 256, -1, 256])]; tensor var_1972 = reshape(shape = var_1971, x = var_1970)[name = tensor("op_1972")]; tensor hidden_states_119_perm_0 = const()[name = tensor("hidden_states_119_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_22_promoted_49_to_fp16 = const()[name = tensor("op_22_promoted_49_to_fp16"), val = tensor(0x1p+1)]; tensor x_195 = transpose(perm = x_195_perm_0, x = var_1962)[name = tensor("transpose_103")]; tensor var_1976_cast_fp16 = pow(x = x_195, y = var_22_promoted_49_to_fp16)[name = tensor("op_1976_cast_fp16")]; tensor var_1978_axes_0 = const()[name = tensor("op_1978_axes_0"), val = tensor([-1])]; tensor var_1978_keep_dims_0 = const()[name = tensor("op_1978_keep_dims_0"), val = tensor(true)]; tensor var_1978_cast_fp16 = reduce_mean(axes = var_1978_axes_0, keep_dims = var_1978_keep_dims_0, x = var_1976_cast_fp16)[name = tensor("op_1978_cast_fp16")]; tensor var_1979_to_fp16 = const()[name = tensor("op_1979_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_1980_cast_fp16 = add(x = var_1978_cast_fp16, y = var_1979_to_fp16)[name = tensor("op_1980_cast_fp16")]; tensor var_1981_epsilon_0 = const()[name = tensor("op_1981_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_1981_cast_fp16 = rsqrt(epsilon = var_1981_epsilon_0, x = var_1980_cast_fp16)[name = tensor("op_1981_cast_fp16")]; tensor output_197_cast_fp16 = mul(x = x_195, y = var_1981_cast_fp16)[name = tensor("output_197_cast_fp16")]; tensor var_1985_to_fp16 = const()[name = tensor("op_1985_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940370560)))]; tensor output_199_cast_fp16 = mul(x = output_197_cast_fp16, y = var_1985_to_fp16)[name = tensor("output_199_cast_fp16")]; tensor var_22_promoted_50_to_fp16 = const()[name = tensor("op_22_promoted_50_to_fp16"), val = tensor(0x1p+1)]; tensor x_199 = transpose(perm = x_199_perm_0, x = var_1967)[name = tensor("transpose_102")]; tensor var_1990_cast_fp16 = pow(x = x_199, y = var_22_promoted_50_to_fp16)[name = tensor("op_1990_cast_fp16")]; tensor var_1992_axes_0 = const()[name = tensor("op_1992_axes_0"), val = tensor([-1])]; tensor var_1992_keep_dims_0 = const()[name = tensor("op_1992_keep_dims_0"), val = tensor(true)]; tensor var_1992_cast_fp16 = reduce_mean(axes = var_1992_axes_0, keep_dims = var_1992_keep_dims_0, x = var_1990_cast_fp16)[name = tensor("op_1992_cast_fp16")]; tensor var_1993_to_fp16 = const()[name = tensor("op_1993_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_1994_cast_fp16 = add(x = var_1992_cast_fp16, y = var_1993_to_fp16)[name = tensor("op_1994_cast_fp16")]; tensor var_1995_epsilon_0 = const()[name = tensor("op_1995_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_1995_cast_fp16 = rsqrt(epsilon = var_1995_epsilon_0, x = var_1994_cast_fp16)[name = tensor("op_1995_cast_fp16")]; tensor output_201_cast_fp16 = mul(x = x_199, y = var_1995_cast_fp16)[name = tensor("output_201_cast_fp16")]; tensor var_1999_to_fp16 = const()[name = tensor("op_1999_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940371136)))]; tensor output_203_cast_fp16 = mul(x = output_201_cast_fp16, y = var_1999_to_fp16)[name = tensor("output_203_cast_fp16")]; tensor var_2004 = mul(x = output_199_cast_fp16, y = cos_7_palettized)[name = tensor("op_2004")]; tensor x1_33_begin_0 = const()[name = tensor("x1_33_begin_0"), val = tensor([0, 0, 0, 0])]; tensor x1_33_end_0 = const()[name = tensor("x1_33_end_0"), val = tensor([1, 8, 256, 128])]; tensor x1_33_end_mask_0 = const()[name = tensor("x1_33_end_mask_0"), val = tensor([true, true, true, false])]; tensor x1_33 = slice_by_index(begin = x1_33_begin_0, end = x1_33_end_0, end_mask = x1_33_end_mask_0, x = output_199_cast_fp16)[name = tensor("x1_33")]; tensor x2_33_begin_0 = const()[name = tensor("x2_33_begin_0"), val = tensor([0, 0, 0, 128])]; tensor x2_33_end_0 = const()[name = tensor("x2_33_end_0"), val = tensor([1, 8, 256, 256])]; tensor x2_33_end_mask_0 = const()[name = tensor("x2_33_end_mask_0"), val = tensor([true, true, true, true])]; tensor x2_33 = slice_by_index(begin = x2_33_begin_0, end = x2_33_end_0, end_mask = x2_33_end_mask_0, x = output_199_cast_fp16)[name = tensor("x2_33")]; tensor const_219_promoted = const()[name = tensor("const_219_promoted"), val = tensor(-0x1p+0)]; tensor var_2015 = mul(x = x2_33, y = const_219_promoted)[name = tensor("op_2015")]; tensor var_2017_interleave_0 = const()[name = tensor("op_2017_interleave_0"), val = tensor(false)]; tensor var_2017 = concat(axis = var_24, interleave = var_2017_interleave_0, values = (var_2015, x1_33))[name = tensor("op_2017")]; tensor var_2018 = mul(x = var_2017, y = sin_7_palettized)[name = tensor("op_2018")]; tensor query_17 = add(x = var_2004, y = var_2018)[name = tensor("query_17")]; tensor var_2020 = mul(x = output_203_cast_fp16, y = cos_7_palettized)[name = tensor("op_2020")]; tensor x1_35_begin_0 = const()[name = tensor("x1_35_begin_0"), val = tensor([0, 0, 0, 0])]; tensor x1_35_end_0 = const()[name = tensor("x1_35_end_0"), val = tensor([1, 4, 256, 128])]; tensor x1_35_end_mask_0 = const()[name = tensor("x1_35_end_mask_0"), val = tensor([true, true, true, false])]; tensor x1_35 = slice_by_index(begin = x1_35_begin_0, end = x1_35_end_0, end_mask = x1_35_end_mask_0, x = output_203_cast_fp16)[name = tensor("x1_35")]; tensor x2_35_begin_0 = const()[name = tensor("x2_35_begin_0"), val = tensor([0, 0, 0, 128])]; tensor x2_35_end_0 = const()[name = tensor("x2_35_end_0"), val = tensor([1, 4, 256, 256])]; tensor x2_35_end_mask_0 = const()[name = tensor("x2_35_end_mask_0"), val = tensor([true, true, true, true])]; tensor x2_35 = slice_by_index(begin = x2_35_begin_0, end = x2_35_end_0, end_mask = x2_35_end_mask_0, x = output_203_cast_fp16)[name = tensor("x2_35")]; tensor const_222_promoted = const()[name = tensor("const_222_promoted"), val = tensor(-0x1p+0)]; tensor var_2031 = mul(x = x2_35, y = const_222_promoted)[name = tensor("op_2031")]; tensor var_2033_interleave_0 = const()[name = tensor("op_2033_interleave_0"), val = tensor(false)]; tensor var_2033 = concat(axis = var_24, interleave = var_2033_interleave_0, values = (var_2031, x1_35))[name = tensor("op_2033")]; tensor var_2034 = mul(x = var_2033, y = sin_7_palettized)[name = tensor("op_2034")]; tensor hidden_states_115 = add(x = var_2020, y = var_2034)[name = tensor("hidden_states_115")]; tensor var_2043_axes_0 = const()[name = tensor("op_2043_axes_0"), val = tensor([2])]; tensor var_2043 = expand_dims(axes = var_2043_axes_0, x = hidden_states_115)[name = tensor("op_2043")]; tensor hidden_states_117_reps_0 = const()[name = tensor("hidden_states_117_reps_0"), val = tensor([1, 1, 2, 1, 1])]; tensor hidden_states_117 = tile(reps = hidden_states_117_reps_0, x = var_2043)[name = tensor("hidden_states_117")]; tensor var_2051 = const()[name = tensor("op_2051"), val = tensor([1, 8, 256, 256])]; tensor key_states_17 = reshape(shape = var_2051, x = hidden_states_117)[name = tensor("key_states_17")]; tensor var_2060_axes_0 = const()[name = tensor("op_2060_axes_0"), val = tensor([2])]; tensor hidden_states_119 = transpose(perm = hidden_states_119_perm_0, x = var_1972)[name = tensor("transpose_101")]; tensor var_2060 = expand_dims(axes = var_2060_axes_0, x = hidden_states_119)[name = tensor("op_2060")]; tensor hidden_states_121_reps_0 = const()[name = tensor("hidden_states_121_reps_0"), val = tensor([1, 1, 2, 1, 1])]; tensor hidden_states_121 = tile(reps = hidden_states_121_reps_0, x = var_2060)[name = tensor("hidden_states_121")]; tensor var_2068 = const()[name = tensor("op_2068"), val = tensor([1, 8, 256, 256])]; tensor value_states_17 = reshape(shape = var_2068, x = hidden_states_121)[name = tensor("value_states_17")]; tensor var_2071_transpose_x_1 = const()[name = tensor("op_2071_transpose_x_1"), val = tensor(false)]; tensor var_2071_transpose_y_1 = const()[name = tensor("op_2071_transpose_y_1"), val = tensor(true)]; tensor var_2071 = matmul(transpose_x = var_2071_transpose_x_1, transpose_y = var_2071_transpose_y_1, x = query_17, y = key_states_17)[name = tensor("op_2071")]; tensor var_2072_to_fp16 = const()[name = tensor("op_2072_to_fp16"), val = tensor(0x1p-4)]; tensor attn_weights_33_cast_fp16 = mul(x = var_2071, y = var_2072_to_fp16)[name = tensor("attn_weights_33_cast_fp16")]; tensor input_97_cast_fp16 = add(x = attn_weights_33_cast_fp16, y = attention_mask_to_fp16_palettized)[name = tensor("input_97_cast_fp16")]; tensor var_2080_cast_fp16 = softmax(axis = var_24, x = input_97_cast_fp16)[name = tensor("op_2080_cast_fp16")]; tensor attn_output_33_transpose_x_0 = const()[name = tensor("attn_output_33_transpose_x_0"), val = tensor(false)]; tensor attn_output_33_transpose_y_0 = const()[name = tensor("attn_output_33_transpose_y_0"), val = tensor(false)]; tensor attn_output_33 = matmul(transpose_x = attn_output_33_transpose_x_0, transpose_y = attn_output_33_transpose_y_0, x = var_2080_cast_fp16, y = value_states_17)[name = tensor("attn_output_33")]; tensor var_2084_perm_0 = const()[name = tensor("op_2084_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_2086 = const()[name = tensor("op_2086"), val = tensor([1, 256, -1])]; tensor var_2084 = transpose(perm = var_2084_perm_0, x = attn_output_33)[name = tensor("transpose_100")]; tensor var_2087 = reshape(shape = var_2086, x = var_2084)[name = tensor("op_2087")]; tensor x_203 = linear(bias = linear_3_bias_0, weight = wrapped_model_language_model_layers_8_self_attn_o_proj_weight_palettized, x = var_2087)[name = tensor("linear_59")]; tensor var_22_promoted_51_to_fp16 = const()[name = tensor("op_22_promoted_51_to_fp16"), val = tensor(0x1p+1)]; tensor var_2093_cast_fp16 = pow(x = x_203, y = var_22_promoted_51_to_fp16)[name = tensor("op_2093_cast_fp16")]; tensor var_2095_axes_0 = const()[name = tensor("op_2095_axes_0"), val = tensor([-1])]; tensor var_2095_keep_dims_0 = const()[name = tensor("op_2095_keep_dims_0"), val = tensor(true)]; tensor var_2095_cast_fp16 = reduce_mean(axes = var_2095_axes_0, keep_dims = var_2095_keep_dims_0, x = var_2093_cast_fp16)[name = tensor("op_2095_cast_fp16")]; tensor var_2096_to_fp16 = const()[name = tensor("op_2096_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_2097_cast_fp16 = add(x = var_2095_cast_fp16, y = var_2096_to_fp16)[name = tensor("op_2097_cast_fp16")]; tensor var_2098_epsilon_0 = const()[name = tensor("op_2098_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_2098_cast_fp16 = rsqrt(epsilon = var_2098_epsilon_0, x = var_2097_cast_fp16)[name = tensor("op_2098_cast_fp16")]; tensor output_205_cast_fp16 = mul(x = x_203, y = var_2098_cast_fp16)[name = tensor("output_205_cast_fp16")]; tensor var_2102_to_fp16 = const()[name = tensor("op_2102_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940371712)))]; tensor output_207_cast_fp16 = mul(x = output_205_cast_fp16, y = var_2102_to_fp16)[name = tensor("output_207_cast_fp16")]; tensor x_207 = add(x = x_191, y = output_207_cast_fp16)[name = tensor("x_207")]; tensor var_22_promoted_52_to_fp16 = const()[name = tensor("op_22_promoted_52_to_fp16"), val = tensor(0x1p+1)]; tensor var_2108_cast_fp16 = pow(x = x_207, y = var_22_promoted_52_to_fp16)[name = tensor("op_2108_cast_fp16")]; tensor var_2110_axes_0 = const()[name = tensor("op_2110_axes_0"), val = tensor([-1])]; tensor var_2110_keep_dims_0 = const()[name = tensor("op_2110_keep_dims_0"), val = tensor(true)]; tensor var_2110_cast_fp16 = reduce_mean(axes = var_2110_axes_0, keep_dims = var_2110_keep_dims_0, x = var_2108_cast_fp16)[name = tensor("op_2110_cast_fp16")]; tensor var_2111_to_fp16 = const()[name = tensor("op_2111_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_2112_cast_fp16 = add(x = var_2110_cast_fp16, y = var_2111_to_fp16)[name = tensor("op_2112_cast_fp16")]; tensor var_2113_epsilon_0 = const()[name = tensor("op_2113_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_2113_cast_fp16 = rsqrt(epsilon = var_2113_epsilon_0, x = var_2112_cast_fp16)[name = tensor("op_2113_cast_fp16")]; tensor output_209_cast_fp16 = mul(x = x_207, y = var_2113_cast_fp16)[name = tensor("output_209_cast_fp16")]; tensor var_2117_to_fp16 = const()[name = tensor("op_2117_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940376896)))]; tensor output_211_cast_fp16 = mul(x = output_209_cast_fp16, y = var_2117_to_fp16)[name = tensor("output_211_cast_fp16")]; tensor input_105 = linear(bias = linear_4_bias_0, weight = wrapped_model_language_model_layers_8_mlp_gate_proj_weight_palettized, x = output_211_cast_fp16)[name = tensor("linear_60")]; tensor var_2125_mode_0 = const()[name = tensor("op_2125_mode_0"), val = tensor("TANH_APPROXIMATION")]; tensor var_2125 = gelu(mode = var_2125_mode_0, x = input_105)[name = tensor("op_2125")]; tensor var_2127 = linear(bias = linear_4_bias_0, weight = wrapped_model_language_model_layers_8_mlp_up_proj_weight_palettized, x = output_211_cast_fp16)[name = tensor("linear_61")]; tensor input_107 = mul(x = var_2125, y = var_2127)[name = tensor("input_107")]; tensor x_211 = linear(bias = linear_3_bias_0, weight = wrapped_model_language_model_layers_8_mlp_down_proj_weight_palettized, x = input_107)[name = tensor("linear_62")]; tensor var_22_promoted_53_to_fp16 = const()[name = tensor("op_22_promoted_53_to_fp16"), val = tensor(0x1p+1)]; tensor var_2133_cast_fp16 = pow(x = x_211, y = var_22_promoted_53_to_fp16)[name = tensor("op_2133_cast_fp16")]; tensor var_2135_axes_0 = const()[name = tensor("op_2135_axes_0"), val = tensor([-1])]; tensor var_2135_keep_dims_0 = const()[name = tensor("op_2135_keep_dims_0"), val = tensor(true)]; tensor var_2135_cast_fp16 = reduce_mean(axes = var_2135_axes_0, keep_dims = var_2135_keep_dims_0, x = var_2133_cast_fp16)[name = tensor("op_2135_cast_fp16")]; tensor var_2136_to_fp16 = const()[name = tensor("op_2136_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_2137_cast_fp16 = add(x = var_2135_cast_fp16, y = var_2136_to_fp16)[name = tensor("op_2137_cast_fp16")]; tensor var_2138_epsilon_0 = const()[name = tensor("op_2138_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_2138_cast_fp16 = rsqrt(epsilon = var_2138_epsilon_0, x = var_2137_cast_fp16)[name = tensor("op_2138_cast_fp16")]; tensor output_213_cast_fp16 = mul(x = x_211, y = var_2138_cast_fp16)[name = tensor("output_213_cast_fp16")]; tensor var_2142_to_fp16 = const()[name = tensor("op_2142_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940382080)))]; tensor output_215_cast_fp16 = mul(x = output_213_cast_fp16, y = var_2142_to_fp16)[name = tensor("output_215_cast_fp16")]; tensor x_215 = add(x = x_207, y = output_215_cast_fp16)[name = tensor("x_215")]; tensor var_22_promoted_54_to_fp16 = const()[name = tensor("op_22_promoted_54_to_fp16"), val = tensor(0x1p+1)]; tensor var_2154_cast_fp16 = pow(x = x_215, y = var_22_promoted_54_to_fp16)[name = tensor("op_2154_cast_fp16")]; tensor var_2156_axes_0 = const()[name = tensor("op_2156_axes_0"), val = tensor([-1])]; tensor var_2156_keep_dims_0 = const()[name = tensor("op_2156_keep_dims_0"), val = tensor(true)]; tensor var_2156_cast_fp16 = reduce_mean(axes = var_2156_axes_0, keep_dims = var_2156_keep_dims_0, x = var_2154_cast_fp16)[name = tensor("op_2156_cast_fp16")]; tensor var_2157_to_fp16 = const()[name = tensor("op_2157_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_2158_cast_fp16 = add(x = var_2156_cast_fp16, y = var_2157_to_fp16)[name = tensor("op_2158_cast_fp16")]; tensor var_2159_epsilon_0 = const()[name = tensor("op_2159_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_2159_cast_fp16 = rsqrt(epsilon = var_2159_epsilon_0, x = var_2158_cast_fp16)[name = tensor("op_2159_cast_fp16")]; tensor output_217_cast_fp16 = mul(x = x_215, y = var_2159_cast_fp16)[name = tensor("output_217_cast_fp16")]; tensor var_2163_to_fp16 = const()[name = tensor("op_2163_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940387264)))]; tensor output_219_cast_fp16 = mul(x = output_217_cast_fp16, y = var_2163_to_fp16)[name = tensor("output_219_cast_fp16")]; tensor var_2175 = linear(bias = linear_0_bias_0, weight = wrapped_model_language_model_layers_9_self_attn_q_proj_weight_palettized, x = output_219_cast_fp16)[name = tensor("linear_63")]; tensor var_2176 = const()[name = tensor("op_2176"), val = tensor([1, 256, -1, 256])]; tensor var_2177 = reshape(shape = var_2176, x = var_2175)[name = tensor("op_2177")]; tensor x_219_perm_0 = const()[name = tensor("x_219_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_2180 = linear(bias = linear_1_bias_0, weight = wrapped_model_language_model_layers_9_self_attn_k_proj_weight_palettized, x = output_219_cast_fp16)[name = tensor("linear_64")]; tensor var_2181 = const()[name = tensor("op_2181"), val = tensor([1, 256, -1, 256])]; tensor var_2182 = reshape(shape = var_2181, x = var_2180)[name = tensor("op_2182")]; tensor x_223_perm_0 = const()[name = tensor("x_223_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_2185 = linear(bias = linear_1_bias_0, weight = wrapped_model_language_model_layers_9_self_attn_v_proj_weight_palettized, x = output_219_cast_fp16)[name = tensor("linear_65")]; tensor var_2186 = const()[name = tensor("op_2186"), val = tensor([1, 256, -1, 256])]; tensor var_2187 = reshape(shape = var_2186, x = var_2185)[name = tensor("op_2187")]; tensor hidden_states_133_perm_0 = const()[name = tensor("hidden_states_133_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_22_promoted_55_to_fp16 = const()[name = tensor("op_22_promoted_55_to_fp16"), val = tensor(0x1p+1)]; tensor x_219 = transpose(perm = x_219_perm_0, x = var_2177)[name = tensor("transpose_99")]; tensor var_2191_cast_fp16 = pow(x = x_219, y = var_22_promoted_55_to_fp16)[name = tensor("op_2191_cast_fp16")]; tensor var_2193_axes_0 = const()[name = tensor("op_2193_axes_0"), val = tensor([-1])]; tensor var_2193_keep_dims_0 = const()[name = tensor("op_2193_keep_dims_0"), val = tensor(true)]; tensor var_2193_cast_fp16 = reduce_mean(axes = var_2193_axes_0, keep_dims = var_2193_keep_dims_0, x = var_2191_cast_fp16)[name = tensor("op_2193_cast_fp16")]; tensor var_2194_to_fp16 = const()[name = tensor("op_2194_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_2195_cast_fp16 = add(x = var_2193_cast_fp16, y = var_2194_to_fp16)[name = tensor("op_2195_cast_fp16")]; tensor var_2196_epsilon_0 = const()[name = tensor("op_2196_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_2196_cast_fp16 = rsqrt(epsilon = var_2196_epsilon_0, x = var_2195_cast_fp16)[name = tensor("op_2196_cast_fp16")]; tensor output_221_cast_fp16 = mul(x = x_219, y = var_2196_cast_fp16)[name = tensor("output_221_cast_fp16")]; tensor var_2200_to_fp16 = const()[name = tensor("op_2200_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940392448)))]; tensor output_223_cast_fp16 = mul(x = output_221_cast_fp16, y = var_2200_to_fp16)[name = tensor("output_223_cast_fp16")]; tensor var_22_promoted_56_to_fp16 = const()[name = tensor("op_22_promoted_56_to_fp16"), val = tensor(0x1p+1)]; tensor x_223 = transpose(perm = x_223_perm_0, x = var_2182)[name = tensor("transpose_98")]; tensor var_2205_cast_fp16 = pow(x = x_223, y = var_22_promoted_56_to_fp16)[name = tensor("op_2205_cast_fp16")]; tensor var_2207_axes_0 = const()[name = tensor("op_2207_axes_0"), val = tensor([-1])]; tensor var_2207_keep_dims_0 = const()[name = tensor("op_2207_keep_dims_0"), val = tensor(true)]; tensor var_2207_cast_fp16 = reduce_mean(axes = var_2207_axes_0, keep_dims = var_2207_keep_dims_0, x = var_2205_cast_fp16)[name = tensor("op_2207_cast_fp16")]; tensor var_2208_to_fp16 = const()[name = tensor("op_2208_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_2209_cast_fp16 = add(x = var_2207_cast_fp16, y = var_2208_to_fp16)[name = tensor("op_2209_cast_fp16")]; tensor var_2210_epsilon_0 = const()[name = tensor("op_2210_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_2210_cast_fp16 = rsqrt(epsilon = var_2210_epsilon_0, x = var_2209_cast_fp16)[name = tensor("op_2210_cast_fp16")]; tensor output_225_cast_fp16 = mul(x = x_223, y = var_2210_cast_fp16)[name = tensor("output_225_cast_fp16")]; tensor var_2214_to_fp16 = const()[name = tensor("op_2214_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940393024)))]; tensor output_227_cast_fp16 = mul(x = output_225_cast_fp16, y = var_2214_to_fp16)[name = tensor("output_227_cast_fp16")]; tensor var_2219 = mul(x = output_223_cast_fp16, y = cos_7_palettized)[name = tensor("op_2219")]; tensor x1_37_begin_0 = const()[name = tensor("x1_37_begin_0"), val = tensor([0, 0, 0, 0])]; tensor x1_37_end_0 = const()[name = tensor("x1_37_end_0"), val = tensor([1, 8, 256, 128])]; tensor x1_37_end_mask_0 = const()[name = tensor("x1_37_end_mask_0"), val = tensor([true, true, true, false])]; tensor x1_37 = slice_by_index(begin = x1_37_begin_0, end = x1_37_end_0, end_mask = x1_37_end_mask_0, x = output_223_cast_fp16)[name = tensor("x1_37")]; tensor x2_37_begin_0 = const()[name = tensor("x2_37_begin_0"), val = tensor([0, 0, 0, 128])]; tensor x2_37_end_0 = const()[name = tensor("x2_37_end_0"), val = tensor([1, 8, 256, 256])]; tensor x2_37_end_mask_0 = const()[name = tensor("x2_37_end_mask_0"), val = tensor([true, true, true, true])]; tensor x2_37 = slice_by_index(begin = x2_37_begin_0, end = x2_37_end_0, end_mask = x2_37_end_mask_0, x = output_223_cast_fp16)[name = tensor("x2_37")]; tensor const_242_promoted = const()[name = tensor("const_242_promoted"), val = tensor(-0x1p+0)]; tensor var_2230 = mul(x = x2_37, y = const_242_promoted)[name = tensor("op_2230")]; tensor var_2232_interleave_0 = const()[name = tensor("op_2232_interleave_0"), val = tensor(false)]; tensor var_2232 = concat(axis = var_24, interleave = var_2232_interleave_0, values = (var_2230, x1_37))[name = tensor("op_2232")]; tensor var_2233 = mul(x = var_2232, y = sin_7_palettized)[name = tensor("op_2233")]; tensor query_19 = add(x = var_2219, y = var_2233)[name = tensor("query_19")]; tensor var_2235 = mul(x = output_227_cast_fp16, y = cos_7_palettized)[name = tensor("op_2235")]; tensor x1_39_begin_0 = const()[name = tensor("x1_39_begin_0"), val = tensor([0, 0, 0, 0])]; tensor x1_39_end_0 = const()[name = tensor("x1_39_end_0"), val = tensor([1, 4, 256, 128])]; tensor x1_39_end_mask_0 = const()[name = tensor("x1_39_end_mask_0"), val = tensor([true, true, true, false])]; tensor x1_39 = slice_by_index(begin = x1_39_begin_0, end = x1_39_end_0, end_mask = x1_39_end_mask_0, x = output_227_cast_fp16)[name = tensor("x1_39")]; tensor x2_39_begin_0 = const()[name = tensor("x2_39_begin_0"), val = tensor([0, 0, 0, 128])]; tensor x2_39_end_0 = const()[name = tensor("x2_39_end_0"), val = tensor([1, 4, 256, 256])]; tensor x2_39_end_mask_0 = const()[name = tensor("x2_39_end_mask_0"), val = tensor([true, true, true, true])]; tensor x2_39 = slice_by_index(begin = x2_39_begin_0, end = x2_39_end_0, end_mask = x2_39_end_mask_0, x = output_227_cast_fp16)[name = tensor("x2_39")]; tensor const_245_promoted = const()[name = tensor("const_245_promoted"), val = tensor(-0x1p+0)]; tensor var_2246 = mul(x = x2_39, y = const_245_promoted)[name = tensor("op_2246")]; tensor var_2248_interleave_0 = const()[name = tensor("op_2248_interleave_0"), val = tensor(false)]; tensor var_2248 = concat(axis = var_24, interleave = var_2248_interleave_0, values = (var_2246, x1_39))[name = tensor("op_2248")]; tensor var_2249 = mul(x = var_2248, y = sin_7_palettized)[name = tensor("op_2249")]; tensor hidden_states_129 = add(x = var_2235, y = var_2249)[name = tensor("hidden_states_129")]; tensor var_2258_axes_0 = const()[name = tensor("op_2258_axes_0"), val = tensor([2])]; tensor var_2258 = expand_dims(axes = var_2258_axes_0, x = hidden_states_129)[name = tensor("op_2258")]; tensor hidden_states_131_reps_0 = const()[name = tensor("hidden_states_131_reps_0"), val = tensor([1, 1, 2, 1, 1])]; tensor hidden_states_131 = tile(reps = hidden_states_131_reps_0, x = var_2258)[name = tensor("hidden_states_131")]; tensor var_2266 = const()[name = tensor("op_2266"), val = tensor([1, 8, 256, 256])]; tensor key_states_19 = reshape(shape = var_2266, x = hidden_states_131)[name = tensor("key_states_19")]; tensor var_2275_axes_0 = const()[name = tensor("op_2275_axes_0"), val = tensor([2])]; tensor hidden_states_133 = transpose(perm = hidden_states_133_perm_0, x = var_2187)[name = tensor("transpose_97")]; tensor var_2275 = expand_dims(axes = var_2275_axes_0, x = hidden_states_133)[name = tensor("op_2275")]; tensor hidden_states_135_reps_0 = const()[name = tensor("hidden_states_135_reps_0"), val = tensor([1, 1, 2, 1, 1])]; tensor hidden_states_135 = tile(reps = hidden_states_135_reps_0, x = var_2275)[name = tensor("hidden_states_135")]; tensor var_2283 = const()[name = tensor("op_2283"), val = tensor([1, 8, 256, 256])]; tensor value_states_19 = reshape(shape = var_2283, x = hidden_states_135)[name = tensor("value_states_19")]; tensor var_2286_transpose_x_1 = const()[name = tensor("op_2286_transpose_x_1"), val = tensor(false)]; tensor var_2286_transpose_y_1 = const()[name = tensor("op_2286_transpose_y_1"), val = tensor(true)]; tensor var_2286 = matmul(transpose_x = var_2286_transpose_x_1, transpose_y = var_2286_transpose_y_1, x = query_19, y = key_states_19)[name = tensor("op_2286")]; tensor var_2287_to_fp16 = const()[name = tensor("op_2287_to_fp16"), val = tensor(0x1p-4)]; tensor attn_weights_37_cast_fp16 = mul(x = var_2286, y = var_2287_to_fp16)[name = tensor("attn_weights_37_cast_fp16")]; tensor input_109_cast_fp16 = add(x = attn_weights_37_cast_fp16, y = attention_mask_to_fp16_palettized)[name = tensor("input_109_cast_fp16")]; tensor var_2295_cast_fp16 = softmax(axis = var_24, x = input_109_cast_fp16)[name = tensor("op_2295_cast_fp16")]; tensor attn_output_37_transpose_x_0 = const()[name = tensor("attn_output_37_transpose_x_0"), val = tensor(false)]; tensor attn_output_37_transpose_y_0 = const()[name = tensor("attn_output_37_transpose_y_0"), val = tensor(false)]; tensor attn_output_37 = matmul(transpose_x = attn_output_37_transpose_x_0, transpose_y = attn_output_37_transpose_y_0, x = var_2295_cast_fp16, y = value_states_19)[name = tensor("attn_output_37")]; tensor var_2299_perm_0 = const()[name = tensor("op_2299_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_2301 = const()[name = tensor("op_2301"), val = tensor([1, 256, -1])]; tensor var_2299 = transpose(perm = var_2299_perm_0, x = attn_output_37)[name = tensor("transpose_96")]; tensor var_2302 = reshape(shape = var_2301, x = var_2299)[name = tensor("op_2302")]; tensor x_227 = linear(bias = linear_3_bias_0, weight = wrapped_model_language_model_layers_9_self_attn_o_proj_weight_palettized, x = var_2302)[name = tensor("linear_66")]; tensor var_22_promoted_57_to_fp16 = const()[name = tensor("op_22_promoted_57_to_fp16"), val = tensor(0x1p+1)]; tensor var_2308_cast_fp16 = pow(x = x_227, y = var_22_promoted_57_to_fp16)[name = tensor("op_2308_cast_fp16")]; tensor var_2310_axes_0 = const()[name = tensor("op_2310_axes_0"), val = tensor([-1])]; tensor var_2310_keep_dims_0 = const()[name = tensor("op_2310_keep_dims_0"), val = tensor(true)]; tensor var_2310_cast_fp16 = reduce_mean(axes = var_2310_axes_0, keep_dims = var_2310_keep_dims_0, x = var_2308_cast_fp16)[name = tensor("op_2310_cast_fp16")]; tensor var_2311_to_fp16 = const()[name = tensor("op_2311_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_2312_cast_fp16 = add(x = var_2310_cast_fp16, y = var_2311_to_fp16)[name = tensor("op_2312_cast_fp16")]; tensor var_2313_epsilon_0 = const()[name = tensor("op_2313_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_2313_cast_fp16 = rsqrt(epsilon = var_2313_epsilon_0, x = var_2312_cast_fp16)[name = tensor("op_2313_cast_fp16")]; tensor output_229_cast_fp16 = mul(x = x_227, y = var_2313_cast_fp16)[name = tensor("output_229_cast_fp16")]; tensor var_2317_to_fp16 = const()[name = tensor("op_2317_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940393600)))]; tensor output_231_cast_fp16 = mul(x = output_229_cast_fp16, y = var_2317_to_fp16)[name = tensor("output_231_cast_fp16")]; tensor x_231 = add(x = x_215, y = output_231_cast_fp16)[name = tensor("x_231")]; tensor var_22_promoted_58_to_fp16 = const()[name = tensor("op_22_promoted_58_to_fp16"), val = tensor(0x1p+1)]; tensor var_2323_cast_fp16 = pow(x = x_231, y = var_22_promoted_58_to_fp16)[name = tensor("op_2323_cast_fp16")]; tensor var_2325_axes_0 = const()[name = tensor("op_2325_axes_0"), val = tensor([-1])]; tensor var_2325_keep_dims_0 = const()[name = tensor("op_2325_keep_dims_0"), val = tensor(true)]; tensor var_2325_cast_fp16 = reduce_mean(axes = var_2325_axes_0, keep_dims = var_2325_keep_dims_0, x = var_2323_cast_fp16)[name = tensor("op_2325_cast_fp16")]; tensor var_2326_to_fp16 = const()[name = tensor("op_2326_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_2327_cast_fp16 = add(x = var_2325_cast_fp16, y = var_2326_to_fp16)[name = tensor("op_2327_cast_fp16")]; tensor var_2328_epsilon_0 = const()[name = tensor("op_2328_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_2328_cast_fp16 = rsqrt(epsilon = var_2328_epsilon_0, x = var_2327_cast_fp16)[name = tensor("op_2328_cast_fp16")]; tensor output_233_cast_fp16 = mul(x = x_231, y = var_2328_cast_fp16)[name = tensor("output_233_cast_fp16")]; tensor var_2332_to_fp16 = const()[name = tensor("op_2332_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940398784)))]; tensor output_235_cast_fp16 = mul(x = output_233_cast_fp16, y = var_2332_to_fp16)[name = tensor("output_235_cast_fp16")]; tensor input_117 = linear(bias = linear_4_bias_0, weight = wrapped_model_language_model_layers_9_mlp_gate_proj_weight_palettized, x = output_235_cast_fp16)[name = tensor("linear_67")]; tensor var_2340_mode_0 = const()[name = tensor("op_2340_mode_0"), val = tensor("TANH_APPROXIMATION")]; tensor var_2340 = gelu(mode = var_2340_mode_0, x = input_117)[name = tensor("op_2340")]; tensor var_2342 = linear(bias = linear_4_bias_0, weight = wrapped_model_language_model_layers_9_mlp_up_proj_weight_palettized, x = output_235_cast_fp16)[name = tensor("linear_68")]; tensor input_119 = mul(x = var_2340, y = var_2342)[name = tensor("input_119")]; tensor x_235 = linear(bias = linear_3_bias_0, weight = wrapped_model_language_model_layers_9_mlp_down_proj_weight_palettized, x = input_119)[name = tensor("linear_69")]; tensor var_22_promoted_59_to_fp16 = const()[name = tensor("op_22_promoted_59_to_fp16"), val = tensor(0x1p+1)]; tensor var_2348_cast_fp16 = pow(x = x_235, y = var_22_promoted_59_to_fp16)[name = tensor("op_2348_cast_fp16")]; tensor var_2350_axes_0 = const()[name = tensor("op_2350_axes_0"), val = tensor([-1])]; tensor var_2350_keep_dims_0 = const()[name = tensor("op_2350_keep_dims_0"), val = tensor(true)]; tensor var_2350_cast_fp16 = reduce_mean(axes = var_2350_axes_0, keep_dims = var_2350_keep_dims_0, x = var_2348_cast_fp16)[name = tensor("op_2350_cast_fp16")]; tensor var_2351_to_fp16 = const()[name = tensor("op_2351_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_2352_cast_fp16 = add(x = var_2350_cast_fp16, y = var_2351_to_fp16)[name = tensor("op_2352_cast_fp16")]; tensor var_2353_epsilon_0 = const()[name = tensor("op_2353_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_2353_cast_fp16 = rsqrt(epsilon = var_2353_epsilon_0, x = var_2352_cast_fp16)[name = tensor("op_2353_cast_fp16")]; tensor output_237_cast_fp16 = mul(x = x_235, y = var_2353_cast_fp16)[name = tensor("output_237_cast_fp16")]; tensor var_2357_to_fp16 = const()[name = tensor("op_2357_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940403968)))]; tensor output_239_cast_fp16 = mul(x = output_237_cast_fp16, y = var_2357_to_fp16)[name = tensor("output_239_cast_fp16")]; tensor x_239 = add(x = x_231, y = output_239_cast_fp16)[name = tensor("x_239")]; tensor var_22_promoted_60_to_fp16 = const()[name = tensor("op_22_promoted_60_to_fp16"), val = tensor(0x1p+1)]; tensor var_2369_cast_fp16 = pow(x = x_239, y = var_22_promoted_60_to_fp16)[name = tensor("op_2369_cast_fp16")]; tensor var_2371_axes_0 = const()[name = tensor("op_2371_axes_0"), val = tensor([-1])]; tensor var_2371_keep_dims_0 = const()[name = tensor("op_2371_keep_dims_0"), val = tensor(true)]; tensor var_2371_cast_fp16 = reduce_mean(axes = var_2371_axes_0, keep_dims = var_2371_keep_dims_0, x = var_2369_cast_fp16)[name = tensor("op_2371_cast_fp16")]; tensor var_2372_to_fp16 = const()[name = tensor("op_2372_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_2373_cast_fp16 = add(x = var_2371_cast_fp16, y = var_2372_to_fp16)[name = tensor("op_2373_cast_fp16")]; tensor var_2374_epsilon_0 = const()[name = tensor("op_2374_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_2374_cast_fp16 = rsqrt(epsilon = var_2374_epsilon_0, x = var_2373_cast_fp16)[name = tensor("op_2374_cast_fp16")]; tensor output_241_cast_fp16 = mul(x = x_239, y = var_2374_cast_fp16)[name = tensor("output_241_cast_fp16")]; tensor var_2378_to_fp16 = const()[name = tensor("op_2378_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940409152)))]; tensor output_243_cast_fp16 = mul(x = output_241_cast_fp16, y = var_2378_to_fp16)[name = tensor("output_243_cast_fp16")]; tensor var_2390 = linear(bias = linear_0_bias_0, weight = wrapped_model_language_model_layers_10_self_attn_q_proj_weight_palettized, x = output_243_cast_fp16)[name = tensor("linear_70")]; tensor var_2391 = const()[name = tensor("op_2391"), val = tensor([1, 256, -1, 256])]; tensor var_2392 = reshape(shape = var_2391, x = var_2390)[name = tensor("op_2392")]; tensor x_243_perm_0 = const()[name = tensor("x_243_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_2395 = linear(bias = linear_1_bias_0, weight = wrapped_model_language_model_layers_10_self_attn_k_proj_weight_palettized, x = output_243_cast_fp16)[name = tensor("linear_71")]; tensor var_2396 = const()[name = tensor("op_2396"), val = tensor([1, 256, -1, 256])]; tensor var_2397 = reshape(shape = var_2396, x = var_2395)[name = tensor("op_2397")]; tensor x_247_perm_0 = const()[name = tensor("x_247_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_2400 = linear(bias = linear_1_bias_0, weight = wrapped_model_language_model_layers_10_self_attn_v_proj_weight_palettized, x = output_243_cast_fp16)[name = tensor("linear_72")]; tensor var_2401 = const()[name = tensor("op_2401"), val = tensor([1, 256, -1, 256])]; tensor var_2402 = reshape(shape = var_2401, x = var_2400)[name = tensor("op_2402")]; tensor hidden_states_147_perm_0 = const()[name = tensor("hidden_states_147_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_22_promoted_61_to_fp16 = const()[name = tensor("op_22_promoted_61_to_fp16"), val = tensor(0x1p+1)]; tensor x_243 = transpose(perm = x_243_perm_0, x = var_2392)[name = tensor("transpose_95")]; tensor var_2406_cast_fp16 = pow(x = x_243, y = var_22_promoted_61_to_fp16)[name = tensor("op_2406_cast_fp16")]; tensor var_2408_axes_0 = const()[name = tensor("op_2408_axes_0"), val = tensor([-1])]; tensor var_2408_keep_dims_0 = const()[name = tensor("op_2408_keep_dims_0"), val = tensor(true)]; tensor var_2408_cast_fp16 = reduce_mean(axes = var_2408_axes_0, keep_dims = var_2408_keep_dims_0, x = var_2406_cast_fp16)[name = tensor("op_2408_cast_fp16")]; tensor var_2409_to_fp16 = const()[name = tensor("op_2409_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_2410_cast_fp16 = add(x = var_2408_cast_fp16, y = var_2409_to_fp16)[name = tensor("op_2410_cast_fp16")]; tensor var_2411_epsilon_0 = const()[name = tensor("op_2411_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_2411_cast_fp16 = rsqrt(epsilon = var_2411_epsilon_0, x = var_2410_cast_fp16)[name = tensor("op_2411_cast_fp16")]; tensor output_245_cast_fp16 = mul(x = x_243, y = var_2411_cast_fp16)[name = tensor("output_245_cast_fp16")]; tensor var_2415_to_fp16 = const()[name = tensor("op_2415_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940414336)))]; tensor output_247_cast_fp16 = mul(x = output_245_cast_fp16, y = var_2415_to_fp16)[name = tensor("output_247_cast_fp16")]; tensor var_22_promoted_62_to_fp16 = const()[name = tensor("op_22_promoted_62_to_fp16"), val = tensor(0x1p+1)]; tensor x_247 = transpose(perm = x_247_perm_0, x = var_2397)[name = tensor("transpose_94")]; tensor var_2420_cast_fp16 = pow(x = x_247, y = var_22_promoted_62_to_fp16)[name = tensor("op_2420_cast_fp16")]; tensor var_2422_axes_0 = const()[name = tensor("op_2422_axes_0"), val = tensor([-1])]; tensor var_2422_keep_dims_0 = const()[name = tensor("op_2422_keep_dims_0"), val = tensor(true)]; tensor var_2422_cast_fp16 = reduce_mean(axes = var_2422_axes_0, keep_dims = var_2422_keep_dims_0, x = var_2420_cast_fp16)[name = tensor("op_2422_cast_fp16")]; tensor var_2423_to_fp16 = const()[name = tensor("op_2423_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_2424_cast_fp16 = add(x = var_2422_cast_fp16, y = var_2423_to_fp16)[name = tensor("op_2424_cast_fp16")]; tensor var_2425_epsilon_0 = const()[name = tensor("op_2425_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_2425_cast_fp16 = rsqrt(epsilon = var_2425_epsilon_0, x = var_2424_cast_fp16)[name = tensor("op_2425_cast_fp16")]; tensor output_249_cast_fp16 = mul(x = x_247, y = var_2425_cast_fp16)[name = tensor("output_249_cast_fp16")]; tensor var_2429_to_fp16 = const()[name = tensor("op_2429_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940414912)))]; tensor output_251_cast_fp16 = mul(x = output_249_cast_fp16, y = var_2429_to_fp16)[name = tensor("output_251_cast_fp16")]; tensor var_2434 = mul(x = output_247_cast_fp16, y = cos_7_palettized)[name = tensor("op_2434")]; tensor x1_41_begin_0 = const()[name = tensor("x1_41_begin_0"), val = tensor([0, 0, 0, 0])]; tensor x1_41_end_0 = const()[name = tensor("x1_41_end_0"), val = tensor([1, 8, 256, 128])]; tensor x1_41_end_mask_0 = const()[name = tensor("x1_41_end_mask_0"), val = tensor([true, true, true, false])]; tensor x1_41 = slice_by_index(begin = x1_41_begin_0, end = x1_41_end_0, end_mask = x1_41_end_mask_0, x = output_247_cast_fp16)[name = tensor("x1_41")]; tensor x2_41_begin_0 = const()[name = tensor("x2_41_begin_0"), val = tensor([0, 0, 0, 128])]; tensor x2_41_end_0 = const()[name = tensor("x2_41_end_0"), val = tensor([1, 8, 256, 256])]; tensor x2_41_end_mask_0 = const()[name = tensor("x2_41_end_mask_0"), val = tensor([true, true, true, true])]; tensor x2_41 = slice_by_index(begin = x2_41_begin_0, end = x2_41_end_0, end_mask = x2_41_end_mask_0, x = output_247_cast_fp16)[name = tensor("x2_41")]; tensor const_265_promoted = const()[name = tensor("const_265_promoted"), val = tensor(-0x1p+0)]; tensor var_2445 = mul(x = x2_41, y = const_265_promoted)[name = tensor("op_2445")]; tensor var_2447_interleave_0 = const()[name = tensor("op_2447_interleave_0"), val = tensor(false)]; tensor var_2447 = concat(axis = var_24, interleave = var_2447_interleave_0, values = (var_2445, x1_41))[name = tensor("op_2447")]; tensor var_2448 = mul(x = var_2447, y = sin_7_palettized)[name = tensor("op_2448")]; tensor query_21 = add(x = var_2434, y = var_2448)[name = tensor("query_21")]; tensor var_2450 = mul(x = output_251_cast_fp16, y = cos_7_palettized)[name = tensor("op_2450")]; tensor x1_43_begin_0 = const()[name = tensor("x1_43_begin_0"), val = tensor([0, 0, 0, 0])]; tensor x1_43_end_0 = const()[name = tensor("x1_43_end_0"), val = tensor([1, 4, 256, 128])]; tensor x1_43_end_mask_0 = const()[name = tensor("x1_43_end_mask_0"), val = tensor([true, true, true, false])]; tensor x1_43 = slice_by_index(begin = x1_43_begin_0, end = x1_43_end_0, end_mask = x1_43_end_mask_0, x = output_251_cast_fp16)[name = tensor("x1_43")]; tensor x2_43_begin_0 = const()[name = tensor("x2_43_begin_0"), val = tensor([0, 0, 0, 128])]; tensor x2_43_end_0 = const()[name = tensor("x2_43_end_0"), val = tensor([1, 4, 256, 256])]; tensor x2_43_end_mask_0 = const()[name = tensor("x2_43_end_mask_0"), val = tensor([true, true, true, true])]; tensor x2_43 = slice_by_index(begin = x2_43_begin_0, end = x2_43_end_0, end_mask = x2_43_end_mask_0, x = output_251_cast_fp16)[name = tensor("x2_43")]; tensor const_268_promoted = const()[name = tensor("const_268_promoted"), val = tensor(-0x1p+0)]; tensor var_2461 = mul(x = x2_43, y = const_268_promoted)[name = tensor("op_2461")]; tensor var_2463_interleave_0 = const()[name = tensor("op_2463_interleave_0"), val = tensor(false)]; tensor var_2463 = concat(axis = var_24, interleave = var_2463_interleave_0, values = (var_2461, x1_43))[name = tensor("op_2463")]; tensor var_2464 = mul(x = var_2463, y = sin_7_palettized)[name = tensor("op_2464")]; tensor hidden_states_143 = add(x = var_2450, y = var_2464)[name = tensor("hidden_states_143")]; tensor var_2473_axes_0 = const()[name = tensor("op_2473_axes_0"), val = tensor([2])]; tensor var_2473 = expand_dims(axes = var_2473_axes_0, x = hidden_states_143)[name = tensor("op_2473")]; tensor hidden_states_145_reps_0 = const()[name = tensor("hidden_states_145_reps_0"), val = tensor([1, 1, 2, 1, 1])]; tensor hidden_states_145 = tile(reps = hidden_states_145_reps_0, x = var_2473)[name = tensor("hidden_states_145")]; tensor var_2481 = const()[name = tensor("op_2481"), val = tensor([1, 8, 256, 256])]; tensor key_states_21 = reshape(shape = var_2481, x = hidden_states_145)[name = tensor("key_states_21")]; tensor var_2490_axes_0 = const()[name = tensor("op_2490_axes_0"), val = tensor([2])]; tensor hidden_states_147 = transpose(perm = hidden_states_147_perm_0, x = var_2402)[name = tensor("transpose_93")]; tensor var_2490 = expand_dims(axes = var_2490_axes_0, x = hidden_states_147)[name = tensor("op_2490")]; tensor hidden_states_149_reps_0 = const()[name = tensor("hidden_states_149_reps_0"), val = tensor([1, 1, 2, 1, 1])]; tensor hidden_states_149 = tile(reps = hidden_states_149_reps_0, x = var_2490)[name = tensor("hidden_states_149")]; tensor var_2498 = const()[name = tensor("op_2498"), val = tensor([1, 8, 256, 256])]; tensor value_states_21 = reshape(shape = var_2498, x = hidden_states_149)[name = tensor("value_states_21")]; tensor var_2501_transpose_x_1 = const()[name = tensor("op_2501_transpose_x_1"), val = tensor(false)]; tensor var_2501_transpose_y_1 = const()[name = tensor("op_2501_transpose_y_1"), val = tensor(true)]; tensor var_2501 = matmul(transpose_x = var_2501_transpose_x_1, transpose_y = var_2501_transpose_y_1, x = query_21, y = key_states_21)[name = tensor("op_2501")]; tensor var_2502_to_fp16 = const()[name = tensor("op_2502_to_fp16"), val = tensor(0x1p-4)]; tensor attn_weights_41_cast_fp16 = mul(x = var_2501, y = var_2502_to_fp16)[name = tensor("attn_weights_41_cast_fp16")]; tensor input_121_cast_fp16 = add(x = attn_weights_41_cast_fp16, y = attention_mask_to_fp16_palettized)[name = tensor("input_121_cast_fp16")]; tensor var_2510_cast_fp16 = softmax(axis = var_24, x = input_121_cast_fp16)[name = tensor("op_2510_cast_fp16")]; tensor attn_output_41_transpose_x_0 = const()[name = tensor("attn_output_41_transpose_x_0"), val = tensor(false)]; tensor attn_output_41_transpose_y_0 = const()[name = tensor("attn_output_41_transpose_y_0"), val = tensor(false)]; tensor attn_output_41 = matmul(transpose_x = attn_output_41_transpose_x_0, transpose_y = attn_output_41_transpose_y_0, x = var_2510_cast_fp16, y = value_states_21)[name = tensor("attn_output_41")]; tensor var_2514_perm_0 = const()[name = tensor("op_2514_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_2516 = const()[name = tensor("op_2516"), val = tensor([1, 256, -1])]; tensor var_2514 = transpose(perm = var_2514_perm_0, x = attn_output_41)[name = tensor("transpose_92")]; tensor var_2517 = reshape(shape = var_2516, x = var_2514)[name = tensor("op_2517")]; tensor x_251 = linear(bias = linear_3_bias_0, weight = wrapped_model_language_model_layers_10_self_attn_o_proj_weight_palettized, x = var_2517)[name = tensor("linear_73")]; tensor var_22_promoted_63_to_fp16 = const()[name = tensor("op_22_promoted_63_to_fp16"), val = tensor(0x1p+1)]; tensor var_2523_cast_fp16 = pow(x = x_251, y = var_22_promoted_63_to_fp16)[name = tensor("op_2523_cast_fp16")]; tensor var_2525_axes_0 = const()[name = tensor("op_2525_axes_0"), val = tensor([-1])]; tensor var_2525_keep_dims_0 = const()[name = tensor("op_2525_keep_dims_0"), val = tensor(true)]; tensor var_2525_cast_fp16 = reduce_mean(axes = var_2525_axes_0, keep_dims = var_2525_keep_dims_0, x = var_2523_cast_fp16)[name = tensor("op_2525_cast_fp16")]; tensor var_2526_to_fp16 = const()[name = tensor("op_2526_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_2527_cast_fp16 = add(x = var_2525_cast_fp16, y = var_2526_to_fp16)[name = tensor("op_2527_cast_fp16")]; tensor var_2528_epsilon_0 = const()[name = tensor("op_2528_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_2528_cast_fp16 = rsqrt(epsilon = var_2528_epsilon_0, x = var_2527_cast_fp16)[name = tensor("op_2528_cast_fp16")]; tensor output_253_cast_fp16 = mul(x = x_251, y = var_2528_cast_fp16)[name = tensor("output_253_cast_fp16")]; tensor var_2532_to_fp16 = const()[name = tensor("op_2532_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940415488)))]; tensor output_255_cast_fp16 = mul(x = output_253_cast_fp16, y = var_2532_to_fp16)[name = tensor("output_255_cast_fp16")]; tensor x_255 = add(x = x_239, y = output_255_cast_fp16)[name = tensor("x_255")]; tensor var_22_promoted_64_to_fp16 = const()[name = tensor("op_22_promoted_64_to_fp16"), val = tensor(0x1p+1)]; tensor var_2538_cast_fp16 = pow(x = x_255, y = var_22_promoted_64_to_fp16)[name = tensor("op_2538_cast_fp16")]; tensor var_2540_axes_0 = const()[name = tensor("op_2540_axes_0"), val = tensor([-1])]; tensor var_2540_keep_dims_0 = const()[name = tensor("op_2540_keep_dims_0"), val = tensor(true)]; tensor var_2540_cast_fp16 = reduce_mean(axes = var_2540_axes_0, keep_dims = var_2540_keep_dims_0, x = var_2538_cast_fp16)[name = tensor("op_2540_cast_fp16")]; tensor var_2541_to_fp16 = const()[name = tensor("op_2541_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_2542_cast_fp16 = add(x = var_2540_cast_fp16, y = var_2541_to_fp16)[name = tensor("op_2542_cast_fp16")]; tensor var_2543_epsilon_0 = const()[name = tensor("op_2543_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_2543_cast_fp16 = rsqrt(epsilon = var_2543_epsilon_0, x = var_2542_cast_fp16)[name = tensor("op_2543_cast_fp16")]; tensor output_257_cast_fp16 = mul(x = x_255, y = var_2543_cast_fp16)[name = tensor("output_257_cast_fp16")]; tensor var_2547_to_fp16 = const()[name = tensor("op_2547_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940420672)))]; tensor output_259_cast_fp16 = mul(x = output_257_cast_fp16, y = var_2547_to_fp16)[name = tensor("output_259_cast_fp16")]; tensor input_129 = linear(bias = linear_4_bias_0, weight = wrapped_model_language_model_layers_10_mlp_gate_proj_weight_palettized, x = output_259_cast_fp16)[name = tensor("linear_74")]; tensor var_2555_mode_0 = const()[name = tensor("op_2555_mode_0"), val = tensor("TANH_APPROXIMATION")]; tensor var_2555 = gelu(mode = var_2555_mode_0, x = input_129)[name = tensor("op_2555")]; tensor var_2557 = linear(bias = linear_4_bias_0, weight = wrapped_model_language_model_layers_10_mlp_up_proj_weight_palettized, x = output_259_cast_fp16)[name = tensor("linear_75")]; tensor input_131 = mul(x = var_2555, y = var_2557)[name = tensor("input_131")]; tensor x_259 = linear(bias = linear_3_bias_0, weight = wrapped_model_language_model_layers_10_mlp_down_proj_weight_palettized, x = input_131)[name = tensor("linear_76")]; tensor var_22_promoted_65_to_fp16 = const()[name = tensor("op_22_promoted_65_to_fp16"), val = tensor(0x1p+1)]; tensor var_2563_cast_fp16 = pow(x = x_259, y = var_22_promoted_65_to_fp16)[name = tensor("op_2563_cast_fp16")]; tensor var_2565_axes_0 = const()[name = tensor("op_2565_axes_0"), val = tensor([-1])]; tensor var_2565_keep_dims_0 = const()[name = tensor("op_2565_keep_dims_0"), val = tensor(true)]; tensor var_2565_cast_fp16 = reduce_mean(axes = var_2565_axes_0, keep_dims = var_2565_keep_dims_0, x = var_2563_cast_fp16)[name = tensor("op_2565_cast_fp16")]; tensor var_2566_to_fp16 = const()[name = tensor("op_2566_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_2567_cast_fp16 = add(x = var_2565_cast_fp16, y = var_2566_to_fp16)[name = tensor("op_2567_cast_fp16")]; tensor var_2568_epsilon_0 = const()[name = tensor("op_2568_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_2568_cast_fp16 = rsqrt(epsilon = var_2568_epsilon_0, x = var_2567_cast_fp16)[name = tensor("op_2568_cast_fp16")]; tensor output_261_cast_fp16 = mul(x = x_259, y = var_2568_cast_fp16)[name = tensor("output_261_cast_fp16")]; tensor var_2572_to_fp16 = const()[name = tensor("op_2572_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940425856)))]; tensor output_263_cast_fp16 = mul(x = output_261_cast_fp16, y = var_2572_to_fp16)[name = tensor("output_263_cast_fp16")]; tensor x_263 = add(x = x_255, y = output_263_cast_fp16)[name = tensor("x_263")]; tensor var_22_promoted_66_to_fp16 = const()[name = tensor("op_22_promoted_66_to_fp16"), val = tensor(0x1p+1)]; tensor var_2584_cast_fp16 = pow(x = x_263, y = var_22_promoted_66_to_fp16)[name = tensor("op_2584_cast_fp16")]; tensor var_2586_axes_0 = const()[name = tensor("op_2586_axes_0"), val = tensor([-1])]; tensor var_2586_keep_dims_0 = const()[name = tensor("op_2586_keep_dims_0"), val = tensor(true)]; tensor var_2586_cast_fp16 = reduce_mean(axes = var_2586_axes_0, keep_dims = var_2586_keep_dims_0, x = var_2584_cast_fp16)[name = tensor("op_2586_cast_fp16")]; tensor var_2587_to_fp16 = const()[name = tensor("op_2587_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_2588_cast_fp16 = add(x = var_2586_cast_fp16, y = var_2587_to_fp16)[name = tensor("op_2588_cast_fp16")]; tensor var_2589_epsilon_0 = const()[name = tensor("op_2589_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_2589_cast_fp16 = rsqrt(epsilon = var_2589_epsilon_0, x = var_2588_cast_fp16)[name = tensor("op_2589_cast_fp16")]; tensor output_265_cast_fp16 = mul(x = x_263, y = var_2589_cast_fp16)[name = tensor("output_265_cast_fp16")]; tensor var_2593_to_fp16 = const()[name = tensor("op_2593_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940431040)))]; tensor output_267_cast_fp16 = mul(x = output_265_cast_fp16, y = var_2593_to_fp16)[name = tensor("output_267_cast_fp16")]; tensor var_2605 = linear(bias = linear_0_bias_0, weight = wrapped_model_language_model_layers_11_self_attn_q_proj_weight_palettized, x = output_267_cast_fp16)[name = tensor("linear_77")]; tensor var_2606 = const()[name = tensor("op_2606"), val = tensor([1, 256, -1, 256])]; tensor var_2607 = reshape(shape = var_2606, x = var_2605)[name = tensor("op_2607")]; tensor x_267_perm_0 = const()[name = tensor("x_267_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_2610 = linear(bias = linear_1_bias_0, weight = wrapped_model_language_model_layers_11_self_attn_k_proj_weight_palettized, x = output_267_cast_fp16)[name = tensor("linear_78")]; tensor var_2611 = const()[name = tensor("op_2611"), val = tensor([1, 256, -1, 256])]; tensor var_2612 = reshape(shape = var_2611, x = var_2610)[name = tensor("op_2612")]; tensor x_271_perm_0 = const()[name = tensor("x_271_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_2615 = linear(bias = linear_1_bias_0, weight = wrapped_model_language_model_layers_11_self_attn_v_proj_weight_palettized, x = output_267_cast_fp16)[name = tensor("linear_79")]; tensor var_2616 = const()[name = tensor("op_2616"), val = tensor([1, 256, -1, 256])]; tensor var_2617 = reshape(shape = var_2616, x = var_2615)[name = tensor("op_2617")]; tensor hidden_states_161_perm_0 = const()[name = tensor("hidden_states_161_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_22_promoted_67_to_fp16 = const()[name = tensor("op_22_promoted_67_to_fp16"), val = tensor(0x1p+1)]; tensor x_267 = transpose(perm = x_267_perm_0, x = var_2607)[name = tensor("transpose_91")]; tensor var_2621_cast_fp16 = pow(x = x_267, y = var_22_promoted_67_to_fp16)[name = tensor("op_2621_cast_fp16")]; tensor var_2623_axes_0 = const()[name = tensor("op_2623_axes_0"), val = tensor([-1])]; tensor var_2623_keep_dims_0 = const()[name = tensor("op_2623_keep_dims_0"), val = tensor(true)]; tensor var_2623_cast_fp16 = reduce_mean(axes = var_2623_axes_0, keep_dims = var_2623_keep_dims_0, x = var_2621_cast_fp16)[name = tensor("op_2623_cast_fp16")]; tensor var_2624_to_fp16 = const()[name = tensor("op_2624_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_2625_cast_fp16 = add(x = var_2623_cast_fp16, y = var_2624_to_fp16)[name = tensor("op_2625_cast_fp16")]; tensor var_2626_epsilon_0 = const()[name = tensor("op_2626_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_2626_cast_fp16 = rsqrt(epsilon = var_2626_epsilon_0, x = var_2625_cast_fp16)[name = tensor("op_2626_cast_fp16")]; tensor output_269_cast_fp16 = mul(x = x_267, y = var_2626_cast_fp16)[name = tensor("output_269_cast_fp16")]; tensor var_2630_to_fp16 = const()[name = tensor("op_2630_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940436224)))]; tensor output_271_cast_fp16 = mul(x = output_269_cast_fp16, y = var_2630_to_fp16)[name = tensor("output_271_cast_fp16")]; tensor var_22_promoted_68_to_fp16 = const()[name = tensor("op_22_promoted_68_to_fp16"), val = tensor(0x1p+1)]; tensor x_271 = transpose(perm = x_271_perm_0, x = var_2612)[name = tensor("transpose_90")]; tensor var_2635_cast_fp16 = pow(x = x_271, y = var_22_promoted_68_to_fp16)[name = tensor("op_2635_cast_fp16")]; tensor var_2637_axes_0 = const()[name = tensor("op_2637_axes_0"), val = tensor([-1])]; tensor var_2637_keep_dims_0 = const()[name = tensor("op_2637_keep_dims_0"), val = tensor(true)]; tensor var_2637_cast_fp16 = reduce_mean(axes = var_2637_axes_0, keep_dims = var_2637_keep_dims_0, x = var_2635_cast_fp16)[name = tensor("op_2637_cast_fp16")]; tensor var_2638_to_fp16 = const()[name = tensor("op_2638_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_2639_cast_fp16 = add(x = var_2637_cast_fp16, y = var_2638_to_fp16)[name = tensor("op_2639_cast_fp16")]; tensor var_2640_epsilon_0 = const()[name = tensor("op_2640_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_2640_cast_fp16 = rsqrt(epsilon = var_2640_epsilon_0, x = var_2639_cast_fp16)[name = tensor("op_2640_cast_fp16")]; tensor output_273_cast_fp16 = mul(x = x_271, y = var_2640_cast_fp16)[name = tensor("output_273_cast_fp16")]; tensor var_2644_to_fp16 = const()[name = tensor("op_2644_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940436800)))]; tensor output_275_cast_fp16 = mul(x = output_273_cast_fp16, y = var_2644_to_fp16)[name = tensor("output_275_cast_fp16")]; tensor var_2649 = mul(x = output_271_cast_fp16, y = cos_19_palettized)[name = tensor("op_2649")]; tensor x1_45_begin_0 = const()[name = tensor("x1_45_begin_0"), val = tensor([0, 0, 0, 0])]; tensor x1_45_end_0 = const()[name = tensor("x1_45_end_0"), val = tensor([1, 8, 256, 128])]; tensor x1_45_end_mask_0 = const()[name = tensor("x1_45_end_mask_0"), val = tensor([true, true, true, false])]; tensor x1_45 = slice_by_index(begin = x1_45_begin_0, end = x1_45_end_0, end_mask = x1_45_end_mask_0, x = output_271_cast_fp16)[name = tensor("x1_45")]; tensor x2_45_begin_0 = const()[name = tensor("x2_45_begin_0"), val = tensor([0, 0, 0, 128])]; tensor x2_45_end_0 = const()[name = tensor("x2_45_end_0"), val = tensor([1, 8, 256, 256])]; tensor x2_45_end_mask_0 = const()[name = tensor("x2_45_end_mask_0"), val = tensor([true, true, true, true])]; tensor x2_45 = slice_by_index(begin = x2_45_begin_0, end = x2_45_end_0, end_mask = x2_45_end_mask_0, x = output_271_cast_fp16)[name = tensor("x2_45")]; tensor const_288_promoted = const()[name = tensor("const_288_promoted"), val = tensor(-0x1p+0)]; tensor var_2660 = mul(x = x2_45, y = const_288_promoted)[name = tensor("op_2660")]; tensor var_2662_interleave_0 = const()[name = tensor("op_2662_interleave_0"), val = tensor(false)]; tensor var_2662 = concat(axis = var_24, interleave = var_2662_interleave_0, values = (var_2660, x1_45))[name = tensor("op_2662")]; tensor var_2663 = mul(x = var_2662, y = sin_19_palettized)[name = tensor("op_2663")]; tensor query_23 = add(x = var_2649, y = var_2663)[name = tensor("query_23")]; tensor var_2665 = mul(x = output_275_cast_fp16, y = cos_19_palettized)[name = tensor("op_2665")]; tensor x1_47_begin_0 = const()[name = tensor("x1_47_begin_0"), val = tensor([0, 0, 0, 0])]; tensor x1_47_end_0 = const()[name = tensor("x1_47_end_0"), val = tensor([1, 4, 256, 128])]; tensor x1_47_end_mask_0 = const()[name = tensor("x1_47_end_mask_0"), val = tensor([true, true, true, false])]; tensor x1_47 = slice_by_index(begin = x1_47_begin_0, end = x1_47_end_0, end_mask = x1_47_end_mask_0, x = output_275_cast_fp16)[name = tensor("x1_47")]; tensor x2_47_begin_0 = const()[name = tensor("x2_47_begin_0"), val = tensor([0, 0, 0, 128])]; tensor x2_47_end_0 = const()[name = tensor("x2_47_end_0"), val = tensor([1, 4, 256, 256])]; tensor x2_47_end_mask_0 = const()[name = tensor("x2_47_end_mask_0"), val = tensor([true, true, true, true])]; tensor x2_47 = slice_by_index(begin = x2_47_begin_0, end = x2_47_end_0, end_mask = x2_47_end_mask_0, x = output_275_cast_fp16)[name = tensor("x2_47")]; tensor const_291_promoted = const()[name = tensor("const_291_promoted"), val = tensor(-0x1p+0)]; tensor var_2676 = mul(x = x2_47, y = const_291_promoted)[name = tensor("op_2676")]; tensor var_2678_interleave_0 = const()[name = tensor("op_2678_interleave_0"), val = tensor(false)]; tensor var_2678 = concat(axis = var_24, interleave = var_2678_interleave_0, values = (var_2676, x1_47))[name = tensor("op_2678")]; tensor var_2679 = mul(x = var_2678, y = sin_19_palettized)[name = tensor("op_2679")]; tensor hidden_states_157 = add(x = var_2665, y = var_2679)[name = tensor("hidden_states_157")]; tensor var_2688_axes_0 = const()[name = tensor("op_2688_axes_0"), val = tensor([2])]; tensor var_2688 = expand_dims(axes = var_2688_axes_0, x = hidden_states_157)[name = tensor("op_2688")]; tensor hidden_states_159_reps_0 = const()[name = tensor("hidden_states_159_reps_0"), val = tensor([1, 1, 2, 1, 1])]; tensor hidden_states_159 = tile(reps = hidden_states_159_reps_0, x = var_2688)[name = tensor("hidden_states_159")]; tensor var_2696 = const()[name = tensor("op_2696"), val = tensor([1, 8, 256, 256])]; tensor key_states_23 = reshape(shape = var_2696, x = hidden_states_159)[name = tensor("key_states_23")]; tensor var_2705_axes_0 = const()[name = tensor("op_2705_axes_0"), val = tensor([2])]; tensor hidden_states_161 = transpose(perm = hidden_states_161_perm_0, x = var_2617)[name = tensor("transpose_89")]; tensor var_2705 = expand_dims(axes = var_2705_axes_0, x = hidden_states_161)[name = tensor("op_2705")]; tensor hidden_states_163_reps_0 = const()[name = tensor("hidden_states_163_reps_0"), val = tensor([1, 1, 2, 1, 1])]; tensor hidden_states_163 = tile(reps = hidden_states_163_reps_0, x = var_2705)[name = tensor("hidden_states_163")]; tensor var_2713 = const()[name = tensor("op_2713"), val = tensor([1, 8, 256, 256])]; tensor value_states_23 = reshape(shape = var_2713, x = hidden_states_163)[name = tensor("value_states_23")]; tensor var_2716_transpose_x_1 = const()[name = tensor("op_2716_transpose_x_1"), val = tensor(false)]; tensor var_2716_transpose_y_1 = const()[name = tensor("op_2716_transpose_y_1"), val = tensor(true)]; tensor var_2716 = matmul(transpose_x = var_2716_transpose_x_1, transpose_y = var_2716_transpose_y_1, x = query_23, y = key_states_23)[name = tensor("op_2716")]; tensor var_2717_to_fp16 = const()[name = tensor("op_2717_to_fp16"), val = tensor(0x1p-4)]; tensor attn_weights_45_cast_fp16 = mul(x = var_2716, y = var_2717_to_fp16)[name = tensor("attn_weights_45_cast_fp16")]; tensor input_133_cast_fp16 = add(x = attn_weights_45_cast_fp16, y = attention_mask_to_fp16_palettized)[name = tensor("input_133_cast_fp16")]; tensor var_2725_cast_fp16 = softmax(axis = var_24, x = input_133_cast_fp16)[name = tensor("op_2725_cast_fp16")]; tensor attn_output_45_transpose_x_0 = const()[name = tensor("attn_output_45_transpose_x_0"), val = tensor(false)]; tensor attn_output_45_transpose_y_0 = const()[name = tensor("attn_output_45_transpose_y_0"), val = tensor(false)]; tensor attn_output_45 = matmul(transpose_x = attn_output_45_transpose_x_0, transpose_y = attn_output_45_transpose_y_0, x = var_2725_cast_fp16, y = value_states_23)[name = tensor("attn_output_45")]; tensor var_2729_perm_0 = const()[name = tensor("op_2729_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_2731 = const()[name = tensor("op_2731"), val = tensor([1, 256, -1])]; tensor var_2729 = transpose(perm = var_2729_perm_0, x = attn_output_45)[name = tensor("transpose_88")]; tensor var_2732 = reshape(shape = var_2731, x = var_2729)[name = tensor("op_2732")]; tensor x_275 = linear(bias = linear_3_bias_0, weight = wrapped_model_language_model_layers_11_self_attn_o_proj_weight_palettized, x = var_2732)[name = tensor("linear_80")]; tensor var_22_promoted_69_to_fp16 = const()[name = tensor("op_22_promoted_69_to_fp16"), val = tensor(0x1p+1)]; tensor var_2738_cast_fp16 = pow(x = x_275, y = var_22_promoted_69_to_fp16)[name = tensor("op_2738_cast_fp16")]; tensor var_2740_axes_0 = const()[name = tensor("op_2740_axes_0"), val = tensor([-1])]; tensor var_2740_keep_dims_0 = const()[name = tensor("op_2740_keep_dims_0"), val = tensor(true)]; tensor var_2740_cast_fp16 = reduce_mean(axes = var_2740_axes_0, keep_dims = var_2740_keep_dims_0, x = var_2738_cast_fp16)[name = tensor("op_2740_cast_fp16")]; tensor var_2741_to_fp16 = const()[name = tensor("op_2741_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_2742_cast_fp16 = add(x = var_2740_cast_fp16, y = var_2741_to_fp16)[name = tensor("op_2742_cast_fp16")]; tensor var_2743_epsilon_0 = const()[name = tensor("op_2743_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_2743_cast_fp16 = rsqrt(epsilon = var_2743_epsilon_0, x = var_2742_cast_fp16)[name = tensor("op_2743_cast_fp16")]; tensor output_277_cast_fp16 = mul(x = x_275, y = var_2743_cast_fp16)[name = tensor("output_277_cast_fp16")]; tensor var_2747_to_fp16 = const()[name = tensor("op_2747_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940437376)))]; tensor output_279_cast_fp16 = mul(x = output_277_cast_fp16, y = var_2747_to_fp16)[name = tensor("output_279_cast_fp16")]; tensor x_279 = add(x = x_263, y = output_279_cast_fp16)[name = tensor("x_279")]; tensor var_22_promoted_70_to_fp16 = const()[name = tensor("op_22_promoted_70_to_fp16"), val = tensor(0x1p+1)]; tensor var_2753_cast_fp16 = pow(x = x_279, y = var_22_promoted_70_to_fp16)[name = tensor("op_2753_cast_fp16")]; tensor var_2755_axes_0 = const()[name = tensor("op_2755_axes_0"), val = tensor([-1])]; tensor var_2755_keep_dims_0 = const()[name = tensor("op_2755_keep_dims_0"), val = tensor(true)]; tensor var_2755_cast_fp16 = reduce_mean(axes = var_2755_axes_0, keep_dims = var_2755_keep_dims_0, x = var_2753_cast_fp16)[name = tensor("op_2755_cast_fp16")]; tensor var_2756_to_fp16 = const()[name = tensor("op_2756_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_2757_cast_fp16 = add(x = var_2755_cast_fp16, y = var_2756_to_fp16)[name = tensor("op_2757_cast_fp16")]; tensor var_2758_epsilon_0 = const()[name = tensor("op_2758_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_2758_cast_fp16 = rsqrt(epsilon = var_2758_epsilon_0, x = var_2757_cast_fp16)[name = tensor("op_2758_cast_fp16")]; tensor output_281_cast_fp16 = mul(x = x_279, y = var_2758_cast_fp16)[name = tensor("output_281_cast_fp16")]; tensor var_2762_to_fp16 = const()[name = tensor("op_2762_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940442560)))]; tensor output_283_cast_fp16 = mul(x = output_281_cast_fp16, y = var_2762_to_fp16)[name = tensor("output_283_cast_fp16")]; tensor input_141 = linear(bias = linear_4_bias_0, weight = wrapped_model_language_model_layers_11_mlp_gate_proj_weight_palettized, x = output_283_cast_fp16)[name = tensor("linear_81")]; tensor var_2770_mode_0 = const()[name = tensor("op_2770_mode_0"), val = tensor("TANH_APPROXIMATION")]; tensor var_2770 = gelu(mode = var_2770_mode_0, x = input_141)[name = tensor("op_2770")]; tensor var_2772 = linear(bias = linear_4_bias_0, weight = wrapped_model_language_model_layers_11_mlp_up_proj_weight_palettized, x = output_283_cast_fp16)[name = tensor("linear_82")]; tensor input_143 = mul(x = var_2770, y = var_2772)[name = tensor("input_143")]; tensor x_283 = linear(bias = linear_3_bias_0, weight = wrapped_model_language_model_layers_11_mlp_down_proj_weight_palettized, x = input_143)[name = tensor("linear_83")]; tensor var_22_promoted_71_to_fp16 = const()[name = tensor("op_22_promoted_71_to_fp16"), val = tensor(0x1p+1)]; tensor var_2778_cast_fp16 = pow(x = x_283, y = var_22_promoted_71_to_fp16)[name = tensor("op_2778_cast_fp16")]; tensor var_2780_axes_0 = const()[name = tensor("op_2780_axes_0"), val = tensor([-1])]; tensor var_2780_keep_dims_0 = const()[name = tensor("op_2780_keep_dims_0"), val = tensor(true)]; tensor var_2780_cast_fp16 = reduce_mean(axes = var_2780_axes_0, keep_dims = var_2780_keep_dims_0, x = var_2778_cast_fp16)[name = tensor("op_2780_cast_fp16")]; tensor var_2781_to_fp16 = const()[name = tensor("op_2781_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_2782_cast_fp16 = add(x = var_2780_cast_fp16, y = var_2781_to_fp16)[name = tensor("op_2782_cast_fp16")]; tensor var_2783_epsilon_0 = const()[name = tensor("op_2783_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_2783_cast_fp16 = rsqrt(epsilon = var_2783_epsilon_0, x = var_2782_cast_fp16)[name = tensor("op_2783_cast_fp16")]; tensor output_285_cast_fp16 = mul(x = x_283, y = var_2783_cast_fp16)[name = tensor("output_285_cast_fp16")]; tensor var_2787_to_fp16 = const()[name = tensor("op_2787_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940447744)))]; tensor output_287_cast_fp16 = mul(x = output_285_cast_fp16, y = var_2787_to_fp16)[name = tensor("output_287_cast_fp16")]; tensor x_287 = add(x = x_279, y = output_287_cast_fp16)[name = tensor("x_287")]; tensor var_22_promoted_72_to_fp16 = const()[name = tensor("op_22_promoted_72_to_fp16"), val = tensor(0x1p+1)]; tensor var_2799_cast_fp16 = pow(x = x_287, y = var_22_promoted_72_to_fp16)[name = tensor("op_2799_cast_fp16")]; tensor var_2801_axes_0 = const()[name = tensor("op_2801_axes_0"), val = tensor([-1])]; tensor var_2801_keep_dims_0 = const()[name = tensor("op_2801_keep_dims_0"), val = tensor(true)]; tensor var_2801_cast_fp16 = reduce_mean(axes = var_2801_axes_0, keep_dims = var_2801_keep_dims_0, x = var_2799_cast_fp16)[name = tensor("op_2801_cast_fp16")]; tensor var_2802_to_fp16 = const()[name = tensor("op_2802_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_2803_cast_fp16 = add(x = var_2801_cast_fp16, y = var_2802_to_fp16)[name = tensor("op_2803_cast_fp16")]; tensor var_2804_epsilon_0 = const()[name = tensor("op_2804_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_2804_cast_fp16 = rsqrt(epsilon = var_2804_epsilon_0, x = var_2803_cast_fp16)[name = tensor("op_2804_cast_fp16")]; tensor output_289_cast_fp16 = mul(x = x_287, y = var_2804_cast_fp16)[name = tensor("output_289_cast_fp16")]; tensor var_2808_to_fp16 = const()[name = tensor("op_2808_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940452928)))]; tensor output_291_cast_fp16 = mul(x = output_289_cast_fp16, y = var_2808_to_fp16)[name = tensor("output_291_cast_fp16")]; tensor var_2820 = linear(bias = linear_0_bias_0, weight = wrapped_model_language_model_layers_12_self_attn_q_proj_weight_palettized, x = output_291_cast_fp16)[name = tensor("linear_84")]; tensor var_2821 = const()[name = tensor("op_2821"), val = tensor([1, 256, -1, 256])]; tensor var_2822 = reshape(shape = var_2821, x = var_2820)[name = tensor("op_2822")]; tensor x_291_perm_0 = const()[name = tensor("x_291_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_2825 = linear(bias = linear_1_bias_0, weight = wrapped_model_language_model_layers_12_self_attn_k_proj_weight_palettized, x = output_291_cast_fp16)[name = tensor("linear_85")]; tensor var_2826 = const()[name = tensor("op_2826"), val = tensor([1, 256, -1, 256])]; tensor var_2827 = reshape(shape = var_2826, x = var_2825)[name = tensor("op_2827")]; tensor x_295_perm_0 = const()[name = tensor("x_295_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_2830 = linear(bias = linear_1_bias_0, weight = wrapped_model_language_model_layers_12_self_attn_v_proj_weight_palettized, x = output_291_cast_fp16)[name = tensor("linear_86")]; tensor var_2831 = const()[name = tensor("op_2831"), val = tensor([1, 256, -1, 256])]; tensor var_2832 = reshape(shape = var_2831, x = var_2830)[name = tensor("op_2832")]; tensor hidden_states_175_perm_0 = const()[name = tensor("hidden_states_175_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_22_promoted_73_to_fp16 = const()[name = tensor("op_22_promoted_73_to_fp16"), val = tensor(0x1p+1)]; tensor x_291 = transpose(perm = x_291_perm_0, x = var_2822)[name = tensor("transpose_87")]; tensor var_2836_cast_fp16 = pow(x = x_291, y = var_22_promoted_73_to_fp16)[name = tensor("op_2836_cast_fp16")]; tensor var_2838_axes_0 = const()[name = tensor("op_2838_axes_0"), val = tensor([-1])]; tensor var_2838_keep_dims_0 = const()[name = tensor("op_2838_keep_dims_0"), val = tensor(true)]; tensor var_2838_cast_fp16 = reduce_mean(axes = var_2838_axes_0, keep_dims = var_2838_keep_dims_0, x = var_2836_cast_fp16)[name = tensor("op_2838_cast_fp16")]; tensor var_2839_to_fp16 = const()[name = tensor("op_2839_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_2840_cast_fp16 = add(x = var_2838_cast_fp16, y = var_2839_to_fp16)[name = tensor("op_2840_cast_fp16")]; tensor var_2841_epsilon_0 = const()[name = tensor("op_2841_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_2841_cast_fp16 = rsqrt(epsilon = var_2841_epsilon_0, x = var_2840_cast_fp16)[name = tensor("op_2841_cast_fp16")]; tensor output_293_cast_fp16 = mul(x = x_291, y = var_2841_cast_fp16)[name = tensor("output_293_cast_fp16")]; tensor var_2845_to_fp16 = const()[name = tensor("op_2845_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940458112)))]; tensor output_295_cast_fp16 = mul(x = output_293_cast_fp16, y = var_2845_to_fp16)[name = tensor("output_295_cast_fp16")]; tensor var_22_promoted_74_to_fp16 = const()[name = tensor("op_22_promoted_74_to_fp16"), val = tensor(0x1p+1)]; tensor x_295 = transpose(perm = x_295_perm_0, x = var_2827)[name = tensor("transpose_86")]; tensor var_2850_cast_fp16 = pow(x = x_295, y = var_22_promoted_74_to_fp16)[name = tensor("op_2850_cast_fp16")]; tensor var_2852_axes_0 = const()[name = tensor("op_2852_axes_0"), val = tensor([-1])]; tensor var_2852_keep_dims_0 = const()[name = tensor("op_2852_keep_dims_0"), val = tensor(true)]; tensor var_2852_cast_fp16 = reduce_mean(axes = var_2852_axes_0, keep_dims = var_2852_keep_dims_0, x = var_2850_cast_fp16)[name = tensor("op_2852_cast_fp16")]; tensor var_2853_to_fp16 = const()[name = tensor("op_2853_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_2854_cast_fp16 = add(x = var_2852_cast_fp16, y = var_2853_to_fp16)[name = tensor("op_2854_cast_fp16")]; tensor var_2855_epsilon_0 = const()[name = tensor("op_2855_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_2855_cast_fp16 = rsqrt(epsilon = var_2855_epsilon_0, x = var_2854_cast_fp16)[name = tensor("op_2855_cast_fp16")]; tensor output_297_cast_fp16 = mul(x = x_295, y = var_2855_cast_fp16)[name = tensor("output_297_cast_fp16")]; tensor var_2859_to_fp16 = const()[name = tensor("op_2859_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940458688)))]; tensor output_299_cast_fp16 = mul(x = output_297_cast_fp16, y = var_2859_to_fp16)[name = tensor("output_299_cast_fp16")]; tensor var_2864 = mul(x = output_295_cast_fp16, y = cos_7_palettized)[name = tensor("op_2864")]; tensor x1_49_begin_0 = const()[name = tensor("x1_49_begin_0"), val = tensor([0, 0, 0, 0])]; tensor x1_49_end_0 = const()[name = tensor("x1_49_end_0"), val = tensor([1, 8, 256, 128])]; tensor x1_49_end_mask_0 = const()[name = tensor("x1_49_end_mask_0"), val = tensor([true, true, true, false])]; tensor x1_49 = slice_by_index(begin = x1_49_begin_0, end = x1_49_end_0, end_mask = x1_49_end_mask_0, x = output_295_cast_fp16)[name = tensor("x1_49")]; tensor x2_49_begin_0 = const()[name = tensor("x2_49_begin_0"), val = tensor([0, 0, 0, 128])]; tensor x2_49_end_0 = const()[name = tensor("x2_49_end_0"), val = tensor([1, 8, 256, 256])]; tensor x2_49_end_mask_0 = const()[name = tensor("x2_49_end_mask_0"), val = tensor([true, true, true, true])]; tensor x2_49 = slice_by_index(begin = x2_49_begin_0, end = x2_49_end_0, end_mask = x2_49_end_mask_0, x = output_295_cast_fp16)[name = tensor("x2_49")]; tensor const_311_promoted = const()[name = tensor("const_311_promoted"), val = tensor(-0x1p+0)]; tensor var_2875 = mul(x = x2_49, y = const_311_promoted)[name = tensor("op_2875")]; tensor var_2877_interleave_0 = const()[name = tensor("op_2877_interleave_0"), val = tensor(false)]; tensor var_2877 = concat(axis = var_24, interleave = var_2877_interleave_0, values = (var_2875, x1_49))[name = tensor("op_2877")]; tensor var_2878 = mul(x = var_2877, y = sin_7_palettized)[name = tensor("op_2878")]; tensor query_25 = add(x = var_2864, y = var_2878)[name = tensor("query_25")]; tensor var_2880 = mul(x = output_299_cast_fp16, y = cos_7_palettized)[name = tensor("op_2880")]; tensor x1_51_begin_0 = const()[name = tensor("x1_51_begin_0"), val = tensor([0, 0, 0, 0])]; tensor x1_51_end_0 = const()[name = tensor("x1_51_end_0"), val = tensor([1, 4, 256, 128])]; tensor x1_51_end_mask_0 = const()[name = tensor("x1_51_end_mask_0"), val = tensor([true, true, true, false])]; tensor x1_51 = slice_by_index(begin = x1_51_begin_0, end = x1_51_end_0, end_mask = x1_51_end_mask_0, x = output_299_cast_fp16)[name = tensor("x1_51")]; tensor x2_51_begin_0 = const()[name = tensor("x2_51_begin_0"), val = tensor([0, 0, 0, 128])]; tensor x2_51_end_0 = const()[name = tensor("x2_51_end_0"), val = tensor([1, 4, 256, 256])]; tensor x2_51_end_mask_0 = const()[name = tensor("x2_51_end_mask_0"), val = tensor([true, true, true, true])]; tensor x2_51 = slice_by_index(begin = x2_51_begin_0, end = x2_51_end_0, end_mask = x2_51_end_mask_0, x = output_299_cast_fp16)[name = tensor("x2_51")]; tensor const_314_promoted = const()[name = tensor("const_314_promoted"), val = tensor(-0x1p+0)]; tensor var_2891 = mul(x = x2_51, y = const_314_promoted)[name = tensor("op_2891")]; tensor var_2893_interleave_0 = const()[name = tensor("op_2893_interleave_0"), val = tensor(false)]; tensor var_2893 = concat(axis = var_24, interleave = var_2893_interleave_0, values = (var_2891, x1_51))[name = tensor("op_2893")]; tensor var_2894 = mul(x = var_2893, y = sin_7_palettized)[name = tensor("op_2894")]; tensor hidden_states_171 = add(x = var_2880, y = var_2894)[name = tensor("hidden_states_171")]; tensor var_2903_axes_0 = const()[name = tensor("op_2903_axes_0"), val = tensor([2])]; tensor var_2903 = expand_dims(axes = var_2903_axes_0, x = hidden_states_171)[name = tensor("op_2903")]; tensor hidden_states_173_reps_0 = const()[name = tensor("hidden_states_173_reps_0"), val = tensor([1, 1, 2, 1, 1])]; tensor hidden_states_173 = tile(reps = hidden_states_173_reps_0, x = var_2903)[name = tensor("hidden_states_173")]; tensor var_2911 = const()[name = tensor("op_2911"), val = tensor([1, 8, 256, 256])]; tensor key_states_25 = reshape(shape = var_2911, x = hidden_states_173)[name = tensor("key_states_25")]; tensor var_2920_axes_0 = const()[name = tensor("op_2920_axes_0"), val = tensor([2])]; tensor hidden_states_175 = transpose(perm = hidden_states_175_perm_0, x = var_2832)[name = tensor("transpose_85")]; tensor var_2920 = expand_dims(axes = var_2920_axes_0, x = hidden_states_175)[name = tensor("op_2920")]; tensor hidden_states_177_reps_0 = const()[name = tensor("hidden_states_177_reps_0"), val = tensor([1, 1, 2, 1, 1])]; tensor hidden_states_177 = tile(reps = hidden_states_177_reps_0, x = var_2920)[name = tensor("hidden_states_177")]; tensor var_2928 = const()[name = tensor("op_2928"), val = tensor([1, 8, 256, 256])]; tensor value_states_25 = reshape(shape = var_2928, x = hidden_states_177)[name = tensor("value_states_25")]; tensor var_2931_transpose_x_1 = const()[name = tensor("op_2931_transpose_x_1"), val = tensor(false)]; tensor var_2931_transpose_y_1 = const()[name = tensor("op_2931_transpose_y_1"), val = tensor(true)]; tensor var_2931 = matmul(transpose_x = var_2931_transpose_x_1, transpose_y = var_2931_transpose_y_1, x = query_25, y = key_states_25)[name = tensor("op_2931")]; tensor var_2932_to_fp16 = const()[name = tensor("op_2932_to_fp16"), val = tensor(0x1p-4)]; tensor attn_weights_49_cast_fp16 = mul(x = var_2931, y = var_2932_to_fp16)[name = tensor("attn_weights_49_cast_fp16")]; tensor input_145_cast_fp16 = add(x = attn_weights_49_cast_fp16, y = attention_mask_to_fp16_palettized)[name = tensor("input_145_cast_fp16")]; tensor var_2940_cast_fp16 = softmax(axis = var_24, x = input_145_cast_fp16)[name = tensor("op_2940_cast_fp16")]; tensor attn_output_49_transpose_x_0 = const()[name = tensor("attn_output_49_transpose_x_0"), val = tensor(false)]; tensor attn_output_49_transpose_y_0 = const()[name = tensor("attn_output_49_transpose_y_0"), val = tensor(false)]; tensor attn_output_49 = matmul(transpose_x = attn_output_49_transpose_x_0, transpose_y = attn_output_49_transpose_y_0, x = var_2940_cast_fp16, y = value_states_25)[name = tensor("attn_output_49")]; tensor var_2944_perm_0 = const()[name = tensor("op_2944_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_2946 = const()[name = tensor("op_2946"), val = tensor([1, 256, -1])]; tensor var_2944 = transpose(perm = var_2944_perm_0, x = attn_output_49)[name = tensor("transpose_84")]; tensor var_2947 = reshape(shape = var_2946, x = var_2944)[name = tensor("op_2947")]; tensor x_299 = linear(bias = linear_3_bias_0, weight = wrapped_model_language_model_layers_12_self_attn_o_proj_weight_palettized, x = var_2947)[name = tensor("linear_87")]; tensor var_22_promoted_75_to_fp16 = const()[name = tensor("op_22_promoted_75_to_fp16"), val = tensor(0x1p+1)]; tensor var_2953_cast_fp16 = pow(x = x_299, y = var_22_promoted_75_to_fp16)[name = tensor("op_2953_cast_fp16")]; tensor var_2955_axes_0 = const()[name = tensor("op_2955_axes_0"), val = tensor([-1])]; tensor var_2955_keep_dims_0 = const()[name = tensor("op_2955_keep_dims_0"), val = tensor(true)]; tensor var_2955_cast_fp16 = reduce_mean(axes = var_2955_axes_0, keep_dims = var_2955_keep_dims_0, x = var_2953_cast_fp16)[name = tensor("op_2955_cast_fp16")]; tensor var_2956_to_fp16 = const()[name = tensor("op_2956_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_2957_cast_fp16 = add(x = var_2955_cast_fp16, y = var_2956_to_fp16)[name = tensor("op_2957_cast_fp16")]; tensor var_2958_epsilon_0 = const()[name = tensor("op_2958_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_2958_cast_fp16 = rsqrt(epsilon = var_2958_epsilon_0, x = var_2957_cast_fp16)[name = tensor("op_2958_cast_fp16")]; tensor output_301_cast_fp16 = mul(x = x_299, y = var_2958_cast_fp16)[name = tensor("output_301_cast_fp16")]; tensor var_2962_to_fp16 = const()[name = tensor("op_2962_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940459264)))]; tensor output_303_cast_fp16 = mul(x = output_301_cast_fp16, y = var_2962_to_fp16)[name = tensor("output_303_cast_fp16")]; tensor x_303 = add(x = x_287, y = output_303_cast_fp16)[name = tensor("x_303")]; tensor var_22_promoted_76_to_fp16 = const()[name = tensor("op_22_promoted_76_to_fp16"), val = tensor(0x1p+1)]; tensor var_2968_cast_fp16 = pow(x = x_303, y = var_22_promoted_76_to_fp16)[name = tensor("op_2968_cast_fp16")]; tensor var_2970_axes_0 = const()[name = tensor("op_2970_axes_0"), val = tensor([-1])]; tensor var_2970_keep_dims_0 = const()[name = tensor("op_2970_keep_dims_0"), val = tensor(true)]; tensor var_2970_cast_fp16 = reduce_mean(axes = var_2970_axes_0, keep_dims = var_2970_keep_dims_0, x = var_2968_cast_fp16)[name = tensor("op_2970_cast_fp16")]; tensor var_2971_to_fp16 = const()[name = tensor("op_2971_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_2972_cast_fp16 = add(x = var_2970_cast_fp16, y = var_2971_to_fp16)[name = tensor("op_2972_cast_fp16")]; tensor var_2973_epsilon_0 = const()[name = tensor("op_2973_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_2973_cast_fp16 = rsqrt(epsilon = var_2973_epsilon_0, x = var_2972_cast_fp16)[name = tensor("op_2973_cast_fp16")]; tensor output_305_cast_fp16 = mul(x = x_303, y = var_2973_cast_fp16)[name = tensor("output_305_cast_fp16")]; tensor var_2977_to_fp16 = const()[name = tensor("op_2977_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940464448)))]; tensor output_307_cast_fp16 = mul(x = output_305_cast_fp16, y = var_2977_to_fp16)[name = tensor("output_307_cast_fp16")]; tensor input_153 = linear(bias = linear_4_bias_0, weight = wrapped_model_language_model_layers_12_mlp_gate_proj_weight_palettized, x = output_307_cast_fp16)[name = tensor("linear_88")]; tensor var_2985_mode_0 = const()[name = tensor("op_2985_mode_0"), val = tensor("TANH_APPROXIMATION")]; tensor var_2985 = gelu(mode = var_2985_mode_0, x = input_153)[name = tensor("op_2985")]; tensor var_2987 = linear(bias = linear_4_bias_0, weight = wrapped_model_language_model_layers_12_mlp_up_proj_weight_palettized, x = output_307_cast_fp16)[name = tensor("linear_89")]; tensor input_155 = mul(x = var_2985, y = var_2987)[name = tensor("input_155")]; tensor x_307 = linear(bias = linear_3_bias_0, weight = wrapped_model_language_model_layers_12_mlp_down_proj_weight_palettized, x = input_155)[name = tensor("linear_90")]; tensor var_22_promoted_77_to_fp16 = const()[name = tensor("op_22_promoted_77_to_fp16"), val = tensor(0x1p+1)]; tensor var_2993_cast_fp16 = pow(x = x_307, y = var_22_promoted_77_to_fp16)[name = tensor("op_2993_cast_fp16")]; tensor var_2995_axes_0 = const()[name = tensor("op_2995_axes_0"), val = tensor([-1])]; tensor var_2995_keep_dims_0 = const()[name = tensor("op_2995_keep_dims_0"), val = tensor(true)]; tensor var_2995_cast_fp16 = reduce_mean(axes = var_2995_axes_0, keep_dims = var_2995_keep_dims_0, x = var_2993_cast_fp16)[name = tensor("op_2995_cast_fp16")]; tensor var_2996_to_fp16 = const()[name = tensor("op_2996_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_2997_cast_fp16 = add(x = var_2995_cast_fp16, y = var_2996_to_fp16)[name = tensor("op_2997_cast_fp16")]; tensor var_2998_epsilon_0 = const()[name = tensor("op_2998_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_2998_cast_fp16 = rsqrt(epsilon = var_2998_epsilon_0, x = var_2997_cast_fp16)[name = tensor("op_2998_cast_fp16")]; tensor output_309_cast_fp16 = mul(x = x_307, y = var_2998_cast_fp16)[name = tensor("output_309_cast_fp16")]; tensor var_3002_to_fp16 = const()[name = tensor("op_3002_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940469632)))]; tensor output_311_cast_fp16 = mul(x = output_309_cast_fp16, y = var_3002_to_fp16)[name = tensor("output_311_cast_fp16")]; tensor x_311 = add(x = x_303, y = output_311_cast_fp16)[name = tensor("x_311")]; tensor var_22_promoted_78_to_fp16 = const()[name = tensor("op_22_promoted_78_to_fp16"), val = tensor(0x1p+1)]; tensor var_3014_cast_fp16 = pow(x = x_311, y = var_22_promoted_78_to_fp16)[name = tensor("op_3014_cast_fp16")]; tensor var_3016_axes_0 = const()[name = tensor("op_3016_axes_0"), val = tensor([-1])]; tensor var_3016_keep_dims_0 = const()[name = tensor("op_3016_keep_dims_0"), val = tensor(true)]; tensor var_3016_cast_fp16 = reduce_mean(axes = var_3016_axes_0, keep_dims = var_3016_keep_dims_0, x = var_3014_cast_fp16)[name = tensor("op_3016_cast_fp16")]; tensor var_3017_to_fp16 = const()[name = tensor("op_3017_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_3018_cast_fp16 = add(x = var_3016_cast_fp16, y = var_3017_to_fp16)[name = tensor("op_3018_cast_fp16")]; tensor var_3019_epsilon_0 = const()[name = tensor("op_3019_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_3019_cast_fp16 = rsqrt(epsilon = var_3019_epsilon_0, x = var_3018_cast_fp16)[name = tensor("op_3019_cast_fp16")]; tensor output_313_cast_fp16 = mul(x = x_311, y = var_3019_cast_fp16)[name = tensor("output_313_cast_fp16")]; tensor var_3023_to_fp16 = const()[name = tensor("op_3023_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940474816)))]; tensor output_315_cast_fp16 = mul(x = output_313_cast_fp16, y = var_3023_to_fp16)[name = tensor("output_315_cast_fp16")]; tensor var_3035 = linear(bias = linear_0_bias_0, weight = wrapped_model_language_model_layers_13_self_attn_q_proj_weight_palettized, x = output_315_cast_fp16)[name = tensor("linear_91")]; tensor var_3036 = const()[name = tensor("op_3036"), val = tensor([1, 256, -1, 256])]; tensor var_3037 = reshape(shape = var_3036, x = var_3035)[name = tensor("op_3037")]; tensor x_315_perm_0 = const()[name = tensor("x_315_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_3040 = linear(bias = linear_1_bias_0, weight = wrapped_model_language_model_layers_13_self_attn_k_proj_weight_palettized, x = output_315_cast_fp16)[name = tensor("linear_92")]; tensor var_3041 = const()[name = tensor("op_3041"), val = tensor([1, 256, -1, 256])]; tensor var_3042 = reshape(shape = var_3041, x = var_3040)[name = tensor("op_3042")]; tensor x_319_perm_0 = const()[name = tensor("x_319_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_3045 = linear(bias = linear_1_bias_0, weight = wrapped_model_language_model_layers_13_self_attn_v_proj_weight_palettized, x = output_315_cast_fp16)[name = tensor("linear_93")]; tensor var_3046 = const()[name = tensor("op_3046"), val = tensor([1, 256, -1, 256])]; tensor var_3047 = reshape(shape = var_3046, x = var_3045)[name = tensor("op_3047")]; tensor hidden_states_189_perm_0 = const()[name = tensor("hidden_states_189_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_22_promoted_79_to_fp16 = const()[name = tensor("op_22_promoted_79_to_fp16"), val = tensor(0x1p+1)]; tensor x_315 = transpose(perm = x_315_perm_0, x = var_3037)[name = tensor("transpose_83")]; tensor var_3051_cast_fp16 = pow(x = x_315, y = var_22_promoted_79_to_fp16)[name = tensor("op_3051_cast_fp16")]; tensor var_3053_axes_0 = const()[name = tensor("op_3053_axes_0"), val = tensor([-1])]; tensor var_3053_keep_dims_0 = const()[name = tensor("op_3053_keep_dims_0"), val = tensor(true)]; tensor var_3053_cast_fp16 = reduce_mean(axes = var_3053_axes_0, keep_dims = var_3053_keep_dims_0, x = var_3051_cast_fp16)[name = tensor("op_3053_cast_fp16")]; tensor var_3054_to_fp16 = const()[name = tensor("op_3054_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_3055_cast_fp16 = add(x = var_3053_cast_fp16, y = var_3054_to_fp16)[name = tensor("op_3055_cast_fp16")]; tensor var_3056_epsilon_0 = const()[name = tensor("op_3056_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_3056_cast_fp16 = rsqrt(epsilon = var_3056_epsilon_0, x = var_3055_cast_fp16)[name = tensor("op_3056_cast_fp16")]; tensor output_317_cast_fp16 = mul(x = x_315, y = var_3056_cast_fp16)[name = tensor("output_317_cast_fp16")]; tensor var_3060_to_fp16 = const()[name = tensor("op_3060_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940480000)))]; tensor output_319_cast_fp16 = mul(x = output_317_cast_fp16, y = var_3060_to_fp16)[name = tensor("output_319_cast_fp16")]; tensor var_22_promoted_80_to_fp16 = const()[name = tensor("op_22_promoted_80_to_fp16"), val = tensor(0x1p+1)]; tensor x_319 = transpose(perm = x_319_perm_0, x = var_3042)[name = tensor("transpose_82")]; tensor var_3065_cast_fp16 = pow(x = x_319, y = var_22_promoted_80_to_fp16)[name = tensor("op_3065_cast_fp16")]; tensor var_3067_axes_0 = const()[name = tensor("op_3067_axes_0"), val = tensor([-1])]; tensor var_3067_keep_dims_0 = const()[name = tensor("op_3067_keep_dims_0"), val = tensor(true)]; tensor var_3067_cast_fp16 = reduce_mean(axes = var_3067_axes_0, keep_dims = var_3067_keep_dims_0, x = var_3065_cast_fp16)[name = tensor("op_3067_cast_fp16")]; tensor var_3068_to_fp16 = const()[name = tensor("op_3068_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_3069_cast_fp16 = add(x = var_3067_cast_fp16, y = var_3068_to_fp16)[name = tensor("op_3069_cast_fp16")]; tensor var_3070_epsilon_0 = const()[name = tensor("op_3070_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_3070_cast_fp16 = rsqrt(epsilon = var_3070_epsilon_0, x = var_3069_cast_fp16)[name = tensor("op_3070_cast_fp16")]; tensor output_321_cast_fp16 = mul(x = x_319, y = var_3070_cast_fp16)[name = tensor("output_321_cast_fp16")]; tensor var_3074_to_fp16 = const()[name = tensor("op_3074_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940480576)))]; tensor output_323_cast_fp16 = mul(x = output_321_cast_fp16, y = var_3074_to_fp16)[name = tensor("output_323_cast_fp16")]; tensor var_3079 = mul(x = output_319_cast_fp16, y = cos_7_palettized)[name = tensor("op_3079")]; tensor x1_53_begin_0 = const()[name = tensor("x1_53_begin_0"), val = tensor([0, 0, 0, 0])]; tensor x1_53_end_0 = const()[name = tensor("x1_53_end_0"), val = tensor([1, 8, 256, 128])]; tensor x1_53_end_mask_0 = const()[name = tensor("x1_53_end_mask_0"), val = tensor([true, true, true, false])]; tensor x1_53 = slice_by_index(begin = x1_53_begin_0, end = x1_53_end_0, end_mask = x1_53_end_mask_0, x = output_319_cast_fp16)[name = tensor("x1_53")]; tensor x2_53_begin_0 = const()[name = tensor("x2_53_begin_0"), val = tensor([0, 0, 0, 128])]; tensor x2_53_end_0 = const()[name = tensor("x2_53_end_0"), val = tensor([1, 8, 256, 256])]; tensor x2_53_end_mask_0 = const()[name = tensor("x2_53_end_mask_0"), val = tensor([true, true, true, true])]; tensor x2_53 = slice_by_index(begin = x2_53_begin_0, end = x2_53_end_0, end_mask = x2_53_end_mask_0, x = output_319_cast_fp16)[name = tensor("x2_53")]; tensor const_334_promoted = const()[name = tensor("const_334_promoted"), val = tensor(-0x1p+0)]; tensor var_3090 = mul(x = x2_53, y = const_334_promoted)[name = tensor("op_3090")]; tensor var_3092_interleave_0 = const()[name = tensor("op_3092_interleave_0"), val = tensor(false)]; tensor var_3092 = concat(axis = var_24, interleave = var_3092_interleave_0, values = (var_3090, x1_53))[name = tensor("op_3092")]; tensor var_3093 = mul(x = var_3092, y = sin_7_palettized)[name = tensor("op_3093")]; tensor query_27 = add(x = var_3079, y = var_3093)[name = tensor("query_27")]; tensor var_3095 = mul(x = output_323_cast_fp16, y = cos_7_palettized)[name = tensor("op_3095")]; tensor x1_55_begin_0 = const()[name = tensor("x1_55_begin_0"), val = tensor([0, 0, 0, 0])]; tensor x1_55_end_0 = const()[name = tensor("x1_55_end_0"), val = tensor([1, 4, 256, 128])]; tensor x1_55_end_mask_0 = const()[name = tensor("x1_55_end_mask_0"), val = tensor([true, true, true, false])]; tensor x1_55 = slice_by_index(begin = x1_55_begin_0, end = x1_55_end_0, end_mask = x1_55_end_mask_0, x = output_323_cast_fp16)[name = tensor("x1_55")]; tensor x2_55_begin_0 = const()[name = tensor("x2_55_begin_0"), val = tensor([0, 0, 0, 128])]; tensor x2_55_end_0 = const()[name = tensor("x2_55_end_0"), val = tensor([1, 4, 256, 256])]; tensor x2_55_end_mask_0 = const()[name = tensor("x2_55_end_mask_0"), val = tensor([true, true, true, true])]; tensor x2_55 = slice_by_index(begin = x2_55_begin_0, end = x2_55_end_0, end_mask = x2_55_end_mask_0, x = output_323_cast_fp16)[name = tensor("x2_55")]; tensor const_337_promoted = const()[name = tensor("const_337_promoted"), val = tensor(-0x1p+0)]; tensor var_3106 = mul(x = x2_55, y = const_337_promoted)[name = tensor("op_3106")]; tensor var_3108_interleave_0 = const()[name = tensor("op_3108_interleave_0"), val = tensor(false)]; tensor var_3108 = concat(axis = var_24, interleave = var_3108_interleave_0, values = (var_3106, x1_55))[name = tensor("op_3108")]; tensor var_3109 = mul(x = var_3108, y = sin_7_palettized)[name = tensor("op_3109")]; tensor hidden_states_185 = add(x = var_3095, y = var_3109)[name = tensor("hidden_states_185")]; tensor var_3118_axes_0 = const()[name = tensor("op_3118_axes_0"), val = tensor([2])]; tensor var_3118 = expand_dims(axes = var_3118_axes_0, x = hidden_states_185)[name = tensor("op_3118")]; tensor hidden_states_187_reps_0 = const()[name = tensor("hidden_states_187_reps_0"), val = tensor([1, 1, 2, 1, 1])]; tensor hidden_states_187 = tile(reps = hidden_states_187_reps_0, x = var_3118)[name = tensor("hidden_states_187")]; tensor var_3126 = const()[name = tensor("op_3126"), val = tensor([1, 8, 256, 256])]; tensor key_states_27 = reshape(shape = var_3126, x = hidden_states_187)[name = tensor("key_states_27")]; tensor var_3135_axes_0 = const()[name = tensor("op_3135_axes_0"), val = tensor([2])]; tensor hidden_states_189 = transpose(perm = hidden_states_189_perm_0, x = var_3047)[name = tensor("transpose_81")]; tensor var_3135 = expand_dims(axes = var_3135_axes_0, x = hidden_states_189)[name = tensor("op_3135")]; tensor hidden_states_191_reps_0 = const()[name = tensor("hidden_states_191_reps_0"), val = tensor([1, 1, 2, 1, 1])]; tensor hidden_states_191 = tile(reps = hidden_states_191_reps_0, x = var_3135)[name = tensor("hidden_states_191")]; tensor var_3143 = const()[name = tensor("op_3143"), val = tensor([1, 8, 256, 256])]; tensor value_states_27 = reshape(shape = var_3143, x = hidden_states_191)[name = tensor("value_states_27")]; tensor var_3146_transpose_x_1 = const()[name = tensor("op_3146_transpose_x_1"), val = tensor(false)]; tensor var_3146_transpose_y_1 = const()[name = tensor("op_3146_transpose_y_1"), val = tensor(true)]; tensor var_3146 = matmul(transpose_x = var_3146_transpose_x_1, transpose_y = var_3146_transpose_y_1, x = query_27, y = key_states_27)[name = tensor("op_3146")]; tensor var_3147_to_fp16 = const()[name = tensor("op_3147_to_fp16"), val = tensor(0x1p-4)]; tensor attn_weights_53_cast_fp16 = mul(x = var_3146, y = var_3147_to_fp16)[name = tensor("attn_weights_53_cast_fp16")]; tensor input_157_cast_fp16 = add(x = attn_weights_53_cast_fp16, y = attention_mask_to_fp16_palettized)[name = tensor("input_157_cast_fp16")]; tensor var_3155_cast_fp16 = softmax(axis = var_24, x = input_157_cast_fp16)[name = tensor("op_3155_cast_fp16")]; tensor attn_output_53_transpose_x_0 = const()[name = tensor("attn_output_53_transpose_x_0"), val = tensor(false)]; tensor attn_output_53_transpose_y_0 = const()[name = tensor("attn_output_53_transpose_y_0"), val = tensor(false)]; tensor attn_output_53 = matmul(transpose_x = attn_output_53_transpose_x_0, transpose_y = attn_output_53_transpose_y_0, x = var_3155_cast_fp16, y = value_states_27)[name = tensor("attn_output_53")]; tensor var_3159_perm_0 = const()[name = tensor("op_3159_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_3161 = const()[name = tensor("op_3161"), val = tensor([1, 256, -1])]; tensor var_3159 = transpose(perm = var_3159_perm_0, x = attn_output_53)[name = tensor("transpose_80")]; tensor var_3162 = reshape(shape = var_3161, x = var_3159)[name = tensor("op_3162")]; tensor x_323 = linear(bias = linear_3_bias_0, weight = wrapped_model_language_model_layers_13_self_attn_o_proj_weight_palettized, x = var_3162)[name = tensor("linear_94")]; tensor var_22_promoted_81_to_fp16 = const()[name = tensor("op_22_promoted_81_to_fp16"), val = tensor(0x1p+1)]; tensor var_3168_cast_fp16 = pow(x = x_323, y = var_22_promoted_81_to_fp16)[name = tensor("op_3168_cast_fp16")]; tensor var_3170_axes_0 = const()[name = tensor("op_3170_axes_0"), val = tensor([-1])]; tensor var_3170_keep_dims_0 = const()[name = tensor("op_3170_keep_dims_0"), val = tensor(true)]; tensor var_3170_cast_fp16 = reduce_mean(axes = var_3170_axes_0, keep_dims = var_3170_keep_dims_0, x = var_3168_cast_fp16)[name = tensor("op_3170_cast_fp16")]; tensor var_3171_to_fp16 = const()[name = tensor("op_3171_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_3172_cast_fp16 = add(x = var_3170_cast_fp16, y = var_3171_to_fp16)[name = tensor("op_3172_cast_fp16")]; tensor var_3173_epsilon_0 = const()[name = tensor("op_3173_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_3173_cast_fp16 = rsqrt(epsilon = var_3173_epsilon_0, x = var_3172_cast_fp16)[name = tensor("op_3173_cast_fp16")]; tensor output_325_cast_fp16 = mul(x = x_323, y = var_3173_cast_fp16)[name = tensor("output_325_cast_fp16")]; tensor var_3177_to_fp16 = const()[name = tensor("op_3177_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940481152)))]; tensor output_327_cast_fp16 = mul(x = output_325_cast_fp16, y = var_3177_to_fp16)[name = tensor("output_327_cast_fp16")]; tensor x_327 = add(x = x_311, y = output_327_cast_fp16)[name = tensor("x_327")]; tensor var_22_promoted_82_to_fp16 = const()[name = tensor("op_22_promoted_82_to_fp16"), val = tensor(0x1p+1)]; tensor var_3183_cast_fp16 = pow(x = x_327, y = var_22_promoted_82_to_fp16)[name = tensor("op_3183_cast_fp16")]; tensor var_3185_axes_0 = const()[name = tensor("op_3185_axes_0"), val = tensor([-1])]; tensor var_3185_keep_dims_0 = const()[name = tensor("op_3185_keep_dims_0"), val = tensor(true)]; tensor var_3185_cast_fp16 = reduce_mean(axes = var_3185_axes_0, keep_dims = var_3185_keep_dims_0, x = var_3183_cast_fp16)[name = tensor("op_3185_cast_fp16")]; tensor var_3186_to_fp16 = const()[name = tensor("op_3186_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_3187_cast_fp16 = add(x = var_3185_cast_fp16, y = var_3186_to_fp16)[name = tensor("op_3187_cast_fp16")]; tensor var_3188_epsilon_0 = const()[name = tensor("op_3188_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_3188_cast_fp16 = rsqrt(epsilon = var_3188_epsilon_0, x = var_3187_cast_fp16)[name = tensor("op_3188_cast_fp16")]; tensor output_329_cast_fp16 = mul(x = x_327, y = var_3188_cast_fp16)[name = tensor("output_329_cast_fp16")]; tensor var_3192_to_fp16 = const()[name = tensor("op_3192_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940486336)))]; tensor output_331_cast_fp16 = mul(x = output_329_cast_fp16, y = var_3192_to_fp16)[name = tensor("output_331_cast_fp16")]; tensor input_165 = linear(bias = linear_4_bias_0, weight = wrapped_model_language_model_layers_13_mlp_gate_proj_weight_palettized, x = output_331_cast_fp16)[name = tensor("linear_95")]; tensor var_3200_mode_0 = const()[name = tensor("op_3200_mode_0"), val = tensor("TANH_APPROXIMATION")]; tensor var_3200 = gelu(mode = var_3200_mode_0, x = input_165)[name = tensor("op_3200")]; tensor var_3202 = linear(bias = linear_4_bias_0, weight = wrapped_model_language_model_layers_13_mlp_up_proj_weight_palettized, x = output_331_cast_fp16)[name = tensor("linear_96")]; tensor input_167 = mul(x = var_3200, y = var_3202)[name = tensor("input_167")]; tensor x_331 = linear(bias = linear_3_bias_0, weight = wrapped_model_language_model_layers_13_mlp_down_proj_weight_palettized, x = input_167)[name = tensor("linear_97")]; tensor var_22_promoted_83_to_fp16 = const()[name = tensor("op_22_promoted_83_to_fp16"), val = tensor(0x1p+1)]; tensor var_3208_cast_fp16 = pow(x = x_331, y = var_22_promoted_83_to_fp16)[name = tensor("op_3208_cast_fp16")]; tensor var_3210_axes_0 = const()[name = tensor("op_3210_axes_0"), val = tensor([-1])]; tensor var_3210_keep_dims_0 = const()[name = tensor("op_3210_keep_dims_0"), val = tensor(true)]; tensor var_3210_cast_fp16 = reduce_mean(axes = var_3210_axes_0, keep_dims = var_3210_keep_dims_0, x = var_3208_cast_fp16)[name = tensor("op_3210_cast_fp16")]; tensor var_3211_to_fp16 = const()[name = tensor("op_3211_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_3212_cast_fp16 = add(x = var_3210_cast_fp16, y = var_3211_to_fp16)[name = tensor("op_3212_cast_fp16")]; tensor var_3213_epsilon_0 = const()[name = tensor("op_3213_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_3213_cast_fp16 = rsqrt(epsilon = var_3213_epsilon_0, x = var_3212_cast_fp16)[name = tensor("op_3213_cast_fp16")]; tensor output_333_cast_fp16 = mul(x = x_331, y = var_3213_cast_fp16)[name = tensor("output_333_cast_fp16")]; tensor var_3217_to_fp16 = const()[name = tensor("op_3217_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940491520)))]; tensor output_335_cast_fp16 = mul(x = output_333_cast_fp16, y = var_3217_to_fp16)[name = tensor("output_335_cast_fp16")]; tensor x_335 = add(x = x_327, y = output_335_cast_fp16)[name = tensor("x_335")]; tensor var_22_promoted_84_to_fp16 = const()[name = tensor("op_22_promoted_84_to_fp16"), val = tensor(0x1p+1)]; tensor var_3229_cast_fp16 = pow(x = x_335, y = var_22_promoted_84_to_fp16)[name = tensor("op_3229_cast_fp16")]; tensor var_3231_axes_0 = const()[name = tensor("op_3231_axes_0"), val = tensor([-1])]; tensor var_3231_keep_dims_0 = const()[name = tensor("op_3231_keep_dims_0"), val = tensor(true)]; tensor var_3231_cast_fp16 = reduce_mean(axes = var_3231_axes_0, keep_dims = var_3231_keep_dims_0, x = var_3229_cast_fp16)[name = tensor("op_3231_cast_fp16")]; tensor var_3232_to_fp16 = const()[name = tensor("op_3232_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_3233_cast_fp16 = add(x = var_3231_cast_fp16, y = var_3232_to_fp16)[name = tensor("op_3233_cast_fp16")]; tensor var_3234_epsilon_0 = const()[name = tensor("op_3234_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_3234_cast_fp16 = rsqrt(epsilon = var_3234_epsilon_0, x = var_3233_cast_fp16)[name = tensor("op_3234_cast_fp16")]; tensor output_337_cast_fp16 = mul(x = x_335, y = var_3234_cast_fp16)[name = tensor("output_337_cast_fp16")]; tensor var_3238_to_fp16 = const()[name = tensor("op_3238_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940496704)))]; tensor output_339_cast_fp16 = mul(x = output_337_cast_fp16, y = var_3238_to_fp16)[name = tensor("output_339_cast_fp16")]; tensor var_3250 = linear(bias = linear_0_bias_0, weight = wrapped_model_language_model_layers_14_self_attn_q_proj_weight_palettized, x = output_339_cast_fp16)[name = tensor("linear_98")]; tensor var_3251 = const()[name = tensor("op_3251"), val = tensor([1, 256, -1, 256])]; tensor var_3252 = reshape(shape = var_3251, x = var_3250)[name = tensor("op_3252")]; tensor x_339_perm_0 = const()[name = tensor("x_339_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_3255 = linear(bias = linear_1_bias_0, weight = wrapped_model_language_model_layers_14_self_attn_k_proj_weight_palettized, x = output_339_cast_fp16)[name = tensor("linear_99")]; tensor var_3256 = const()[name = tensor("op_3256"), val = tensor([1, 256, -1, 256])]; tensor var_3257 = reshape(shape = var_3256, x = var_3255)[name = tensor("op_3257")]; tensor x_343_perm_0 = const()[name = tensor("x_343_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_3260 = linear(bias = linear_1_bias_0, weight = wrapped_model_language_model_layers_14_self_attn_v_proj_weight_palettized, x = output_339_cast_fp16)[name = tensor("linear_100")]; tensor var_3261 = const()[name = tensor("op_3261"), val = tensor([1, 256, -1, 256])]; tensor var_3262 = reshape(shape = var_3261, x = var_3260)[name = tensor("op_3262")]; tensor hidden_states_203_perm_0 = const()[name = tensor("hidden_states_203_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_22_promoted_85_to_fp16 = const()[name = tensor("op_22_promoted_85_to_fp16"), val = tensor(0x1p+1)]; tensor x_339 = transpose(perm = x_339_perm_0, x = var_3252)[name = tensor("transpose_79")]; tensor var_3266_cast_fp16 = pow(x = x_339, y = var_22_promoted_85_to_fp16)[name = tensor("op_3266_cast_fp16")]; tensor var_3268_axes_0 = const()[name = tensor("op_3268_axes_0"), val = tensor([-1])]; tensor var_3268_keep_dims_0 = const()[name = tensor("op_3268_keep_dims_0"), val = tensor(true)]; tensor var_3268_cast_fp16 = reduce_mean(axes = var_3268_axes_0, keep_dims = var_3268_keep_dims_0, x = var_3266_cast_fp16)[name = tensor("op_3268_cast_fp16")]; tensor var_3269_to_fp16 = const()[name = tensor("op_3269_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_3270_cast_fp16 = add(x = var_3268_cast_fp16, y = var_3269_to_fp16)[name = tensor("op_3270_cast_fp16")]; tensor var_3271_epsilon_0 = const()[name = tensor("op_3271_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_3271_cast_fp16 = rsqrt(epsilon = var_3271_epsilon_0, x = var_3270_cast_fp16)[name = tensor("op_3271_cast_fp16")]; tensor output_341_cast_fp16 = mul(x = x_339, y = var_3271_cast_fp16)[name = tensor("output_341_cast_fp16")]; tensor var_3275_to_fp16 = const()[name = tensor("op_3275_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940501888)))]; tensor output_343_cast_fp16 = mul(x = output_341_cast_fp16, y = var_3275_to_fp16)[name = tensor("output_343_cast_fp16")]; tensor var_22_promoted_86_to_fp16 = const()[name = tensor("op_22_promoted_86_to_fp16"), val = tensor(0x1p+1)]; tensor x_343 = transpose(perm = x_343_perm_0, x = var_3257)[name = tensor("transpose_78")]; tensor var_3280_cast_fp16 = pow(x = x_343, y = var_22_promoted_86_to_fp16)[name = tensor("op_3280_cast_fp16")]; tensor var_3282_axes_0 = const()[name = tensor("op_3282_axes_0"), val = tensor([-1])]; tensor var_3282_keep_dims_0 = const()[name = tensor("op_3282_keep_dims_0"), val = tensor(true)]; tensor var_3282_cast_fp16 = reduce_mean(axes = var_3282_axes_0, keep_dims = var_3282_keep_dims_0, x = var_3280_cast_fp16)[name = tensor("op_3282_cast_fp16")]; tensor var_3283_to_fp16 = const()[name = tensor("op_3283_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_3284_cast_fp16 = add(x = var_3282_cast_fp16, y = var_3283_to_fp16)[name = tensor("op_3284_cast_fp16")]; tensor var_3285_epsilon_0 = const()[name = tensor("op_3285_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_3285_cast_fp16 = rsqrt(epsilon = var_3285_epsilon_0, x = var_3284_cast_fp16)[name = tensor("op_3285_cast_fp16")]; tensor output_345_cast_fp16 = mul(x = x_343, y = var_3285_cast_fp16)[name = tensor("output_345_cast_fp16")]; tensor var_3289_to_fp16 = const()[name = tensor("op_3289_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940502464)))]; tensor output_347_cast_fp16 = mul(x = output_345_cast_fp16, y = var_3289_to_fp16)[name = tensor("output_347_cast_fp16")]; tensor var_3294 = mul(x = output_343_cast_fp16, y = cos_7_palettized)[name = tensor("op_3294")]; tensor x1_57_begin_0 = const()[name = tensor("x1_57_begin_0"), val = tensor([0, 0, 0, 0])]; tensor x1_57_end_0 = const()[name = tensor("x1_57_end_0"), val = tensor([1, 8, 256, 128])]; tensor x1_57_end_mask_0 = const()[name = tensor("x1_57_end_mask_0"), val = tensor([true, true, true, false])]; tensor x1_57 = slice_by_index(begin = x1_57_begin_0, end = x1_57_end_0, end_mask = x1_57_end_mask_0, x = output_343_cast_fp16)[name = tensor("x1_57")]; tensor x2_57_begin_0 = const()[name = tensor("x2_57_begin_0"), val = tensor([0, 0, 0, 128])]; tensor x2_57_end_0 = const()[name = tensor("x2_57_end_0"), val = tensor([1, 8, 256, 256])]; tensor x2_57_end_mask_0 = const()[name = tensor("x2_57_end_mask_0"), val = tensor([true, true, true, true])]; tensor x2_57 = slice_by_index(begin = x2_57_begin_0, end = x2_57_end_0, end_mask = x2_57_end_mask_0, x = output_343_cast_fp16)[name = tensor("x2_57")]; tensor const_357_promoted = const()[name = tensor("const_357_promoted"), val = tensor(-0x1p+0)]; tensor var_3305 = mul(x = x2_57, y = const_357_promoted)[name = tensor("op_3305")]; tensor var_3307_interleave_0 = const()[name = tensor("op_3307_interleave_0"), val = tensor(false)]; tensor var_3307 = concat(axis = var_24, interleave = var_3307_interleave_0, values = (var_3305, x1_57))[name = tensor("op_3307")]; tensor var_3308 = mul(x = var_3307, y = sin_7_palettized)[name = tensor("op_3308")]; tensor query_29 = add(x = var_3294, y = var_3308)[name = tensor("query_29")]; tensor var_3310 = mul(x = output_347_cast_fp16, y = cos_7_palettized)[name = tensor("op_3310")]; tensor x1_59_begin_0 = const()[name = tensor("x1_59_begin_0"), val = tensor([0, 0, 0, 0])]; tensor x1_59_end_0 = const()[name = tensor("x1_59_end_0"), val = tensor([1, 4, 256, 128])]; tensor x1_59_end_mask_0 = const()[name = tensor("x1_59_end_mask_0"), val = tensor([true, true, true, false])]; tensor x1_59 = slice_by_index(begin = x1_59_begin_0, end = x1_59_end_0, end_mask = x1_59_end_mask_0, x = output_347_cast_fp16)[name = tensor("x1_59")]; tensor x2_59_begin_0 = const()[name = tensor("x2_59_begin_0"), val = tensor([0, 0, 0, 128])]; tensor x2_59_end_0 = const()[name = tensor("x2_59_end_0"), val = tensor([1, 4, 256, 256])]; tensor x2_59_end_mask_0 = const()[name = tensor("x2_59_end_mask_0"), val = tensor([true, true, true, true])]; tensor x2_59 = slice_by_index(begin = x2_59_begin_0, end = x2_59_end_0, end_mask = x2_59_end_mask_0, x = output_347_cast_fp16)[name = tensor("x2_59")]; tensor const_360_promoted = const()[name = tensor("const_360_promoted"), val = tensor(-0x1p+0)]; tensor var_3321 = mul(x = x2_59, y = const_360_promoted)[name = tensor("op_3321")]; tensor var_3323_interleave_0 = const()[name = tensor("op_3323_interleave_0"), val = tensor(false)]; tensor var_3323 = concat(axis = var_24, interleave = var_3323_interleave_0, values = (var_3321, x1_59))[name = tensor("op_3323")]; tensor var_3324 = mul(x = var_3323, y = sin_7_palettized)[name = tensor("op_3324")]; tensor hidden_states_199 = add(x = var_3310, y = var_3324)[name = tensor("hidden_states_199")]; tensor var_3333_axes_0 = const()[name = tensor("op_3333_axes_0"), val = tensor([2])]; tensor var_3333 = expand_dims(axes = var_3333_axes_0, x = hidden_states_199)[name = tensor("op_3333")]; tensor hidden_states_201_reps_0 = const()[name = tensor("hidden_states_201_reps_0"), val = tensor([1, 1, 2, 1, 1])]; tensor hidden_states_201 = tile(reps = hidden_states_201_reps_0, x = var_3333)[name = tensor("hidden_states_201")]; tensor var_3341 = const()[name = tensor("op_3341"), val = tensor([1, 8, 256, 256])]; tensor key_states_29 = reshape(shape = var_3341, x = hidden_states_201)[name = tensor("key_states_29")]; tensor var_3350_axes_0 = const()[name = tensor("op_3350_axes_0"), val = tensor([2])]; tensor hidden_states_203 = transpose(perm = hidden_states_203_perm_0, x = var_3262)[name = tensor("transpose_77")]; tensor var_3350 = expand_dims(axes = var_3350_axes_0, x = hidden_states_203)[name = tensor("op_3350")]; tensor hidden_states_205_reps_0 = const()[name = tensor("hidden_states_205_reps_0"), val = tensor([1, 1, 2, 1, 1])]; tensor hidden_states_205 = tile(reps = hidden_states_205_reps_0, x = var_3350)[name = tensor("hidden_states_205")]; tensor var_3358 = const()[name = tensor("op_3358"), val = tensor([1, 8, 256, 256])]; tensor value_states_29 = reshape(shape = var_3358, x = hidden_states_205)[name = tensor("value_states_29")]; tensor var_3361_transpose_x_1 = const()[name = tensor("op_3361_transpose_x_1"), val = tensor(false)]; tensor var_3361_transpose_y_1 = const()[name = tensor("op_3361_transpose_y_1"), val = tensor(true)]; tensor var_3361 = matmul(transpose_x = var_3361_transpose_x_1, transpose_y = var_3361_transpose_y_1, x = query_29, y = key_states_29)[name = tensor("op_3361")]; tensor var_3362_to_fp16 = const()[name = tensor("op_3362_to_fp16"), val = tensor(0x1p-4)]; tensor attn_weights_57_cast_fp16 = mul(x = var_3361, y = var_3362_to_fp16)[name = tensor("attn_weights_57_cast_fp16")]; tensor input_169_cast_fp16 = add(x = attn_weights_57_cast_fp16, y = attention_mask_to_fp16_palettized)[name = tensor("input_169_cast_fp16")]; tensor var_3370_cast_fp16 = softmax(axis = var_24, x = input_169_cast_fp16)[name = tensor("op_3370_cast_fp16")]; tensor attn_output_57_transpose_x_0 = const()[name = tensor("attn_output_57_transpose_x_0"), val = tensor(false)]; tensor attn_output_57_transpose_y_0 = const()[name = tensor("attn_output_57_transpose_y_0"), val = tensor(false)]; tensor attn_output_57 = matmul(transpose_x = attn_output_57_transpose_x_0, transpose_y = attn_output_57_transpose_y_0, x = var_3370_cast_fp16, y = value_states_29)[name = tensor("attn_output_57")]; tensor var_3374_perm_0 = const()[name = tensor("op_3374_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_3376 = const()[name = tensor("op_3376"), val = tensor([1, 256, -1])]; tensor var_3374 = transpose(perm = var_3374_perm_0, x = attn_output_57)[name = tensor("transpose_76")]; tensor var_3377 = reshape(shape = var_3376, x = var_3374)[name = tensor("op_3377")]; tensor x_347 = linear(bias = linear_3_bias_0, weight = wrapped_model_language_model_layers_14_self_attn_o_proj_weight_palettized, x = var_3377)[name = tensor("linear_101")]; tensor var_22_promoted_87_to_fp16 = const()[name = tensor("op_22_promoted_87_to_fp16"), val = tensor(0x1p+1)]; tensor var_3383_cast_fp16 = pow(x = x_347, y = var_22_promoted_87_to_fp16)[name = tensor("op_3383_cast_fp16")]; tensor var_3385_axes_0 = const()[name = tensor("op_3385_axes_0"), val = tensor([-1])]; tensor var_3385_keep_dims_0 = const()[name = tensor("op_3385_keep_dims_0"), val = tensor(true)]; tensor var_3385_cast_fp16 = reduce_mean(axes = var_3385_axes_0, keep_dims = var_3385_keep_dims_0, x = var_3383_cast_fp16)[name = tensor("op_3385_cast_fp16")]; tensor var_3386_to_fp16 = const()[name = tensor("op_3386_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_3387_cast_fp16 = add(x = var_3385_cast_fp16, y = var_3386_to_fp16)[name = tensor("op_3387_cast_fp16")]; tensor var_3388_epsilon_0 = const()[name = tensor("op_3388_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_3388_cast_fp16 = rsqrt(epsilon = var_3388_epsilon_0, x = var_3387_cast_fp16)[name = tensor("op_3388_cast_fp16")]; tensor output_349_cast_fp16 = mul(x = x_347, y = var_3388_cast_fp16)[name = tensor("output_349_cast_fp16")]; tensor var_3392_to_fp16 = const()[name = tensor("op_3392_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940503040)))]; tensor output_351_cast_fp16 = mul(x = output_349_cast_fp16, y = var_3392_to_fp16)[name = tensor("output_351_cast_fp16")]; tensor x_351 = add(x = x_335, y = output_351_cast_fp16)[name = tensor("x_351")]; tensor var_22_promoted_88_to_fp16 = const()[name = tensor("op_22_promoted_88_to_fp16"), val = tensor(0x1p+1)]; tensor var_3398_cast_fp16 = pow(x = x_351, y = var_22_promoted_88_to_fp16)[name = tensor("op_3398_cast_fp16")]; tensor var_3400_axes_0 = const()[name = tensor("op_3400_axes_0"), val = tensor([-1])]; tensor var_3400_keep_dims_0 = const()[name = tensor("op_3400_keep_dims_0"), val = tensor(true)]; tensor var_3400_cast_fp16 = reduce_mean(axes = var_3400_axes_0, keep_dims = var_3400_keep_dims_0, x = var_3398_cast_fp16)[name = tensor("op_3400_cast_fp16")]; tensor var_3401_to_fp16 = const()[name = tensor("op_3401_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_3402_cast_fp16 = add(x = var_3400_cast_fp16, y = var_3401_to_fp16)[name = tensor("op_3402_cast_fp16")]; tensor var_3403_epsilon_0 = const()[name = tensor("op_3403_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_3403_cast_fp16 = rsqrt(epsilon = var_3403_epsilon_0, x = var_3402_cast_fp16)[name = tensor("op_3403_cast_fp16")]; tensor output_353_cast_fp16 = mul(x = x_351, y = var_3403_cast_fp16)[name = tensor("output_353_cast_fp16")]; tensor var_3407_to_fp16 = const()[name = tensor("op_3407_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940508224)))]; tensor output_355_cast_fp16 = mul(x = output_353_cast_fp16, y = var_3407_to_fp16)[name = tensor("output_355_cast_fp16")]; tensor input_177 = linear(bias = linear_4_bias_0, weight = wrapped_model_language_model_layers_14_mlp_gate_proj_weight_palettized, x = output_355_cast_fp16)[name = tensor("linear_102")]; tensor var_3415_mode_0 = const()[name = tensor("op_3415_mode_0"), val = tensor("TANH_APPROXIMATION")]; tensor var_3415 = gelu(mode = var_3415_mode_0, x = input_177)[name = tensor("op_3415")]; tensor var_3417 = linear(bias = linear_4_bias_0, weight = wrapped_model_language_model_layers_14_mlp_up_proj_weight_palettized, x = output_355_cast_fp16)[name = tensor("linear_103")]; tensor input_179 = mul(x = var_3415, y = var_3417)[name = tensor("input_179")]; tensor x_355 = linear(bias = linear_3_bias_0, weight = wrapped_model_language_model_layers_14_mlp_down_proj_weight_palettized, x = input_179)[name = tensor("linear_104")]; tensor var_22_promoted_89_to_fp16 = const()[name = tensor("op_22_promoted_89_to_fp16"), val = tensor(0x1p+1)]; tensor var_3423_cast_fp16 = pow(x = x_355, y = var_22_promoted_89_to_fp16)[name = tensor("op_3423_cast_fp16")]; tensor var_3425_axes_0 = const()[name = tensor("op_3425_axes_0"), val = tensor([-1])]; tensor var_3425_keep_dims_0 = const()[name = tensor("op_3425_keep_dims_0"), val = tensor(true)]; tensor var_3425_cast_fp16 = reduce_mean(axes = var_3425_axes_0, keep_dims = var_3425_keep_dims_0, x = var_3423_cast_fp16)[name = tensor("op_3425_cast_fp16")]; tensor var_3426_to_fp16 = const()[name = tensor("op_3426_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_3427_cast_fp16 = add(x = var_3425_cast_fp16, y = var_3426_to_fp16)[name = tensor("op_3427_cast_fp16")]; tensor var_3428_epsilon_0 = const()[name = tensor("op_3428_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_3428_cast_fp16 = rsqrt(epsilon = var_3428_epsilon_0, x = var_3427_cast_fp16)[name = tensor("op_3428_cast_fp16")]; tensor output_357_cast_fp16 = mul(x = x_355, y = var_3428_cast_fp16)[name = tensor("output_357_cast_fp16")]; tensor var_3432_to_fp16 = const()[name = tensor("op_3432_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940513408)))]; tensor output_359_cast_fp16 = mul(x = output_357_cast_fp16, y = var_3432_to_fp16)[name = tensor("output_359_cast_fp16")]; tensor x_359 = add(x = x_351, y = output_359_cast_fp16)[name = tensor("x_359")]; tensor var_22_promoted_90_to_fp16 = const()[name = tensor("op_22_promoted_90_to_fp16"), val = tensor(0x1p+1)]; tensor var_3444_cast_fp16 = pow(x = x_359, y = var_22_promoted_90_to_fp16)[name = tensor("op_3444_cast_fp16")]; tensor var_3446_axes_0 = const()[name = tensor("op_3446_axes_0"), val = tensor([-1])]; tensor var_3446_keep_dims_0 = const()[name = tensor("op_3446_keep_dims_0"), val = tensor(true)]; tensor var_3446_cast_fp16 = reduce_mean(axes = var_3446_axes_0, keep_dims = var_3446_keep_dims_0, x = var_3444_cast_fp16)[name = tensor("op_3446_cast_fp16")]; tensor var_3447_to_fp16 = const()[name = tensor("op_3447_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_3448_cast_fp16 = add(x = var_3446_cast_fp16, y = var_3447_to_fp16)[name = tensor("op_3448_cast_fp16")]; tensor var_3449_epsilon_0 = const()[name = tensor("op_3449_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_3449_cast_fp16 = rsqrt(epsilon = var_3449_epsilon_0, x = var_3448_cast_fp16)[name = tensor("op_3449_cast_fp16")]; tensor output_361_cast_fp16 = mul(x = x_359, y = var_3449_cast_fp16)[name = tensor("output_361_cast_fp16")]; tensor var_3453_to_fp16 = const()[name = tensor("op_3453_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940518592)))]; tensor output_363_cast_fp16 = mul(x = output_361_cast_fp16, y = var_3453_to_fp16)[name = tensor("output_363_cast_fp16")]; tensor var_3465 = linear(bias = linear_0_bias_0, weight = wrapped_model_language_model_layers_15_self_attn_q_proj_weight_palettized, x = output_363_cast_fp16)[name = tensor("linear_105")]; tensor var_3466 = const()[name = tensor("op_3466"), val = tensor([1, 256, -1, 256])]; tensor var_3467 = reshape(shape = var_3466, x = var_3465)[name = tensor("op_3467")]; tensor x_363_perm_0 = const()[name = tensor("x_363_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_3470 = linear(bias = linear_1_bias_0, weight = wrapped_model_language_model_layers_15_self_attn_k_proj_weight_palettized, x = output_363_cast_fp16)[name = tensor("linear_106")]; tensor var_3471 = const()[name = tensor("op_3471"), val = tensor([1, 256, -1, 256])]; tensor var_3472 = reshape(shape = var_3471, x = var_3470)[name = tensor("op_3472")]; tensor x_367_perm_0 = const()[name = tensor("x_367_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_3475 = linear(bias = linear_1_bias_0, weight = wrapped_model_language_model_layers_15_self_attn_v_proj_weight_palettized, x = output_363_cast_fp16)[name = tensor("linear_107")]; tensor var_3476 = const()[name = tensor("op_3476"), val = tensor([1, 256, -1, 256])]; tensor var_3477 = reshape(shape = var_3476, x = var_3475)[name = tensor("op_3477")]; tensor hidden_states_217_perm_0 = const()[name = tensor("hidden_states_217_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_22_promoted_91_to_fp16 = const()[name = tensor("op_22_promoted_91_to_fp16"), val = tensor(0x1p+1)]; tensor x_363 = transpose(perm = x_363_perm_0, x = var_3467)[name = tensor("transpose_75")]; tensor var_3481_cast_fp16 = pow(x = x_363, y = var_22_promoted_91_to_fp16)[name = tensor("op_3481_cast_fp16")]; tensor var_3483_axes_0 = const()[name = tensor("op_3483_axes_0"), val = tensor([-1])]; tensor var_3483_keep_dims_0 = const()[name = tensor("op_3483_keep_dims_0"), val = tensor(true)]; tensor var_3483_cast_fp16 = reduce_mean(axes = var_3483_axes_0, keep_dims = var_3483_keep_dims_0, x = var_3481_cast_fp16)[name = tensor("op_3483_cast_fp16")]; tensor var_3484_to_fp16 = const()[name = tensor("op_3484_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_3485_cast_fp16 = add(x = var_3483_cast_fp16, y = var_3484_to_fp16)[name = tensor("op_3485_cast_fp16")]; tensor var_3486_epsilon_0 = const()[name = tensor("op_3486_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_3486_cast_fp16 = rsqrt(epsilon = var_3486_epsilon_0, x = var_3485_cast_fp16)[name = tensor("op_3486_cast_fp16")]; tensor output_365_cast_fp16 = mul(x = x_363, y = var_3486_cast_fp16)[name = tensor("output_365_cast_fp16")]; tensor var_3490_to_fp16 = const()[name = tensor("op_3490_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940523776)))]; tensor output_367_cast_fp16 = mul(x = output_365_cast_fp16, y = var_3490_to_fp16)[name = tensor("output_367_cast_fp16")]; tensor var_22_promoted_92_to_fp16 = const()[name = tensor("op_22_promoted_92_to_fp16"), val = tensor(0x1p+1)]; tensor x_367 = transpose(perm = x_367_perm_0, x = var_3472)[name = tensor("transpose_74")]; tensor var_3495_cast_fp16 = pow(x = x_367, y = var_22_promoted_92_to_fp16)[name = tensor("op_3495_cast_fp16")]; tensor var_3497_axes_0 = const()[name = tensor("op_3497_axes_0"), val = tensor([-1])]; tensor var_3497_keep_dims_0 = const()[name = tensor("op_3497_keep_dims_0"), val = tensor(true)]; tensor var_3497_cast_fp16 = reduce_mean(axes = var_3497_axes_0, keep_dims = var_3497_keep_dims_0, x = var_3495_cast_fp16)[name = tensor("op_3497_cast_fp16")]; tensor var_3498_to_fp16 = const()[name = tensor("op_3498_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_3499_cast_fp16 = add(x = var_3497_cast_fp16, y = var_3498_to_fp16)[name = tensor("op_3499_cast_fp16")]; tensor var_3500_epsilon_0 = const()[name = tensor("op_3500_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_3500_cast_fp16 = rsqrt(epsilon = var_3500_epsilon_0, x = var_3499_cast_fp16)[name = tensor("op_3500_cast_fp16")]; tensor output_369_cast_fp16 = mul(x = x_367, y = var_3500_cast_fp16)[name = tensor("output_369_cast_fp16")]; tensor var_3504_to_fp16 = const()[name = tensor("op_3504_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940524352)))]; tensor output_371_cast_fp16 = mul(x = output_369_cast_fp16, y = var_3504_to_fp16)[name = tensor("output_371_cast_fp16")]; tensor var_3509 = mul(x = output_367_cast_fp16, y = cos_7_palettized)[name = tensor("op_3509")]; tensor x1_61_begin_0 = const()[name = tensor("x1_61_begin_0"), val = tensor([0, 0, 0, 0])]; tensor x1_61_end_0 = const()[name = tensor("x1_61_end_0"), val = tensor([1, 8, 256, 128])]; tensor x1_61_end_mask_0 = const()[name = tensor("x1_61_end_mask_0"), val = tensor([true, true, true, false])]; tensor x1_61 = slice_by_index(begin = x1_61_begin_0, end = x1_61_end_0, end_mask = x1_61_end_mask_0, x = output_367_cast_fp16)[name = tensor("x1_61")]; tensor x2_61_begin_0 = const()[name = tensor("x2_61_begin_0"), val = tensor([0, 0, 0, 128])]; tensor x2_61_end_0 = const()[name = tensor("x2_61_end_0"), val = tensor([1, 8, 256, 256])]; tensor x2_61_end_mask_0 = const()[name = tensor("x2_61_end_mask_0"), val = tensor([true, true, true, true])]; tensor x2_61 = slice_by_index(begin = x2_61_begin_0, end = x2_61_end_0, end_mask = x2_61_end_mask_0, x = output_367_cast_fp16)[name = tensor("x2_61")]; tensor const_380_promoted = const()[name = tensor("const_380_promoted"), val = tensor(-0x1p+0)]; tensor var_3520 = mul(x = x2_61, y = const_380_promoted)[name = tensor("op_3520")]; tensor var_3522_interleave_0 = const()[name = tensor("op_3522_interleave_0"), val = tensor(false)]; tensor var_3522 = concat(axis = var_24, interleave = var_3522_interleave_0, values = (var_3520, x1_61))[name = tensor("op_3522")]; tensor var_3523 = mul(x = var_3522, y = sin_7_palettized)[name = tensor("op_3523")]; tensor query_31 = add(x = var_3509, y = var_3523)[name = tensor("query_31")]; tensor var_3525 = mul(x = output_371_cast_fp16, y = cos_7_palettized)[name = tensor("op_3525")]; tensor x1_63_begin_0 = const()[name = tensor("x1_63_begin_0"), val = tensor([0, 0, 0, 0])]; tensor x1_63_end_0 = const()[name = tensor("x1_63_end_0"), val = tensor([1, 4, 256, 128])]; tensor x1_63_end_mask_0 = const()[name = tensor("x1_63_end_mask_0"), val = tensor([true, true, true, false])]; tensor x1_63 = slice_by_index(begin = x1_63_begin_0, end = x1_63_end_0, end_mask = x1_63_end_mask_0, x = output_371_cast_fp16)[name = tensor("x1_63")]; tensor x2_63_begin_0 = const()[name = tensor("x2_63_begin_0"), val = tensor([0, 0, 0, 128])]; tensor x2_63_end_0 = const()[name = tensor("x2_63_end_0"), val = tensor([1, 4, 256, 256])]; tensor x2_63_end_mask_0 = const()[name = tensor("x2_63_end_mask_0"), val = tensor([true, true, true, true])]; tensor x2_63 = slice_by_index(begin = x2_63_begin_0, end = x2_63_end_0, end_mask = x2_63_end_mask_0, x = output_371_cast_fp16)[name = tensor("x2_63")]; tensor const_383_promoted = const()[name = tensor("const_383_promoted"), val = tensor(-0x1p+0)]; tensor var_3536 = mul(x = x2_63, y = const_383_promoted)[name = tensor("op_3536")]; tensor var_3538_interleave_0 = const()[name = tensor("op_3538_interleave_0"), val = tensor(false)]; tensor var_3538 = concat(axis = var_24, interleave = var_3538_interleave_0, values = (var_3536, x1_63))[name = tensor("op_3538")]; tensor var_3539 = mul(x = var_3538, y = sin_7_palettized)[name = tensor("op_3539")]; tensor hidden_states_213 = add(x = var_3525, y = var_3539)[name = tensor("hidden_states_213")]; tensor var_3548_axes_0 = const()[name = tensor("op_3548_axes_0"), val = tensor([2])]; tensor var_3548 = expand_dims(axes = var_3548_axes_0, x = hidden_states_213)[name = tensor("op_3548")]; tensor hidden_states_215_reps_0 = const()[name = tensor("hidden_states_215_reps_0"), val = tensor([1, 1, 2, 1, 1])]; tensor hidden_states_215 = tile(reps = hidden_states_215_reps_0, x = var_3548)[name = tensor("hidden_states_215")]; tensor var_3556 = const()[name = tensor("op_3556"), val = tensor([1, 8, 256, 256])]; tensor key_states_31 = reshape(shape = var_3556, x = hidden_states_215)[name = tensor("key_states_31")]; tensor var_3565_axes_0 = const()[name = tensor("op_3565_axes_0"), val = tensor([2])]; tensor hidden_states_217 = transpose(perm = hidden_states_217_perm_0, x = var_3477)[name = tensor("transpose_73")]; tensor var_3565 = expand_dims(axes = var_3565_axes_0, x = hidden_states_217)[name = tensor("op_3565")]; tensor hidden_states_219_reps_0 = const()[name = tensor("hidden_states_219_reps_0"), val = tensor([1, 1, 2, 1, 1])]; tensor hidden_states_219 = tile(reps = hidden_states_219_reps_0, x = var_3565)[name = tensor("hidden_states_219")]; tensor var_3573 = const()[name = tensor("op_3573"), val = tensor([1, 8, 256, 256])]; tensor value_states_31 = reshape(shape = var_3573, x = hidden_states_219)[name = tensor("value_states_31")]; tensor var_3576_transpose_x_1 = const()[name = tensor("op_3576_transpose_x_1"), val = tensor(false)]; tensor var_3576_transpose_y_1 = const()[name = tensor("op_3576_transpose_y_1"), val = tensor(true)]; tensor var_3576 = matmul(transpose_x = var_3576_transpose_x_1, transpose_y = var_3576_transpose_y_1, x = query_31, y = key_states_31)[name = tensor("op_3576")]; tensor var_3577_to_fp16 = const()[name = tensor("op_3577_to_fp16"), val = tensor(0x1p-4)]; tensor attn_weights_61_cast_fp16 = mul(x = var_3576, y = var_3577_to_fp16)[name = tensor("attn_weights_61_cast_fp16")]; tensor input_181_cast_fp16 = add(x = attn_weights_61_cast_fp16, y = attention_mask_to_fp16_palettized)[name = tensor("input_181_cast_fp16")]; tensor var_3585_cast_fp16 = softmax(axis = var_24, x = input_181_cast_fp16)[name = tensor("op_3585_cast_fp16")]; tensor attn_output_61_transpose_x_0 = const()[name = tensor("attn_output_61_transpose_x_0"), val = tensor(false)]; tensor attn_output_61_transpose_y_0 = const()[name = tensor("attn_output_61_transpose_y_0"), val = tensor(false)]; tensor attn_output_61 = matmul(transpose_x = attn_output_61_transpose_x_0, transpose_y = attn_output_61_transpose_y_0, x = var_3585_cast_fp16, y = value_states_31)[name = tensor("attn_output_61")]; tensor var_3589_perm_0 = const()[name = tensor("op_3589_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_3591 = const()[name = tensor("op_3591"), val = tensor([1, 256, -1])]; tensor var_3589 = transpose(perm = var_3589_perm_0, x = attn_output_61)[name = tensor("transpose_72")]; tensor var_3592 = reshape(shape = var_3591, x = var_3589)[name = tensor("op_3592")]; tensor x_371 = linear(bias = linear_3_bias_0, weight = wrapped_model_language_model_layers_15_self_attn_o_proj_weight_palettized, x = var_3592)[name = tensor("linear_108")]; tensor var_22_promoted_93_to_fp16 = const()[name = tensor("op_22_promoted_93_to_fp16"), val = tensor(0x1p+1)]; tensor var_3598_cast_fp16 = pow(x = x_371, y = var_22_promoted_93_to_fp16)[name = tensor("op_3598_cast_fp16")]; tensor var_3600_axes_0 = const()[name = tensor("op_3600_axes_0"), val = tensor([-1])]; tensor var_3600_keep_dims_0 = const()[name = tensor("op_3600_keep_dims_0"), val = tensor(true)]; tensor var_3600_cast_fp16 = reduce_mean(axes = var_3600_axes_0, keep_dims = var_3600_keep_dims_0, x = var_3598_cast_fp16)[name = tensor("op_3600_cast_fp16")]; tensor var_3601_to_fp16 = const()[name = tensor("op_3601_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_3602_cast_fp16 = add(x = var_3600_cast_fp16, y = var_3601_to_fp16)[name = tensor("op_3602_cast_fp16")]; tensor var_3603_epsilon_0 = const()[name = tensor("op_3603_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_3603_cast_fp16 = rsqrt(epsilon = var_3603_epsilon_0, x = var_3602_cast_fp16)[name = tensor("op_3603_cast_fp16")]; tensor output_373_cast_fp16 = mul(x = x_371, y = var_3603_cast_fp16)[name = tensor("output_373_cast_fp16")]; tensor var_3607_to_fp16 = const()[name = tensor("op_3607_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940524928)))]; tensor output_375_cast_fp16 = mul(x = output_373_cast_fp16, y = var_3607_to_fp16)[name = tensor("output_375_cast_fp16")]; tensor x_375 = add(x = x_359, y = output_375_cast_fp16)[name = tensor("x_375")]; tensor var_22_promoted_94_to_fp16 = const()[name = tensor("op_22_promoted_94_to_fp16"), val = tensor(0x1p+1)]; tensor var_3613_cast_fp16 = pow(x = x_375, y = var_22_promoted_94_to_fp16)[name = tensor("op_3613_cast_fp16")]; tensor var_3615_axes_0 = const()[name = tensor("op_3615_axes_0"), val = tensor([-1])]; tensor var_3615_keep_dims_0 = const()[name = tensor("op_3615_keep_dims_0"), val = tensor(true)]; tensor var_3615_cast_fp16 = reduce_mean(axes = var_3615_axes_0, keep_dims = var_3615_keep_dims_0, x = var_3613_cast_fp16)[name = tensor("op_3615_cast_fp16")]; tensor var_3616_to_fp16 = const()[name = tensor("op_3616_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_3617_cast_fp16 = add(x = var_3615_cast_fp16, y = var_3616_to_fp16)[name = tensor("op_3617_cast_fp16")]; tensor var_3618_epsilon_0 = const()[name = tensor("op_3618_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_3618_cast_fp16 = rsqrt(epsilon = var_3618_epsilon_0, x = var_3617_cast_fp16)[name = tensor("op_3618_cast_fp16")]; tensor output_377_cast_fp16 = mul(x = x_375, y = var_3618_cast_fp16)[name = tensor("output_377_cast_fp16")]; tensor var_3622_to_fp16 = const()[name = tensor("op_3622_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940530112)))]; tensor output_379_cast_fp16 = mul(x = output_377_cast_fp16, y = var_3622_to_fp16)[name = tensor("output_379_cast_fp16")]; tensor input_189 = linear(bias = linear_4_bias_0, weight = wrapped_model_language_model_layers_15_mlp_gate_proj_weight_palettized, x = output_379_cast_fp16)[name = tensor("linear_109")]; tensor var_3630_mode_0 = const()[name = tensor("op_3630_mode_0"), val = tensor("TANH_APPROXIMATION")]; tensor var_3630 = gelu(mode = var_3630_mode_0, x = input_189)[name = tensor("op_3630")]; tensor var_3632 = linear(bias = linear_4_bias_0, weight = wrapped_model_language_model_layers_15_mlp_up_proj_weight_palettized, x = output_379_cast_fp16)[name = tensor("linear_110")]; tensor input_191 = mul(x = var_3630, y = var_3632)[name = tensor("input_191")]; tensor x_379 = linear(bias = linear_3_bias_0, weight = wrapped_model_language_model_layers_15_mlp_down_proj_weight_palettized, x = input_191)[name = tensor("linear_111")]; tensor var_22_promoted_95_to_fp16 = const()[name = tensor("op_22_promoted_95_to_fp16"), val = tensor(0x1p+1)]; tensor var_3638_cast_fp16 = pow(x = x_379, y = var_22_promoted_95_to_fp16)[name = tensor("op_3638_cast_fp16")]; tensor var_3640_axes_0 = const()[name = tensor("op_3640_axes_0"), val = tensor([-1])]; tensor var_3640_keep_dims_0 = const()[name = tensor("op_3640_keep_dims_0"), val = tensor(true)]; tensor var_3640_cast_fp16 = reduce_mean(axes = var_3640_axes_0, keep_dims = var_3640_keep_dims_0, x = var_3638_cast_fp16)[name = tensor("op_3640_cast_fp16")]; tensor var_3641_to_fp16 = const()[name = tensor("op_3641_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_3642_cast_fp16 = add(x = var_3640_cast_fp16, y = var_3641_to_fp16)[name = tensor("op_3642_cast_fp16")]; tensor var_3643_epsilon_0 = const()[name = tensor("op_3643_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_3643_cast_fp16 = rsqrt(epsilon = var_3643_epsilon_0, x = var_3642_cast_fp16)[name = tensor("op_3643_cast_fp16")]; tensor output_381_cast_fp16 = mul(x = x_379, y = var_3643_cast_fp16)[name = tensor("output_381_cast_fp16")]; tensor var_3647_to_fp16 = const()[name = tensor("op_3647_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940535296)))]; tensor output_383_cast_fp16 = mul(x = output_381_cast_fp16, y = var_3647_to_fp16)[name = tensor("output_383_cast_fp16")]; tensor x_383 = add(x = x_375, y = output_383_cast_fp16)[name = tensor("x_383")]; tensor var_22_promoted_96_to_fp16 = const()[name = tensor("op_22_promoted_96_to_fp16"), val = tensor(0x1p+1)]; tensor var_3659_cast_fp16 = pow(x = x_383, y = var_22_promoted_96_to_fp16)[name = tensor("op_3659_cast_fp16")]; tensor var_3661_axes_0 = const()[name = tensor("op_3661_axes_0"), val = tensor([-1])]; tensor var_3661_keep_dims_0 = const()[name = tensor("op_3661_keep_dims_0"), val = tensor(true)]; tensor var_3661_cast_fp16 = reduce_mean(axes = var_3661_axes_0, keep_dims = var_3661_keep_dims_0, x = var_3659_cast_fp16)[name = tensor("op_3661_cast_fp16")]; tensor var_3662_to_fp16 = const()[name = tensor("op_3662_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_3663_cast_fp16 = add(x = var_3661_cast_fp16, y = var_3662_to_fp16)[name = tensor("op_3663_cast_fp16")]; tensor var_3664_epsilon_0 = const()[name = tensor("op_3664_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_3664_cast_fp16 = rsqrt(epsilon = var_3664_epsilon_0, x = var_3663_cast_fp16)[name = tensor("op_3664_cast_fp16")]; tensor output_385_cast_fp16 = mul(x = x_383, y = var_3664_cast_fp16)[name = tensor("output_385_cast_fp16")]; tensor var_3668_to_fp16 = const()[name = tensor("op_3668_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940540480)))]; tensor output_387_cast_fp16 = mul(x = output_385_cast_fp16, y = var_3668_to_fp16)[name = tensor("output_387_cast_fp16")]; tensor var_3680 = linear(bias = linear_0_bias_0, weight = wrapped_model_language_model_layers_16_self_attn_q_proj_weight_palettized, x = output_387_cast_fp16)[name = tensor("linear_112")]; tensor var_3681 = const()[name = tensor("op_3681"), val = tensor([1, 256, -1, 256])]; tensor var_3682 = reshape(shape = var_3681, x = var_3680)[name = tensor("op_3682")]; tensor x_387_perm_0 = const()[name = tensor("x_387_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_3685 = linear(bias = linear_1_bias_0, weight = wrapped_model_language_model_layers_16_self_attn_k_proj_weight_palettized, x = output_387_cast_fp16)[name = tensor("linear_113")]; tensor var_3686 = const()[name = tensor("op_3686"), val = tensor([1, 256, -1, 256])]; tensor var_3687 = reshape(shape = var_3686, x = var_3685)[name = tensor("op_3687")]; tensor x_391_perm_0 = const()[name = tensor("x_391_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_3690 = linear(bias = linear_1_bias_0, weight = wrapped_model_language_model_layers_16_self_attn_v_proj_weight_palettized, x = output_387_cast_fp16)[name = tensor("linear_114")]; tensor var_3691 = const()[name = tensor("op_3691"), val = tensor([1, 256, -1, 256])]; tensor var_3692 = reshape(shape = var_3691, x = var_3690)[name = tensor("op_3692")]; tensor hidden_states_231_perm_0 = const()[name = tensor("hidden_states_231_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_22_promoted_97_to_fp16 = const()[name = tensor("op_22_promoted_97_to_fp16"), val = tensor(0x1p+1)]; tensor x_387 = transpose(perm = x_387_perm_0, x = var_3682)[name = tensor("transpose_71")]; tensor var_3696_cast_fp16 = pow(x = x_387, y = var_22_promoted_97_to_fp16)[name = tensor("op_3696_cast_fp16")]; tensor var_3698_axes_0 = const()[name = tensor("op_3698_axes_0"), val = tensor([-1])]; tensor var_3698_keep_dims_0 = const()[name = tensor("op_3698_keep_dims_0"), val = tensor(true)]; tensor var_3698_cast_fp16 = reduce_mean(axes = var_3698_axes_0, keep_dims = var_3698_keep_dims_0, x = var_3696_cast_fp16)[name = tensor("op_3698_cast_fp16")]; tensor var_3699_to_fp16 = const()[name = tensor("op_3699_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_3700_cast_fp16 = add(x = var_3698_cast_fp16, y = var_3699_to_fp16)[name = tensor("op_3700_cast_fp16")]; tensor var_3701_epsilon_0 = const()[name = tensor("op_3701_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_3701_cast_fp16 = rsqrt(epsilon = var_3701_epsilon_0, x = var_3700_cast_fp16)[name = tensor("op_3701_cast_fp16")]; tensor output_389_cast_fp16 = mul(x = x_387, y = var_3701_cast_fp16)[name = tensor("output_389_cast_fp16")]; tensor var_3705_to_fp16 = const()[name = tensor("op_3705_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940545664)))]; tensor output_391_cast_fp16 = mul(x = output_389_cast_fp16, y = var_3705_to_fp16)[name = tensor("output_391_cast_fp16")]; tensor var_22_promoted_98_to_fp16 = const()[name = tensor("op_22_promoted_98_to_fp16"), val = tensor(0x1p+1)]; tensor x_391 = transpose(perm = x_391_perm_0, x = var_3687)[name = tensor("transpose_70")]; tensor var_3710_cast_fp16 = pow(x = x_391, y = var_22_promoted_98_to_fp16)[name = tensor("op_3710_cast_fp16")]; tensor var_3712_axes_0 = const()[name = tensor("op_3712_axes_0"), val = tensor([-1])]; tensor var_3712_keep_dims_0 = const()[name = tensor("op_3712_keep_dims_0"), val = tensor(true)]; tensor var_3712_cast_fp16 = reduce_mean(axes = var_3712_axes_0, keep_dims = var_3712_keep_dims_0, x = var_3710_cast_fp16)[name = tensor("op_3712_cast_fp16")]; tensor var_3713_to_fp16 = const()[name = tensor("op_3713_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_3714_cast_fp16 = add(x = var_3712_cast_fp16, y = var_3713_to_fp16)[name = tensor("op_3714_cast_fp16")]; tensor var_3715_epsilon_0 = const()[name = tensor("op_3715_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_3715_cast_fp16 = rsqrt(epsilon = var_3715_epsilon_0, x = var_3714_cast_fp16)[name = tensor("op_3715_cast_fp16")]; tensor output_393_cast_fp16 = mul(x = x_391, y = var_3715_cast_fp16)[name = tensor("output_393_cast_fp16")]; tensor var_3719_to_fp16 = const()[name = tensor("op_3719_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940546240)))]; tensor output_395_cast_fp16 = mul(x = output_393_cast_fp16, y = var_3719_to_fp16)[name = tensor("output_395_cast_fp16")]; tensor var_3724 = mul(x = output_391_cast_fp16, y = cos_7_palettized)[name = tensor("op_3724")]; tensor x1_65_begin_0 = const()[name = tensor("x1_65_begin_0"), val = tensor([0, 0, 0, 0])]; tensor x1_65_end_0 = const()[name = tensor("x1_65_end_0"), val = tensor([1, 8, 256, 128])]; tensor x1_65_end_mask_0 = const()[name = tensor("x1_65_end_mask_0"), val = tensor([true, true, true, false])]; tensor x1_65 = slice_by_index(begin = x1_65_begin_0, end = x1_65_end_0, end_mask = x1_65_end_mask_0, x = output_391_cast_fp16)[name = tensor("x1_65")]; tensor x2_65_begin_0 = const()[name = tensor("x2_65_begin_0"), val = tensor([0, 0, 0, 128])]; tensor x2_65_end_0 = const()[name = tensor("x2_65_end_0"), val = tensor([1, 8, 256, 256])]; tensor x2_65_end_mask_0 = const()[name = tensor("x2_65_end_mask_0"), val = tensor([true, true, true, true])]; tensor x2_65 = slice_by_index(begin = x2_65_begin_0, end = x2_65_end_0, end_mask = x2_65_end_mask_0, x = output_391_cast_fp16)[name = tensor("x2_65")]; tensor const_403_promoted = const()[name = tensor("const_403_promoted"), val = tensor(-0x1p+0)]; tensor var_3735 = mul(x = x2_65, y = const_403_promoted)[name = tensor("op_3735")]; tensor var_3737_interleave_0 = const()[name = tensor("op_3737_interleave_0"), val = tensor(false)]; tensor var_3737 = concat(axis = var_24, interleave = var_3737_interleave_0, values = (var_3735, x1_65))[name = tensor("op_3737")]; tensor var_3738 = mul(x = var_3737, y = sin_7_palettized)[name = tensor("op_3738")]; tensor query_33 = add(x = var_3724, y = var_3738)[name = tensor("query_33")]; tensor var_3740 = mul(x = output_395_cast_fp16, y = cos_7_palettized)[name = tensor("op_3740")]; tensor x1_67_begin_0 = const()[name = tensor("x1_67_begin_0"), val = tensor([0, 0, 0, 0])]; tensor x1_67_end_0 = const()[name = tensor("x1_67_end_0"), val = tensor([1, 4, 256, 128])]; tensor x1_67_end_mask_0 = const()[name = tensor("x1_67_end_mask_0"), val = tensor([true, true, true, false])]; tensor x1_67 = slice_by_index(begin = x1_67_begin_0, end = x1_67_end_0, end_mask = x1_67_end_mask_0, x = output_395_cast_fp16)[name = tensor("x1_67")]; tensor x2_67_begin_0 = const()[name = tensor("x2_67_begin_0"), val = tensor([0, 0, 0, 128])]; tensor x2_67_end_0 = const()[name = tensor("x2_67_end_0"), val = tensor([1, 4, 256, 256])]; tensor x2_67_end_mask_0 = const()[name = tensor("x2_67_end_mask_0"), val = tensor([true, true, true, true])]; tensor x2_67 = slice_by_index(begin = x2_67_begin_0, end = x2_67_end_0, end_mask = x2_67_end_mask_0, x = output_395_cast_fp16)[name = tensor("x2_67")]; tensor const_406_promoted = const()[name = tensor("const_406_promoted"), val = tensor(-0x1p+0)]; tensor var_3751 = mul(x = x2_67, y = const_406_promoted)[name = tensor("op_3751")]; tensor var_3753_interleave_0 = const()[name = tensor("op_3753_interleave_0"), val = tensor(false)]; tensor var_3753 = concat(axis = var_24, interleave = var_3753_interleave_0, values = (var_3751, x1_67))[name = tensor("op_3753")]; tensor var_3754 = mul(x = var_3753, y = sin_7_palettized)[name = tensor("op_3754")]; tensor hidden_states_227 = add(x = var_3740, y = var_3754)[name = tensor("hidden_states_227")]; tensor var_3763_axes_0 = const()[name = tensor("op_3763_axes_0"), val = tensor([2])]; tensor var_3763 = expand_dims(axes = var_3763_axes_0, x = hidden_states_227)[name = tensor("op_3763")]; tensor hidden_states_229_reps_0 = const()[name = tensor("hidden_states_229_reps_0"), val = tensor([1, 1, 2, 1, 1])]; tensor hidden_states_229 = tile(reps = hidden_states_229_reps_0, x = var_3763)[name = tensor("hidden_states_229")]; tensor var_3771 = const()[name = tensor("op_3771"), val = tensor([1, 8, 256, 256])]; tensor key_states_33 = reshape(shape = var_3771, x = hidden_states_229)[name = tensor("key_states_33")]; tensor var_3780_axes_0 = const()[name = tensor("op_3780_axes_0"), val = tensor([2])]; tensor hidden_states_231 = transpose(perm = hidden_states_231_perm_0, x = var_3692)[name = tensor("transpose_69")]; tensor var_3780 = expand_dims(axes = var_3780_axes_0, x = hidden_states_231)[name = tensor("op_3780")]; tensor hidden_states_233_reps_0 = const()[name = tensor("hidden_states_233_reps_0"), val = tensor([1, 1, 2, 1, 1])]; tensor hidden_states_233 = tile(reps = hidden_states_233_reps_0, x = var_3780)[name = tensor("hidden_states_233")]; tensor var_3788 = const()[name = tensor("op_3788"), val = tensor([1, 8, 256, 256])]; tensor value_states_33 = reshape(shape = var_3788, x = hidden_states_233)[name = tensor("value_states_33")]; tensor var_3791_transpose_x_1 = const()[name = tensor("op_3791_transpose_x_1"), val = tensor(false)]; tensor var_3791_transpose_y_1 = const()[name = tensor("op_3791_transpose_y_1"), val = tensor(true)]; tensor var_3791 = matmul(transpose_x = var_3791_transpose_x_1, transpose_y = var_3791_transpose_y_1, x = query_33, y = key_states_33)[name = tensor("op_3791")]; tensor var_3792_to_fp16 = const()[name = tensor("op_3792_to_fp16"), val = tensor(0x1p-4)]; tensor attn_weights_65_cast_fp16 = mul(x = var_3791, y = var_3792_to_fp16)[name = tensor("attn_weights_65_cast_fp16")]; tensor input_193_cast_fp16 = add(x = attn_weights_65_cast_fp16, y = attention_mask_to_fp16_palettized)[name = tensor("input_193_cast_fp16")]; tensor var_3800_cast_fp16 = softmax(axis = var_24, x = input_193_cast_fp16)[name = tensor("op_3800_cast_fp16")]; tensor attn_output_65_transpose_x_0 = const()[name = tensor("attn_output_65_transpose_x_0"), val = tensor(false)]; tensor attn_output_65_transpose_y_0 = const()[name = tensor("attn_output_65_transpose_y_0"), val = tensor(false)]; tensor attn_output_65 = matmul(transpose_x = attn_output_65_transpose_x_0, transpose_y = attn_output_65_transpose_y_0, x = var_3800_cast_fp16, y = value_states_33)[name = tensor("attn_output_65")]; tensor var_3804_perm_0 = const()[name = tensor("op_3804_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_3806 = const()[name = tensor("op_3806"), val = tensor([1, 256, -1])]; tensor var_3804 = transpose(perm = var_3804_perm_0, x = attn_output_65)[name = tensor("transpose_68")]; tensor var_3807 = reshape(shape = var_3806, x = var_3804)[name = tensor("op_3807")]; tensor x_395 = linear(bias = linear_3_bias_0, weight = wrapped_model_language_model_layers_16_self_attn_o_proj_weight_palettized, x = var_3807)[name = tensor("linear_115")]; tensor var_22_promoted_99_to_fp16 = const()[name = tensor("op_22_promoted_99_to_fp16"), val = tensor(0x1p+1)]; tensor var_3813_cast_fp16 = pow(x = x_395, y = var_22_promoted_99_to_fp16)[name = tensor("op_3813_cast_fp16")]; tensor var_3815_axes_0 = const()[name = tensor("op_3815_axes_0"), val = tensor([-1])]; tensor var_3815_keep_dims_0 = const()[name = tensor("op_3815_keep_dims_0"), val = tensor(true)]; tensor var_3815_cast_fp16 = reduce_mean(axes = var_3815_axes_0, keep_dims = var_3815_keep_dims_0, x = var_3813_cast_fp16)[name = tensor("op_3815_cast_fp16")]; tensor var_3816_to_fp16 = const()[name = tensor("op_3816_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_3817_cast_fp16 = add(x = var_3815_cast_fp16, y = var_3816_to_fp16)[name = tensor("op_3817_cast_fp16")]; tensor var_3818_epsilon_0 = const()[name = tensor("op_3818_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_3818_cast_fp16 = rsqrt(epsilon = var_3818_epsilon_0, x = var_3817_cast_fp16)[name = tensor("op_3818_cast_fp16")]; tensor output_397_cast_fp16 = mul(x = x_395, y = var_3818_cast_fp16)[name = tensor("output_397_cast_fp16")]; tensor var_3822_to_fp16 = const()[name = tensor("op_3822_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940546816)))]; tensor output_399_cast_fp16 = mul(x = output_397_cast_fp16, y = var_3822_to_fp16)[name = tensor("output_399_cast_fp16")]; tensor x_399 = add(x = x_383, y = output_399_cast_fp16)[name = tensor("x_399")]; tensor var_22_promoted_100_to_fp16 = const()[name = tensor("op_22_promoted_100_to_fp16"), val = tensor(0x1p+1)]; tensor var_3828_cast_fp16 = pow(x = x_399, y = var_22_promoted_100_to_fp16)[name = tensor("op_3828_cast_fp16")]; tensor var_3830_axes_0 = const()[name = tensor("op_3830_axes_0"), val = tensor([-1])]; tensor var_3830_keep_dims_0 = const()[name = tensor("op_3830_keep_dims_0"), val = tensor(true)]; tensor var_3830_cast_fp16 = reduce_mean(axes = var_3830_axes_0, keep_dims = var_3830_keep_dims_0, x = var_3828_cast_fp16)[name = tensor("op_3830_cast_fp16")]; tensor var_3831_to_fp16 = const()[name = tensor("op_3831_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_3832_cast_fp16 = add(x = var_3830_cast_fp16, y = var_3831_to_fp16)[name = tensor("op_3832_cast_fp16")]; tensor var_3833_epsilon_0 = const()[name = tensor("op_3833_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_3833_cast_fp16 = rsqrt(epsilon = var_3833_epsilon_0, x = var_3832_cast_fp16)[name = tensor("op_3833_cast_fp16")]; tensor output_401_cast_fp16 = mul(x = x_399, y = var_3833_cast_fp16)[name = tensor("output_401_cast_fp16")]; tensor var_3837_to_fp16 = const()[name = tensor("op_3837_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940552000)))]; tensor output_403_cast_fp16 = mul(x = output_401_cast_fp16, y = var_3837_to_fp16)[name = tensor("output_403_cast_fp16")]; tensor input_201 = linear(bias = linear_4_bias_0, weight = wrapped_model_language_model_layers_16_mlp_gate_proj_weight_palettized, x = output_403_cast_fp16)[name = tensor("linear_116")]; tensor var_3845_mode_0 = const()[name = tensor("op_3845_mode_0"), val = tensor("TANH_APPROXIMATION")]; tensor var_3845 = gelu(mode = var_3845_mode_0, x = input_201)[name = tensor("op_3845")]; tensor var_3847 = linear(bias = linear_4_bias_0, weight = wrapped_model_language_model_layers_16_mlp_up_proj_weight_palettized, x = output_403_cast_fp16)[name = tensor("linear_117")]; tensor input_203 = mul(x = var_3845, y = var_3847)[name = tensor("input_203")]; tensor x_403 = linear(bias = linear_3_bias_0, weight = wrapped_model_language_model_layers_16_mlp_down_proj_weight_palettized, x = input_203)[name = tensor("linear_118")]; tensor var_22_promoted_101_to_fp16 = const()[name = tensor("op_22_promoted_101_to_fp16"), val = tensor(0x1p+1)]; tensor var_3853_cast_fp16 = pow(x = x_403, y = var_22_promoted_101_to_fp16)[name = tensor("op_3853_cast_fp16")]; tensor var_3855_axes_0 = const()[name = tensor("op_3855_axes_0"), val = tensor([-1])]; tensor var_3855_keep_dims_0 = const()[name = tensor("op_3855_keep_dims_0"), val = tensor(true)]; tensor var_3855_cast_fp16 = reduce_mean(axes = var_3855_axes_0, keep_dims = var_3855_keep_dims_0, x = var_3853_cast_fp16)[name = tensor("op_3855_cast_fp16")]; tensor var_3856_to_fp16 = const()[name = tensor("op_3856_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_3857_cast_fp16 = add(x = var_3855_cast_fp16, y = var_3856_to_fp16)[name = tensor("op_3857_cast_fp16")]; tensor var_3858_epsilon_0 = const()[name = tensor("op_3858_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_3858_cast_fp16 = rsqrt(epsilon = var_3858_epsilon_0, x = var_3857_cast_fp16)[name = tensor("op_3858_cast_fp16")]; tensor output_405_cast_fp16 = mul(x = x_403, y = var_3858_cast_fp16)[name = tensor("output_405_cast_fp16")]; tensor var_3862_to_fp16 = const()[name = tensor("op_3862_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940557184)))]; tensor output_407_cast_fp16 = mul(x = output_405_cast_fp16, y = var_3862_to_fp16)[name = tensor("output_407_cast_fp16")]; tensor x_407 = add(x = x_399, y = output_407_cast_fp16)[name = tensor("x_407")]; tensor var_22_promoted_102_to_fp16 = const()[name = tensor("op_22_promoted_102_to_fp16"), val = tensor(0x1p+1)]; tensor var_3874_cast_fp16 = pow(x = x_407, y = var_22_promoted_102_to_fp16)[name = tensor("op_3874_cast_fp16")]; tensor var_3876_axes_0 = const()[name = tensor("op_3876_axes_0"), val = tensor([-1])]; tensor var_3876_keep_dims_0 = const()[name = tensor("op_3876_keep_dims_0"), val = tensor(true)]; tensor var_3876_cast_fp16 = reduce_mean(axes = var_3876_axes_0, keep_dims = var_3876_keep_dims_0, x = var_3874_cast_fp16)[name = tensor("op_3876_cast_fp16")]; tensor var_3877_to_fp16 = const()[name = tensor("op_3877_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_3878_cast_fp16 = add(x = var_3876_cast_fp16, y = var_3877_to_fp16)[name = tensor("op_3878_cast_fp16")]; tensor var_3879_epsilon_0 = const()[name = tensor("op_3879_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_3879_cast_fp16 = rsqrt(epsilon = var_3879_epsilon_0, x = var_3878_cast_fp16)[name = tensor("op_3879_cast_fp16")]; tensor output_409_cast_fp16 = mul(x = x_407, y = var_3879_cast_fp16)[name = tensor("output_409_cast_fp16")]; tensor var_3883_to_fp16 = const()[name = tensor("op_3883_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940562368)))]; tensor output_411_cast_fp16 = mul(x = output_409_cast_fp16, y = var_3883_to_fp16)[name = tensor("output_411_cast_fp16")]; tensor var_3895 = linear(bias = linear_0_bias_0, weight = wrapped_model_language_model_layers_17_self_attn_q_proj_weight_palettized, x = output_411_cast_fp16)[name = tensor("linear_119")]; tensor var_3896 = const()[name = tensor("op_3896"), val = tensor([1, 256, -1, 256])]; tensor var_3897 = reshape(shape = var_3896, x = var_3895)[name = tensor("op_3897")]; tensor x_411_perm_0 = const()[name = tensor("x_411_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_3900 = linear(bias = linear_1_bias_0, weight = wrapped_model_language_model_layers_17_self_attn_k_proj_weight_palettized, x = output_411_cast_fp16)[name = tensor("linear_120")]; tensor var_3901 = const()[name = tensor("op_3901"), val = tensor([1, 256, -1, 256])]; tensor var_3902 = reshape(shape = var_3901, x = var_3900)[name = tensor("op_3902")]; tensor x_415_perm_0 = const()[name = tensor("x_415_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_3905 = linear(bias = linear_1_bias_0, weight = wrapped_model_language_model_layers_17_self_attn_v_proj_weight_palettized, x = output_411_cast_fp16)[name = tensor("linear_121")]; tensor var_3906 = const()[name = tensor("op_3906"), val = tensor([1, 256, -1, 256])]; tensor var_3907 = reshape(shape = var_3906, x = var_3905)[name = tensor("op_3907")]; tensor hidden_states_245_perm_0 = const()[name = tensor("hidden_states_245_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_22_promoted_103_to_fp16 = const()[name = tensor("op_22_promoted_103_to_fp16"), val = tensor(0x1p+1)]; tensor x_411 = transpose(perm = x_411_perm_0, x = var_3897)[name = tensor("transpose_67")]; tensor var_3911_cast_fp16 = pow(x = x_411, y = var_22_promoted_103_to_fp16)[name = tensor("op_3911_cast_fp16")]; tensor var_3913_axes_0 = const()[name = tensor("op_3913_axes_0"), val = tensor([-1])]; tensor var_3913_keep_dims_0 = const()[name = tensor("op_3913_keep_dims_0"), val = tensor(true)]; tensor var_3913_cast_fp16 = reduce_mean(axes = var_3913_axes_0, keep_dims = var_3913_keep_dims_0, x = var_3911_cast_fp16)[name = tensor("op_3913_cast_fp16")]; tensor var_3914_to_fp16 = const()[name = tensor("op_3914_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_3915_cast_fp16 = add(x = var_3913_cast_fp16, y = var_3914_to_fp16)[name = tensor("op_3915_cast_fp16")]; tensor var_3916_epsilon_0 = const()[name = tensor("op_3916_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_3916_cast_fp16 = rsqrt(epsilon = var_3916_epsilon_0, x = var_3915_cast_fp16)[name = tensor("op_3916_cast_fp16")]; tensor output_413_cast_fp16 = mul(x = x_411, y = var_3916_cast_fp16)[name = tensor("output_413_cast_fp16")]; tensor var_3920_to_fp16 = const()[name = tensor("op_3920_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940567552)))]; tensor output_415_cast_fp16 = mul(x = output_413_cast_fp16, y = var_3920_to_fp16)[name = tensor("output_415_cast_fp16")]; tensor var_22_promoted_104_to_fp16 = const()[name = tensor("op_22_promoted_104_to_fp16"), val = tensor(0x1p+1)]; tensor x_415 = transpose(perm = x_415_perm_0, x = var_3902)[name = tensor("transpose_66")]; tensor var_3925_cast_fp16 = pow(x = x_415, y = var_22_promoted_104_to_fp16)[name = tensor("op_3925_cast_fp16")]; tensor var_3927_axes_0 = const()[name = tensor("op_3927_axes_0"), val = tensor([-1])]; tensor var_3927_keep_dims_0 = const()[name = tensor("op_3927_keep_dims_0"), val = tensor(true)]; tensor var_3927_cast_fp16 = reduce_mean(axes = var_3927_axes_0, keep_dims = var_3927_keep_dims_0, x = var_3925_cast_fp16)[name = tensor("op_3927_cast_fp16")]; tensor var_3928_to_fp16 = const()[name = tensor("op_3928_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_3929_cast_fp16 = add(x = var_3927_cast_fp16, y = var_3928_to_fp16)[name = tensor("op_3929_cast_fp16")]; tensor var_3930_epsilon_0 = const()[name = tensor("op_3930_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_3930_cast_fp16 = rsqrt(epsilon = var_3930_epsilon_0, x = var_3929_cast_fp16)[name = tensor("op_3930_cast_fp16")]; tensor output_417_cast_fp16 = mul(x = x_415, y = var_3930_cast_fp16)[name = tensor("output_417_cast_fp16")]; tensor var_3934_to_fp16 = const()[name = tensor("op_3934_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940568128)))]; tensor output_419_cast_fp16 = mul(x = output_417_cast_fp16, y = var_3934_to_fp16)[name = tensor("output_419_cast_fp16")]; tensor var_3939 = mul(x = output_415_cast_fp16, y = cos_19_palettized)[name = tensor("op_3939")]; tensor x1_69_begin_0 = const()[name = tensor("x1_69_begin_0"), val = tensor([0, 0, 0, 0])]; tensor x1_69_end_0 = const()[name = tensor("x1_69_end_0"), val = tensor([1, 8, 256, 128])]; tensor x1_69_end_mask_0 = const()[name = tensor("x1_69_end_mask_0"), val = tensor([true, true, true, false])]; tensor x1_69 = slice_by_index(begin = x1_69_begin_0, end = x1_69_end_0, end_mask = x1_69_end_mask_0, x = output_415_cast_fp16)[name = tensor("x1_69")]; tensor x2_69_begin_0 = const()[name = tensor("x2_69_begin_0"), val = tensor([0, 0, 0, 128])]; tensor x2_69_end_0 = const()[name = tensor("x2_69_end_0"), val = tensor([1, 8, 256, 256])]; tensor x2_69_end_mask_0 = const()[name = tensor("x2_69_end_mask_0"), val = tensor([true, true, true, true])]; tensor x2_69 = slice_by_index(begin = x2_69_begin_0, end = x2_69_end_0, end_mask = x2_69_end_mask_0, x = output_415_cast_fp16)[name = tensor("x2_69")]; tensor const_426_promoted = const()[name = tensor("const_426_promoted"), val = tensor(-0x1p+0)]; tensor var_3950 = mul(x = x2_69, y = const_426_promoted)[name = tensor("op_3950")]; tensor var_3952_interleave_0 = const()[name = tensor("op_3952_interleave_0"), val = tensor(false)]; tensor var_3952 = concat(axis = var_24, interleave = var_3952_interleave_0, values = (var_3950, x1_69))[name = tensor("op_3952")]; tensor var_3953 = mul(x = var_3952, y = sin_19_palettized)[name = tensor("op_3953")]; tensor query_35 = add(x = var_3939, y = var_3953)[name = tensor("query_35")]; tensor var_3955 = mul(x = output_419_cast_fp16, y = cos_19_palettized)[name = tensor("op_3955")]; tensor x1_71_begin_0 = const()[name = tensor("x1_71_begin_0"), val = tensor([0, 0, 0, 0])]; tensor x1_71_end_0 = const()[name = tensor("x1_71_end_0"), val = tensor([1, 4, 256, 128])]; tensor x1_71_end_mask_0 = const()[name = tensor("x1_71_end_mask_0"), val = tensor([true, true, true, false])]; tensor x1_71 = slice_by_index(begin = x1_71_begin_0, end = x1_71_end_0, end_mask = x1_71_end_mask_0, x = output_419_cast_fp16)[name = tensor("x1_71")]; tensor x2_71_begin_0 = const()[name = tensor("x2_71_begin_0"), val = tensor([0, 0, 0, 128])]; tensor x2_71_end_0 = const()[name = tensor("x2_71_end_0"), val = tensor([1, 4, 256, 256])]; tensor x2_71_end_mask_0 = const()[name = tensor("x2_71_end_mask_0"), val = tensor([true, true, true, true])]; tensor x2_71 = slice_by_index(begin = x2_71_begin_0, end = x2_71_end_0, end_mask = x2_71_end_mask_0, x = output_419_cast_fp16)[name = tensor("x2_71")]; tensor const_429_promoted = const()[name = tensor("const_429_promoted"), val = tensor(-0x1p+0)]; tensor var_3966 = mul(x = x2_71, y = const_429_promoted)[name = tensor("op_3966")]; tensor var_3968_interleave_0 = const()[name = tensor("op_3968_interleave_0"), val = tensor(false)]; tensor var_3968 = concat(axis = var_24, interleave = var_3968_interleave_0, values = (var_3966, x1_71))[name = tensor("op_3968")]; tensor var_3969 = mul(x = var_3968, y = sin_19_palettized)[name = tensor("op_3969")]; tensor hidden_states_241 = add(x = var_3955, y = var_3969)[name = tensor("hidden_states_241")]; tensor var_3978_axes_0 = const()[name = tensor("op_3978_axes_0"), val = tensor([2])]; tensor var_3978 = expand_dims(axes = var_3978_axes_0, x = hidden_states_241)[name = tensor("op_3978")]; tensor hidden_states_243_reps_0 = const()[name = tensor("hidden_states_243_reps_0"), val = tensor([1, 1, 2, 1, 1])]; tensor hidden_states_243 = tile(reps = hidden_states_243_reps_0, x = var_3978)[name = tensor("hidden_states_243")]; tensor var_3986 = const()[name = tensor("op_3986"), val = tensor([1, 8, 256, 256])]; tensor key_states_35 = reshape(shape = var_3986, x = hidden_states_243)[name = tensor("key_states_35")]; tensor var_3995_axes_0 = const()[name = tensor("op_3995_axes_0"), val = tensor([2])]; tensor hidden_states_245 = transpose(perm = hidden_states_245_perm_0, x = var_3907)[name = tensor("transpose_65")]; tensor var_3995 = expand_dims(axes = var_3995_axes_0, x = hidden_states_245)[name = tensor("op_3995")]; tensor hidden_states_247_reps_0 = const()[name = tensor("hidden_states_247_reps_0"), val = tensor([1, 1, 2, 1, 1])]; tensor hidden_states_247 = tile(reps = hidden_states_247_reps_0, x = var_3995)[name = tensor("hidden_states_247")]; tensor var_4003 = const()[name = tensor("op_4003"), val = tensor([1, 8, 256, 256])]; tensor value_states_35 = reshape(shape = var_4003, x = hidden_states_247)[name = tensor("value_states_35")]; tensor var_4006_transpose_x_1 = const()[name = tensor("op_4006_transpose_x_1"), val = tensor(false)]; tensor var_4006_transpose_y_1 = const()[name = tensor("op_4006_transpose_y_1"), val = tensor(true)]; tensor var_4006 = matmul(transpose_x = var_4006_transpose_x_1, transpose_y = var_4006_transpose_y_1, x = query_35, y = key_states_35)[name = tensor("op_4006")]; tensor var_4007_to_fp16 = const()[name = tensor("op_4007_to_fp16"), val = tensor(0x1p-4)]; tensor attn_weights_69_cast_fp16 = mul(x = var_4006, y = var_4007_to_fp16)[name = tensor("attn_weights_69_cast_fp16")]; tensor input_205_cast_fp16 = add(x = attn_weights_69_cast_fp16, y = attention_mask_to_fp16_palettized)[name = tensor("input_205_cast_fp16")]; tensor var_4015_cast_fp16 = softmax(axis = var_24, x = input_205_cast_fp16)[name = tensor("op_4015_cast_fp16")]; tensor attn_output_69_transpose_x_0 = const()[name = tensor("attn_output_69_transpose_x_0"), val = tensor(false)]; tensor attn_output_69_transpose_y_0 = const()[name = tensor("attn_output_69_transpose_y_0"), val = tensor(false)]; tensor attn_output_69 = matmul(transpose_x = attn_output_69_transpose_x_0, transpose_y = attn_output_69_transpose_y_0, x = var_4015_cast_fp16, y = value_states_35)[name = tensor("attn_output_69")]; tensor var_4019_perm_0 = const()[name = tensor("op_4019_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_4021 = const()[name = tensor("op_4021"), val = tensor([1, 256, -1])]; tensor var_4019 = transpose(perm = var_4019_perm_0, x = attn_output_69)[name = tensor("transpose_64")]; tensor var_4022 = reshape(shape = var_4021, x = var_4019)[name = tensor("op_4022")]; tensor x_419 = linear(bias = linear_3_bias_0, weight = wrapped_model_language_model_layers_17_self_attn_o_proj_weight_palettized, x = var_4022)[name = tensor("linear_122")]; tensor var_22_promoted_105_to_fp16 = const()[name = tensor("op_22_promoted_105_to_fp16"), val = tensor(0x1p+1)]; tensor var_4028_cast_fp16 = pow(x = x_419, y = var_22_promoted_105_to_fp16)[name = tensor("op_4028_cast_fp16")]; tensor var_4030_axes_0 = const()[name = tensor("op_4030_axes_0"), val = tensor([-1])]; tensor var_4030_keep_dims_0 = const()[name = tensor("op_4030_keep_dims_0"), val = tensor(true)]; tensor var_4030_cast_fp16 = reduce_mean(axes = var_4030_axes_0, keep_dims = var_4030_keep_dims_0, x = var_4028_cast_fp16)[name = tensor("op_4030_cast_fp16")]; tensor var_4031_to_fp16 = const()[name = tensor("op_4031_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_4032_cast_fp16 = add(x = var_4030_cast_fp16, y = var_4031_to_fp16)[name = tensor("op_4032_cast_fp16")]; tensor var_4033_epsilon_0 = const()[name = tensor("op_4033_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_4033_cast_fp16 = rsqrt(epsilon = var_4033_epsilon_0, x = var_4032_cast_fp16)[name = tensor("op_4033_cast_fp16")]; tensor output_421_cast_fp16 = mul(x = x_419, y = var_4033_cast_fp16)[name = tensor("output_421_cast_fp16")]; tensor var_4037_to_fp16 = const()[name = tensor("op_4037_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940568704)))]; tensor output_423_cast_fp16 = mul(x = output_421_cast_fp16, y = var_4037_to_fp16)[name = tensor("output_423_cast_fp16")]; tensor x_423 = add(x = x_407, y = output_423_cast_fp16)[name = tensor("x_423")]; tensor var_22_promoted_106_to_fp16 = const()[name = tensor("op_22_promoted_106_to_fp16"), val = tensor(0x1p+1)]; tensor var_4043_cast_fp16 = pow(x = x_423, y = var_22_promoted_106_to_fp16)[name = tensor("op_4043_cast_fp16")]; tensor var_4045_axes_0 = const()[name = tensor("op_4045_axes_0"), val = tensor([-1])]; tensor var_4045_keep_dims_0 = const()[name = tensor("op_4045_keep_dims_0"), val = tensor(true)]; tensor var_4045_cast_fp16 = reduce_mean(axes = var_4045_axes_0, keep_dims = var_4045_keep_dims_0, x = var_4043_cast_fp16)[name = tensor("op_4045_cast_fp16")]; tensor var_4046_to_fp16 = const()[name = tensor("op_4046_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_4047_cast_fp16 = add(x = var_4045_cast_fp16, y = var_4046_to_fp16)[name = tensor("op_4047_cast_fp16")]; tensor var_4048_epsilon_0 = const()[name = tensor("op_4048_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_4048_cast_fp16 = rsqrt(epsilon = var_4048_epsilon_0, x = var_4047_cast_fp16)[name = tensor("op_4048_cast_fp16")]; tensor output_425_cast_fp16 = mul(x = x_423, y = var_4048_cast_fp16)[name = tensor("output_425_cast_fp16")]; tensor var_4052_to_fp16 = const()[name = tensor("op_4052_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940573888)))]; tensor output_427_cast_fp16 = mul(x = output_425_cast_fp16, y = var_4052_to_fp16)[name = tensor("output_427_cast_fp16")]; tensor input_213 = linear(bias = linear_4_bias_0, weight = wrapped_model_language_model_layers_17_mlp_gate_proj_weight_palettized, x = output_427_cast_fp16)[name = tensor("linear_123")]; tensor var_4060_mode_0 = const()[name = tensor("op_4060_mode_0"), val = tensor("TANH_APPROXIMATION")]; tensor var_4060 = gelu(mode = var_4060_mode_0, x = input_213)[name = tensor("op_4060")]; tensor var_4062 = linear(bias = linear_4_bias_0, weight = wrapped_model_language_model_layers_17_mlp_up_proj_weight_palettized, x = output_427_cast_fp16)[name = tensor("linear_124")]; tensor input_215 = mul(x = var_4060, y = var_4062)[name = tensor("input_215")]; tensor x_427 = linear(bias = linear_3_bias_0, weight = wrapped_model_language_model_layers_17_mlp_down_proj_weight_palettized, x = input_215)[name = tensor("linear_125")]; tensor var_22_promoted_107_to_fp16 = const()[name = tensor("op_22_promoted_107_to_fp16"), val = tensor(0x1p+1)]; tensor var_4068_cast_fp16 = pow(x = x_427, y = var_22_promoted_107_to_fp16)[name = tensor("op_4068_cast_fp16")]; tensor var_4070_axes_0 = const()[name = tensor("op_4070_axes_0"), val = tensor([-1])]; tensor var_4070_keep_dims_0 = const()[name = tensor("op_4070_keep_dims_0"), val = tensor(true)]; tensor var_4070_cast_fp16 = reduce_mean(axes = var_4070_axes_0, keep_dims = var_4070_keep_dims_0, x = var_4068_cast_fp16)[name = tensor("op_4070_cast_fp16")]; tensor var_4071_to_fp16 = const()[name = tensor("op_4071_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_4072_cast_fp16 = add(x = var_4070_cast_fp16, y = var_4071_to_fp16)[name = tensor("op_4072_cast_fp16")]; tensor var_4073_epsilon_0 = const()[name = tensor("op_4073_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_4073_cast_fp16 = rsqrt(epsilon = var_4073_epsilon_0, x = var_4072_cast_fp16)[name = tensor("op_4073_cast_fp16")]; tensor output_429_cast_fp16 = mul(x = x_427, y = var_4073_cast_fp16)[name = tensor("output_429_cast_fp16")]; tensor var_4077_to_fp16 = const()[name = tensor("op_4077_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940579072)))]; tensor output_431_cast_fp16 = mul(x = output_429_cast_fp16, y = var_4077_to_fp16)[name = tensor("output_431_cast_fp16")]; tensor x_431 = add(x = x_423, y = output_431_cast_fp16)[name = tensor("x_431")]; tensor var_22_promoted_108_to_fp16 = const()[name = tensor("op_22_promoted_108_to_fp16"), val = tensor(0x1p+1)]; tensor var_4089_cast_fp16 = pow(x = x_431, y = var_22_promoted_108_to_fp16)[name = tensor("op_4089_cast_fp16")]; tensor var_4091_axes_0 = const()[name = tensor("op_4091_axes_0"), val = tensor([-1])]; tensor var_4091_keep_dims_0 = const()[name = tensor("op_4091_keep_dims_0"), val = tensor(true)]; tensor var_4091_cast_fp16 = reduce_mean(axes = var_4091_axes_0, keep_dims = var_4091_keep_dims_0, x = var_4089_cast_fp16)[name = tensor("op_4091_cast_fp16")]; tensor var_4092_to_fp16 = const()[name = tensor("op_4092_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_4093_cast_fp16 = add(x = var_4091_cast_fp16, y = var_4092_to_fp16)[name = tensor("op_4093_cast_fp16")]; tensor var_4094_epsilon_0 = const()[name = tensor("op_4094_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_4094_cast_fp16 = rsqrt(epsilon = var_4094_epsilon_0, x = var_4093_cast_fp16)[name = tensor("op_4094_cast_fp16")]; tensor output_433_cast_fp16 = mul(x = x_431, y = var_4094_cast_fp16)[name = tensor("output_433_cast_fp16")]; tensor var_4098_to_fp16 = const()[name = tensor("op_4098_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940584256)))]; tensor output_435_cast_fp16 = mul(x = output_433_cast_fp16, y = var_4098_to_fp16)[name = tensor("output_435_cast_fp16")]; tensor var_4110 = linear(bias = linear_0_bias_0, weight = wrapped_model_language_model_layers_18_self_attn_q_proj_weight_palettized, x = output_435_cast_fp16)[name = tensor("linear_126")]; tensor var_4111 = const()[name = tensor("op_4111"), val = tensor([1, 256, -1, 256])]; tensor var_4112 = reshape(shape = var_4111, x = var_4110)[name = tensor("op_4112")]; tensor x_435_perm_0 = const()[name = tensor("x_435_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_4115 = linear(bias = linear_1_bias_0, weight = wrapped_model_language_model_layers_18_self_attn_k_proj_weight_palettized, x = output_435_cast_fp16)[name = tensor("linear_127")]; tensor var_4116 = const()[name = tensor("op_4116"), val = tensor([1, 256, -1, 256])]; tensor var_4117 = reshape(shape = var_4116, x = var_4115)[name = tensor("op_4117")]; tensor x_439_perm_0 = const()[name = tensor("x_439_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_4120 = linear(bias = linear_1_bias_0, weight = wrapped_model_language_model_layers_18_self_attn_v_proj_weight_palettized, x = output_435_cast_fp16)[name = tensor("linear_128")]; tensor var_4121 = const()[name = tensor("op_4121"), val = tensor([1, 256, -1, 256])]; tensor var_4122 = reshape(shape = var_4121, x = var_4120)[name = tensor("op_4122")]; tensor hidden_states_259_perm_0 = const()[name = tensor("hidden_states_259_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_22_promoted_109_to_fp16 = const()[name = tensor("op_22_promoted_109_to_fp16"), val = tensor(0x1p+1)]; tensor x_435 = transpose(perm = x_435_perm_0, x = var_4112)[name = tensor("transpose_63")]; tensor var_4126_cast_fp16 = pow(x = x_435, y = var_22_promoted_109_to_fp16)[name = tensor("op_4126_cast_fp16")]; tensor var_4128_axes_0 = const()[name = tensor("op_4128_axes_0"), val = tensor([-1])]; tensor var_4128_keep_dims_0 = const()[name = tensor("op_4128_keep_dims_0"), val = tensor(true)]; tensor var_4128_cast_fp16 = reduce_mean(axes = var_4128_axes_0, keep_dims = var_4128_keep_dims_0, x = var_4126_cast_fp16)[name = tensor("op_4128_cast_fp16")]; tensor var_4129_to_fp16 = const()[name = tensor("op_4129_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_4130_cast_fp16 = add(x = var_4128_cast_fp16, y = var_4129_to_fp16)[name = tensor("op_4130_cast_fp16")]; tensor var_4131_epsilon_0 = const()[name = tensor("op_4131_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_4131_cast_fp16 = rsqrt(epsilon = var_4131_epsilon_0, x = var_4130_cast_fp16)[name = tensor("op_4131_cast_fp16")]; tensor output_437_cast_fp16 = mul(x = x_435, y = var_4131_cast_fp16)[name = tensor("output_437_cast_fp16")]; tensor var_4135_to_fp16 = const()[name = tensor("op_4135_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940589440)))]; tensor output_439_cast_fp16 = mul(x = output_437_cast_fp16, y = var_4135_to_fp16)[name = tensor("output_439_cast_fp16")]; tensor var_22_promoted_110_to_fp16 = const()[name = tensor("op_22_promoted_110_to_fp16"), val = tensor(0x1p+1)]; tensor x_439 = transpose(perm = x_439_perm_0, x = var_4117)[name = tensor("transpose_62")]; tensor var_4140_cast_fp16 = pow(x = x_439, y = var_22_promoted_110_to_fp16)[name = tensor("op_4140_cast_fp16")]; tensor var_4142_axes_0 = const()[name = tensor("op_4142_axes_0"), val = tensor([-1])]; tensor var_4142_keep_dims_0 = const()[name = tensor("op_4142_keep_dims_0"), val = tensor(true)]; tensor var_4142_cast_fp16 = reduce_mean(axes = var_4142_axes_0, keep_dims = var_4142_keep_dims_0, x = var_4140_cast_fp16)[name = tensor("op_4142_cast_fp16")]; tensor var_4143_to_fp16 = const()[name = tensor("op_4143_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_4144_cast_fp16 = add(x = var_4142_cast_fp16, y = var_4143_to_fp16)[name = tensor("op_4144_cast_fp16")]; tensor var_4145_epsilon_0 = const()[name = tensor("op_4145_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_4145_cast_fp16 = rsqrt(epsilon = var_4145_epsilon_0, x = var_4144_cast_fp16)[name = tensor("op_4145_cast_fp16")]; tensor output_441_cast_fp16 = mul(x = x_439, y = var_4145_cast_fp16)[name = tensor("output_441_cast_fp16")]; tensor var_4149_to_fp16 = const()[name = tensor("op_4149_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940590016)))]; tensor output_443_cast_fp16 = mul(x = output_441_cast_fp16, y = var_4149_to_fp16)[name = tensor("output_443_cast_fp16")]; tensor var_4154 = mul(x = output_439_cast_fp16, y = cos_7_palettized)[name = tensor("op_4154")]; tensor x1_73_begin_0 = const()[name = tensor("x1_73_begin_0"), val = tensor([0, 0, 0, 0])]; tensor x1_73_end_0 = const()[name = tensor("x1_73_end_0"), val = tensor([1, 8, 256, 128])]; tensor x1_73_end_mask_0 = const()[name = tensor("x1_73_end_mask_0"), val = tensor([true, true, true, false])]; tensor x1_73 = slice_by_index(begin = x1_73_begin_0, end = x1_73_end_0, end_mask = x1_73_end_mask_0, x = output_439_cast_fp16)[name = tensor("x1_73")]; tensor x2_73_begin_0 = const()[name = tensor("x2_73_begin_0"), val = tensor([0, 0, 0, 128])]; tensor x2_73_end_0 = const()[name = tensor("x2_73_end_0"), val = tensor([1, 8, 256, 256])]; tensor x2_73_end_mask_0 = const()[name = tensor("x2_73_end_mask_0"), val = tensor([true, true, true, true])]; tensor x2_73 = slice_by_index(begin = x2_73_begin_0, end = x2_73_end_0, end_mask = x2_73_end_mask_0, x = output_439_cast_fp16)[name = tensor("x2_73")]; tensor const_449_promoted = const()[name = tensor("const_449_promoted"), val = tensor(-0x1p+0)]; tensor var_4165 = mul(x = x2_73, y = const_449_promoted)[name = tensor("op_4165")]; tensor var_4167_interleave_0 = const()[name = tensor("op_4167_interleave_0"), val = tensor(false)]; tensor var_4167 = concat(axis = var_24, interleave = var_4167_interleave_0, values = (var_4165, x1_73))[name = tensor("op_4167")]; tensor var_4168 = mul(x = var_4167, y = sin_7_palettized)[name = tensor("op_4168")]; tensor query_37 = add(x = var_4154, y = var_4168)[name = tensor("query_37")]; tensor var_4170 = mul(x = output_443_cast_fp16, y = cos_7_palettized)[name = tensor("op_4170")]; tensor x1_75_begin_0 = const()[name = tensor("x1_75_begin_0"), val = tensor([0, 0, 0, 0])]; tensor x1_75_end_0 = const()[name = tensor("x1_75_end_0"), val = tensor([1, 4, 256, 128])]; tensor x1_75_end_mask_0 = const()[name = tensor("x1_75_end_mask_0"), val = tensor([true, true, true, false])]; tensor x1_75 = slice_by_index(begin = x1_75_begin_0, end = x1_75_end_0, end_mask = x1_75_end_mask_0, x = output_443_cast_fp16)[name = tensor("x1_75")]; tensor x2_75_begin_0 = const()[name = tensor("x2_75_begin_0"), val = tensor([0, 0, 0, 128])]; tensor x2_75_end_0 = const()[name = tensor("x2_75_end_0"), val = tensor([1, 4, 256, 256])]; tensor x2_75_end_mask_0 = const()[name = tensor("x2_75_end_mask_0"), val = tensor([true, true, true, true])]; tensor x2_75 = slice_by_index(begin = x2_75_begin_0, end = x2_75_end_0, end_mask = x2_75_end_mask_0, x = output_443_cast_fp16)[name = tensor("x2_75")]; tensor const_452_promoted = const()[name = tensor("const_452_promoted"), val = tensor(-0x1p+0)]; tensor var_4181 = mul(x = x2_75, y = const_452_promoted)[name = tensor("op_4181")]; tensor var_4183_interleave_0 = const()[name = tensor("op_4183_interleave_0"), val = tensor(false)]; tensor var_4183 = concat(axis = var_24, interleave = var_4183_interleave_0, values = (var_4181, x1_75))[name = tensor("op_4183")]; tensor var_4184 = mul(x = var_4183, y = sin_7_palettized)[name = tensor("op_4184")]; tensor hidden_states_255 = add(x = var_4170, y = var_4184)[name = tensor("hidden_states_255")]; tensor var_4193_axes_0 = const()[name = tensor("op_4193_axes_0"), val = tensor([2])]; tensor var_4193 = expand_dims(axes = var_4193_axes_0, x = hidden_states_255)[name = tensor("op_4193")]; tensor hidden_states_257_reps_0 = const()[name = tensor("hidden_states_257_reps_0"), val = tensor([1, 1, 2, 1, 1])]; tensor hidden_states_257 = tile(reps = hidden_states_257_reps_0, x = var_4193)[name = tensor("hidden_states_257")]; tensor var_4201 = const()[name = tensor("op_4201"), val = tensor([1, 8, 256, 256])]; tensor key_states_37 = reshape(shape = var_4201, x = hidden_states_257)[name = tensor("key_states_37")]; tensor var_4210_axes_0 = const()[name = tensor("op_4210_axes_0"), val = tensor([2])]; tensor hidden_states_259 = transpose(perm = hidden_states_259_perm_0, x = var_4122)[name = tensor("transpose_61")]; tensor var_4210 = expand_dims(axes = var_4210_axes_0, x = hidden_states_259)[name = tensor("op_4210")]; tensor hidden_states_261_reps_0 = const()[name = tensor("hidden_states_261_reps_0"), val = tensor([1, 1, 2, 1, 1])]; tensor hidden_states_261 = tile(reps = hidden_states_261_reps_0, x = var_4210)[name = tensor("hidden_states_261")]; tensor var_4218 = const()[name = tensor("op_4218"), val = tensor([1, 8, 256, 256])]; tensor value_states_37 = reshape(shape = var_4218, x = hidden_states_261)[name = tensor("value_states_37")]; tensor var_4221_transpose_x_1 = const()[name = tensor("op_4221_transpose_x_1"), val = tensor(false)]; tensor var_4221_transpose_y_1 = const()[name = tensor("op_4221_transpose_y_1"), val = tensor(true)]; tensor var_4221 = matmul(transpose_x = var_4221_transpose_x_1, transpose_y = var_4221_transpose_y_1, x = query_37, y = key_states_37)[name = tensor("op_4221")]; tensor var_4222_to_fp16 = const()[name = tensor("op_4222_to_fp16"), val = tensor(0x1p-4)]; tensor attn_weights_73_cast_fp16 = mul(x = var_4221, y = var_4222_to_fp16)[name = tensor("attn_weights_73_cast_fp16")]; tensor input_217_cast_fp16 = add(x = attn_weights_73_cast_fp16, y = attention_mask_to_fp16_palettized)[name = tensor("input_217_cast_fp16")]; tensor var_4230_cast_fp16 = softmax(axis = var_24, x = input_217_cast_fp16)[name = tensor("op_4230_cast_fp16")]; tensor attn_output_73_transpose_x_0 = const()[name = tensor("attn_output_73_transpose_x_0"), val = tensor(false)]; tensor attn_output_73_transpose_y_0 = const()[name = tensor("attn_output_73_transpose_y_0"), val = tensor(false)]; tensor attn_output_73 = matmul(transpose_x = attn_output_73_transpose_x_0, transpose_y = attn_output_73_transpose_y_0, x = var_4230_cast_fp16, y = value_states_37)[name = tensor("attn_output_73")]; tensor var_4234_perm_0 = const()[name = tensor("op_4234_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_4236 = const()[name = tensor("op_4236"), val = tensor([1, 256, -1])]; tensor var_4234 = transpose(perm = var_4234_perm_0, x = attn_output_73)[name = tensor("transpose_60")]; tensor var_4237 = reshape(shape = var_4236, x = var_4234)[name = tensor("op_4237")]; tensor x_443 = linear(bias = linear_3_bias_0, weight = wrapped_model_language_model_layers_18_self_attn_o_proj_weight_palettized, x = var_4237)[name = tensor("linear_129")]; tensor var_22_promoted_111_to_fp16 = const()[name = tensor("op_22_promoted_111_to_fp16"), val = tensor(0x1p+1)]; tensor var_4243_cast_fp16 = pow(x = x_443, y = var_22_promoted_111_to_fp16)[name = tensor("op_4243_cast_fp16")]; tensor var_4245_axes_0 = const()[name = tensor("op_4245_axes_0"), val = tensor([-1])]; tensor var_4245_keep_dims_0 = const()[name = tensor("op_4245_keep_dims_0"), val = tensor(true)]; tensor var_4245_cast_fp16 = reduce_mean(axes = var_4245_axes_0, keep_dims = var_4245_keep_dims_0, x = var_4243_cast_fp16)[name = tensor("op_4245_cast_fp16")]; tensor var_4246_to_fp16 = const()[name = tensor("op_4246_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_4247_cast_fp16 = add(x = var_4245_cast_fp16, y = var_4246_to_fp16)[name = tensor("op_4247_cast_fp16")]; tensor var_4248_epsilon_0 = const()[name = tensor("op_4248_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_4248_cast_fp16 = rsqrt(epsilon = var_4248_epsilon_0, x = var_4247_cast_fp16)[name = tensor("op_4248_cast_fp16")]; tensor output_445_cast_fp16 = mul(x = x_443, y = var_4248_cast_fp16)[name = tensor("output_445_cast_fp16")]; tensor var_4252_to_fp16 = const()[name = tensor("op_4252_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940590592)))]; tensor output_447_cast_fp16 = mul(x = output_445_cast_fp16, y = var_4252_to_fp16)[name = tensor("output_447_cast_fp16")]; tensor x_447 = add(x = x_431, y = output_447_cast_fp16)[name = tensor("x_447")]; tensor var_22_promoted_112_to_fp16 = const()[name = tensor("op_22_promoted_112_to_fp16"), val = tensor(0x1p+1)]; tensor var_4258_cast_fp16 = pow(x = x_447, y = var_22_promoted_112_to_fp16)[name = tensor("op_4258_cast_fp16")]; tensor var_4260_axes_0 = const()[name = tensor("op_4260_axes_0"), val = tensor([-1])]; tensor var_4260_keep_dims_0 = const()[name = tensor("op_4260_keep_dims_0"), val = tensor(true)]; tensor var_4260_cast_fp16 = reduce_mean(axes = var_4260_axes_0, keep_dims = var_4260_keep_dims_0, x = var_4258_cast_fp16)[name = tensor("op_4260_cast_fp16")]; tensor var_4261_to_fp16 = const()[name = tensor("op_4261_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_4262_cast_fp16 = add(x = var_4260_cast_fp16, y = var_4261_to_fp16)[name = tensor("op_4262_cast_fp16")]; tensor var_4263_epsilon_0 = const()[name = tensor("op_4263_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_4263_cast_fp16 = rsqrt(epsilon = var_4263_epsilon_0, x = var_4262_cast_fp16)[name = tensor("op_4263_cast_fp16")]; tensor output_449_cast_fp16 = mul(x = x_447, y = var_4263_cast_fp16)[name = tensor("output_449_cast_fp16")]; tensor var_4267_to_fp16 = const()[name = tensor("op_4267_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940595776)))]; tensor output_451_cast_fp16 = mul(x = output_449_cast_fp16, y = var_4267_to_fp16)[name = tensor("output_451_cast_fp16")]; tensor input_225 = linear(bias = linear_4_bias_0, weight = wrapped_model_language_model_layers_18_mlp_gate_proj_weight_palettized, x = output_451_cast_fp16)[name = tensor("linear_130")]; tensor var_4275_mode_0 = const()[name = tensor("op_4275_mode_0"), val = tensor("TANH_APPROXIMATION")]; tensor var_4275 = gelu(mode = var_4275_mode_0, x = input_225)[name = tensor("op_4275")]; tensor var_4277 = linear(bias = linear_4_bias_0, weight = wrapped_model_language_model_layers_18_mlp_up_proj_weight_palettized, x = output_451_cast_fp16)[name = tensor("linear_131")]; tensor input_227 = mul(x = var_4275, y = var_4277)[name = tensor("input_227")]; tensor x_451 = linear(bias = linear_3_bias_0, weight = wrapped_model_language_model_layers_18_mlp_down_proj_weight_palettized, x = input_227)[name = tensor("linear_132")]; tensor var_22_promoted_113_to_fp16 = const()[name = tensor("op_22_promoted_113_to_fp16"), val = tensor(0x1p+1)]; tensor var_4283_cast_fp16 = pow(x = x_451, y = var_22_promoted_113_to_fp16)[name = tensor("op_4283_cast_fp16")]; tensor var_4285_axes_0 = const()[name = tensor("op_4285_axes_0"), val = tensor([-1])]; tensor var_4285_keep_dims_0 = const()[name = tensor("op_4285_keep_dims_0"), val = tensor(true)]; tensor var_4285_cast_fp16 = reduce_mean(axes = var_4285_axes_0, keep_dims = var_4285_keep_dims_0, x = var_4283_cast_fp16)[name = tensor("op_4285_cast_fp16")]; tensor var_4286_to_fp16 = const()[name = tensor("op_4286_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_4287_cast_fp16 = add(x = var_4285_cast_fp16, y = var_4286_to_fp16)[name = tensor("op_4287_cast_fp16")]; tensor var_4288_epsilon_0 = const()[name = tensor("op_4288_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_4288_cast_fp16 = rsqrt(epsilon = var_4288_epsilon_0, x = var_4287_cast_fp16)[name = tensor("op_4288_cast_fp16")]; tensor output_453_cast_fp16 = mul(x = x_451, y = var_4288_cast_fp16)[name = tensor("output_453_cast_fp16")]; tensor var_4292_to_fp16 = const()[name = tensor("op_4292_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940600960)))]; tensor output_455_cast_fp16 = mul(x = output_453_cast_fp16, y = var_4292_to_fp16)[name = tensor("output_455_cast_fp16")]; tensor x_455 = add(x = x_447, y = output_455_cast_fp16)[name = tensor("x_455")]; tensor var_22_promoted_114_to_fp16 = const()[name = tensor("op_22_promoted_114_to_fp16"), val = tensor(0x1p+1)]; tensor var_4304_cast_fp16 = pow(x = x_455, y = var_22_promoted_114_to_fp16)[name = tensor("op_4304_cast_fp16")]; tensor var_4306_axes_0 = const()[name = tensor("op_4306_axes_0"), val = tensor([-1])]; tensor var_4306_keep_dims_0 = const()[name = tensor("op_4306_keep_dims_0"), val = tensor(true)]; tensor var_4306_cast_fp16 = reduce_mean(axes = var_4306_axes_0, keep_dims = var_4306_keep_dims_0, x = var_4304_cast_fp16)[name = tensor("op_4306_cast_fp16")]; tensor var_4307_to_fp16 = const()[name = tensor("op_4307_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_4308_cast_fp16 = add(x = var_4306_cast_fp16, y = var_4307_to_fp16)[name = tensor("op_4308_cast_fp16")]; tensor var_4309_epsilon_0 = const()[name = tensor("op_4309_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_4309_cast_fp16 = rsqrt(epsilon = var_4309_epsilon_0, x = var_4308_cast_fp16)[name = tensor("op_4309_cast_fp16")]; tensor output_457_cast_fp16 = mul(x = x_455, y = var_4309_cast_fp16)[name = tensor("output_457_cast_fp16")]; tensor var_4313_to_fp16 = const()[name = tensor("op_4313_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940606144)))]; tensor output_459_cast_fp16 = mul(x = output_457_cast_fp16, y = var_4313_to_fp16)[name = tensor("output_459_cast_fp16")]; tensor var_4325 = linear(bias = linear_0_bias_0, weight = wrapped_model_language_model_layers_19_self_attn_q_proj_weight_palettized, x = output_459_cast_fp16)[name = tensor("linear_133")]; tensor var_4326 = const()[name = tensor("op_4326"), val = tensor([1, 256, -1, 256])]; tensor var_4327 = reshape(shape = var_4326, x = var_4325)[name = tensor("op_4327")]; tensor x_459_perm_0 = const()[name = tensor("x_459_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_4330 = linear(bias = linear_1_bias_0, weight = wrapped_model_language_model_layers_19_self_attn_k_proj_weight_palettized, x = output_459_cast_fp16)[name = tensor("linear_134")]; tensor var_4331 = const()[name = tensor("op_4331"), val = tensor([1, 256, -1, 256])]; tensor var_4332 = reshape(shape = var_4331, x = var_4330)[name = tensor("op_4332")]; tensor x_463_perm_0 = const()[name = tensor("x_463_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_4335 = linear(bias = linear_1_bias_0, weight = wrapped_model_language_model_layers_19_self_attn_v_proj_weight_palettized, x = output_459_cast_fp16)[name = tensor("linear_135")]; tensor var_4336 = const()[name = tensor("op_4336"), val = tensor([1, 256, -1, 256])]; tensor var_4337 = reshape(shape = var_4336, x = var_4335)[name = tensor("op_4337")]; tensor hidden_states_273_perm_0 = const()[name = tensor("hidden_states_273_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_22_promoted_115_to_fp16 = const()[name = tensor("op_22_promoted_115_to_fp16"), val = tensor(0x1p+1)]; tensor x_459 = transpose(perm = x_459_perm_0, x = var_4327)[name = tensor("transpose_59")]; tensor var_4341_cast_fp16 = pow(x = x_459, y = var_22_promoted_115_to_fp16)[name = tensor("op_4341_cast_fp16")]; tensor var_4343_axes_0 = const()[name = tensor("op_4343_axes_0"), val = tensor([-1])]; tensor var_4343_keep_dims_0 = const()[name = tensor("op_4343_keep_dims_0"), val = tensor(true)]; tensor var_4343_cast_fp16 = reduce_mean(axes = var_4343_axes_0, keep_dims = var_4343_keep_dims_0, x = var_4341_cast_fp16)[name = tensor("op_4343_cast_fp16")]; tensor var_4344_to_fp16 = const()[name = tensor("op_4344_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_4345_cast_fp16 = add(x = var_4343_cast_fp16, y = var_4344_to_fp16)[name = tensor("op_4345_cast_fp16")]; tensor var_4346_epsilon_0 = const()[name = tensor("op_4346_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_4346_cast_fp16 = rsqrt(epsilon = var_4346_epsilon_0, x = var_4345_cast_fp16)[name = tensor("op_4346_cast_fp16")]; tensor output_461_cast_fp16 = mul(x = x_459, y = var_4346_cast_fp16)[name = tensor("output_461_cast_fp16")]; tensor var_4350_to_fp16 = const()[name = tensor("op_4350_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940611328)))]; tensor output_463_cast_fp16 = mul(x = output_461_cast_fp16, y = var_4350_to_fp16)[name = tensor("output_463_cast_fp16")]; tensor var_22_promoted_116_to_fp16 = const()[name = tensor("op_22_promoted_116_to_fp16"), val = tensor(0x1p+1)]; tensor x_463 = transpose(perm = x_463_perm_0, x = var_4332)[name = tensor("transpose_58")]; tensor var_4355_cast_fp16 = pow(x = x_463, y = var_22_promoted_116_to_fp16)[name = tensor("op_4355_cast_fp16")]; tensor var_4357_axes_0 = const()[name = tensor("op_4357_axes_0"), val = tensor([-1])]; tensor var_4357_keep_dims_0 = const()[name = tensor("op_4357_keep_dims_0"), val = tensor(true)]; tensor var_4357_cast_fp16 = reduce_mean(axes = var_4357_axes_0, keep_dims = var_4357_keep_dims_0, x = var_4355_cast_fp16)[name = tensor("op_4357_cast_fp16")]; tensor var_4358_to_fp16 = const()[name = tensor("op_4358_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_4359_cast_fp16 = add(x = var_4357_cast_fp16, y = var_4358_to_fp16)[name = tensor("op_4359_cast_fp16")]; tensor var_4360_epsilon_0 = const()[name = tensor("op_4360_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_4360_cast_fp16 = rsqrt(epsilon = var_4360_epsilon_0, x = var_4359_cast_fp16)[name = tensor("op_4360_cast_fp16")]; tensor output_465_cast_fp16 = mul(x = x_463, y = var_4360_cast_fp16)[name = tensor("output_465_cast_fp16")]; tensor var_4364_to_fp16 = const()[name = tensor("op_4364_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940611904)))]; tensor output_467_cast_fp16 = mul(x = output_465_cast_fp16, y = var_4364_to_fp16)[name = tensor("output_467_cast_fp16")]; tensor var_4369 = mul(x = output_463_cast_fp16, y = cos_7_palettized)[name = tensor("op_4369")]; tensor x1_77_begin_0 = const()[name = tensor("x1_77_begin_0"), val = tensor([0, 0, 0, 0])]; tensor x1_77_end_0 = const()[name = tensor("x1_77_end_0"), val = tensor([1, 8, 256, 128])]; tensor x1_77_end_mask_0 = const()[name = tensor("x1_77_end_mask_0"), val = tensor([true, true, true, false])]; tensor x1_77 = slice_by_index(begin = x1_77_begin_0, end = x1_77_end_0, end_mask = x1_77_end_mask_0, x = output_463_cast_fp16)[name = tensor("x1_77")]; tensor x2_77_begin_0 = const()[name = tensor("x2_77_begin_0"), val = tensor([0, 0, 0, 128])]; tensor x2_77_end_0 = const()[name = tensor("x2_77_end_0"), val = tensor([1, 8, 256, 256])]; tensor x2_77_end_mask_0 = const()[name = tensor("x2_77_end_mask_0"), val = tensor([true, true, true, true])]; tensor x2_77 = slice_by_index(begin = x2_77_begin_0, end = x2_77_end_0, end_mask = x2_77_end_mask_0, x = output_463_cast_fp16)[name = tensor("x2_77")]; tensor const_472_promoted = const()[name = tensor("const_472_promoted"), val = tensor(-0x1p+0)]; tensor var_4380 = mul(x = x2_77, y = const_472_promoted)[name = tensor("op_4380")]; tensor var_4382_interleave_0 = const()[name = tensor("op_4382_interleave_0"), val = tensor(false)]; tensor var_4382 = concat(axis = var_24, interleave = var_4382_interleave_0, values = (var_4380, x1_77))[name = tensor("op_4382")]; tensor var_4383 = mul(x = var_4382, y = sin_7_palettized)[name = tensor("op_4383")]; tensor query_39 = add(x = var_4369, y = var_4383)[name = tensor("query_39")]; tensor var_4385 = mul(x = output_467_cast_fp16, y = cos_7_palettized)[name = tensor("op_4385")]; tensor x1_79_begin_0 = const()[name = tensor("x1_79_begin_0"), val = tensor([0, 0, 0, 0])]; tensor x1_79_end_0 = const()[name = tensor("x1_79_end_0"), val = tensor([1, 4, 256, 128])]; tensor x1_79_end_mask_0 = const()[name = tensor("x1_79_end_mask_0"), val = tensor([true, true, true, false])]; tensor x1_79 = slice_by_index(begin = x1_79_begin_0, end = x1_79_end_0, end_mask = x1_79_end_mask_0, x = output_467_cast_fp16)[name = tensor("x1_79")]; tensor x2_79_begin_0 = const()[name = tensor("x2_79_begin_0"), val = tensor([0, 0, 0, 128])]; tensor x2_79_end_0 = const()[name = tensor("x2_79_end_0"), val = tensor([1, 4, 256, 256])]; tensor x2_79_end_mask_0 = const()[name = tensor("x2_79_end_mask_0"), val = tensor([true, true, true, true])]; tensor x2_79 = slice_by_index(begin = x2_79_begin_0, end = x2_79_end_0, end_mask = x2_79_end_mask_0, x = output_467_cast_fp16)[name = tensor("x2_79")]; tensor const_475_promoted = const()[name = tensor("const_475_promoted"), val = tensor(-0x1p+0)]; tensor var_4396 = mul(x = x2_79, y = const_475_promoted)[name = tensor("op_4396")]; tensor var_4398_interleave_0 = const()[name = tensor("op_4398_interleave_0"), val = tensor(false)]; tensor var_4398 = concat(axis = var_24, interleave = var_4398_interleave_0, values = (var_4396, x1_79))[name = tensor("op_4398")]; tensor var_4399 = mul(x = var_4398, y = sin_7_palettized)[name = tensor("op_4399")]; tensor hidden_states_269 = add(x = var_4385, y = var_4399)[name = tensor("hidden_states_269")]; tensor var_4408_axes_0 = const()[name = tensor("op_4408_axes_0"), val = tensor([2])]; tensor var_4408 = expand_dims(axes = var_4408_axes_0, x = hidden_states_269)[name = tensor("op_4408")]; tensor hidden_states_271_reps_0 = const()[name = tensor("hidden_states_271_reps_0"), val = tensor([1, 1, 2, 1, 1])]; tensor hidden_states_271 = tile(reps = hidden_states_271_reps_0, x = var_4408)[name = tensor("hidden_states_271")]; tensor var_4416 = const()[name = tensor("op_4416"), val = tensor([1, 8, 256, 256])]; tensor key_states_39 = reshape(shape = var_4416, x = hidden_states_271)[name = tensor("key_states_39")]; tensor var_4425_axes_0 = const()[name = tensor("op_4425_axes_0"), val = tensor([2])]; tensor hidden_states_273 = transpose(perm = hidden_states_273_perm_0, x = var_4337)[name = tensor("transpose_57")]; tensor var_4425 = expand_dims(axes = var_4425_axes_0, x = hidden_states_273)[name = tensor("op_4425")]; tensor hidden_states_275_reps_0 = const()[name = tensor("hidden_states_275_reps_0"), val = tensor([1, 1, 2, 1, 1])]; tensor hidden_states_275 = tile(reps = hidden_states_275_reps_0, x = var_4425)[name = tensor("hidden_states_275")]; tensor var_4433 = const()[name = tensor("op_4433"), val = tensor([1, 8, 256, 256])]; tensor value_states_39 = reshape(shape = var_4433, x = hidden_states_275)[name = tensor("value_states_39")]; tensor var_4436_transpose_x_1 = const()[name = tensor("op_4436_transpose_x_1"), val = tensor(false)]; tensor var_4436_transpose_y_1 = const()[name = tensor("op_4436_transpose_y_1"), val = tensor(true)]; tensor var_4436 = matmul(transpose_x = var_4436_transpose_x_1, transpose_y = var_4436_transpose_y_1, x = query_39, y = key_states_39)[name = tensor("op_4436")]; tensor var_4437_to_fp16 = const()[name = tensor("op_4437_to_fp16"), val = tensor(0x1p-4)]; tensor attn_weights_77_cast_fp16 = mul(x = var_4436, y = var_4437_to_fp16)[name = tensor("attn_weights_77_cast_fp16")]; tensor input_229_cast_fp16 = add(x = attn_weights_77_cast_fp16, y = attention_mask_to_fp16_palettized)[name = tensor("input_229_cast_fp16")]; tensor var_4445_cast_fp16 = softmax(axis = var_24, x = input_229_cast_fp16)[name = tensor("op_4445_cast_fp16")]; tensor attn_output_77_transpose_x_0 = const()[name = tensor("attn_output_77_transpose_x_0"), val = tensor(false)]; tensor attn_output_77_transpose_y_0 = const()[name = tensor("attn_output_77_transpose_y_0"), val = tensor(false)]; tensor attn_output_77 = matmul(transpose_x = attn_output_77_transpose_x_0, transpose_y = attn_output_77_transpose_y_0, x = var_4445_cast_fp16, y = value_states_39)[name = tensor("attn_output_77")]; tensor var_4449_perm_0 = const()[name = tensor("op_4449_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_4451 = const()[name = tensor("op_4451"), val = tensor([1, 256, -1])]; tensor var_4449 = transpose(perm = var_4449_perm_0, x = attn_output_77)[name = tensor("transpose_56")]; tensor var_4452 = reshape(shape = var_4451, x = var_4449)[name = tensor("op_4452")]; tensor x_467 = linear(bias = linear_3_bias_0, weight = wrapped_model_language_model_layers_19_self_attn_o_proj_weight_palettized, x = var_4452)[name = tensor("linear_136")]; tensor var_22_promoted_117_to_fp16 = const()[name = tensor("op_22_promoted_117_to_fp16"), val = tensor(0x1p+1)]; tensor var_4458_cast_fp16 = pow(x = x_467, y = var_22_promoted_117_to_fp16)[name = tensor("op_4458_cast_fp16")]; tensor var_4460_axes_0 = const()[name = tensor("op_4460_axes_0"), val = tensor([-1])]; tensor var_4460_keep_dims_0 = const()[name = tensor("op_4460_keep_dims_0"), val = tensor(true)]; tensor var_4460_cast_fp16 = reduce_mean(axes = var_4460_axes_0, keep_dims = var_4460_keep_dims_0, x = var_4458_cast_fp16)[name = tensor("op_4460_cast_fp16")]; tensor var_4461_to_fp16 = const()[name = tensor("op_4461_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_4462_cast_fp16 = add(x = var_4460_cast_fp16, y = var_4461_to_fp16)[name = tensor("op_4462_cast_fp16")]; tensor var_4463_epsilon_0 = const()[name = tensor("op_4463_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_4463_cast_fp16 = rsqrt(epsilon = var_4463_epsilon_0, x = var_4462_cast_fp16)[name = tensor("op_4463_cast_fp16")]; tensor output_469_cast_fp16 = mul(x = x_467, y = var_4463_cast_fp16)[name = tensor("output_469_cast_fp16")]; tensor var_4467_to_fp16 = const()[name = tensor("op_4467_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940612480)))]; tensor output_471_cast_fp16 = mul(x = output_469_cast_fp16, y = var_4467_to_fp16)[name = tensor("output_471_cast_fp16")]; tensor x_471 = add(x = x_455, y = output_471_cast_fp16)[name = tensor("x_471")]; tensor var_22_promoted_118_to_fp16 = const()[name = tensor("op_22_promoted_118_to_fp16"), val = tensor(0x1p+1)]; tensor var_4473_cast_fp16 = pow(x = x_471, y = var_22_promoted_118_to_fp16)[name = tensor("op_4473_cast_fp16")]; tensor var_4475_axes_0 = const()[name = tensor("op_4475_axes_0"), val = tensor([-1])]; tensor var_4475_keep_dims_0 = const()[name = tensor("op_4475_keep_dims_0"), val = tensor(true)]; tensor var_4475_cast_fp16 = reduce_mean(axes = var_4475_axes_0, keep_dims = var_4475_keep_dims_0, x = var_4473_cast_fp16)[name = tensor("op_4475_cast_fp16")]; tensor var_4476_to_fp16 = const()[name = tensor("op_4476_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_4477_cast_fp16 = add(x = var_4475_cast_fp16, y = var_4476_to_fp16)[name = tensor("op_4477_cast_fp16")]; tensor var_4478_epsilon_0 = const()[name = tensor("op_4478_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_4478_cast_fp16 = rsqrt(epsilon = var_4478_epsilon_0, x = var_4477_cast_fp16)[name = tensor("op_4478_cast_fp16")]; tensor output_473_cast_fp16 = mul(x = x_471, y = var_4478_cast_fp16)[name = tensor("output_473_cast_fp16")]; tensor var_4482_to_fp16 = const()[name = tensor("op_4482_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940617664)))]; tensor output_475_cast_fp16 = mul(x = output_473_cast_fp16, y = var_4482_to_fp16)[name = tensor("output_475_cast_fp16")]; tensor input_237 = linear(bias = linear_4_bias_0, weight = wrapped_model_language_model_layers_19_mlp_gate_proj_weight_palettized, x = output_475_cast_fp16)[name = tensor("linear_137")]; tensor var_4490_mode_0 = const()[name = tensor("op_4490_mode_0"), val = tensor("TANH_APPROXIMATION")]; tensor var_4490 = gelu(mode = var_4490_mode_0, x = input_237)[name = tensor("op_4490")]; tensor var_4492 = linear(bias = linear_4_bias_0, weight = wrapped_model_language_model_layers_19_mlp_up_proj_weight_palettized, x = output_475_cast_fp16)[name = tensor("linear_138")]; tensor input_239 = mul(x = var_4490, y = var_4492)[name = tensor("input_239")]; tensor x_475 = linear(bias = linear_3_bias_0, weight = wrapped_model_language_model_layers_19_mlp_down_proj_weight_palettized, x = input_239)[name = tensor("linear_139")]; tensor var_22_promoted_119_to_fp16 = const()[name = tensor("op_22_promoted_119_to_fp16"), val = tensor(0x1p+1)]; tensor var_4498_cast_fp16 = pow(x = x_475, y = var_22_promoted_119_to_fp16)[name = tensor("op_4498_cast_fp16")]; tensor var_4500_axes_0 = const()[name = tensor("op_4500_axes_0"), val = tensor([-1])]; tensor var_4500_keep_dims_0 = const()[name = tensor("op_4500_keep_dims_0"), val = tensor(true)]; tensor var_4500_cast_fp16 = reduce_mean(axes = var_4500_axes_0, keep_dims = var_4500_keep_dims_0, x = var_4498_cast_fp16)[name = tensor("op_4500_cast_fp16")]; tensor var_4501_to_fp16 = const()[name = tensor("op_4501_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_4502_cast_fp16 = add(x = var_4500_cast_fp16, y = var_4501_to_fp16)[name = tensor("op_4502_cast_fp16")]; tensor var_4503_epsilon_0 = const()[name = tensor("op_4503_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_4503_cast_fp16 = rsqrt(epsilon = var_4503_epsilon_0, x = var_4502_cast_fp16)[name = tensor("op_4503_cast_fp16")]; tensor output_477_cast_fp16 = mul(x = x_475, y = var_4503_cast_fp16)[name = tensor("output_477_cast_fp16")]; tensor var_4507_to_fp16 = const()[name = tensor("op_4507_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940622848)))]; tensor output_479_cast_fp16 = mul(x = output_477_cast_fp16, y = var_4507_to_fp16)[name = tensor("output_479_cast_fp16")]; tensor x_479 = add(x = x_471, y = output_479_cast_fp16)[name = tensor("x_479")]; tensor var_22_promoted_120_to_fp16 = const()[name = tensor("op_22_promoted_120_to_fp16"), val = tensor(0x1p+1)]; tensor var_4519_cast_fp16 = pow(x = x_479, y = var_22_promoted_120_to_fp16)[name = tensor("op_4519_cast_fp16")]; tensor var_4521_axes_0 = const()[name = tensor("op_4521_axes_0"), val = tensor([-1])]; tensor var_4521_keep_dims_0 = const()[name = tensor("op_4521_keep_dims_0"), val = tensor(true)]; tensor var_4521_cast_fp16 = reduce_mean(axes = var_4521_axes_0, keep_dims = var_4521_keep_dims_0, x = var_4519_cast_fp16)[name = tensor("op_4521_cast_fp16")]; tensor var_4522_to_fp16 = const()[name = tensor("op_4522_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_4523_cast_fp16 = add(x = var_4521_cast_fp16, y = var_4522_to_fp16)[name = tensor("op_4523_cast_fp16")]; tensor var_4524_epsilon_0 = const()[name = tensor("op_4524_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_4524_cast_fp16 = rsqrt(epsilon = var_4524_epsilon_0, x = var_4523_cast_fp16)[name = tensor("op_4524_cast_fp16")]; tensor output_481_cast_fp16 = mul(x = x_479, y = var_4524_cast_fp16)[name = tensor("output_481_cast_fp16")]; tensor var_4528_to_fp16 = const()[name = tensor("op_4528_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940628032)))]; tensor output_483_cast_fp16 = mul(x = output_481_cast_fp16, y = var_4528_to_fp16)[name = tensor("output_483_cast_fp16")]; tensor var_4540 = linear(bias = linear_0_bias_0, weight = wrapped_model_language_model_layers_20_self_attn_q_proj_weight_palettized, x = output_483_cast_fp16)[name = tensor("linear_140")]; tensor var_4541 = const()[name = tensor("op_4541"), val = tensor([1, 256, -1, 256])]; tensor var_4542 = reshape(shape = var_4541, x = var_4540)[name = tensor("op_4542")]; tensor x_483_perm_0 = const()[name = tensor("x_483_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_4545 = linear(bias = linear_1_bias_0, weight = wrapped_model_language_model_layers_20_self_attn_k_proj_weight_palettized, x = output_483_cast_fp16)[name = tensor("linear_141")]; tensor var_4546 = const()[name = tensor("op_4546"), val = tensor([1, 256, -1, 256])]; tensor var_4547 = reshape(shape = var_4546, x = var_4545)[name = tensor("op_4547")]; tensor x_487_perm_0 = const()[name = tensor("x_487_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_4550 = linear(bias = linear_1_bias_0, weight = wrapped_model_language_model_layers_20_self_attn_v_proj_weight_palettized, x = output_483_cast_fp16)[name = tensor("linear_142")]; tensor var_4551 = const()[name = tensor("op_4551"), val = tensor([1, 256, -1, 256])]; tensor var_4552 = reshape(shape = var_4551, x = var_4550)[name = tensor("op_4552")]; tensor hidden_states_287_perm_0 = const()[name = tensor("hidden_states_287_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_22_promoted_121_to_fp16 = const()[name = tensor("op_22_promoted_121_to_fp16"), val = tensor(0x1p+1)]; tensor x_483 = transpose(perm = x_483_perm_0, x = var_4542)[name = tensor("transpose_55")]; tensor var_4556_cast_fp16 = pow(x = x_483, y = var_22_promoted_121_to_fp16)[name = tensor("op_4556_cast_fp16")]; tensor var_4558_axes_0 = const()[name = tensor("op_4558_axes_0"), val = tensor([-1])]; tensor var_4558_keep_dims_0 = const()[name = tensor("op_4558_keep_dims_0"), val = tensor(true)]; tensor var_4558_cast_fp16 = reduce_mean(axes = var_4558_axes_0, keep_dims = var_4558_keep_dims_0, x = var_4556_cast_fp16)[name = tensor("op_4558_cast_fp16")]; tensor var_4559_to_fp16 = const()[name = tensor("op_4559_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_4560_cast_fp16 = add(x = var_4558_cast_fp16, y = var_4559_to_fp16)[name = tensor("op_4560_cast_fp16")]; tensor var_4561_epsilon_0 = const()[name = tensor("op_4561_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_4561_cast_fp16 = rsqrt(epsilon = var_4561_epsilon_0, x = var_4560_cast_fp16)[name = tensor("op_4561_cast_fp16")]; tensor output_485_cast_fp16 = mul(x = x_483, y = var_4561_cast_fp16)[name = tensor("output_485_cast_fp16")]; tensor var_4565_to_fp16 = const()[name = tensor("op_4565_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940633216)))]; tensor output_487_cast_fp16 = mul(x = output_485_cast_fp16, y = var_4565_to_fp16)[name = tensor("output_487_cast_fp16")]; tensor var_22_promoted_122_to_fp16 = const()[name = tensor("op_22_promoted_122_to_fp16"), val = tensor(0x1p+1)]; tensor x_487 = transpose(perm = x_487_perm_0, x = var_4547)[name = tensor("transpose_54")]; tensor var_4570_cast_fp16 = pow(x = x_487, y = var_22_promoted_122_to_fp16)[name = tensor("op_4570_cast_fp16")]; tensor var_4572_axes_0 = const()[name = tensor("op_4572_axes_0"), val = tensor([-1])]; tensor var_4572_keep_dims_0 = const()[name = tensor("op_4572_keep_dims_0"), val = tensor(true)]; tensor var_4572_cast_fp16 = reduce_mean(axes = var_4572_axes_0, keep_dims = var_4572_keep_dims_0, x = var_4570_cast_fp16)[name = tensor("op_4572_cast_fp16")]; tensor var_4573_to_fp16 = const()[name = tensor("op_4573_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_4574_cast_fp16 = add(x = var_4572_cast_fp16, y = var_4573_to_fp16)[name = tensor("op_4574_cast_fp16")]; tensor var_4575_epsilon_0 = const()[name = tensor("op_4575_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_4575_cast_fp16 = rsqrt(epsilon = var_4575_epsilon_0, x = var_4574_cast_fp16)[name = tensor("op_4575_cast_fp16")]; tensor output_489_cast_fp16 = mul(x = x_487, y = var_4575_cast_fp16)[name = tensor("output_489_cast_fp16")]; tensor var_4579_to_fp16 = const()[name = tensor("op_4579_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940633792)))]; tensor output_491_cast_fp16 = mul(x = output_489_cast_fp16, y = var_4579_to_fp16)[name = tensor("output_491_cast_fp16")]; tensor var_4584 = mul(x = output_487_cast_fp16, y = cos_7_palettized)[name = tensor("op_4584")]; tensor x1_81_begin_0 = const()[name = tensor("x1_81_begin_0"), val = tensor([0, 0, 0, 0])]; tensor x1_81_end_0 = const()[name = tensor("x1_81_end_0"), val = tensor([1, 8, 256, 128])]; tensor x1_81_end_mask_0 = const()[name = tensor("x1_81_end_mask_0"), val = tensor([true, true, true, false])]; tensor x1_81 = slice_by_index(begin = x1_81_begin_0, end = x1_81_end_0, end_mask = x1_81_end_mask_0, x = output_487_cast_fp16)[name = tensor("x1_81")]; tensor x2_81_begin_0 = const()[name = tensor("x2_81_begin_0"), val = tensor([0, 0, 0, 128])]; tensor x2_81_end_0 = const()[name = tensor("x2_81_end_0"), val = tensor([1, 8, 256, 256])]; tensor x2_81_end_mask_0 = const()[name = tensor("x2_81_end_mask_0"), val = tensor([true, true, true, true])]; tensor x2_81 = slice_by_index(begin = x2_81_begin_0, end = x2_81_end_0, end_mask = x2_81_end_mask_0, x = output_487_cast_fp16)[name = tensor("x2_81")]; tensor const_495_promoted = const()[name = tensor("const_495_promoted"), val = tensor(-0x1p+0)]; tensor var_4595 = mul(x = x2_81, y = const_495_promoted)[name = tensor("op_4595")]; tensor var_4597_interleave_0 = const()[name = tensor("op_4597_interleave_0"), val = tensor(false)]; tensor var_4597 = concat(axis = var_24, interleave = var_4597_interleave_0, values = (var_4595, x1_81))[name = tensor("op_4597")]; tensor var_4598 = mul(x = var_4597, y = sin_7_palettized)[name = tensor("op_4598")]; tensor query_41 = add(x = var_4584, y = var_4598)[name = tensor("query_41")]; tensor var_4600 = mul(x = output_491_cast_fp16, y = cos_7_palettized)[name = tensor("op_4600")]; tensor x1_83_begin_0 = const()[name = tensor("x1_83_begin_0"), val = tensor([0, 0, 0, 0])]; tensor x1_83_end_0 = const()[name = tensor("x1_83_end_0"), val = tensor([1, 4, 256, 128])]; tensor x1_83_end_mask_0 = const()[name = tensor("x1_83_end_mask_0"), val = tensor([true, true, true, false])]; tensor x1_83 = slice_by_index(begin = x1_83_begin_0, end = x1_83_end_0, end_mask = x1_83_end_mask_0, x = output_491_cast_fp16)[name = tensor("x1_83")]; tensor x2_83_begin_0 = const()[name = tensor("x2_83_begin_0"), val = tensor([0, 0, 0, 128])]; tensor x2_83_end_0 = const()[name = tensor("x2_83_end_0"), val = tensor([1, 4, 256, 256])]; tensor x2_83_end_mask_0 = const()[name = tensor("x2_83_end_mask_0"), val = tensor([true, true, true, true])]; tensor x2_83 = slice_by_index(begin = x2_83_begin_0, end = x2_83_end_0, end_mask = x2_83_end_mask_0, x = output_491_cast_fp16)[name = tensor("x2_83")]; tensor const_498_promoted = const()[name = tensor("const_498_promoted"), val = tensor(-0x1p+0)]; tensor var_4611 = mul(x = x2_83, y = const_498_promoted)[name = tensor("op_4611")]; tensor var_4613_interleave_0 = const()[name = tensor("op_4613_interleave_0"), val = tensor(false)]; tensor var_4613 = concat(axis = var_24, interleave = var_4613_interleave_0, values = (var_4611, x1_83))[name = tensor("op_4613")]; tensor var_4614 = mul(x = var_4613, y = sin_7_palettized)[name = tensor("op_4614")]; tensor hidden_states_283 = add(x = var_4600, y = var_4614)[name = tensor("hidden_states_283")]; tensor var_4623_axes_0 = const()[name = tensor("op_4623_axes_0"), val = tensor([2])]; tensor var_4623 = expand_dims(axes = var_4623_axes_0, x = hidden_states_283)[name = tensor("op_4623")]; tensor hidden_states_285_reps_0 = const()[name = tensor("hidden_states_285_reps_0"), val = tensor([1, 1, 2, 1, 1])]; tensor hidden_states_285 = tile(reps = hidden_states_285_reps_0, x = var_4623)[name = tensor("hidden_states_285")]; tensor var_4631 = const()[name = tensor("op_4631"), val = tensor([1, 8, 256, 256])]; tensor key_states_41 = reshape(shape = var_4631, x = hidden_states_285)[name = tensor("key_states_41")]; tensor var_4640_axes_0 = const()[name = tensor("op_4640_axes_0"), val = tensor([2])]; tensor hidden_states_287 = transpose(perm = hidden_states_287_perm_0, x = var_4552)[name = tensor("transpose_53")]; tensor var_4640 = expand_dims(axes = var_4640_axes_0, x = hidden_states_287)[name = tensor("op_4640")]; tensor hidden_states_289_reps_0 = const()[name = tensor("hidden_states_289_reps_0"), val = tensor([1, 1, 2, 1, 1])]; tensor hidden_states_289 = tile(reps = hidden_states_289_reps_0, x = var_4640)[name = tensor("hidden_states_289")]; tensor var_4648 = const()[name = tensor("op_4648"), val = tensor([1, 8, 256, 256])]; tensor value_states_41 = reshape(shape = var_4648, x = hidden_states_289)[name = tensor("value_states_41")]; tensor var_4651_transpose_x_1 = const()[name = tensor("op_4651_transpose_x_1"), val = tensor(false)]; tensor var_4651_transpose_y_1 = const()[name = tensor("op_4651_transpose_y_1"), val = tensor(true)]; tensor var_4651 = matmul(transpose_x = var_4651_transpose_x_1, transpose_y = var_4651_transpose_y_1, x = query_41, y = key_states_41)[name = tensor("op_4651")]; tensor var_4652_to_fp16 = const()[name = tensor("op_4652_to_fp16"), val = tensor(0x1p-4)]; tensor attn_weights_81_cast_fp16 = mul(x = var_4651, y = var_4652_to_fp16)[name = tensor("attn_weights_81_cast_fp16")]; tensor input_241_cast_fp16 = add(x = attn_weights_81_cast_fp16, y = attention_mask_to_fp16_palettized)[name = tensor("input_241_cast_fp16")]; tensor var_4660_cast_fp16 = softmax(axis = var_24, x = input_241_cast_fp16)[name = tensor("op_4660_cast_fp16")]; tensor attn_output_81_transpose_x_0 = const()[name = tensor("attn_output_81_transpose_x_0"), val = tensor(false)]; tensor attn_output_81_transpose_y_0 = const()[name = tensor("attn_output_81_transpose_y_0"), val = tensor(false)]; tensor attn_output_81 = matmul(transpose_x = attn_output_81_transpose_x_0, transpose_y = attn_output_81_transpose_y_0, x = var_4660_cast_fp16, y = value_states_41)[name = tensor("attn_output_81")]; tensor var_4664_perm_0 = const()[name = tensor("op_4664_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_4666 = const()[name = tensor("op_4666"), val = tensor([1, 256, -1])]; tensor var_4664 = transpose(perm = var_4664_perm_0, x = attn_output_81)[name = tensor("transpose_52")]; tensor var_4667 = reshape(shape = var_4666, x = var_4664)[name = tensor("op_4667")]; tensor x_491 = linear(bias = linear_3_bias_0, weight = wrapped_model_language_model_layers_20_self_attn_o_proj_weight_palettized, x = var_4667)[name = tensor("linear_143")]; tensor var_22_promoted_123_to_fp16 = const()[name = tensor("op_22_promoted_123_to_fp16"), val = tensor(0x1p+1)]; tensor var_4673_cast_fp16 = pow(x = x_491, y = var_22_promoted_123_to_fp16)[name = tensor("op_4673_cast_fp16")]; tensor var_4675_axes_0 = const()[name = tensor("op_4675_axes_0"), val = tensor([-1])]; tensor var_4675_keep_dims_0 = const()[name = tensor("op_4675_keep_dims_0"), val = tensor(true)]; tensor var_4675_cast_fp16 = reduce_mean(axes = var_4675_axes_0, keep_dims = var_4675_keep_dims_0, x = var_4673_cast_fp16)[name = tensor("op_4675_cast_fp16")]; tensor var_4676_to_fp16 = const()[name = tensor("op_4676_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_4677_cast_fp16 = add(x = var_4675_cast_fp16, y = var_4676_to_fp16)[name = tensor("op_4677_cast_fp16")]; tensor var_4678_epsilon_0 = const()[name = tensor("op_4678_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_4678_cast_fp16 = rsqrt(epsilon = var_4678_epsilon_0, x = var_4677_cast_fp16)[name = tensor("op_4678_cast_fp16")]; tensor output_493_cast_fp16 = mul(x = x_491, y = var_4678_cast_fp16)[name = tensor("output_493_cast_fp16")]; tensor var_4682_to_fp16 = const()[name = tensor("op_4682_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940634368)))]; tensor output_495_cast_fp16 = mul(x = output_493_cast_fp16, y = var_4682_to_fp16)[name = tensor("output_495_cast_fp16")]; tensor x_495 = add(x = x_479, y = output_495_cast_fp16)[name = tensor("x_495")]; tensor var_22_promoted_124_to_fp16 = const()[name = tensor("op_22_promoted_124_to_fp16"), val = tensor(0x1p+1)]; tensor var_4688_cast_fp16 = pow(x = x_495, y = var_22_promoted_124_to_fp16)[name = tensor("op_4688_cast_fp16")]; tensor var_4690_axes_0 = const()[name = tensor("op_4690_axes_0"), val = tensor([-1])]; tensor var_4690_keep_dims_0 = const()[name = tensor("op_4690_keep_dims_0"), val = tensor(true)]; tensor var_4690_cast_fp16 = reduce_mean(axes = var_4690_axes_0, keep_dims = var_4690_keep_dims_0, x = var_4688_cast_fp16)[name = tensor("op_4690_cast_fp16")]; tensor var_4691_to_fp16 = const()[name = tensor("op_4691_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_4692_cast_fp16 = add(x = var_4690_cast_fp16, y = var_4691_to_fp16)[name = tensor("op_4692_cast_fp16")]; tensor var_4693_epsilon_0 = const()[name = tensor("op_4693_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_4693_cast_fp16 = rsqrt(epsilon = var_4693_epsilon_0, x = var_4692_cast_fp16)[name = tensor("op_4693_cast_fp16")]; tensor output_497_cast_fp16 = mul(x = x_495, y = var_4693_cast_fp16)[name = tensor("output_497_cast_fp16")]; tensor var_4697_to_fp16 = const()[name = tensor("op_4697_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940639552)))]; tensor output_499_cast_fp16 = mul(x = output_497_cast_fp16, y = var_4697_to_fp16)[name = tensor("output_499_cast_fp16")]; tensor input_249 = linear(bias = linear_4_bias_0, weight = wrapped_model_language_model_layers_20_mlp_gate_proj_weight_palettized, x = output_499_cast_fp16)[name = tensor("linear_144")]; tensor var_4705_mode_0 = const()[name = tensor("op_4705_mode_0"), val = tensor("TANH_APPROXIMATION")]; tensor var_4705 = gelu(mode = var_4705_mode_0, x = input_249)[name = tensor("op_4705")]; tensor var_4707 = linear(bias = linear_4_bias_0, weight = wrapped_model_language_model_layers_20_mlp_up_proj_weight_palettized, x = output_499_cast_fp16)[name = tensor("linear_145")]; tensor input_251 = mul(x = var_4705, y = var_4707)[name = tensor("input_251")]; tensor x_499 = linear(bias = linear_3_bias_0, weight = wrapped_model_language_model_layers_20_mlp_down_proj_weight_palettized, x = input_251)[name = tensor("linear_146")]; tensor var_22_promoted_125_to_fp16 = const()[name = tensor("op_22_promoted_125_to_fp16"), val = tensor(0x1p+1)]; tensor var_4713_cast_fp16 = pow(x = x_499, y = var_22_promoted_125_to_fp16)[name = tensor("op_4713_cast_fp16")]; tensor var_4715_axes_0 = const()[name = tensor("op_4715_axes_0"), val = tensor([-1])]; tensor var_4715_keep_dims_0 = const()[name = tensor("op_4715_keep_dims_0"), val = tensor(true)]; tensor var_4715_cast_fp16 = reduce_mean(axes = var_4715_axes_0, keep_dims = var_4715_keep_dims_0, x = var_4713_cast_fp16)[name = tensor("op_4715_cast_fp16")]; tensor var_4716_to_fp16 = const()[name = tensor("op_4716_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_4717_cast_fp16 = add(x = var_4715_cast_fp16, y = var_4716_to_fp16)[name = tensor("op_4717_cast_fp16")]; tensor var_4718_epsilon_0 = const()[name = tensor("op_4718_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_4718_cast_fp16 = rsqrt(epsilon = var_4718_epsilon_0, x = var_4717_cast_fp16)[name = tensor("op_4718_cast_fp16")]; tensor output_501_cast_fp16 = mul(x = x_499, y = var_4718_cast_fp16)[name = tensor("output_501_cast_fp16")]; tensor var_4722_to_fp16 = const()[name = tensor("op_4722_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940644736)))]; tensor output_503_cast_fp16 = mul(x = output_501_cast_fp16, y = var_4722_to_fp16)[name = tensor("output_503_cast_fp16")]; tensor x_503 = add(x = x_495, y = output_503_cast_fp16)[name = tensor("x_503")]; tensor var_22_promoted_126_to_fp16 = const()[name = tensor("op_22_promoted_126_to_fp16"), val = tensor(0x1p+1)]; tensor var_4734_cast_fp16 = pow(x = x_503, y = var_22_promoted_126_to_fp16)[name = tensor("op_4734_cast_fp16")]; tensor var_4736_axes_0 = const()[name = tensor("op_4736_axes_0"), val = tensor([-1])]; tensor var_4736_keep_dims_0 = const()[name = tensor("op_4736_keep_dims_0"), val = tensor(true)]; tensor var_4736_cast_fp16 = reduce_mean(axes = var_4736_axes_0, keep_dims = var_4736_keep_dims_0, x = var_4734_cast_fp16)[name = tensor("op_4736_cast_fp16")]; tensor var_4737_to_fp16 = const()[name = tensor("op_4737_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_4738_cast_fp16 = add(x = var_4736_cast_fp16, y = var_4737_to_fp16)[name = tensor("op_4738_cast_fp16")]; tensor var_4739_epsilon_0 = const()[name = tensor("op_4739_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_4739_cast_fp16 = rsqrt(epsilon = var_4739_epsilon_0, x = var_4738_cast_fp16)[name = tensor("op_4739_cast_fp16")]; tensor output_505_cast_fp16 = mul(x = x_503, y = var_4739_cast_fp16)[name = tensor("output_505_cast_fp16")]; tensor var_4743_to_fp16 = const()[name = tensor("op_4743_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940649920)))]; tensor output_507_cast_fp16 = mul(x = output_505_cast_fp16, y = var_4743_to_fp16)[name = tensor("output_507_cast_fp16")]; tensor var_4755 = linear(bias = linear_0_bias_0, weight = wrapped_model_language_model_layers_21_self_attn_q_proj_weight_palettized, x = output_507_cast_fp16)[name = tensor("linear_147")]; tensor var_4756 = const()[name = tensor("op_4756"), val = tensor([1, 256, -1, 256])]; tensor var_4757 = reshape(shape = var_4756, x = var_4755)[name = tensor("op_4757")]; tensor x_507_perm_0 = const()[name = tensor("x_507_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_4760 = linear(bias = linear_1_bias_0, weight = wrapped_model_language_model_layers_21_self_attn_k_proj_weight_palettized, x = output_507_cast_fp16)[name = tensor("linear_148")]; tensor var_4761 = const()[name = tensor("op_4761"), val = tensor([1, 256, -1, 256])]; tensor var_4762 = reshape(shape = var_4761, x = var_4760)[name = tensor("op_4762")]; tensor x_511_perm_0 = const()[name = tensor("x_511_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_4765 = linear(bias = linear_1_bias_0, weight = wrapped_model_language_model_layers_21_self_attn_v_proj_weight_palettized, x = output_507_cast_fp16)[name = tensor("linear_149")]; tensor var_4766 = const()[name = tensor("op_4766"), val = tensor([1, 256, -1, 256])]; tensor var_4767 = reshape(shape = var_4766, x = var_4765)[name = tensor("op_4767")]; tensor hidden_states_301_perm_0 = const()[name = tensor("hidden_states_301_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_22_promoted_127_to_fp16 = const()[name = tensor("op_22_promoted_127_to_fp16"), val = tensor(0x1p+1)]; tensor x_507 = transpose(perm = x_507_perm_0, x = var_4757)[name = tensor("transpose_51")]; tensor var_4771_cast_fp16 = pow(x = x_507, y = var_22_promoted_127_to_fp16)[name = tensor("op_4771_cast_fp16")]; tensor var_4773_axes_0 = const()[name = tensor("op_4773_axes_0"), val = tensor([-1])]; tensor var_4773_keep_dims_0 = const()[name = tensor("op_4773_keep_dims_0"), val = tensor(true)]; tensor var_4773_cast_fp16 = reduce_mean(axes = var_4773_axes_0, keep_dims = var_4773_keep_dims_0, x = var_4771_cast_fp16)[name = tensor("op_4773_cast_fp16")]; tensor var_4774_to_fp16 = const()[name = tensor("op_4774_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_4775_cast_fp16 = add(x = var_4773_cast_fp16, y = var_4774_to_fp16)[name = tensor("op_4775_cast_fp16")]; tensor var_4776_epsilon_0 = const()[name = tensor("op_4776_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_4776_cast_fp16 = rsqrt(epsilon = var_4776_epsilon_0, x = var_4775_cast_fp16)[name = tensor("op_4776_cast_fp16")]; tensor output_509_cast_fp16 = mul(x = x_507, y = var_4776_cast_fp16)[name = tensor("output_509_cast_fp16")]; tensor var_4780_to_fp16 = const()[name = tensor("op_4780_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940655104)))]; tensor output_511_cast_fp16 = mul(x = output_509_cast_fp16, y = var_4780_to_fp16)[name = tensor("output_511_cast_fp16")]; tensor var_22_promoted_128_to_fp16 = const()[name = tensor("op_22_promoted_128_to_fp16"), val = tensor(0x1p+1)]; tensor x_511 = transpose(perm = x_511_perm_0, x = var_4762)[name = tensor("transpose_50")]; tensor var_4785_cast_fp16 = pow(x = x_511, y = var_22_promoted_128_to_fp16)[name = tensor("op_4785_cast_fp16")]; tensor var_4787_axes_0 = const()[name = tensor("op_4787_axes_0"), val = tensor([-1])]; tensor var_4787_keep_dims_0 = const()[name = tensor("op_4787_keep_dims_0"), val = tensor(true)]; tensor var_4787_cast_fp16 = reduce_mean(axes = var_4787_axes_0, keep_dims = var_4787_keep_dims_0, x = var_4785_cast_fp16)[name = tensor("op_4787_cast_fp16")]; tensor var_4788_to_fp16 = const()[name = tensor("op_4788_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_4789_cast_fp16 = add(x = var_4787_cast_fp16, y = var_4788_to_fp16)[name = tensor("op_4789_cast_fp16")]; tensor var_4790_epsilon_0 = const()[name = tensor("op_4790_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_4790_cast_fp16 = rsqrt(epsilon = var_4790_epsilon_0, x = var_4789_cast_fp16)[name = tensor("op_4790_cast_fp16")]; tensor output_513_cast_fp16 = mul(x = x_511, y = var_4790_cast_fp16)[name = tensor("output_513_cast_fp16")]; tensor var_4794_to_fp16 = const()[name = tensor("op_4794_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940655680)))]; tensor output_515_cast_fp16 = mul(x = output_513_cast_fp16, y = var_4794_to_fp16)[name = tensor("output_515_cast_fp16")]; tensor var_4799 = mul(x = output_511_cast_fp16, y = cos_7_palettized)[name = tensor("op_4799")]; tensor x1_85_begin_0 = const()[name = tensor("x1_85_begin_0"), val = tensor([0, 0, 0, 0])]; tensor x1_85_end_0 = const()[name = tensor("x1_85_end_0"), val = tensor([1, 8, 256, 128])]; tensor x1_85_end_mask_0 = const()[name = tensor("x1_85_end_mask_0"), val = tensor([true, true, true, false])]; tensor x1_85 = slice_by_index(begin = x1_85_begin_0, end = x1_85_end_0, end_mask = x1_85_end_mask_0, x = output_511_cast_fp16)[name = tensor("x1_85")]; tensor x2_85_begin_0 = const()[name = tensor("x2_85_begin_0"), val = tensor([0, 0, 0, 128])]; tensor x2_85_end_0 = const()[name = tensor("x2_85_end_0"), val = tensor([1, 8, 256, 256])]; tensor x2_85_end_mask_0 = const()[name = tensor("x2_85_end_mask_0"), val = tensor([true, true, true, true])]; tensor x2_85 = slice_by_index(begin = x2_85_begin_0, end = x2_85_end_0, end_mask = x2_85_end_mask_0, x = output_511_cast_fp16)[name = tensor("x2_85")]; tensor const_518_promoted = const()[name = tensor("const_518_promoted"), val = tensor(-0x1p+0)]; tensor var_4810 = mul(x = x2_85, y = const_518_promoted)[name = tensor("op_4810")]; tensor var_4812_interleave_0 = const()[name = tensor("op_4812_interleave_0"), val = tensor(false)]; tensor var_4812 = concat(axis = var_24, interleave = var_4812_interleave_0, values = (var_4810, x1_85))[name = tensor("op_4812")]; tensor var_4813 = mul(x = var_4812, y = sin_7_palettized)[name = tensor("op_4813")]; tensor query_43 = add(x = var_4799, y = var_4813)[name = tensor("query_43")]; tensor var_4815 = mul(x = output_515_cast_fp16, y = cos_7_palettized)[name = tensor("op_4815")]; tensor x1_87_begin_0 = const()[name = tensor("x1_87_begin_0"), val = tensor([0, 0, 0, 0])]; tensor x1_87_end_0 = const()[name = tensor("x1_87_end_0"), val = tensor([1, 4, 256, 128])]; tensor x1_87_end_mask_0 = const()[name = tensor("x1_87_end_mask_0"), val = tensor([true, true, true, false])]; tensor x1_87 = slice_by_index(begin = x1_87_begin_0, end = x1_87_end_0, end_mask = x1_87_end_mask_0, x = output_515_cast_fp16)[name = tensor("x1_87")]; tensor x2_87_begin_0 = const()[name = tensor("x2_87_begin_0"), val = tensor([0, 0, 0, 128])]; tensor x2_87_end_0 = const()[name = tensor("x2_87_end_0"), val = tensor([1, 4, 256, 256])]; tensor x2_87_end_mask_0 = const()[name = tensor("x2_87_end_mask_0"), val = tensor([true, true, true, true])]; tensor x2_87 = slice_by_index(begin = x2_87_begin_0, end = x2_87_end_0, end_mask = x2_87_end_mask_0, x = output_515_cast_fp16)[name = tensor("x2_87")]; tensor const_521_promoted = const()[name = tensor("const_521_promoted"), val = tensor(-0x1p+0)]; tensor var_4826 = mul(x = x2_87, y = const_521_promoted)[name = tensor("op_4826")]; tensor var_4828_interleave_0 = const()[name = tensor("op_4828_interleave_0"), val = tensor(false)]; tensor var_4828 = concat(axis = var_24, interleave = var_4828_interleave_0, values = (var_4826, x1_87))[name = tensor("op_4828")]; tensor var_4829 = mul(x = var_4828, y = sin_7_palettized)[name = tensor("op_4829")]; tensor hidden_states_297 = add(x = var_4815, y = var_4829)[name = tensor("hidden_states_297")]; tensor var_4838_axes_0 = const()[name = tensor("op_4838_axes_0"), val = tensor([2])]; tensor var_4838 = expand_dims(axes = var_4838_axes_0, x = hidden_states_297)[name = tensor("op_4838")]; tensor hidden_states_299_reps_0 = const()[name = tensor("hidden_states_299_reps_0"), val = tensor([1, 1, 2, 1, 1])]; tensor hidden_states_299 = tile(reps = hidden_states_299_reps_0, x = var_4838)[name = tensor("hidden_states_299")]; tensor var_4846 = const()[name = tensor("op_4846"), val = tensor([1, 8, 256, 256])]; tensor key_states_43 = reshape(shape = var_4846, x = hidden_states_299)[name = tensor("key_states_43")]; tensor var_4855_axes_0 = const()[name = tensor("op_4855_axes_0"), val = tensor([2])]; tensor hidden_states_301 = transpose(perm = hidden_states_301_perm_0, x = var_4767)[name = tensor("transpose_49")]; tensor var_4855 = expand_dims(axes = var_4855_axes_0, x = hidden_states_301)[name = tensor("op_4855")]; tensor hidden_states_303_reps_0 = const()[name = tensor("hidden_states_303_reps_0"), val = tensor([1, 1, 2, 1, 1])]; tensor hidden_states_303 = tile(reps = hidden_states_303_reps_0, x = var_4855)[name = tensor("hidden_states_303")]; tensor var_4863 = const()[name = tensor("op_4863"), val = tensor([1, 8, 256, 256])]; tensor value_states_43 = reshape(shape = var_4863, x = hidden_states_303)[name = tensor("value_states_43")]; tensor var_4866_transpose_x_1 = const()[name = tensor("op_4866_transpose_x_1"), val = tensor(false)]; tensor var_4866_transpose_y_1 = const()[name = tensor("op_4866_transpose_y_1"), val = tensor(true)]; tensor var_4866 = matmul(transpose_x = var_4866_transpose_x_1, transpose_y = var_4866_transpose_y_1, x = query_43, y = key_states_43)[name = tensor("op_4866")]; tensor var_4867_to_fp16 = const()[name = tensor("op_4867_to_fp16"), val = tensor(0x1p-4)]; tensor attn_weights_85_cast_fp16 = mul(x = var_4866, y = var_4867_to_fp16)[name = tensor("attn_weights_85_cast_fp16")]; tensor input_253_cast_fp16 = add(x = attn_weights_85_cast_fp16, y = attention_mask_to_fp16_palettized)[name = tensor("input_253_cast_fp16")]; tensor var_4875_cast_fp16 = softmax(axis = var_24, x = input_253_cast_fp16)[name = tensor("op_4875_cast_fp16")]; tensor attn_output_85_transpose_x_0 = const()[name = tensor("attn_output_85_transpose_x_0"), val = tensor(false)]; tensor attn_output_85_transpose_y_0 = const()[name = tensor("attn_output_85_transpose_y_0"), val = tensor(false)]; tensor attn_output_85 = matmul(transpose_x = attn_output_85_transpose_x_0, transpose_y = attn_output_85_transpose_y_0, x = var_4875_cast_fp16, y = value_states_43)[name = tensor("attn_output_85")]; tensor var_4879_perm_0 = const()[name = tensor("op_4879_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_4881 = const()[name = tensor("op_4881"), val = tensor([1, 256, -1])]; tensor var_4879 = transpose(perm = var_4879_perm_0, x = attn_output_85)[name = tensor("transpose_48")]; tensor var_4882 = reshape(shape = var_4881, x = var_4879)[name = tensor("op_4882")]; tensor x_515 = linear(bias = linear_3_bias_0, weight = wrapped_model_language_model_layers_21_self_attn_o_proj_weight_palettized, x = var_4882)[name = tensor("linear_150")]; tensor var_22_promoted_129_to_fp16 = const()[name = tensor("op_22_promoted_129_to_fp16"), val = tensor(0x1p+1)]; tensor var_4888_cast_fp16 = pow(x = x_515, y = var_22_promoted_129_to_fp16)[name = tensor("op_4888_cast_fp16")]; tensor var_4890_axes_0 = const()[name = tensor("op_4890_axes_0"), val = tensor([-1])]; tensor var_4890_keep_dims_0 = const()[name = tensor("op_4890_keep_dims_0"), val = tensor(true)]; tensor var_4890_cast_fp16 = reduce_mean(axes = var_4890_axes_0, keep_dims = var_4890_keep_dims_0, x = var_4888_cast_fp16)[name = tensor("op_4890_cast_fp16")]; tensor var_4891_to_fp16 = const()[name = tensor("op_4891_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_4892_cast_fp16 = add(x = var_4890_cast_fp16, y = var_4891_to_fp16)[name = tensor("op_4892_cast_fp16")]; tensor var_4893_epsilon_0 = const()[name = tensor("op_4893_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_4893_cast_fp16 = rsqrt(epsilon = var_4893_epsilon_0, x = var_4892_cast_fp16)[name = tensor("op_4893_cast_fp16")]; tensor output_517_cast_fp16 = mul(x = x_515, y = var_4893_cast_fp16)[name = tensor("output_517_cast_fp16")]; tensor var_4897_to_fp16 = const()[name = tensor("op_4897_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940656256)))]; tensor output_519_cast_fp16 = mul(x = output_517_cast_fp16, y = var_4897_to_fp16)[name = tensor("output_519_cast_fp16")]; tensor x_519 = add(x = x_503, y = output_519_cast_fp16)[name = tensor("x_519")]; tensor var_22_promoted_130_to_fp16 = const()[name = tensor("op_22_promoted_130_to_fp16"), val = tensor(0x1p+1)]; tensor var_4903_cast_fp16 = pow(x = x_519, y = var_22_promoted_130_to_fp16)[name = tensor("op_4903_cast_fp16")]; tensor var_4905_axes_0 = const()[name = tensor("op_4905_axes_0"), val = tensor([-1])]; tensor var_4905_keep_dims_0 = const()[name = tensor("op_4905_keep_dims_0"), val = tensor(true)]; tensor var_4905_cast_fp16 = reduce_mean(axes = var_4905_axes_0, keep_dims = var_4905_keep_dims_0, x = var_4903_cast_fp16)[name = tensor("op_4905_cast_fp16")]; tensor var_4906_to_fp16 = const()[name = tensor("op_4906_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_4907_cast_fp16 = add(x = var_4905_cast_fp16, y = var_4906_to_fp16)[name = tensor("op_4907_cast_fp16")]; tensor var_4908_epsilon_0 = const()[name = tensor("op_4908_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_4908_cast_fp16 = rsqrt(epsilon = var_4908_epsilon_0, x = var_4907_cast_fp16)[name = tensor("op_4908_cast_fp16")]; tensor output_521_cast_fp16 = mul(x = x_519, y = var_4908_cast_fp16)[name = tensor("output_521_cast_fp16")]; tensor var_4912_to_fp16 = const()[name = tensor("op_4912_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940661440)))]; tensor output_523_cast_fp16 = mul(x = output_521_cast_fp16, y = var_4912_to_fp16)[name = tensor("output_523_cast_fp16")]; tensor input_261 = linear(bias = linear_4_bias_0, weight = wrapped_model_language_model_layers_21_mlp_gate_proj_weight_palettized, x = output_523_cast_fp16)[name = tensor("linear_151")]; tensor var_4920_mode_0 = const()[name = tensor("op_4920_mode_0"), val = tensor("TANH_APPROXIMATION")]; tensor var_4920 = gelu(mode = var_4920_mode_0, x = input_261)[name = tensor("op_4920")]; tensor var_4922 = linear(bias = linear_4_bias_0, weight = wrapped_model_language_model_layers_21_mlp_up_proj_weight_palettized, x = output_523_cast_fp16)[name = tensor("linear_152")]; tensor input_263 = mul(x = var_4920, y = var_4922)[name = tensor("input_263")]; tensor x_523 = linear(bias = linear_3_bias_0, weight = wrapped_model_language_model_layers_21_mlp_down_proj_weight_palettized, x = input_263)[name = tensor("linear_153")]; tensor var_22_promoted_131_to_fp16 = const()[name = tensor("op_22_promoted_131_to_fp16"), val = tensor(0x1p+1)]; tensor var_4928_cast_fp16 = pow(x = x_523, y = var_22_promoted_131_to_fp16)[name = tensor("op_4928_cast_fp16")]; tensor var_4930_axes_0 = const()[name = tensor("op_4930_axes_0"), val = tensor([-1])]; tensor var_4930_keep_dims_0 = const()[name = tensor("op_4930_keep_dims_0"), val = tensor(true)]; tensor var_4930_cast_fp16 = reduce_mean(axes = var_4930_axes_0, keep_dims = var_4930_keep_dims_0, x = var_4928_cast_fp16)[name = tensor("op_4930_cast_fp16")]; tensor var_4931_to_fp16 = const()[name = tensor("op_4931_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_4932_cast_fp16 = add(x = var_4930_cast_fp16, y = var_4931_to_fp16)[name = tensor("op_4932_cast_fp16")]; tensor var_4933_epsilon_0 = const()[name = tensor("op_4933_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_4933_cast_fp16 = rsqrt(epsilon = var_4933_epsilon_0, x = var_4932_cast_fp16)[name = tensor("op_4933_cast_fp16")]; tensor output_525_cast_fp16 = mul(x = x_523, y = var_4933_cast_fp16)[name = tensor("output_525_cast_fp16")]; tensor var_4937_to_fp16 = const()[name = tensor("op_4937_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940666624)))]; tensor output_527_cast_fp16 = mul(x = output_525_cast_fp16, y = var_4937_to_fp16)[name = tensor("output_527_cast_fp16")]; tensor x_527 = add(x = x_519, y = output_527_cast_fp16)[name = tensor("x_527")]; tensor var_22_promoted_132_to_fp16 = const()[name = tensor("op_22_promoted_132_to_fp16"), val = tensor(0x1p+1)]; tensor var_4949_cast_fp16 = pow(x = x_527, y = var_22_promoted_132_to_fp16)[name = tensor("op_4949_cast_fp16")]; tensor var_4951_axes_0 = const()[name = tensor("op_4951_axes_0"), val = tensor([-1])]; tensor var_4951_keep_dims_0 = const()[name = tensor("op_4951_keep_dims_0"), val = tensor(true)]; tensor var_4951_cast_fp16 = reduce_mean(axes = var_4951_axes_0, keep_dims = var_4951_keep_dims_0, x = var_4949_cast_fp16)[name = tensor("op_4951_cast_fp16")]; tensor var_4952_to_fp16 = const()[name = tensor("op_4952_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_4953_cast_fp16 = add(x = var_4951_cast_fp16, y = var_4952_to_fp16)[name = tensor("op_4953_cast_fp16")]; tensor var_4954_epsilon_0 = const()[name = tensor("op_4954_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_4954_cast_fp16 = rsqrt(epsilon = var_4954_epsilon_0, x = var_4953_cast_fp16)[name = tensor("op_4954_cast_fp16")]; tensor output_529_cast_fp16 = mul(x = x_527, y = var_4954_cast_fp16)[name = tensor("output_529_cast_fp16")]; tensor var_4958_to_fp16 = const()[name = tensor("op_4958_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940671808)))]; tensor output_531_cast_fp16 = mul(x = output_529_cast_fp16, y = var_4958_to_fp16)[name = tensor("output_531_cast_fp16")]; tensor var_4970 = linear(bias = linear_0_bias_0, weight = wrapped_model_language_model_layers_22_self_attn_q_proj_weight_palettized, x = output_531_cast_fp16)[name = tensor("linear_154")]; tensor var_4971 = const()[name = tensor("op_4971"), val = tensor([1, 256, -1, 256])]; tensor var_4972 = reshape(shape = var_4971, x = var_4970)[name = tensor("op_4972")]; tensor x_531_perm_0 = const()[name = tensor("x_531_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_4975 = linear(bias = linear_1_bias_0, weight = wrapped_model_language_model_layers_22_self_attn_k_proj_weight_palettized, x = output_531_cast_fp16)[name = tensor("linear_155")]; tensor var_4976 = const()[name = tensor("op_4976"), val = tensor([1, 256, -1, 256])]; tensor var_4977 = reshape(shape = var_4976, x = var_4975)[name = tensor("op_4977")]; tensor x_535_perm_0 = const()[name = tensor("x_535_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_4980 = linear(bias = linear_1_bias_0, weight = wrapped_model_language_model_layers_22_self_attn_v_proj_weight_palettized, x = output_531_cast_fp16)[name = tensor("linear_156")]; tensor var_4981 = const()[name = tensor("op_4981"), val = tensor([1, 256, -1, 256])]; tensor var_4982 = reshape(shape = var_4981, x = var_4980)[name = tensor("op_4982")]; tensor hidden_states_315_perm_0 = const()[name = tensor("hidden_states_315_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_22_promoted_133_to_fp16 = const()[name = tensor("op_22_promoted_133_to_fp16"), val = tensor(0x1p+1)]; tensor x_531 = transpose(perm = x_531_perm_0, x = var_4972)[name = tensor("transpose_47")]; tensor var_4986_cast_fp16 = pow(x = x_531, y = var_22_promoted_133_to_fp16)[name = tensor("op_4986_cast_fp16")]; tensor var_4988_axes_0 = const()[name = tensor("op_4988_axes_0"), val = tensor([-1])]; tensor var_4988_keep_dims_0 = const()[name = tensor("op_4988_keep_dims_0"), val = tensor(true)]; tensor var_4988_cast_fp16 = reduce_mean(axes = var_4988_axes_0, keep_dims = var_4988_keep_dims_0, x = var_4986_cast_fp16)[name = tensor("op_4988_cast_fp16")]; tensor var_4989_to_fp16 = const()[name = tensor("op_4989_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_4990_cast_fp16 = add(x = var_4988_cast_fp16, y = var_4989_to_fp16)[name = tensor("op_4990_cast_fp16")]; tensor var_4991_epsilon_0 = const()[name = tensor("op_4991_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_4991_cast_fp16 = rsqrt(epsilon = var_4991_epsilon_0, x = var_4990_cast_fp16)[name = tensor("op_4991_cast_fp16")]; tensor output_533_cast_fp16 = mul(x = x_531, y = var_4991_cast_fp16)[name = tensor("output_533_cast_fp16")]; tensor var_4995_to_fp16 = const()[name = tensor("op_4995_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940676992)))]; tensor output_535_cast_fp16 = mul(x = output_533_cast_fp16, y = var_4995_to_fp16)[name = tensor("output_535_cast_fp16")]; tensor var_22_promoted_134_to_fp16 = const()[name = tensor("op_22_promoted_134_to_fp16"), val = tensor(0x1p+1)]; tensor x_535 = transpose(perm = x_535_perm_0, x = var_4977)[name = tensor("transpose_46")]; tensor var_5000_cast_fp16 = pow(x = x_535, y = var_22_promoted_134_to_fp16)[name = tensor("op_5000_cast_fp16")]; tensor var_5002_axes_0 = const()[name = tensor("op_5002_axes_0"), val = tensor([-1])]; tensor var_5002_keep_dims_0 = const()[name = tensor("op_5002_keep_dims_0"), val = tensor(true)]; tensor var_5002_cast_fp16 = reduce_mean(axes = var_5002_axes_0, keep_dims = var_5002_keep_dims_0, x = var_5000_cast_fp16)[name = tensor("op_5002_cast_fp16")]; tensor var_5003_to_fp16 = const()[name = tensor("op_5003_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_5004_cast_fp16 = add(x = var_5002_cast_fp16, y = var_5003_to_fp16)[name = tensor("op_5004_cast_fp16")]; tensor var_5005_epsilon_0 = const()[name = tensor("op_5005_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_5005_cast_fp16 = rsqrt(epsilon = var_5005_epsilon_0, x = var_5004_cast_fp16)[name = tensor("op_5005_cast_fp16")]; tensor output_537_cast_fp16 = mul(x = x_535, y = var_5005_cast_fp16)[name = tensor("output_537_cast_fp16")]; tensor var_5009_to_fp16 = const()[name = tensor("op_5009_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940677568)))]; tensor output_539_cast_fp16 = mul(x = output_537_cast_fp16, y = var_5009_to_fp16)[name = tensor("output_539_cast_fp16")]; tensor var_5014 = mul(x = output_535_cast_fp16, y = cos_7_palettized)[name = tensor("op_5014")]; tensor x1_89_begin_0 = const()[name = tensor("x1_89_begin_0"), val = tensor([0, 0, 0, 0])]; tensor x1_89_end_0 = const()[name = tensor("x1_89_end_0"), val = tensor([1, 8, 256, 128])]; tensor x1_89_end_mask_0 = const()[name = tensor("x1_89_end_mask_0"), val = tensor([true, true, true, false])]; tensor x1_89 = slice_by_index(begin = x1_89_begin_0, end = x1_89_end_0, end_mask = x1_89_end_mask_0, x = output_535_cast_fp16)[name = tensor("x1_89")]; tensor x2_89_begin_0 = const()[name = tensor("x2_89_begin_0"), val = tensor([0, 0, 0, 128])]; tensor x2_89_end_0 = const()[name = tensor("x2_89_end_0"), val = tensor([1, 8, 256, 256])]; tensor x2_89_end_mask_0 = const()[name = tensor("x2_89_end_mask_0"), val = tensor([true, true, true, true])]; tensor x2_89 = slice_by_index(begin = x2_89_begin_0, end = x2_89_end_0, end_mask = x2_89_end_mask_0, x = output_535_cast_fp16)[name = tensor("x2_89")]; tensor const_541_promoted = const()[name = tensor("const_541_promoted"), val = tensor(-0x1p+0)]; tensor var_5025 = mul(x = x2_89, y = const_541_promoted)[name = tensor("op_5025")]; tensor var_5027_interleave_0 = const()[name = tensor("op_5027_interleave_0"), val = tensor(false)]; tensor var_5027 = concat(axis = var_24, interleave = var_5027_interleave_0, values = (var_5025, x1_89))[name = tensor("op_5027")]; tensor var_5028 = mul(x = var_5027, y = sin_7_palettized)[name = tensor("op_5028")]; tensor query_45 = add(x = var_5014, y = var_5028)[name = tensor("query_45")]; tensor var_5030 = mul(x = output_539_cast_fp16, y = cos_7_palettized)[name = tensor("op_5030")]; tensor x1_91_begin_0 = const()[name = tensor("x1_91_begin_0"), val = tensor([0, 0, 0, 0])]; tensor x1_91_end_0 = const()[name = tensor("x1_91_end_0"), val = tensor([1, 4, 256, 128])]; tensor x1_91_end_mask_0 = const()[name = tensor("x1_91_end_mask_0"), val = tensor([true, true, true, false])]; tensor x1_91 = slice_by_index(begin = x1_91_begin_0, end = x1_91_end_0, end_mask = x1_91_end_mask_0, x = output_539_cast_fp16)[name = tensor("x1_91")]; tensor x2_91_begin_0 = const()[name = tensor("x2_91_begin_0"), val = tensor([0, 0, 0, 128])]; tensor x2_91_end_0 = const()[name = tensor("x2_91_end_0"), val = tensor([1, 4, 256, 256])]; tensor x2_91_end_mask_0 = const()[name = tensor("x2_91_end_mask_0"), val = tensor([true, true, true, true])]; tensor x2_91 = slice_by_index(begin = x2_91_begin_0, end = x2_91_end_0, end_mask = x2_91_end_mask_0, x = output_539_cast_fp16)[name = tensor("x2_91")]; tensor const_544_promoted = const()[name = tensor("const_544_promoted"), val = tensor(-0x1p+0)]; tensor var_5041 = mul(x = x2_91, y = const_544_promoted)[name = tensor("op_5041")]; tensor var_5043_interleave_0 = const()[name = tensor("op_5043_interleave_0"), val = tensor(false)]; tensor var_5043 = concat(axis = var_24, interleave = var_5043_interleave_0, values = (var_5041, x1_91))[name = tensor("op_5043")]; tensor var_5044 = mul(x = var_5043, y = sin_7_palettized)[name = tensor("op_5044")]; tensor hidden_states_311 = add(x = var_5030, y = var_5044)[name = tensor("hidden_states_311")]; tensor var_5053_axes_0 = const()[name = tensor("op_5053_axes_0"), val = tensor([2])]; tensor var_5053 = expand_dims(axes = var_5053_axes_0, x = hidden_states_311)[name = tensor("op_5053")]; tensor hidden_states_313_reps_0 = const()[name = tensor("hidden_states_313_reps_0"), val = tensor([1, 1, 2, 1, 1])]; tensor hidden_states_313 = tile(reps = hidden_states_313_reps_0, x = var_5053)[name = tensor("hidden_states_313")]; tensor var_5061 = const()[name = tensor("op_5061"), val = tensor([1, 8, 256, 256])]; tensor key_states_45 = reshape(shape = var_5061, x = hidden_states_313)[name = tensor("key_states_45")]; tensor var_5070_axes_0 = const()[name = tensor("op_5070_axes_0"), val = tensor([2])]; tensor hidden_states_315 = transpose(perm = hidden_states_315_perm_0, x = var_4982)[name = tensor("transpose_45")]; tensor var_5070 = expand_dims(axes = var_5070_axes_0, x = hidden_states_315)[name = tensor("op_5070")]; tensor hidden_states_317_reps_0 = const()[name = tensor("hidden_states_317_reps_0"), val = tensor([1, 1, 2, 1, 1])]; tensor hidden_states_317 = tile(reps = hidden_states_317_reps_0, x = var_5070)[name = tensor("hidden_states_317")]; tensor var_5078 = const()[name = tensor("op_5078"), val = tensor([1, 8, 256, 256])]; tensor value_states_45 = reshape(shape = var_5078, x = hidden_states_317)[name = tensor("value_states_45")]; tensor var_5081_transpose_x_1 = const()[name = tensor("op_5081_transpose_x_1"), val = tensor(false)]; tensor var_5081_transpose_y_1 = const()[name = tensor("op_5081_transpose_y_1"), val = tensor(true)]; tensor var_5081 = matmul(transpose_x = var_5081_transpose_x_1, transpose_y = var_5081_transpose_y_1, x = query_45, y = key_states_45)[name = tensor("op_5081")]; tensor var_5082_to_fp16 = const()[name = tensor("op_5082_to_fp16"), val = tensor(0x1p-4)]; tensor attn_weights_89_cast_fp16 = mul(x = var_5081, y = var_5082_to_fp16)[name = tensor("attn_weights_89_cast_fp16")]; tensor input_265_cast_fp16 = add(x = attn_weights_89_cast_fp16, y = attention_mask_to_fp16_palettized)[name = tensor("input_265_cast_fp16")]; tensor var_5090_cast_fp16 = softmax(axis = var_24, x = input_265_cast_fp16)[name = tensor("op_5090_cast_fp16")]; tensor attn_output_89_transpose_x_0 = const()[name = tensor("attn_output_89_transpose_x_0"), val = tensor(false)]; tensor attn_output_89_transpose_y_0 = const()[name = tensor("attn_output_89_transpose_y_0"), val = tensor(false)]; tensor attn_output_89 = matmul(transpose_x = attn_output_89_transpose_x_0, transpose_y = attn_output_89_transpose_y_0, x = var_5090_cast_fp16, y = value_states_45)[name = tensor("attn_output_89")]; tensor var_5094_perm_0 = const()[name = tensor("op_5094_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_5096 = const()[name = tensor("op_5096"), val = tensor([1, 256, -1])]; tensor var_5094 = transpose(perm = var_5094_perm_0, x = attn_output_89)[name = tensor("transpose_44")]; tensor var_5097 = reshape(shape = var_5096, x = var_5094)[name = tensor("op_5097")]; tensor x_539 = linear(bias = linear_3_bias_0, weight = wrapped_model_language_model_layers_22_self_attn_o_proj_weight_palettized, x = var_5097)[name = tensor("linear_157")]; tensor var_22_promoted_135_to_fp16 = const()[name = tensor("op_22_promoted_135_to_fp16"), val = tensor(0x1p+1)]; tensor var_5103_cast_fp16 = pow(x = x_539, y = var_22_promoted_135_to_fp16)[name = tensor("op_5103_cast_fp16")]; tensor var_5105_axes_0 = const()[name = tensor("op_5105_axes_0"), val = tensor([-1])]; tensor var_5105_keep_dims_0 = const()[name = tensor("op_5105_keep_dims_0"), val = tensor(true)]; tensor var_5105_cast_fp16 = reduce_mean(axes = var_5105_axes_0, keep_dims = var_5105_keep_dims_0, x = var_5103_cast_fp16)[name = tensor("op_5105_cast_fp16")]; tensor var_5106_to_fp16 = const()[name = tensor("op_5106_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_5107_cast_fp16 = add(x = var_5105_cast_fp16, y = var_5106_to_fp16)[name = tensor("op_5107_cast_fp16")]; tensor var_5108_epsilon_0 = const()[name = tensor("op_5108_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_5108_cast_fp16 = rsqrt(epsilon = var_5108_epsilon_0, x = var_5107_cast_fp16)[name = tensor("op_5108_cast_fp16")]; tensor output_541_cast_fp16 = mul(x = x_539, y = var_5108_cast_fp16)[name = tensor("output_541_cast_fp16")]; tensor var_5112_to_fp16 = const()[name = tensor("op_5112_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940678144)))]; tensor output_543_cast_fp16 = mul(x = output_541_cast_fp16, y = var_5112_to_fp16)[name = tensor("output_543_cast_fp16")]; tensor x_543 = add(x = x_527, y = output_543_cast_fp16)[name = tensor("x_543")]; tensor var_22_promoted_136_to_fp16 = const()[name = tensor("op_22_promoted_136_to_fp16"), val = tensor(0x1p+1)]; tensor var_5118_cast_fp16 = pow(x = x_543, y = var_22_promoted_136_to_fp16)[name = tensor("op_5118_cast_fp16")]; tensor var_5120_axes_0 = const()[name = tensor("op_5120_axes_0"), val = tensor([-1])]; tensor var_5120_keep_dims_0 = const()[name = tensor("op_5120_keep_dims_0"), val = tensor(true)]; tensor var_5120_cast_fp16 = reduce_mean(axes = var_5120_axes_0, keep_dims = var_5120_keep_dims_0, x = var_5118_cast_fp16)[name = tensor("op_5120_cast_fp16")]; tensor var_5121_to_fp16 = const()[name = tensor("op_5121_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_5122_cast_fp16 = add(x = var_5120_cast_fp16, y = var_5121_to_fp16)[name = tensor("op_5122_cast_fp16")]; tensor var_5123_epsilon_0 = const()[name = tensor("op_5123_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_5123_cast_fp16 = rsqrt(epsilon = var_5123_epsilon_0, x = var_5122_cast_fp16)[name = tensor("op_5123_cast_fp16")]; tensor output_545_cast_fp16 = mul(x = x_543, y = var_5123_cast_fp16)[name = tensor("output_545_cast_fp16")]; tensor var_5127_to_fp16 = const()[name = tensor("op_5127_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940683328)))]; tensor output_547_cast_fp16 = mul(x = output_545_cast_fp16, y = var_5127_to_fp16)[name = tensor("output_547_cast_fp16")]; tensor input_273 = linear(bias = linear_4_bias_0, weight = wrapped_model_language_model_layers_22_mlp_gate_proj_weight_palettized, x = output_547_cast_fp16)[name = tensor("linear_158")]; tensor var_5135_mode_0 = const()[name = tensor("op_5135_mode_0"), val = tensor("TANH_APPROXIMATION")]; tensor var_5135 = gelu(mode = var_5135_mode_0, x = input_273)[name = tensor("op_5135")]; tensor var_5137 = linear(bias = linear_4_bias_0, weight = wrapped_model_language_model_layers_22_mlp_up_proj_weight_palettized, x = output_547_cast_fp16)[name = tensor("linear_159")]; tensor input_275 = mul(x = var_5135, y = var_5137)[name = tensor("input_275")]; tensor x_547 = linear(bias = linear_3_bias_0, weight = wrapped_model_language_model_layers_22_mlp_down_proj_weight_palettized, x = input_275)[name = tensor("linear_160")]; tensor var_22_promoted_137_to_fp16 = const()[name = tensor("op_22_promoted_137_to_fp16"), val = tensor(0x1p+1)]; tensor var_5143_cast_fp16 = pow(x = x_547, y = var_22_promoted_137_to_fp16)[name = tensor("op_5143_cast_fp16")]; tensor var_5145_axes_0 = const()[name = tensor("op_5145_axes_0"), val = tensor([-1])]; tensor var_5145_keep_dims_0 = const()[name = tensor("op_5145_keep_dims_0"), val = tensor(true)]; tensor var_5145_cast_fp16 = reduce_mean(axes = var_5145_axes_0, keep_dims = var_5145_keep_dims_0, x = var_5143_cast_fp16)[name = tensor("op_5145_cast_fp16")]; tensor var_5146_to_fp16 = const()[name = tensor("op_5146_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_5147_cast_fp16 = add(x = var_5145_cast_fp16, y = var_5146_to_fp16)[name = tensor("op_5147_cast_fp16")]; tensor var_5148_epsilon_0 = const()[name = tensor("op_5148_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_5148_cast_fp16 = rsqrt(epsilon = var_5148_epsilon_0, x = var_5147_cast_fp16)[name = tensor("op_5148_cast_fp16")]; tensor output_549_cast_fp16 = mul(x = x_547, y = var_5148_cast_fp16)[name = tensor("output_549_cast_fp16")]; tensor var_5152_to_fp16 = const()[name = tensor("op_5152_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940688512)))]; tensor output_551_cast_fp16 = mul(x = output_549_cast_fp16, y = var_5152_to_fp16)[name = tensor("output_551_cast_fp16")]; tensor x_551 = add(x = x_543, y = output_551_cast_fp16)[name = tensor("x_551")]; tensor var_22_promoted_138_to_fp16 = const()[name = tensor("op_22_promoted_138_to_fp16"), val = tensor(0x1p+1)]; tensor var_5164_cast_fp16 = pow(x = x_551, y = var_22_promoted_138_to_fp16)[name = tensor("op_5164_cast_fp16")]; tensor var_5166_axes_0 = const()[name = tensor("op_5166_axes_0"), val = tensor([-1])]; tensor var_5166_keep_dims_0 = const()[name = tensor("op_5166_keep_dims_0"), val = tensor(true)]; tensor var_5166_cast_fp16 = reduce_mean(axes = var_5166_axes_0, keep_dims = var_5166_keep_dims_0, x = var_5164_cast_fp16)[name = tensor("op_5166_cast_fp16")]; tensor var_5167_to_fp16 = const()[name = tensor("op_5167_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_5168_cast_fp16 = add(x = var_5166_cast_fp16, y = var_5167_to_fp16)[name = tensor("op_5168_cast_fp16")]; tensor var_5169_epsilon_0 = const()[name = tensor("op_5169_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_5169_cast_fp16 = rsqrt(epsilon = var_5169_epsilon_0, x = var_5168_cast_fp16)[name = tensor("op_5169_cast_fp16")]; tensor output_553_cast_fp16 = mul(x = x_551, y = var_5169_cast_fp16)[name = tensor("output_553_cast_fp16")]; tensor var_5173_to_fp16 = const()[name = tensor("op_5173_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940693696)))]; tensor output_555_cast_fp16 = mul(x = output_553_cast_fp16, y = var_5173_to_fp16)[name = tensor("output_555_cast_fp16")]; tensor var_5185 = linear(bias = linear_0_bias_0, weight = wrapped_model_language_model_layers_23_self_attn_q_proj_weight_palettized, x = output_555_cast_fp16)[name = tensor("linear_161")]; tensor var_5186 = const()[name = tensor("op_5186"), val = tensor([1, 256, -1, 256])]; tensor var_5187 = reshape(shape = var_5186, x = var_5185)[name = tensor("op_5187")]; tensor x_555_perm_0 = const()[name = tensor("x_555_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_5190 = linear(bias = linear_1_bias_0, weight = wrapped_model_language_model_layers_23_self_attn_k_proj_weight_palettized, x = output_555_cast_fp16)[name = tensor("linear_162")]; tensor var_5191 = const()[name = tensor("op_5191"), val = tensor([1, 256, -1, 256])]; tensor var_5192 = reshape(shape = var_5191, x = var_5190)[name = tensor("op_5192")]; tensor x_559_perm_0 = const()[name = tensor("x_559_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_5195 = linear(bias = linear_1_bias_0, weight = wrapped_model_language_model_layers_23_self_attn_v_proj_weight_palettized, x = output_555_cast_fp16)[name = tensor("linear_163")]; tensor var_5196 = const()[name = tensor("op_5196"), val = tensor([1, 256, -1, 256])]; tensor var_5197 = reshape(shape = var_5196, x = var_5195)[name = tensor("op_5197")]; tensor hidden_states_329_perm_0 = const()[name = tensor("hidden_states_329_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_22_promoted_139_to_fp16 = const()[name = tensor("op_22_promoted_139_to_fp16"), val = tensor(0x1p+1)]; tensor x_555 = transpose(perm = x_555_perm_0, x = var_5187)[name = tensor("transpose_43")]; tensor var_5201_cast_fp16 = pow(x = x_555, y = var_22_promoted_139_to_fp16)[name = tensor("op_5201_cast_fp16")]; tensor var_5203_axes_0 = const()[name = tensor("op_5203_axes_0"), val = tensor([-1])]; tensor var_5203_keep_dims_0 = const()[name = tensor("op_5203_keep_dims_0"), val = tensor(true)]; tensor var_5203_cast_fp16 = reduce_mean(axes = var_5203_axes_0, keep_dims = var_5203_keep_dims_0, x = var_5201_cast_fp16)[name = tensor("op_5203_cast_fp16")]; tensor var_5204_to_fp16 = const()[name = tensor("op_5204_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_5205_cast_fp16 = add(x = var_5203_cast_fp16, y = var_5204_to_fp16)[name = tensor("op_5205_cast_fp16")]; tensor var_5206_epsilon_0 = const()[name = tensor("op_5206_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_5206_cast_fp16 = rsqrt(epsilon = var_5206_epsilon_0, x = var_5205_cast_fp16)[name = tensor("op_5206_cast_fp16")]; tensor output_557_cast_fp16 = mul(x = x_555, y = var_5206_cast_fp16)[name = tensor("output_557_cast_fp16")]; tensor var_5210_to_fp16 = const()[name = tensor("op_5210_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940698880)))]; tensor output_559_cast_fp16 = mul(x = output_557_cast_fp16, y = var_5210_to_fp16)[name = tensor("output_559_cast_fp16")]; tensor var_22_promoted_140_to_fp16 = const()[name = tensor("op_22_promoted_140_to_fp16"), val = tensor(0x1p+1)]; tensor x_559 = transpose(perm = x_559_perm_0, x = var_5192)[name = tensor("transpose_42")]; tensor var_5215_cast_fp16 = pow(x = x_559, y = var_22_promoted_140_to_fp16)[name = tensor("op_5215_cast_fp16")]; tensor var_5217_axes_0 = const()[name = tensor("op_5217_axes_0"), val = tensor([-1])]; tensor var_5217_keep_dims_0 = const()[name = tensor("op_5217_keep_dims_0"), val = tensor(true)]; tensor var_5217_cast_fp16 = reduce_mean(axes = var_5217_axes_0, keep_dims = var_5217_keep_dims_0, x = var_5215_cast_fp16)[name = tensor("op_5217_cast_fp16")]; tensor var_5218_to_fp16 = const()[name = tensor("op_5218_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_5219_cast_fp16 = add(x = var_5217_cast_fp16, y = var_5218_to_fp16)[name = tensor("op_5219_cast_fp16")]; tensor var_5220_epsilon_0 = const()[name = tensor("op_5220_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_5220_cast_fp16 = rsqrt(epsilon = var_5220_epsilon_0, x = var_5219_cast_fp16)[name = tensor("op_5220_cast_fp16")]; tensor output_561_cast_fp16 = mul(x = x_559, y = var_5220_cast_fp16)[name = tensor("output_561_cast_fp16")]; tensor var_5224_to_fp16 = const()[name = tensor("op_5224_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940699456)))]; tensor output_563_cast_fp16 = mul(x = output_561_cast_fp16, y = var_5224_to_fp16)[name = tensor("output_563_cast_fp16")]; tensor var_5229 = mul(x = output_559_cast_fp16, y = cos_19_palettized)[name = tensor("op_5229")]; tensor x1_93_begin_0 = const()[name = tensor("x1_93_begin_0"), val = tensor([0, 0, 0, 0])]; tensor x1_93_end_0 = const()[name = tensor("x1_93_end_0"), val = tensor([1, 8, 256, 128])]; tensor x1_93_end_mask_0 = const()[name = tensor("x1_93_end_mask_0"), val = tensor([true, true, true, false])]; tensor x1_93 = slice_by_index(begin = x1_93_begin_0, end = x1_93_end_0, end_mask = x1_93_end_mask_0, x = output_559_cast_fp16)[name = tensor("x1_93")]; tensor x2_93_begin_0 = const()[name = tensor("x2_93_begin_0"), val = tensor([0, 0, 0, 128])]; tensor x2_93_end_0 = const()[name = tensor("x2_93_end_0"), val = tensor([1, 8, 256, 256])]; tensor x2_93_end_mask_0 = const()[name = tensor("x2_93_end_mask_0"), val = tensor([true, true, true, true])]; tensor x2_93 = slice_by_index(begin = x2_93_begin_0, end = x2_93_end_0, end_mask = x2_93_end_mask_0, x = output_559_cast_fp16)[name = tensor("x2_93")]; tensor const_564_promoted = const()[name = tensor("const_564_promoted"), val = tensor(-0x1p+0)]; tensor var_5240 = mul(x = x2_93, y = const_564_promoted)[name = tensor("op_5240")]; tensor var_5242_interleave_0 = const()[name = tensor("op_5242_interleave_0"), val = tensor(false)]; tensor var_5242 = concat(axis = var_24, interleave = var_5242_interleave_0, values = (var_5240, x1_93))[name = tensor("op_5242")]; tensor var_5243 = mul(x = var_5242, y = sin_19_palettized)[name = tensor("op_5243")]; tensor query_47 = add(x = var_5229, y = var_5243)[name = tensor("query_47")]; tensor var_5245 = mul(x = output_563_cast_fp16, y = cos_19_palettized)[name = tensor("op_5245")]; tensor x1_95_begin_0 = const()[name = tensor("x1_95_begin_0"), val = tensor([0, 0, 0, 0])]; tensor x1_95_end_0 = const()[name = tensor("x1_95_end_0"), val = tensor([1, 4, 256, 128])]; tensor x1_95_end_mask_0 = const()[name = tensor("x1_95_end_mask_0"), val = tensor([true, true, true, false])]; tensor x1_95 = slice_by_index(begin = x1_95_begin_0, end = x1_95_end_0, end_mask = x1_95_end_mask_0, x = output_563_cast_fp16)[name = tensor("x1_95")]; tensor x2_95_begin_0 = const()[name = tensor("x2_95_begin_0"), val = tensor([0, 0, 0, 128])]; tensor x2_95_end_0 = const()[name = tensor("x2_95_end_0"), val = tensor([1, 4, 256, 256])]; tensor x2_95_end_mask_0 = const()[name = tensor("x2_95_end_mask_0"), val = tensor([true, true, true, true])]; tensor x2_95 = slice_by_index(begin = x2_95_begin_0, end = x2_95_end_0, end_mask = x2_95_end_mask_0, x = output_563_cast_fp16)[name = tensor("x2_95")]; tensor const_567_promoted = const()[name = tensor("const_567_promoted"), val = tensor(-0x1p+0)]; tensor var_5256 = mul(x = x2_95, y = const_567_promoted)[name = tensor("op_5256")]; tensor var_5258_interleave_0 = const()[name = tensor("op_5258_interleave_0"), val = tensor(false)]; tensor var_5258 = concat(axis = var_24, interleave = var_5258_interleave_0, values = (var_5256, x1_95))[name = tensor("op_5258")]; tensor var_5259 = mul(x = var_5258, y = sin_19_palettized)[name = tensor("op_5259")]; tensor hidden_states_325 = add(x = var_5245, y = var_5259)[name = tensor("hidden_states_325")]; tensor var_5268_axes_0 = const()[name = tensor("op_5268_axes_0"), val = tensor([2])]; tensor var_5268 = expand_dims(axes = var_5268_axes_0, x = hidden_states_325)[name = tensor("op_5268")]; tensor hidden_states_327_reps_0 = const()[name = tensor("hidden_states_327_reps_0"), val = tensor([1, 1, 2, 1, 1])]; tensor hidden_states_327 = tile(reps = hidden_states_327_reps_0, x = var_5268)[name = tensor("hidden_states_327")]; tensor var_5276 = const()[name = tensor("op_5276"), val = tensor([1, 8, 256, 256])]; tensor key_states_47 = reshape(shape = var_5276, x = hidden_states_327)[name = tensor("key_states_47")]; tensor var_5285_axes_0 = const()[name = tensor("op_5285_axes_0"), val = tensor([2])]; tensor hidden_states_329 = transpose(perm = hidden_states_329_perm_0, x = var_5197)[name = tensor("transpose_41")]; tensor var_5285 = expand_dims(axes = var_5285_axes_0, x = hidden_states_329)[name = tensor("op_5285")]; tensor hidden_states_331_reps_0 = const()[name = tensor("hidden_states_331_reps_0"), val = tensor([1, 1, 2, 1, 1])]; tensor hidden_states_331 = tile(reps = hidden_states_331_reps_0, x = var_5285)[name = tensor("hidden_states_331")]; tensor var_5293 = const()[name = tensor("op_5293"), val = tensor([1, 8, 256, 256])]; tensor value_states_47 = reshape(shape = var_5293, x = hidden_states_331)[name = tensor("value_states_47")]; tensor var_5296_transpose_x_1 = const()[name = tensor("op_5296_transpose_x_1"), val = tensor(false)]; tensor var_5296_transpose_y_1 = const()[name = tensor("op_5296_transpose_y_1"), val = tensor(true)]; tensor var_5296 = matmul(transpose_x = var_5296_transpose_x_1, transpose_y = var_5296_transpose_y_1, x = query_47, y = key_states_47)[name = tensor("op_5296")]; tensor var_5297_to_fp16 = const()[name = tensor("op_5297_to_fp16"), val = tensor(0x1p-4)]; tensor attn_weights_93_cast_fp16 = mul(x = var_5296, y = var_5297_to_fp16)[name = tensor("attn_weights_93_cast_fp16")]; tensor input_277_cast_fp16 = add(x = attn_weights_93_cast_fp16, y = attention_mask_to_fp16_palettized)[name = tensor("input_277_cast_fp16")]; tensor var_5305_cast_fp16 = softmax(axis = var_24, x = input_277_cast_fp16)[name = tensor("op_5305_cast_fp16")]; tensor attn_output_93_transpose_x_0 = const()[name = tensor("attn_output_93_transpose_x_0"), val = tensor(false)]; tensor attn_output_93_transpose_y_0 = const()[name = tensor("attn_output_93_transpose_y_0"), val = tensor(false)]; tensor attn_output_93 = matmul(transpose_x = attn_output_93_transpose_x_0, transpose_y = attn_output_93_transpose_y_0, x = var_5305_cast_fp16, y = value_states_47)[name = tensor("attn_output_93")]; tensor var_5309_perm_0 = const()[name = tensor("op_5309_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_5311 = const()[name = tensor("op_5311"), val = tensor([1, 256, -1])]; tensor var_5309 = transpose(perm = var_5309_perm_0, x = attn_output_93)[name = tensor("transpose_40")]; tensor var_5312 = reshape(shape = var_5311, x = var_5309)[name = tensor("op_5312")]; tensor x_563 = linear(bias = linear_3_bias_0, weight = wrapped_model_language_model_layers_23_self_attn_o_proj_weight_palettized, x = var_5312)[name = tensor("linear_164")]; tensor var_22_promoted_141_to_fp16 = const()[name = tensor("op_22_promoted_141_to_fp16"), val = tensor(0x1p+1)]; tensor var_5318_cast_fp16 = pow(x = x_563, y = var_22_promoted_141_to_fp16)[name = tensor("op_5318_cast_fp16")]; tensor var_5320_axes_0 = const()[name = tensor("op_5320_axes_0"), val = tensor([-1])]; tensor var_5320_keep_dims_0 = const()[name = tensor("op_5320_keep_dims_0"), val = tensor(true)]; tensor var_5320_cast_fp16 = reduce_mean(axes = var_5320_axes_0, keep_dims = var_5320_keep_dims_0, x = var_5318_cast_fp16)[name = tensor("op_5320_cast_fp16")]; tensor var_5321_to_fp16 = const()[name = tensor("op_5321_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_5322_cast_fp16 = add(x = var_5320_cast_fp16, y = var_5321_to_fp16)[name = tensor("op_5322_cast_fp16")]; tensor var_5323_epsilon_0 = const()[name = tensor("op_5323_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_5323_cast_fp16 = rsqrt(epsilon = var_5323_epsilon_0, x = var_5322_cast_fp16)[name = tensor("op_5323_cast_fp16")]; tensor output_565_cast_fp16 = mul(x = x_563, y = var_5323_cast_fp16)[name = tensor("output_565_cast_fp16")]; tensor var_5327_to_fp16 = const()[name = tensor("op_5327_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940700032)))]; tensor output_567_cast_fp16 = mul(x = output_565_cast_fp16, y = var_5327_to_fp16)[name = tensor("output_567_cast_fp16")]; tensor x_567 = add(x = x_551, y = output_567_cast_fp16)[name = tensor("x_567")]; tensor var_22_promoted_142_to_fp16 = const()[name = tensor("op_22_promoted_142_to_fp16"), val = tensor(0x1p+1)]; tensor var_5333_cast_fp16 = pow(x = x_567, y = var_22_promoted_142_to_fp16)[name = tensor("op_5333_cast_fp16")]; tensor var_5335_axes_0 = const()[name = tensor("op_5335_axes_0"), val = tensor([-1])]; tensor var_5335_keep_dims_0 = const()[name = tensor("op_5335_keep_dims_0"), val = tensor(true)]; tensor var_5335_cast_fp16 = reduce_mean(axes = var_5335_axes_0, keep_dims = var_5335_keep_dims_0, x = var_5333_cast_fp16)[name = tensor("op_5335_cast_fp16")]; tensor var_5336_to_fp16 = const()[name = tensor("op_5336_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_5337_cast_fp16 = add(x = var_5335_cast_fp16, y = var_5336_to_fp16)[name = tensor("op_5337_cast_fp16")]; tensor var_5338_epsilon_0 = const()[name = tensor("op_5338_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_5338_cast_fp16 = rsqrt(epsilon = var_5338_epsilon_0, x = var_5337_cast_fp16)[name = tensor("op_5338_cast_fp16")]; tensor output_569_cast_fp16 = mul(x = x_567, y = var_5338_cast_fp16)[name = tensor("output_569_cast_fp16")]; tensor var_5342_to_fp16 = const()[name = tensor("op_5342_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940705216)))]; tensor output_571_cast_fp16 = mul(x = output_569_cast_fp16, y = var_5342_to_fp16)[name = tensor("output_571_cast_fp16")]; tensor input_285 = linear(bias = linear_4_bias_0, weight = wrapped_model_language_model_layers_23_mlp_gate_proj_weight_palettized, x = output_571_cast_fp16)[name = tensor("linear_165")]; tensor var_5350_mode_0 = const()[name = tensor("op_5350_mode_0"), val = tensor("TANH_APPROXIMATION")]; tensor var_5350 = gelu(mode = var_5350_mode_0, x = input_285)[name = tensor("op_5350")]; tensor var_5352 = linear(bias = linear_4_bias_0, weight = wrapped_model_language_model_layers_23_mlp_up_proj_weight_palettized, x = output_571_cast_fp16)[name = tensor("linear_166")]; tensor input_287 = mul(x = var_5350, y = var_5352)[name = tensor("input_287")]; tensor x_571 = linear(bias = linear_3_bias_0, weight = wrapped_model_language_model_layers_23_mlp_down_proj_weight_palettized, x = input_287)[name = tensor("linear_167")]; tensor var_22_promoted_143_to_fp16 = const()[name = tensor("op_22_promoted_143_to_fp16"), val = tensor(0x1p+1)]; tensor var_5358_cast_fp16 = pow(x = x_571, y = var_22_promoted_143_to_fp16)[name = tensor("op_5358_cast_fp16")]; tensor var_5360_axes_0 = const()[name = tensor("op_5360_axes_0"), val = tensor([-1])]; tensor var_5360_keep_dims_0 = const()[name = tensor("op_5360_keep_dims_0"), val = tensor(true)]; tensor var_5360_cast_fp16 = reduce_mean(axes = var_5360_axes_0, keep_dims = var_5360_keep_dims_0, x = var_5358_cast_fp16)[name = tensor("op_5360_cast_fp16")]; tensor var_5361_to_fp16 = const()[name = tensor("op_5361_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_5362_cast_fp16 = add(x = var_5360_cast_fp16, y = var_5361_to_fp16)[name = tensor("op_5362_cast_fp16")]; tensor var_5363_epsilon_0 = const()[name = tensor("op_5363_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_5363_cast_fp16 = rsqrt(epsilon = var_5363_epsilon_0, x = var_5362_cast_fp16)[name = tensor("op_5363_cast_fp16")]; tensor output_573_cast_fp16 = mul(x = x_571, y = var_5363_cast_fp16)[name = tensor("output_573_cast_fp16")]; tensor var_5367_to_fp16 = const()[name = tensor("op_5367_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940710400)))]; tensor output_575_cast_fp16 = mul(x = output_573_cast_fp16, y = var_5367_to_fp16)[name = tensor("output_575_cast_fp16")]; tensor x_575 = add(x = x_567, y = output_575_cast_fp16)[name = tensor("x_575")]; tensor var_22_promoted_144_to_fp16 = const()[name = tensor("op_22_promoted_144_to_fp16"), val = tensor(0x1p+1)]; tensor var_5379_cast_fp16 = pow(x = x_575, y = var_22_promoted_144_to_fp16)[name = tensor("op_5379_cast_fp16")]; tensor var_5381_axes_0 = const()[name = tensor("op_5381_axes_0"), val = tensor([-1])]; tensor var_5381_keep_dims_0 = const()[name = tensor("op_5381_keep_dims_0"), val = tensor(true)]; tensor var_5381_cast_fp16 = reduce_mean(axes = var_5381_axes_0, keep_dims = var_5381_keep_dims_0, x = var_5379_cast_fp16)[name = tensor("op_5381_cast_fp16")]; tensor var_5382_to_fp16 = const()[name = tensor("op_5382_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_5383_cast_fp16 = add(x = var_5381_cast_fp16, y = var_5382_to_fp16)[name = tensor("op_5383_cast_fp16")]; tensor var_5384_epsilon_0 = const()[name = tensor("op_5384_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_5384_cast_fp16 = rsqrt(epsilon = var_5384_epsilon_0, x = var_5383_cast_fp16)[name = tensor("op_5384_cast_fp16")]; tensor output_577_cast_fp16 = mul(x = x_575, y = var_5384_cast_fp16)[name = tensor("output_577_cast_fp16")]; tensor var_5388_to_fp16 = const()[name = tensor("op_5388_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940715584)))]; tensor output_579_cast_fp16 = mul(x = output_577_cast_fp16, y = var_5388_to_fp16)[name = tensor("output_579_cast_fp16")]; tensor var_5400 = linear(bias = linear_0_bias_0, weight = wrapped_model_language_model_layers_24_self_attn_q_proj_weight_palettized, x = output_579_cast_fp16)[name = tensor("linear_168")]; tensor var_5401 = const()[name = tensor("op_5401"), val = tensor([1, 256, -1, 256])]; tensor var_5402 = reshape(shape = var_5401, x = var_5400)[name = tensor("op_5402")]; tensor x_579_perm_0 = const()[name = tensor("x_579_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_5405 = linear(bias = linear_1_bias_0, weight = wrapped_model_language_model_layers_24_self_attn_k_proj_weight_palettized, x = output_579_cast_fp16)[name = tensor("linear_169")]; tensor var_5406 = const()[name = tensor("op_5406"), val = tensor([1, 256, -1, 256])]; tensor var_5407 = reshape(shape = var_5406, x = var_5405)[name = tensor("op_5407")]; tensor x_583_perm_0 = const()[name = tensor("x_583_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_5410 = linear(bias = linear_1_bias_0, weight = wrapped_model_language_model_layers_24_self_attn_v_proj_weight_palettized, x = output_579_cast_fp16)[name = tensor("linear_170")]; tensor var_5411 = const()[name = tensor("op_5411"), val = tensor([1, 256, -1, 256])]; tensor var_5412 = reshape(shape = var_5411, x = var_5410)[name = tensor("op_5412")]; tensor hidden_states_343_perm_0 = const()[name = tensor("hidden_states_343_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_22_promoted_145_to_fp16 = const()[name = tensor("op_22_promoted_145_to_fp16"), val = tensor(0x1p+1)]; tensor x_579 = transpose(perm = x_579_perm_0, x = var_5402)[name = tensor("transpose_39")]; tensor var_5416_cast_fp16 = pow(x = x_579, y = var_22_promoted_145_to_fp16)[name = tensor("op_5416_cast_fp16")]; tensor var_5418_axes_0 = const()[name = tensor("op_5418_axes_0"), val = tensor([-1])]; tensor var_5418_keep_dims_0 = const()[name = tensor("op_5418_keep_dims_0"), val = tensor(true)]; tensor var_5418_cast_fp16 = reduce_mean(axes = var_5418_axes_0, keep_dims = var_5418_keep_dims_0, x = var_5416_cast_fp16)[name = tensor("op_5418_cast_fp16")]; tensor var_5419_to_fp16 = const()[name = tensor("op_5419_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_5420_cast_fp16 = add(x = var_5418_cast_fp16, y = var_5419_to_fp16)[name = tensor("op_5420_cast_fp16")]; tensor var_5421_epsilon_0 = const()[name = tensor("op_5421_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_5421_cast_fp16 = rsqrt(epsilon = var_5421_epsilon_0, x = var_5420_cast_fp16)[name = tensor("op_5421_cast_fp16")]; tensor output_581_cast_fp16 = mul(x = x_579, y = var_5421_cast_fp16)[name = tensor("output_581_cast_fp16")]; tensor var_5425_to_fp16 = const()[name = tensor("op_5425_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940720768)))]; tensor output_583_cast_fp16 = mul(x = output_581_cast_fp16, y = var_5425_to_fp16)[name = tensor("output_583_cast_fp16")]; tensor var_22_promoted_146_to_fp16 = const()[name = tensor("op_22_promoted_146_to_fp16"), val = tensor(0x1p+1)]; tensor x_583 = transpose(perm = x_583_perm_0, x = var_5407)[name = tensor("transpose_38")]; tensor var_5430_cast_fp16 = pow(x = x_583, y = var_22_promoted_146_to_fp16)[name = tensor("op_5430_cast_fp16")]; tensor var_5432_axes_0 = const()[name = tensor("op_5432_axes_0"), val = tensor([-1])]; tensor var_5432_keep_dims_0 = const()[name = tensor("op_5432_keep_dims_0"), val = tensor(true)]; tensor var_5432_cast_fp16 = reduce_mean(axes = var_5432_axes_0, keep_dims = var_5432_keep_dims_0, x = var_5430_cast_fp16)[name = tensor("op_5432_cast_fp16")]; tensor var_5433_to_fp16 = const()[name = tensor("op_5433_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_5434_cast_fp16 = add(x = var_5432_cast_fp16, y = var_5433_to_fp16)[name = tensor("op_5434_cast_fp16")]; tensor var_5435_epsilon_0 = const()[name = tensor("op_5435_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_5435_cast_fp16 = rsqrt(epsilon = var_5435_epsilon_0, x = var_5434_cast_fp16)[name = tensor("op_5435_cast_fp16")]; tensor output_585_cast_fp16 = mul(x = x_583, y = var_5435_cast_fp16)[name = tensor("output_585_cast_fp16")]; tensor var_5439_to_fp16 = const()[name = tensor("op_5439_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940721344)))]; tensor output_587_cast_fp16 = mul(x = output_585_cast_fp16, y = var_5439_to_fp16)[name = tensor("output_587_cast_fp16")]; tensor var_5444 = mul(x = output_583_cast_fp16, y = cos_7_palettized)[name = tensor("op_5444")]; tensor x1_97_begin_0 = const()[name = tensor("x1_97_begin_0"), val = tensor([0, 0, 0, 0])]; tensor x1_97_end_0 = const()[name = tensor("x1_97_end_0"), val = tensor([1, 8, 256, 128])]; tensor x1_97_end_mask_0 = const()[name = tensor("x1_97_end_mask_0"), val = tensor([true, true, true, false])]; tensor x1_97 = slice_by_index(begin = x1_97_begin_0, end = x1_97_end_0, end_mask = x1_97_end_mask_0, x = output_583_cast_fp16)[name = tensor("x1_97")]; tensor x2_97_begin_0 = const()[name = tensor("x2_97_begin_0"), val = tensor([0, 0, 0, 128])]; tensor x2_97_end_0 = const()[name = tensor("x2_97_end_0"), val = tensor([1, 8, 256, 256])]; tensor x2_97_end_mask_0 = const()[name = tensor("x2_97_end_mask_0"), val = tensor([true, true, true, true])]; tensor x2_97 = slice_by_index(begin = x2_97_begin_0, end = x2_97_end_0, end_mask = x2_97_end_mask_0, x = output_583_cast_fp16)[name = tensor("x2_97")]; tensor const_587_promoted = const()[name = tensor("const_587_promoted"), val = tensor(-0x1p+0)]; tensor var_5455 = mul(x = x2_97, y = const_587_promoted)[name = tensor("op_5455")]; tensor var_5457_interleave_0 = const()[name = tensor("op_5457_interleave_0"), val = tensor(false)]; tensor var_5457 = concat(axis = var_24, interleave = var_5457_interleave_0, values = (var_5455, x1_97))[name = tensor("op_5457")]; tensor var_5458 = mul(x = var_5457, y = sin_7_palettized)[name = tensor("op_5458")]; tensor query_49 = add(x = var_5444, y = var_5458)[name = tensor("query_49")]; tensor var_5460 = mul(x = output_587_cast_fp16, y = cos_7_palettized)[name = tensor("op_5460")]; tensor x1_99_begin_0 = const()[name = tensor("x1_99_begin_0"), val = tensor([0, 0, 0, 0])]; tensor x1_99_end_0 = const()[name = tensor("x1_99_end_0"), val = tensor([1, 4, 256, 128])]; tensor x1_99_end_mask_0 = const()[name = tensor("x1_99_end_mask_0"), val = tensor([true, true, true, false])]; tensor x1_99 = slice_by_index(begin = x1_99_begin_0, end = x1_99_end_0, end_mask = x1_99_end_mask_0, x = output_587_cast_fp16)[name = tensor("x1_99")]; tensor x2_99_begin_0 = const()[name = tensor("x2_99_begin_0"), val = tensor([0, 0, 0, 128])]; tensor x2_99_end_0 = const()[name = tensor("x2_99_end_0"), val = tensor([1, 4, 256, 256])]; tensor x2_99_end_mask_0 = const()[name = tensor("x2_99_end_mask_0"), val = tensor([true, true, true, true])]; tensor x2_99 = slice_by_index(begin = x2_99_begin_0, end = x2_99_end_0, end_mask = x2_99_end_mask_0, x = output_587_cast_fp16)[name = tensor("x2_99")]; tensor const_590_promoted = const()[name = tensor("const_590_promoted"), val = tensor(-0x1p+0)]; tensor var_5471 = mul(x = x2_99, y = const_590_promoted)[name = tensor("op_5471")]; tensor var_5473_interleave_0 = const()[name = tensor("op_5473_interleave_0"), val = tensor(false)]; tensor var_5473 = concat(axis = var_24, interleave = var_5473_interleave_0, values = (var_5471, x1_99))[name = tensor("op_5473")]; tensor var_5474 = mul(x = var_5473, y = sin_7_palettized)[name = tensor("op_5474")]; tensor hidden_states_339 = add(x = var_5460, y = var_5474)[name = tensor("hidden_states_339")]; tensor var_5483_axes_0 = const()[name = tensor("op_5483_axes_0"), val = tensor([2])]; tensor var_5483 = expand_dims(axes = var_5483_axes_0, x = hidden_states_339)[name = tensor("op_5483")]; tensor hidden_states_341_reps_0 = const()[name = tensor("hidden_states_341_reps_0"), val = tensor([1, 1, 2, 1, 1])]; tensor hidden_states_341 = tile(reps = hidden_states_341_reps_0, x = var_5483)[name = tensor("hidden_states_341")]; tensor var_5491 = const()[name = tensor("op_5491"), val = tensor([1, 8, 256, 256])]; tensor key_states_49 = reshape(shape = var_5491, x = hidden_states_341)[name = tensor("key_states_49")]; tensor var_5500_axes_0 = const()[name = tensor("op_5500_axes_0"), val = tensor([2])]; tensor hidden_states_343 = transpose(perm = hidden_states_343_perm_0, x = var_5412)[name = tensor("transpose_37")]; tensor var_5500 = expand_dims(axes = var_5500_axes_0, x = hidden_states_343)[name = tensor("op_5500")]; tensor hidden_states_345_reps_0 = const()[name = tensor("hidden_states_345_reps_0"), val = tensor([1, 1, 2, 1, 1])]; tensor hidden_states_345 = tile(reps = hidden_states_345_reps_0, x = var_5500)[name = tensor("hidden_states_345")]; tensor var_5508 = const()[name = tensor("op_5508"), val = tensor([1, 8, 256, 256])]; tensor value_states_49 = reshape(shape = var_5508, x = hidden_states_345)[name = tensor("value_states_49")]; tensor var_5511_transpose_x_1 = const()[name = tensor("op_5511_transpose_x_1"), val = tensor(false)]; tensor var_5511_transpose_y_1 = const()[name = tensor("op_5511_transpose_y_1"), val = tensor(true)]; tensor var_5511 = matmul(transpose_x = var_5511_transpose_x_1, transpose_y = var_5511_transpose_y_1, x = query_49, y = key_states_49)[name = tensor("op_5511")]; tensor var_5512_to_fp16 = const()[name = tensor("op_5512_to_fp16"), val = tensor(0x1p-4)]; tensor attn_weights_97_cast_fp16 = mul(x = var_5511, y = var_5512_to_fp16)[name = tensor("attn_weights_97_cast_fp16")]; tensor input_289_cast_fp16 = add(x = attn_weights_97_cast_fp16, y = attention_mask_to_fp16_palettized)[name = tensor("input_289_cast_fp16")]; tensor var_5520_cast_fp16 = softmax(axis = var_24, x = input_289_cast_fp16)[name = tensor("op_5520_cast_fp16")]; tensor attn_output_97_transpose_x_0 = const()[name = tensor("attn_output_97_transpose_x_0"), val = tensor(false)]; tensor attn_output_97_transpose_y_0 = const()[name = tensor("attn_output_97_transpose_y_0"), val = tensor(false)]; tensor attn_output_97 = matmul(transpose_x = attn_output_97_transpose_x_0, transpose_y = attn_output_97_transpose_y_0, x = var_5520_cast_fp16, y = value_states_49)[name = tensor("attn_output_97")]; tensor var_5524_perm_0 = const()[name = tensor("op_5524_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_5526 = const()[name = tensor("op_5526"), val = tensor([1, 256, -1])]; tensor var_5524 = transpose(perm = var_5524_perm_0, x = attn_output_97)[name = tensor("transpose_36")]; tensor var_5527 = reshape(shape = var_5526, x = var_5524)[name = tensor("op_5527")]; tensor x_587 = linear(bias = linear_3_bias_0, weight = wrapped_model_language_model_layers_24_self_attn_o_proj_weight_palettized, x = var_5527)[name = tensor("linear_171")]; tensor var_22_promoted_147_to_fp16 = const()[name = tensor("op_22_promoted_147_to_fp16"), val = tensor(0x1p+1)]; tensor var_5533_cast_fp16 = pow(x = x_587, y = var_22_promoted_147_to_fp16)[name = tensor("op_5533_cast_fp16")]; tensor var_5535_axes_0 = const()[name = tensor("op_5535_axes_0"), val = tensor([-1])]; tensor var_5535_keep_dims_0 = const()[name = tensor("op_5535_keep_dims_0"), val = tensor(true)]; tensor var_5535_cast_fp16 = reduce_mean(axes = var_5535_axes_0, keep_dims = var_5535_keep_dims_0, x = var_5533_cast_fp16)[name = tensor("op_5535_cast_fp16")]; tensor var_5536_to_fp16 = const()[name = tensor("op_5536_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_5537_cast_fp16 = add(x = var_5535_cast_fp16, y = var_5536_to_fp16)[name = tensor("op_5537_cast_fp16")]; tensor var_5538_epsilon_0 = const()[name = tensor("op_5538_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_5538_cast_fp16 = rsqrt(epsilon = var_5538_epsilon_0, x = var_5537_cast_fp16)[name = tensor("op_5538_cast_fp16")]; tensor output_589_cast_fp16 = mul(x = x_587, y = var_5538_cast_fp16)[name = tensor("output_589_cast_fp16")]; tensor var_5542_to_fp16 = const()[name = tensor("op_5542_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940721920)))]; tensor output_591_cast_fp16 = mul(x = output_589_cast_fp16, y = var_5542_to_fp16)[name = tensor("output_591_cast_fp16")]; tensor x_591 = add(x = x_575, y = output_591_cast_fp16)[name = tensor("x_591")]; tensor var_22_promoted_148_to_fp16 = const()[name = tensor("op_22_promoted_148_to_fp16"), val = tensor(0x1p+1)]; tensor var_5548_cast_fp16 = pow(x = x_591, y = var_22_promoted_148_to_fp16)[name = tensor("op_5548_cast_fp16")]; tensor var_5550_axes_0 = const()[name = tensor("op_5550_axes_0"), val = tensor([-1])]; tensor var_5550_keep_dims_0 = const()[name = tensor("op_5550_keep_dims_0"), val = tensor(true)]; tensor var_5550_cast_fp16 = reduce_mean(axes = var_5550_axes_0, keep_dims = var_5550_keep_dims_0, x = var_5548_cast_fp16)[name = tensor("op_5550_cast_fp16")]; tensor var_5551_to_fp16 = const()[name = tensor("op_5551_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_5552_cast_fp16 = add(x = var_5550_cast_fp16, y = var_5551_to_fp16)[name = tensor("op_5552_cast_fp16")]; tensor var_5553_epsilon_0 = const()[name = tensor("op_5553_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_5553_cast_fp16 = rsqrt(epsilon = var_5553_epsilon_0, x = var_5552_cast_fp16)[name = tensor("op_5553_cast_fp16")]; tensor output_593_cast_fp16 = mul(x = x_591, y = var_5553_cast_fp16)[name = tensor("output_593_cast_fp16")]; tensor var_5557_to_fp16 = const()[name = tensor("op_5557_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940727104)))]; tensor output_595_cast_fp16 = mul(x = output_593_cast_fp16, y = var_5557_to_fp16)[name = tensor("output_595_cast_fp16")]; tensor input_297 = linear(bias = linear_4_bias_0, weight = wrapped_model_language_model_layers_24_mlp_gate_proj_weight_palettized, x = output_595_cast_fp16)[name = tensor("linear_172")]; tensor var_5565_mode_0 = const()[name = tensor("op_5565_mode_0"), val = tensor("TANH_APPROXIMATION")]; tensor var_5565 = gelu(mode = var_5565_mode_0, x = input_297)[name = tensor("op_5565")]; tensor var_5567 = linear(bias = linear_4_bias_0, weight = wrapped_model_language_model_layers_24_mlp_up_proj_weight_palettized, x = output_595_cast_fp16)[name = tensor("linear_173")]; tensor input_299 = mul(x = var_5565, y = var_5567)[name = tensor("input_299")]; tensor x_595 = linear(bias = linear_3_bias_0, weight = wrapped_model_language_model_layers_24_mlp_down_proj_weight_palettized, x = input_299)[name = tensor("linear_174")]; tensor var_22_promoted_149_to_fp16 = const()[name = tensor("op_22_promoted_149_to_fp16"), val = tensor(0x1p+1)]; tensor var_5573_cast_fp16 = pow(x = x_595, y = var_22_promoted_149_to_fp16)[name = tensor("op_5573_cast_fp16")]; tensor var_5575_axes_0 = const()[name = tensor("op_5575_axes_0"), val = tensor([-1])]; tensor var_5575_keep_dims_0 = const()[name = tensor("op_5575_keep_dims_0"), val = tensor(true)]; tensor var_5575_cast_fp16 = reduce_mean(axes = var_5575_axes_0, keep_dims = var_5575_keep_dims_0, x = var_5573_cast_fp16)[name = tensor("op_5575_cast_fp16")]; tensor var_5576_to_fp16 = const()[name = tensor("op_5576_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_5577_cast_fp16 = add(x = var_5575_cast_fp16, y = var_5576_to_fp16)[name = tensor("op_5577_cast_fp16")]; tensor var_5578_epsilon_0 = const()[name = tensor("op_5578_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_5578_cast_fp16 = rsqrt(epsilon = var_5578_epsilon_0, x = var_5577_cast_fp16)[name = tensor("op_5578_cast_fp16")]; tensor output_597_cast_fp16 = mul(x = x_595, y = var_5578_cast_fp16)[name = tensor("output_597_cast_fp16")]; tensor var_5582_to_fp16 = const()[name = tensor("op_5582_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940732288)))]; tensor output_599_cast_fp16 = mul(x = output_597_cast_fp16, y = var_5582_to_fp16)[name = tensor("output_599_cast_fp16")]; tensor x_599 = add(x = x_591, y = output_599_cast_fp16)[name = tensor("x_599")]; tensor var_22_promoted_150_to_fp16 = const()[name = tensor("op_22_promoted_150_to_fp16"), val = tensor(0x1p+1)]; tensor var_5594_cast_fp16 = pow(x = x_599, y = var_22_promoted_150_to_fp16)[name = tensor("op_5594_cast_fp16")]; tensor var_5596_axes_0 = const()[name = tensor("op_5596_axes_0"), val = tensor([-1])]; tensor var_5596_keep_dims_0 = const()[name = tensor("op_5596_keep_dims_0"), val = tensor(true)]; tensor var_5596_cast_fp16 = reduce_mean(axes = var_5596_axes_0, keep_dims = var_5596_keep_dims_0, x = var_5594_cast_fp16)[name = tensor("op_5596_cast_fp16")]; tensor var_5597_to_fp16 = const()[name = tensor("op_5597_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_5598_cast_fp16 = add(x = var_5596_cast_fp16, y = var_5597_to_fp16)[name = tensor("op_5598_cast_fp16")]; tensor var_5599_epsilon_0 = const()[name = tensor("op_5599_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_5599_cast_fp16 = rsqrt(epsilon = var_5599_epsilon_0, x = var_5598_cast_fp16)[name = tensor("op_5599_cast_fp16")]; tensor output_601_cast_fp16 = mul(x = x_599, y = var_5599_cast_fp16)[name = tensor("output_601_cast_fp16")]; tensor var_5603_to_fp16 = const()[name = tensor("op_5603_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940737472)))]; tensor output_603_cast_fp16 = mul(x = output_601_cast_fp16, y = var_5603_to_fp16)[name = tensor("output_603_cast_fp16")]; tensor var_5615 = linear(bias = linear_0_bias_0, weight = wrapped_model_language_model_layers_25_self_attn_q_proj_weight_palettized, x = output_603_cast_fp16)[name = tensor("linear_175")]; tensor var_5616 = const()[name = tensor("op_5616"), val = tensor([1, 256, -1, 256])]; tensor var_5617 = reshape(shape = var_5616, x = var_5615)[name = tensor("op_5617")]; tensor x_603_perm_0 = const()[name = tensor("x_603_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_5620 = linear(bias = linear_1_bias_0, weight = wrapped_model_language_model_layers_25_self_attn_k_proj_weight_palettized, x = output_603_cast_fp16)[name = tensor("linear_176")]; tensor var_5621 = const()[name = tensor("op_5621"), val = tensor([1, 256, -1, 256])]; tensor var_5622 = reshape(shape = var_5621, x = var_5620)[name = tensor("op_5622")]; tensor x_607_perm_0 = const()[name = tensor("x_607_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_5625 = linear(bias = linear_1_bias_0, weight = wrapped_model_language_model_layers_25_self_attn_v_proj_weight_palettized, x = output_603_cast_fp16)[name = tensor("linear_177")]; tensor var_5626 = const()[name = tensor("op_5626"), val = tensor([1, 256, -1, 256])]; tensor var_5627 = reshape(shape = var_5626, x = var_5625)[name = tensor("op_5627")]; tensor hidden_states_357_perm_0 = const()[name = tensor("hidden_states_357_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_22_promoted_151_to_fp16 = const()[name = tensor("op_22_promoted_151_to_fp16"), val = tensor(0x1p+1)]; tensor x_603 = transpose(perm = x_603_perm_0, x = var_5617)[name = tensor("transpose_35")]; tensor var_5631_cast_fp16 = pow(x = x_603, y = var_22_promoted_151_to_fp16)[name = tensor("op_5631_cast_fp16")]; tensor var_5633_axes_0 = const()[name = tensor("op_5633_axes_0"), val = tensor([-1])]; tensor var_5633_keep_dims_0 = const()[name = tensor("op_5633_keep_dims_0"), val = tensor(true)]; tensor var_5633_cast_fp16 = reduce_mean(axes = var_5633_axes_0, keep_dims = var_5633_keep_dims_0, x = var_5631_cast_fp16)[name = tensor("op_5633_cast_fp16")]; tensor var_5634_to_fp16 = const()[name = tensor("op_5634_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_5635_cast_fp16 = add(x = var_5633_cast_fp16, y = var_5634_to_fp16)[name = tensor("op_5635_cast_fp16")]; tensor var_5636_epsilon_0 = const()[name = tensor("op_5636_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_5636_cast_fp16 = rsqrt(epsilon = var_5636_epsilon_0, x = var_5635_cast_fp16)[name = tensor("op_5636_cast_fp16")]; tensor output_605_cast_fp16 = mul(x = x_603, y = var_5636_cast_fp16)[name = tensor("output_605_cast_fp16")]; tensor var_5640_to_fp16 = const()[name = tensor("op_5640_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940742656)))]; tensor output_607_cast_fp16 = mul(x = output_605_cast_fp16, y = var_5640_to_fp16)[name = tensor("output_607_cast_fp16")]; tensor var_22_promoted_152_to_fp16 = const()[name = tensor("op_22_promoted_152_to_fp16"), val = tensor(0x1p+1)]; tensor x_607 = transpose(perm = x_607_perm_0, x = var_5622)[name = tensor("transpose_34")]; tensor var_5645_cast_fp16 = pow(x = x_607, y = var_22_promoted_152_to_fp16)[name = tensor("op_5645_cast_fp16")]; tensor var_5647_axes_0 = const()[name = tensor("op_5647_axes_0"), val = tensor([-1])]; tensor var_5647_keep_dims_0 = const()[name = tensor("op_5647_keep_dims_0"), val = tensor(true)]; tensor var_5647_cast_fp16 = reduce_mean(axes = var_5647_axes_0, keep_dims = var_5647_keep_dims_0, x = var_5645_cast_fp16)[name = tensor("op_5647_cast_fp16")]; tensor var_5648_to_fp16 = const()[name = tensor("op_5648_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_5649_cast_fp16 = add(x = var_5647_cast_fp16, y = var_5648_to_fp16)[name = tensor("op_5649_cast_fp16")]; tensor var_5650_epsilon_0 = const()[name = tensor("op_5650_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_5650_cast_fp16 = rsqrt(epsilon = var_5650_epsilon_0, x = var_5649_cast_fp16)[name = tensor("op_5650_cast_fp16")]; tensor output_609_cast_fp16 = mul(x = x_607, y = var_5650_cast_fp16)[name = tensor("output_609_cast_fp16")]; tensor var_5654_to_fp16 = const()[name = tensor("op_5654_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940743232)))]; tensor output_611_cast_fp16 = mul(x = output_609_cast_fp16, y = var_5654_to_fp16)[name = tensor("output_611_cast_fp16")]; tensor var_5659 = mul(x = output_607_cast_fp16, y = cos_7_palettized)[name = tensor("op_5659")]; tensor x1_101_begin_0 = const()[name = tensor("x1_101_begin_0"), val = tensor([0, 0, 0, 0])]; tensor x1_101_end_0 = const()[name = tensor("x1_101_end_0"), val = tensor([1, 8, 256, 128])]; tensor x1_101_end_mask_0 = const()[name = tensor("x1_101_end_mask_0"), val = tensor([true, true, true, false])]; tensor x1_101 = slice_by_index(begin = x1_101_begin_0, end = x1_101_end_0, end_mask = x1_101_end_mask_0, x = output_607_cast_fp16)[name = tensor("x1_101")]; tensor x2_101_begin_0 = const()[name = tensor("x2_101_begin_0"), val = tensor([0, 0, 0, 128])]; tensor x2_101_end_0 = const()[name = tensor("x2_101_end_0"), val = tensor([1, 8, 256, 256])]; tensor x2_101_end_mask_0 = const()[name = tensor("x2_101_end_mask_0"), val = tensor([true, true, true, true])]; tensor x2_101 = slice_by_index(begin = x2_101_begin_0, end = x2_101_end_0, end_mask = x2_101_end_mask_0, x = output_607_cast_fp16)[name = tensor("x2_101")]; tensor const_610_promoted = const()[name = tensor("const_610_promoted"), val = tensor(-0x1p+0)]; tensor var_5670 = mul(x = x2_101, y = const_610_promoted)[name = tensor("op_5670")]; tensor var_5672_interleave_0 = const()[name = tensor("op_5672_interleave_0"), val = tensor(false)]; tensor var_5672 = concat(axis = var_24, interleave = var_5672_interleave_0, values = (var_5670, x1_101))[name = tensor("op_5672")]; tensor var_5673 = mul(x = var_5672, y = sin_7_palettized)[name = tensor("op_5673")]; tensor query_51 = add(x = var_5659, y = var_5673)[name = tensor("query_51")]; tensor var_5675 = mul(x = output_611_cast_fp16, y = cos_7_palettized)[name = tensor("op_5675")]; tensor x1_103_begin_0 = const()[name = tensor("x1_103_begin_0"), val = tensor([0, 0, 0, 0])]; tensor x1_103_end_0 = const()[name = tensor("x1_103_end_0"), val = tensor([1, 4, 256, 128])]; tensor x1_103_end_mask_0 = const()[name = tensor("x1_103_end_mask_0"), val = tensor([true, true, true, false])]; tensor x1_103 = slice_by_index(begin = x1_103_begin_0, end = x1_103_end_0, end_mask = x1_103_end_mask_0, x = output_611_cast_fp16)[name = tensor("x1_103")]; tensor x2_103_begin_0 = const()[name = tensor("x2_103_begin_0"), val = tensor([0, 0, 0, 128])]; tensor x2_103_end_0 = const()[name = tensor("x2_103_end_0"), val = tensor([1, 4, 256, 256])]; tensor x2_103_end_mask_0 = const()[name = tensor("x2_103_end_mask_0"), val = tensor([true, true, true, true])]; tensor x2_103 = slice_by_index(begin = x2_103_begin_0, end = x2_103_end_0, end_mask = x2_103_end_mask_0, x = output_611_cast_fp16)[name = tensor("x2_103")]; tensor const_613_promoted = const()[name = tensor("const_613_promoted"), val = tensor(-0x1p+0)]; tensor var_5686 = mul(x = x2_103, y = const_613_promoted)[name = tensor("op_5686")]; tensor var_5688_interleave_0 = const()[name = tensor("op_5688_interleave_0"), val = tensor(false)]; tensor var_5688 = concat(axis = var_24, interleave = var_5688_interleave_0, values = (var_5686, x1_103))[name = tensor("op_5688")]; tensor var_5689 = mul(x = var_5688, y = sin_7_palettized)[name = tensor("op_5689")]; tensor hidden_states_353 = add(x = var_5675, y = var_5689)[name = tensor("hidden_states_353")]; tensor var_5698_axes_0 = const()[name = tensor("op_5698_axes_0"), val = tensor([2])]; tensor var_5698 = expand_dims(axes = var_5698_axes_0, x = hidden_states_353)[name = tensor("op_5698")]; tensor hidden_states_355_reps_0 = const()[name = tensor("hidden_states_355_reps_0"), val = tensor([1, 1, 2, 1, 1])]; tensor hidden_states_355 = tile(reps = hidden_states_355_reps_0, x = var_5698)[name = tensor("hidden_states_355")]; tensor var_5706 = const()[name = tensor("op_5706"), val = tensor([1, 8, 256, 256])]; tensor key_states_51 = reshape(shape = var_5706, x = hidden_states_355)[name = tensor("key_states_51")]; tensor var_5715_axes_0 = const()[name = tensor("op_5715_axes_0"), val = tensor([2])]; tensor hidden_states_357 = transpose(perm = hidden_states_357_perm_0, x = var_5627)[name = tensor("transpose_33")]; tensor var_5715 = expand_dims(axes = var_5715_axes_0, x = hidden_states_357)[name = tensor("op_5715")]; tensor hidden_states_359_reps_0 = const()[name = tensor("hidden_states_359_reps_0"), val = tensor([1, 1, 2, 1, 1])]; tensor hidden_states_359 = tile(reps = hidden_states_359_reps_0, x = var_5715)[name = tensor("hidden_states_359")]; tensor var_5723 = const()[name = tensor("op_5723"), val = tensor([1, 8, 256, 256])]; tensor value_states_51 = reshape(shape = var_5723, x = hidden_states_359)[name = tensor("value_states_51")]; tensor var_5726_transpose_x_1 = const()[name = tensor("op_5726_transpose_x_1"), val = tensor(false)]; tensor var_5726_transpose_y_1 = const()[name = tensor("op_5726_transpose_y_1"), val = tensor(true)]; tensor var_5726 = matmul(transpose_x = var_5726_transpose_x_1, transpose_y = var_5726_transpose_y_1, x = query_51, y = key_states_51)[name = tensor("op_5726")]; tensor var_5727_to_fp16 = const()[name = tensor("op_5727_to_fp16"), val = tensor(0x1p-4)]; tensor attn_weights_101_cast_fp16 = mul(x = var_5726, y = var_5727_to_fp16)[name = tensor("attn_weights_101_cast_fp16")]; tensor input_301_cast_fp16 = add(x = attn_weights_101_cast_fp16, y = attention_mask_to_fp16_palettized)[name = tensor("input_301_cast_fp16")]; tensor var_5735_cast_fp16 = softmax(axis = var_24, x = input_301_cast_fp16)[name = tensor("op_5735_cast_fp16")]; tensor attn_output_101_transpose_x_0 = const()[name = tensor("attn_output_101_transpose_x_0"), val = tensor(false)]; tensor attn_output_101_transpose_y_0 = const()[name = tensor("attn_output_101_transpose_y_0"), val = tensor(false)]; tensor attn_output_101 = matmul(transpose_x = attn_output_101_transpose_x_0, transpose_y = attn_output_101_transpose_y_0, x = var_5735_cast_fp16, y = value_states_51)[name = tensor("attn_output_101")]; tensor var_5739_perm_0 = const()[name = tensor("op_5739_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_5741 = const()[name = tensor("op_5741"), val = tensor([1, 256, -1])]; tensor var_5739 = transpose(perm = var_5739_perm_0, x = attn_output_101)[name = tensor("transpose_32")]; tensor var_5742 = reshape(shape = var_5741, x = var_5739)[name = tensor("op_5742")]; tensor x_611 = linear(bias = linear_3_bias_0, weight = wrapped_model_language_model_layers_25_self_attn_o_proj_weight_palettized, x = var_5742)[name = tensor("linear_178")]; tensor var_22_promoted_153_to_fp16 = const()[name = tensor("op_22_promoted_153_to_fp16"), val = tensor(0x1p+1)]; tensor var_5748_cast_fp16 = pow(x = x_611, y = var_22_promoted_153_to_fp16)[name = tensor("op_5748_cast_fp16")]; tensor var_5750_axes_0 = const()[name = tensor("op_5750_axes_0"), val = tensor([-1])]; tensor var_5750_keep_dims_0 = const()[name = tensor("op_5750_keep_dims_0"), val = tensor(true)]; tensor var_5750_cast_fp16 = reduce_mean(axes = var_5750_axes_0, keep_dims = var_5750_keep_dims_0, x = var_5748_cast_fp16)[name = tensor("op_5750_cast_fp16")]; tensor var_5751_to_fp16 = const()[name = tensor("op_5751_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_5752_cast_fp16 = add(x = var_5750_cast_fp16, y = var_5751_to_fp16)[name = tensor("op_5752_cast_fp16")]; tensor var_5753_epsilon_0 = const()[name = tensor("op_5753_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_5753_cast_fp16 = rsqrt(epsilon = var_5753_epsilon_0, x = var_5752_cast_fp16)[name = tensor("op_5753_cast_fp16")]; tensor output_613_cast_fp16 = mul(x = x_611, y = var_5753_cast_fp16)[name = tensor("output_613_cast_fp16")]; tensor var_5757_to_fp16 = const()[name = tensor("op_5757_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940743808)))]; tensor output_615_cast_fp16 = mul(x = output_613_cast_fp16, y = var_5757_to_fp16)[name = tensor("output_615_cast_fp16")]; tensor x_615 = add(x = x_599, y = output_615_cast_fp16)[name = tensor("x_615")]; tensor var_22_promoted_154_to_fp16 = const()[name = tensor("op_22_promoted_154_to_fp16"), val = tensor(0x1p+1)]; tensor var_5763_cast_fp16 = pow(x = x_615, y = var_22_promoted_154_to_fp16)[name = tensor("op_5763_cast_fp16")]; tensor var_5765_axes_0 = const()[name = tensor("op_5765_axes_0"), val = tensor([-1])]; tensor var_5765_keep_dims_0 = const()[name = tensor("op_5765_keep_dims_0"), val = tensor(true)]; tensor var_5765_cast_fp16 = reduce_mean(axes = var_5765_axes_0, keep_dims = var_5765_keep_dims_0, x = var_5763_cast_fp16)[name = tensor("op_5765_cast_fp16")]; tensor var_5766_to_fp16 = const()[name = tensor("op_5766_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_5767_cast_fp16 = add(x = var_5765_cast_fp16, y = var_5766_to_fp16)[name = tensor("op_5767_cast_fp16")]; tensor var_5768_epsilon_0 = const()[name = tensor("op_5768_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_5768_cast_fp16 = rsqrt(epsilon = var_5768_epsilon_0, x = var_5767_cast_fp16)[name = tensor("op_5768_cast_fp16")]; tensor output_617_cast_fp16 = mul(x = x_615, y = var_5768_cast_fp16)[name = tensor("output_617_cast_fp16")]; tensor var_5772_to_fp16 = const()[name = tensor("op_5772_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940748992)))]; tensor output_619_cast_fp16 = mul(x = output_617_cast_fp16, y = var_5772_to_fp16)[name = tensor("output_619_cast_fp16")]; tensor input_309 = linear(bias = linear_4_bias_0, weight = wrapped_model_language_model_layers_25_mlp_gate_proj_weight_palettized, x = output_619_cast_fp16)[name = tensor("linear_179")]; tensor var_5780_mode_0 = const()[name = tensor("op_5780_mode_0"), val = tensor("TANH_APPROXIMATION")]; tensor var_5780 = gelu(mode = var_5780_mode_0, x = input_309)[name = tensor("op_5780")]; tensor var_5782 = linear(bias = linear_4_bias_0, weight = wrapped_model_language_model_layers_25_mlp_up_proj_weight_palettized, x = output_619_cast_fp16)[name = tensor("linear_180")]; tensor input_311 = mul(x = var_5780, y = var_5782)[name = tensor("input_311")]; tensor x_619 = linear(bias = linear_3_bias_0, weight = wrapped_model_language_model_layers_25_mlp_down_proj_weight_palettized, x = input_311)[name = tensor("linear_181")]; tensor var_22_promoted_155_to_fp16 = const()[name = tensor("op_22_promoted_155_to_fp16"), val = tensor(0x1p+1)]; tensor var_5788_cast_fp16 = pow(x = x_619, y = var_22_promoted_155_to_fp16)[name = tensor("op_5788_cast_fp16")]; tensor var_5790_axes_0 = const()[name = tensor("op_5790_axes_0"), val = tensor([-1])]; tensor var_5790_keep_dims_0 = const()[name = tensor("op_5790_keep_dims_0"), val = tensor(true)]; tensor var_5790_cast_fp16 = reduce_mean(axes = var_5790_axes_0, keep_dims = var_5790_keep_dims_0, x = var_5788_cast_fp16)[name = tensor("op_5790_cast_fp16")]; tensor var_5791_to_fp16 = const()[name = tensor("op_5791_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_5792_cast_fp16 = add(x = var_5790_cast_fp16, y = var_5791_to_fp16)[name = tensor("op_5792_cast_fp16")]; tensor var_5793_epsilon_0 = const()[name = tensor("op_5793_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_5793_cast_fp16 = rsqrt(epsilon = var_5793_epsilon_0, x = var_5792_cast_fp16)[name = tensor("op_5793_cast_fp16")]; tensor output_621_cast_fp16 = mul(x = x_619, y = var_5793_cast_fp16)[name = tensor("output_621_cast_fp16")]; tensor var_5797_to_fp16 = const()[name = tensor("op_5797_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940754176)))]; tensor output_623_cast_fp16 = mul(x = output_621_cast_fp16, y = var_5797_to_fp16)[name = tensor("output_623_cast_fp16")]; tensor x_623 = add(x = x_615, y = output_623_cast_fp16)[name = tensor("x_623")]; tensor var_22_promoted_156_to_fp16 = const()[name = tensor("op_22_promoted_156_to_fp16"), val = tensor(0x1p+1)]; tensor var_5809_cast_fp16 = pow(x = x_623, y = var_22_promoted_156_to_fp16)[name = tensor("op_5809_cast_fp16")]; tensor var_5811_axes_0 = const()[name = tensor("op_5811_axes_0"), val = tensor([-1])]; tensor var_5811_keep_dims_0 = const()[name = tensor("op_5811_keep_dims_0"), val = tensor(true)]; tensor var_5811_cast_fp16 = reduce_mean(axes = var_5811_axes_0, keep_dims = var_5811_keep_dims_0, x = var_5809_cast_fp16)[name = tensor("op_5811_cast_fp16")]; tensor var_5812_to_fp16 = const()[name = tensor("op_5812_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_5813_cast_fp16 = add(x = var_5811_cast_fp16, y = var_5812_to_fp16)[name = tensor("op_5813_cast_fp16")]; tensor var_5814_epsilon_0 = const()[name = tensor("op_5814_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_5814_cast_fp16 = rsqrt(epsilon = var_5814_epsilon_0, x = var_5813_cast_fp16)[name = tensor("op_5814_cast_fp16")]; tensor output_625_cast_fp16 = mul(x = x_623, y = var_5814_cast_fp16)[name = tensor("output_625_cast_fp16")]; tensor var_5818_to_fp16 = const()[name = tensor("op_5818_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940759360)))]; tensor output_627_cast_fp16 = mul(x = output_625_cast_fp16, y = var_5818_to_fp16)[name = tensor("output_627_cast_fp16")]; tensor var_5830 = linear(bias = linear_0_bias_0, weight = wrapped_model_language_model_layers_26_self_attn_q_proj_weight_palettized, x = output_627_cast_fp16)[name = tensor("linear_182")]; tensor var_5831 = const()[name = tensor("op_5831"), val = tensor([1, 256, -1, 256])]; tensor var_5832 = reshape(shape = var_5831, x = var_5830)[name = tensor("op_5832")]; tensor x_627_perm_0 = const()[name = tensor("x_627_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_5835 = linear(bias = linear_1_bias_0, weight = wrapped_model_language_model_layers_26_self_attn_k_proj_weight_palettized, x = output_627_cast_fp16)[name = tensor("linear_183")]; tensor var_5836 = const()[name = tensor("op_5836"), val = tensor([1, 256, -1, 256])]; tensor var_5837 = reshape(shape = var_5836, x = var_5835)[name = tensor("op_5837")]; tensor x_631_perm_0 = const()[name = tensor("x_631_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_5840 = linear(bias = linear_1_bias_0, weight = wrapped_model_language_model_layers_26_self_attn_v_proj_weight_palettized, x = output_627_cast_fp16)[name = tensor("linear_184")]; tensor var_5841 = const()[name = tensor("op_5841"), val = tensor([1, 256, -1, 256])]; tensor var_5842 = reshape(shape = var_5841, x = var_5840)[name = tensor("op_5842")]; tensor hidden_states_371_perm_0 = const()[name = tensor("hidden_states_371_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_22_promoted_157_to_fp16 = const()[name = tensor("op_22_promoted_157_to_fp16"), val = tensor(0x1p+1)]; tensor x_627 = transpose(perm = x_627_perm_0, x = var_5832)[name = tensor("transpose_31")]; tensor var_5846_cast_fp16 = pow(x = x_627, y = var_22_promoted_157_to_fp16)[name = tensor("op_5846_cast_fp16")]; tensor var_5848_axes_0 = const()[name = tensor("op_5848_axes_0"), val = tensor([-1])]; tensor var_5848_keep_dims_0 = const()[name = tensor("op_5848_keep_dims_0"), val = tensor(true)]; tensor var_5848_cast_fp16 = reduce_mean(axes = var_5848_axes_0, keep_dims = var_5848_keep_dims_0, x = var_5846_cast_fp16)[name = tensor("op_5848_cast_fp16")]; tensor var_5849_to_fp16 = const()[name = tensor("op_5849_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_5850_cast_fp16 = add(x = var_5848_cast_fp16, y = var_5849_to_fp16)[name = tensor("op_5850_cast_fp16")]; tensor var_5851_epsilon_0 = const()[name = tensor("op_5851_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_5851_cast_fp16 = rsqrt(epsilon = var_5851_epsilon_0, x = var_5850_cast_fp16)[name = tensor("op_5851_cast_fp16")]; tensor output_629_cast_fp16 = mul(x = x_627, y = var_5851_cast_fp16)[name = tensor("output_629_cast_fp16")]; tensor var_5855_to_fp16 = const()[name = tensor("op_5855_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940764544)))]; tensor output_631_cast_fp16 = mul(x = output_629_cast_fp16, y = var_5855_to_fp16)[name = tensor("output_631_cast_fp16")]; tensor var_22_promoted_158_to_fp16 = const()[name = tensor("op_22_promoted_158_to_fp16"), val = tensor(0x1p+1)]; tensor x_631 = transpose(perm = x_631_perm_0, x = var_5837)[name = tensor("transpose_30")]; tensor var_5860_cast_fp16 = pow(x = x_631, y = var_22_promoted_158_to_fp16)[name = tensor("op_5860_cast_fp16")]; tensor var_5862_axes_0 = const()[name = tensor("op_5862_axes_0"), val = tensor([-1])]; tensor var_5862_keep_dims_0 = const()[name = tensor("op_5862_keep_dims_0"), val = tensor(true)]; tensor var_5862_cast_fp16 = reduce_mean(axes = var_5862_axes_0, keep_dims = var_5862_keep_dims_0, x = var_5860_cast_fp16)[name = tensor("op_5862_cast_fp16")]; tensor var_5863_to_fp16 = const()[name = tensor("op_5863_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_5864_cast_fp16 = add(x = var_5862_cast_fp16, y = var_5863_to_fp16)[name = tensor("op_5864_cast_fp16")]; tensor var_5865_epsilon_0 = const()[name = tensor("op_5865_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_5865_cast_fp16 = rsqrt(epsilon = var_5865_epsilon_0, x = var_5864_cast_fp16)[name = tensor("op_5865_cast_fp16")]; tensor output_633_cast_fp16 = mul(x = x_631, y = var_5865_cast_fp16)[name = tensor("output_633_cast_fp16")]; tensor var_5869_to_fp16 = const()[name = tensor("op_5869_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940765120)))]; tensor output_635_cast_fp16 = mul(x = output_633_cast_fp16, y = var_5869_to_fp16)[name = tensor("output_635_cast_fp16")]; tensor var_5874 = mul(x = output_631_cast_fp16, y = cos_7_palettized)[name = tensor("op_5874")]; tensor x1_105_begin_0 = const()[name = tensor("x1_105_begin_0"), val = tensor([0, 0, 0, 0])]; tensor x1_105_end_0 = const()[name = tensor("x1_105_end_0"), val = tensor([1, 8, 256, 128])]; tensor x1_105_end_mask_0 = const()[name = tensor("x1_105_end_mask_0"), val = tensor([true, true, true, false])]; tensor x1_105 = slice_by_index(begin = x1_105_begin_0, end = x1_105_end_0, end_mask = x1_105_end_mask_0, x = output_631_cast_fp16)[name = tensor("x1_105")]; tensor x2_105_begin_0 = const()[name = tensor("x2_105_begin_0"), val = tensor([0, 0, 0, 128])]; tensor x2_105_end_0 = const()[name = tensor("x2_105_end_0"), val = tensor([1, 8, 256, 256])]; tensor x2_105_end_mask_0 = const()[name = tensor("x2_105_end_mask_0"), val = tensor([true, true, true, true])]; tensor x2_105 = slice_by_index(begin = x2_105_begin_0, end = x2_105_end_0, end_mask = x2_105_end_mask_0, x = output_631_cast_fp16)[name = tensor("x2_105")]; tensor const_633_promoted = const()[name = tensor("const_633_promoted"), val = tensor(-0x1p+0)]; tensor var_5885 = mul(x = x2_105, y = const_633_promoted)[name = tensor("op_5885")]; tensor var_5887_interleave_0 = const()[name = tensor("op_5887_interleave_0"), val = tensor(false)]; tensor var_5887 = concat(axis = var_24, interleave = var_5887_interleave_0, values = (var_5885, x1_105))[name = tensor("op_5887")]; tensor var_5888 = mul(x = var_5887, y = sin_7_palettized)[name = tensor("op_5888")]; tensor query_53 = add(x = var_5874, y = var_5888)[name = tensor("query_53")]; tensor var_5890 = mul(x = output_635_cast_fp16, y = cos_7_palettized)[name = tensor("op_5890")]; tensor x1_107_begin_0 = const()[name = tensor("x1_107_begin_0"), val = tensor([0, 0, 0, 0])]; tensor x1_107_end_0 = const()[name = tensor("x1_107_end_0"), val = tensor([1, 4, 256, 128])]; tensor x1_107_end_mask_0 = const()[name = tensor("x1_107_end_mask_0"), val = tensor([true, true, true, false])]; tensor x1_107 = slice_by_index(begin = x1_107_begin_0, end = x1_107_end_0, end_mask = x1_107_end_mask_0, x = output_635_cast_fp16)[name = tensor("x1_107")]; tensor x2_107_begin_0 = const()[name = tensor("x2_107_begin_0"), val = tensor([0, 0, 0, 128])]; tensor x2_107_end_0 = const()[name = tensor("x2_107_end_0"), val = tensor([1, 4, 256, 256])]; tensor x2_107_end_mask_0 = const()[name = tensor("x2_107_end_mask_0"), val = tensor([true, true, true, true])]; tensor x2_107 = slice_by_index(begin = x2_107_begin_0, end = x2_107_end_0, end_mask = x2_107_end_mask_0, x = output_635_cast_fp16)[name = tensor("x2_107")]; tensor const_636_promoted = const()[name = tensor("const_636_promoted"), val = tensor(-0x1p+0)]; tensor var_5901 = mul(x = x2_107, y = const_636_promoted)[name = tensor("op_5901")]; tensor var_5903_interleave_0 = const()[name = tensor("op_5903_interleave_0"), val = tensor(false)]; tensor var_5903 = concat(axis = var_24, interleave = var_5903_interleave_0, values = (var_5901, x1_107))[name = tensor("op_5903")]; tensor var_5904 = mul(x = var_5903, y = sin_7_palettized)[name = tensor("op_5904")]; tensor hidden_states_367 = add(x = var_5890, y = var_5904)[name = tensor("hidden_states_367")]; tensor var_5913_axes_0 = const()[name = tensor("op_5913_axes_0"), val = tensor([2])]; tensor var_5913 = expand_dims(axes = var_5913_axes_0, x = hidden_states_367)[name = tensor("op_5913")]; tensor hidden_states_369_reps_0 = const()[name = tensor("hidden_states_369_reps_0"), val = tensor([1, 1, 2, 1, 1])]; tensor hidden_states_369 = tile(reps = hidden_states_369_reps_0, x = var_5913)[name = tensor("hidden_states_369")]; tensor var_5921 = const()[name = tensor("op_5921"), val = tensor([1, 8, 256, 256])]; tensor key_states_53 = reshape(shape = var_5921, x = hidden_states_369)[name = tensor("key_states_53")]; tensor var_5930_axes_0 = const()[name = tensor("op_5930_axes_0"), val = tensor([2])]; tensor hidden_states_371 = transpose(perm = hidden_states_371_perm_0, x = var_5842)[name = tensor("transpose_29")]; tensor var_5930 = expand_dims(axes = var_5930_axes_0, x = hidden_states_371)[name = tensor("op_5930")]; tensor hidden_states_373_reps_0 = const()[name = tensor("hidden_states_373_reps_0"), val = tensor([1, 1, 2, 1, 1])]; tensor hidden_states_373 = tile(reps = hidden_states_373_reps_0, x = var_5930)[name = tensor("hidden_states_373")]; tensor var_5938 = const()[name = tensor("op_5938"), val = tensor([1, 8, 256, 256])]; tensor value_states_53 = reshape(shape = var_5938, x = hidden_states_373)[name = tensor("value_states_53")]; tensor var_5941_transpose_x_1 = const()[name = tensor("op_5941_transpose_x_1"), val = tensor(false)]; tensor var_5941_transpose_y_1 = const()[name = tensor("op_5941_transpose_y_1"), val = tensor(true)]; tensor var_5941 = matmul(transpose_x = var_5941_transpose_x_1, transpose_y = var_5941_transpose_y_1, x = query_53, y = key_states_53)[name = tensor("op_5941")]; tensor var_5942_to_fp16 = const()[name = tensor("op_5942_to_fp16"), val = tensor(0x1p-4)]; tensor attn_weights_105_cast_fp16 = mul(x = var_5941, y = var_5942_to_fp16)[name = tensor("attn_weights_105_cast_fp16")]; tensor input_313_cast_fp16 = add(x = attn_weights_105_cast_fp16, y = attention_mask_to_fp16_palettized)[name = tensor("input_313_cast_fp16")]; tensor var_5950_cast_fp16 = softmax(axis = var_24, x = input_313_cast_fp16)[name = tensor("op_5950_cast_fp16")]; tensor attn_output_105_transpose_x_0 = const()[name = tensor("attn_output_105_transpose_x_0"), val = tensor(false)]; tensor attn_output_105_transpose_y_0 = const()[name = tensor("attn_output_105_transpose_y_0"), val = tensor(false)]; tensor attn_output_105 = matmul(transpose_x = attn_output_105_transpose_x_0, transpose_y = attn_output_105_transpose_y_0, x = var_5950_cast_fp16, y = value_states_53)[name = tensor("attn_output_105")]; tensor var_5954_perm_0 = const()[name = tensor("op_5954_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_5956 = const()[name = tensor("op_5956"), val = tensor([1, 256, -1])]; tensor var_5954 = transpose(perm = var_5954_perm_0, x = attn_output_105)[name = tensor("transpose_28")]; tensor var_5957 = reshape(shape = var_5956, x = var_5954)[name = tensor("op_5957")]; tensor x_635 = linear(bias = linear_3_bias_0, weight = wrapped_model_language_model_layers_26_self_attn_o_proj_weight_palettized, x = var_5957)[name = tensor("linear_185")]; tensor var_22_promoted_159_to_fp16 = const()[name = tensor("op_22_promoted_159_to_fp16"), val = tensor(0x1p+1)]; tensor var_5963_cast_fp16 = pow(x = x_635, y = var_22_promoted_159_to_fp16)[name = tensor("op_5963_cast_fp16")]; tensor var_5965_axes_0 = const()[name = tensor("op_5965_axes_0"), val = tensor([-1])]; tensor var_5965_keep_dims_0 = const()[name = tensor("op_5965_keep_dims_0"), val = tensor(true)]; tensor var_5965_cast_fp16 = reduce_mean(axes = var_5965_axes_0, keep_dims = var_5965_keep_dims_0, x = var_5963_cast_fp16)[name = tensor("op_5965_cast_fp16")]; tensor var_5966_to_fp16 = const()[name = tensor("op_5966_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_5967_cast_fp16 = add(x = var_5965_cast_fp16, y = var_5966_to_fp16)[name = tensor("op_5967_cast_fp16")]; tensor var_5968_epsilon_0 = const()[name = tensor("op_5968_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_5968_cast_fp16 = rsqrt(epsilon = var_5968_epsilon_0, x = var_5967_cast_fp16)[name = tensor("op_5968_cast_fp16")]; tensor output_637_cast_fp16 = mul(x = x_635, y = var_5968_cast_fp16)[name = tensor("output_637_cast_fp16")]; tensor var_5972_to_fp16 = const()[name = tensor("op_5972_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940765696)))]; tensor output_639_cast_fp16 = mul(x = output_637_cast_fp16, y = var_5972_to_fp16)[name = tensor("output_639_cast_fp16")]; tensor x_639 = add(x = x_623, y = output_639_cast_fp16)[name = tensor("x_639")]; tensor var_22_promoted_160_to_fp16 = const()[name = tensor("op_22_promoted_160_to_fp16"), val = tensor(0x1p+1)]; tensor var_5978_cast_fp16 = pow(x = x_639, y = var_22_promoted_160_to_fp16)[name = tensor("op_5978_cast_fp16")]; tensor var_5980_axes_0 = const()[name = tensor("op_5980_axes_0"), val = tensor([-1])]; tensor var_5980_keep_dims_0 = const()[name = tensor("op_5980_keep_dims_0"), val = tensor(true)]; tensor var_5980_cast_fp16 = reduce_mean(axes = var_5980_axes_0, keep_dims = var_5980_keep_dims_0, x = var_5978_cast_fp16)[name = tensor("op_5980_cast_fp16")]; tensor var_5981_to_fp16 = const()[name = tensor("op_5981_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_5982_cast_fp16 = add(x = var_5980_cast_fp16, y = var_5981_to_fp16)[name = tensor("op_5982_cast_fp16")]; tensor var_5983_epsilon_0 = const()[name = tensor("op_5983_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_5983_cast_fp16 = rsqrt(epsilon = var_5983_epsilon_0, x = var_5982_cast_fp16)[name = tensor("op_5983_cast_fp16")]; tensor output_641_cast_fp16 = mul(x = x_639, y = var_5983_cast_fp16)[name = tensor("output_641_cast_fp16")]; tensor var_5987_to_fp16 = const()[name = tensor("op_5987_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940770880)))]; tensor output_643_cast_fp16 = mul(x = output_641_cast_fp16, y = var_5987_to_fp16)[name = tensor("output_643_cast_fp16")]; tensor input_321 = linear(bias = linear_4_bias_0, weight = wrapped_model_language_model_layers_26_mlp_gate_proj_weight_palettized, x = output_643_cast_fp16)[name = tensor("linear_186")]; tensor var_5995_mode_0 = const()[name = tensor("op_5995_mode_0"), val = tensor("TANH_APPROXIMATION")]; tensor var_5995 = gelu(mode = var_5995_mode_0, x = input_321)[name = tensor("op_5995")]; tensor var_5997 = linear(bias = linear_4_bias_0, weight = wrapped_model_language_model_layers_26_mlp_up_proj_weight_palettized, x = output_643_cast_fp16)[name = tensor("linear_187")]; tensor input_323 = mul(x = var_5995, y = var_5997)[name = tensor("input_323")]; tensor x_643 = linear(bias = linear_3_bias_0, weight = wrapped_model_language_model_layers_26_mlp_down_proj_weight_palettized, x = input_323)[name = tensor("linear_188")]; tensor var_22_promoted_161_to_fp16 = const()[name = tensor("op_22_promoted_161_to_fp16"), val = tensor(0x1p+1)]; tensor var_6003_cast_fp16 = pow(x = x_643, y = var_22_promoted_161_to_fp16)[name = tensor("op_6003_cast_fp16")]; tensor var_6005_axes_0 = const()[name = tensor("op_6005_axes_0"), val = tensor([-1])]; tensor var_6005_keep_dims_0 = const()[name = tensor("op_6005_keep_dims_0"), val = tensor(true)]; tensor var_6005_cast_fp16 = reduce_mean(axes = var_6005_axes_0, keep_dims = var_6005_keep_dims_0, x = var_6003_cast_fp16)[name = tensor("op_6005_cast_fp16")]; tensor var_6006_to_fp16 = const()[name = tensor("op_6006_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_6007_cast_fp16 = add(x = var_6005_cast_fp16, y = var_6006_to_fp16)[name = tensor("op_6007_cast_fp16")]; tensor var_6008_epsilon_0 = const()[name = tensor("op_6008_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_6008_cast_fp16 = rsqrt(epsilon = var_6008_epsilon_0, x = var_6007_cast_fp16)[name = tensor("op_6008_cast_fp16")]; tensor output_645_cast_fp16 = mul(x = x_643, y = var_6008_cast_fp16)[name = tensor("output_645_cast_fp16")]; tensor var_6012_to_fp16 = const()[name = tensor("op_6012_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940776064)))]; tensor output_647_cast_fp16 = mul(x = output_645_cast_fp16, y = var_6012_to_fp16)[name = tensor("output_647_cast_fp16")]; tensor x_647 = add(x = x_639, y = output_647_cast_fp16)[name = tensor("x_647")]; tensor var_22_promoted_162_to_fp16 = const()[name = tensor("op_22_promoted_162_to_fp16"), val = tensor(0x1p+1)]; tensor var_6024_cast_fp16 = pow(x = x_647, y = var_22_promoted_162_to_fp16)[name = tensor("op_6024_cast_fp16")]; tensor var_6026_axes_0 = const()[name = tensor("op_6026_axes_0"), val = tensor([-1])]; tensor var_6026_keep_dims_0 = const()[name = tensor("op_6026_keep_dims_0"), val = tensor(true)]; tensor var_6026_cast_fp16 = reduce_mean(axes = var_6026_axes_0, keep_dims = var_6026_keep_dims_0, x = var_6024_cast_fp16)[name = tensor("op_6026_cast_fp16")]; tensor var_6027_to_fp16 = const()[name = tensor("op_6027_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_6028_cast_fp16 = add(x = var_6026_cast_fp16, y = var_6027_to_fp16)[name = tensor("op_6028_cast_fp16")]; tensor var_6029_epsilon_0 = const()[name = tensor("op_6029_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_6029_cast_fp16 = rsqrt(epsilon = var_6029_epsilon_0, x = var_6028_cast_fp16)[name = tensor("op_6029_cast_fp16")]; tensor output_649_cast_fp16 = mul(x = x_647, y = var_6029_cast_fp16)[name = tensor("output_649_cast_fp16")]; tensor var_6033_to_fp16 = const()[name = tensor("op_6033_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940781248)))]; tensor output_651_cast_fp16 = mul(x = output_649_cast_fp16, y = var_6033_to_fp16)[name = tensor("output_651_cast_fp16")]; tensor var_6045 = linear(bias = linear_0_bias_0, weight = wrapped_model_language_model_layers_27_self_attn_q_proj_weight_palettized, x = output_651_cast_fp16)[name = tensor("linear_189")]; tensor var_6046 = const()[name = tensor("op_6046"), val = tensor([1, 256, -1, 256])]; tensor var_6047 = reshape(shape = var_6046, x = var_6045)[name = tensor("op_6047")]; tensor x_651_perm_0 = const()[name = tensor("x_651_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_6050 = linear(bias = linear_1_bias_0, weight = wrapped_model_language_model_layers_27_self_attn_k_proj_weight_palettized, x = output_651_cast_fp16)[name = tensor("linear_190")]; tensor var_6051 = const()[name = tensor("op_6051"), val = tensor([1, 256, -1, 256])]; tensor var_6052 = reshape(shape = var_6051, x = var_6050)[name = tensor("op_6052")]; tensor x_655_perm_0 = const()[name = tensor("x_655_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_6055 = linear(bias = linear_1_bias_0, weight = wrapped_model_language_model_layers_27_self_attn_v_proj_weight_palettized, x = output_651_cast_fp16)[name = tensor("linear_191")]; tensor var_6056 = const()[name = tensor("op_6056"), val = tensor([1, 256, -1, 256])]; tensor var_6057 = reshape(shape = var_6056, x = var_6055)[name = tensor("op_6057")]; tensor hidden_states_385_perm_0 = const()[name = tensor("hidden_states_385_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_22_promoted_163_to_fp16 = const()[name = tensor("op_22_promoted_163_to_fp16"), val = tensor(0x1p+1)]; tensor x_651 = transpose(perm = x_651_perm_0, x = var_6047)[name = tensor("transpose_27")]; tensor var_6061_cast_fp16 = pow(x = x_651, y = var_22_promoted_163_to_fp16)[name = tensor("op_6061_cast_fp16")]; tensor var_6063_axes_0 = const()[name = tensor("op_6063_axes_0"), val = tensor([-1])]; tensor var_6063_keep_dims_0 = const()[name = tensor("op_6063_keep_dims_0"), val = tensor(true)]; tensor var_6063_cast_fp16 = reduce_mean(axes = var_6063_axes_0, keep_dims = var_6063_keep_dims_0, x = var_6061_cast_fp16)[name = tensor("op_6063_cast_fp16")]; tensor var_6064_to_fp16 = const()[name = tensor("op_6064_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_6065_cast_fp16 = add(x = var_6063_cast_fp16, y = var_6064_to_fp16)[name = tensor("op_6065_cast_fp16")]; tensor var_6066_epsilon_0 = const()[name = tensor("op_6066_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_6066_cast_fp16 = rsqrt(epsilon = var_6066_epsilon_0, x = var_6065_cast_fp16)[name = tensor("op_6066_cast_fp16")]; tensor output_653_cast_fp16 = mul(x = x_651, y = var_6066_cast_fp16)[name = tensor("output_653_cast_fp16")]; tensor var_6070_to_fp16 = const()[name = tensor("op_6070_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940786432)))]; tensor output_655_cast_fp16 = mul(x = output_653_cast_fp16, y = var_6070_to_fp16)[name = tensor("output_655_cast_fp16")]; tensor var_22_promoted_164_to_fp16 = const()[name = tensor("op_22_promoted_164_to_fp16"), val = tensor(0x1p+1)]; tensor x_655 = transpose(perm = x_655_perm_0, x = var_6052)[name = tensor("transpose_26")]; tensor var_6075_cast_fp16 = pow(x = x_655, y = var_22_promoted_164_to_fp16)[name = tensor("op_6075_cast_fp16")]; tensor var_6077_axes_0 = const()[name = tensor("op_6077_axes_0"), val = tensor([-1])]; tensor var_6077_keep_dims_0 = const()[name = tensor("op_6077_keep_dims_0"), val = tensor(true)]; tensor var_6077_cast_fp16 = reduce_mean(axes = var_6077_axes_0, keep_dims = var_6077_keep_dims_0, x = var_6075_cast_fp16)[name = tensor("op_6077_cast_fp16")]; tensor var_6078_to_fp16 = const()[name = tensor("op_6078_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_6079_cast_fp16 = add(x = var_6077_cast_fp16, y = var_6078_to_fp16)[name = tensor("op_6079_cast_fp16")]; tensor var_6080_epsilon_0 = const()[name = tensor("op_6080_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_6080_cast_fp16 = rsqrt(epsilon = var_6080_epsilon_0, x = var_6079_cast_fp16)[name = tensor("op_6080_cast_fp16")]; tensor output_657_cast_fp16 = mul(x = x_655, y = var_6080_cast_fp16)[name = tensor("output_657_cast_fp16")]; tensor var_6084_to_fp16 = const()[name = tensor("op_6084_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940787008)))]; tensor output_659_cast_fp16 = mul(x = output_657_cast_fp16, y = var_6084_to_fp16)[name = tensor("output_659_cast_fp16")]; tensor var_6089 = mul(x = output_655_cast_fp16, y = cos_7_palettized)[name = tensor("op_6089")]; tensor x1_109_begin_0 = const()[name = tensor("x1_109_begin_0"), val = tensor([0, 0, 0, 0])]; tensor x1_109_end_0 = const()[name = tensor("x1_109_end_0"), val = tensor([1, 8, 256, 128])]; tensor x1_109_end_mask_0 = const()[name = tensor("x1_109_end_mask_0"), val = tensor([true, true, true, false])]; tensor x1_109 = slice_by_index(begin = x1_109_begin_0, end = x1_109_end_0, end_mask = x1_109_end_mask_0, x = output_655_cast_fp16)[name = tensor("x1_109")]; tensor x2_109_begin_0 = const()[name = tensor("x2_109_begin_0"), val = tensor([0, 0, 0, 128])]; tensor x2_109_end_0 = const()[name = tensor("x2_109_end_0"), val = tensor([1, 8, 256, 256])]; tensor x2_109_end_mask_0 = const()[name = tensor("x2_109_end_mask_0"), val = tensor([true, true, true, true])]; tensor x2_109 = slice_by_index(begin = x2_109_begin_0, end = x2_109_end_0, end_mask = x2_109_end_mask_0, x = output_655_cast_fp16)[name = tensor("x2_109")]; tensor const_656_promoted = const()[name = tensor("const_656_promoted"), val = tensor(-0x1p+0)]; tensor var_6100 = mul(x = x2_109, y = const_656_promoted)[name = tensor("op_6100")]; tensor var_6102_interleave_0 = const()[name = tensor("op_6102_interleave_0"), val = tensor(false)]; tensor var_6102 = concat(axis = var_24, interleave = var_6102_interleave_0, values = (var_6100, x1_109))[name = tensor("op_6102")]; tensor var_6103 = mul(x = var_6102, y = sin_7_palettized)[name = tensor("op_6103")]; tensor query_55 = add(x = var_6089, y = var_6103)[name = tensor("query_55")]; tensor var_6105 = mul(x = output_659_cast_fp16, y = cos_7_palettized)[name = tensor("op_6105")]; tensor x1_111_begin_0 = const()[name = tensor("x1_111_begin_0"), val = tensor([0, 0, 0, 0])]; tensor x1_111_end_0 = const()[name = tensor("x1_111_end_0"), val = tensor([1, 4, 256, 128])]; tensor x1_111_end_mask_0 = const()[name = tensor("x1_111_end_mask_0"), val = tensor([true, true, true, false])]; tensor x1_111 = slice_by_index(begin = x1_111_begin_0, end = x1_111_end_0, end_mask = x1_111_end_mask_0, x = output_659_cast_fp16)[name = tensor("x1_111")]; tensor x2_111_begin_0 = const()[name = tensor("x2_111_begin_0"), val = tensor([0, 0, 0, 128])]; tensor x2_111_end_0 = const()[name = tensor("x2_111_end_0"), val = tensor([1, 4, 256, 256])]; tensor x2_111_end_mask_0 = const()[name = tensor("x2_111_end_mask_0"), val = tensor([true, true, true, true])]; tensor x2_111 = slice_by_index(begin = x2_111_begin_0, end = x2_111_end_0, end_mask = x2_111_end_mask_0, x = output_659_cast_fp16)[name = tensor("x2_111")]; tensor const_659_promoted = const()[name = tensor("const_659_promoted"), val = tensor(-0x1p+0)]; tensor var_6116 = mul(x = x2_111, y = const_659_promoted)[name = tensor("op_6116")]; tensor var_6118_interleave_0 = const()[name = tensor("op_6118_interleave_0"), val = tensor(false)]; tensor var_6118 = concat(axis = var_24, interleave = var_6118_interleave_0, values = (var_6116, x1_111))[name = tensor("op_6118")]; tensor var_6119 = mul(x = var_6118, y = sin_7_palettized)[name = tensor("op_6119")]; tensor hidden_states_381 = add(x = var_6105, y = var_6119)[name = tensor("hidden_states_381")]; tensor var_6128_axes_0 = const()[name = tensor("op_6128_axes_0"), val = tensor([2])]; tensor var_6128 = expand_dims(axes = var_6128_axes_0, x = hidden_states_381)[name = tensor("op_6128")]; tensor hidden_states_383_reps_0 = const()[name = tensor("hidden_states_383_reps_0"), val = tensor([1, 1, 2, 1, 1])]; tensor hidden_states_383 = tile(reps = hidden_states_383_reps_0, x = var_6128)[name = tensor("hidden_states_383")]; tensor var_6136 = const()[name = tensor("op_6136"), val = tensor([1, 8, 256, 256])]; tensor key_states_55 = reshape(shape = var_6136, x = hidden_states_383)[name = tensor("key_states_55")]; tensor var_6145_axes_0 = const()[name = tensor("op_6145_axes_0"), val = tensor([2])]; tensor hidden_states_385 = transpose(perm = hidden_states_385_perm_0, x = var_6057)[name = tensor("transpose_25")]; tensor var_6145 = expand_dims(axes = var_6145_axes_0, x = hidden_states_385)[name = tensor("op_6145")]; tensor hidden_states_387_reps_0 = const()[name = tensor("hidden_states_387_reps_0"), val = tensor([1, 1, 2, 1, 1])]; tensor hidden_states_387 = tile(reps = hidden_states_387_reps_0, x = var_6145)[name = tensor("hidden_states_387")]; tensor var_6153 = const()[name = tensor("op_6153"), val = tensor([1, 8, 256, 256])]; tensor value_states_55 = reshape(shape = var_6153, x = hidden_states_387)[name = tensor("value_states_55")]; tensor var_6156_transpose_x_1 = const()[name = tensor("op_6156_transpose_x_1"), val = tensor(false)]; tensor var_6156_transpose_y_1 = const()[name = tensor("op_6156_transpose_y_1"), val = tensor(true)]; tensor var_6156 = matmul(transpose_x = var_6156_transpose_x_1, transpose_y = var_6156_transpose_y_1, x = query_55, y = key_states_55)[name = tensor("op_6156")]; tensor var_6157_to_fp16 = const()[name = tensor("op_6157_to_fp16"), val = tensor(0x1p-4)]; tensor attn_weights_109_cast_fp16 = mul(x = var_6156, y = var_6157_to_fp16)[name = tensor("attn_weights_109_cast_fp16")]; tensor input_325_cast_fp16 = add(x = attn_weights_109_cast_fp16, y = attention_mask_to_fp16_palettized)[name = tensor("input_325_cast_fp16")]; tensor var_6165_cast_fp16 = softmax(axis = var_24, x = input_325_cast_fp16)[name = tensor("op_6165_cast_fp16")]; tensor attn_output_109_transpose_x_0 = const()[name = tensor("attn_output_109_transpose_x_0"), val = tensor(false)]; tensor attn_output_109_transpose_y_0 = const()[name = tensor("attn_output_109_transpose_y_0"), val = tensor(false)]; tensor attn_output_109 = matmul(transpose_x = attn_output_109_transpose_x_0, transpose_y = attn_output_109_transpose_y_0, x = var_6165_cast_fp16, y = value_states_55)[name = tensor("attn_output_109")]; tensor var_6169_perm_0 = const()[name = tensor("op_6169_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_6171 = const()[name = tensor("op_6171"), val = tensor([1, 256, -1])]; tensor var_6169 = transpose(perm = var_6169_perm_0, x = attn_output_109)[name = tensor("transpose_24")]; tensor var_6172 = reshape(shape = var_6171, x = var_6169)[name = tensor("op_6172")]; tensor x_659 = linear(bias = linear_3_bias_0, weight = wrapped_model_language_model_layers_27_self_attn_o_proj_weight_palettized, x = var_6172)[name = tensor("linear_192")]; tensor var_22_promoted_165_to_fp16 = const()[name = tensor("op_22_promoted_165_to_fp16"), val = tensor(0x1p+1)]; tensor var_6178_cast_fp16 = pow(x = x_659, y = var_22_promoted_165_to_fp16)[name = tensor("op_6178_cast_fp16")]; tensor var_6180_axes_0 = const()[name = tensor("op_6180_axes_0"), val = tensor([-1])]; tensor var_6180_keep_dims_0 = const()[name = tensor("op_6180_keep_dims_0"), val = tensor(true)]; tensor var_6180_cast_fp16 = reduce_mean(axes = var_6180_axes_0, keep_dims = var_6180_keep_dims_0, x = var_6178_cast_fp16)[name = tensor("op_6180_cast_fp16")]; tensor var_6181_to_fp16 = const()[name = tensor("op_6181_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_6182_cast_fp16 = add(x = var_6180_cast_fp16, y = var_6181_to_fp16)[name = tensor("op_6182_cast_fp16")]; tensor var_6183_epsilon_0 = const()[name = tensor("op_6183_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_6183_cast_fp16 = rsqrt(epsilon = var_6183_epsilon_0, x = var_6182_cast_fp16)[name = tensor("op_6183_cast_fp16")]; tensor output_661_cast_fp16 = mul(x = x_659, y = var_6183_cast_fp16)[name = tensor("output_661_cast_fp16")]; tensor var_6187_to_fp16 = const()[name = tensor("op_6187_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940787584)))]; tensor output_663_cast_fp16 = mul(x = output_661_cast_fp16, y = var_6187_to_fp16)[name = tensor("output_663_cast_fp16")]; tensor x_663 = add(x = x_647, y = output_663_cast_fp16)[name = tensor("x_663")]; tensor var_22_promoted_166_to_fp16 = const()[name = tensor("op_22_promoted_166_to_fp16"), val = tensor(0x1p+1)]; tensor var_6193_cast_fp16 = pow(x = x_663, y = var_22_promoted_166_to_fp16)[name = tensor("op_6193_cast_fp16")]; tensor var_6195_axes_0 = const()[name = tensor("op_6195_axes_0"), val = tensor([-1])]; tensor var_6195_keep_dims_0 = const()[name = tensor("op_6195_keep_dims_0"), val = tensor(true)]; tensor var_6195_cast_fp16 = reduce_mean(axes = var_6195_axes_0, keep_dims = var_6195_keep_dims_0, x = var_6193_cast_fp16)[name = tensor("op_6195_cast_fp16")]; tensor var_6196_to_fp16 = const()[name = tensor("op_6196_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_6197_cast_fp16 = add(x = var_6195_cast_fp16, y = var_6196_to_fp16)[name = tensor("op_6197_cast_fp16")]; tensor var_6198_epsilon_0 = const()[name = tensor("op_6198_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_6198_cast_fp16 = rsqrt(epsilon = var_6198_epsilon_0, x = var_6197_cast_fp16)[name = tensor("op_6198_cast_fp16")]; tensor output_665_cast_fp16 = mul(x = x_663, y = var_6198_cast_fp16)[name = tensor("output_665_cast_fp16")]; tensor var_6202_to_fp16 = const()[name = tensor("op_6202_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940792768)))]; tensor output_667_cast_fp16 = mul(x = output_665_cast_fp16, y = var_6202_to_fp16)[name = tensor("output_667_cast_fp16")]; tensor input_333 = linear(bias = linear_4_bias_0, weight = wrapped_model_language_model_layers_27_mlp_gate_proj_weight_palettized, x = output_667_cast_fp16)[name = tensor("linear_193")]; tensor var_6210_mode_0 = const()[name = tensor("op_6210_mode_0"), val = tensor("TANH_APPROXIMATION")]; tensor var_6210 = gelu(mode = var_6210_mode_0, x = input_333)[name = tensor("op_6210")]; tensor var_6212 = linear(bias = linear_4_bias_0, weight = wrapped_model_language_model_layers_27_mlp_up_proj_weight_palettized, x = output_667_cast_fp16)[name = tensor("linear_194")]; tensor input_335 = mul(x = var_6210, y = var_6212)[name = tensor("input_335")]; tensor x_667 = linear(bias = linear_3_bias_0, weight = wrapped_model_language_model_layers_27_mlp_down_proj_weight_palettized, x = input_335)[name = tensor("linear_195")]; tensor var_22_promoted_167_to_fp16 = const()[name = tensor("op_22_promoted_167_to_fp16"), val = tensor(0x1p+1)]; tensor var_6218_cast_fp16 = pow(x = x_667, y = var_22_promoted_167_to_fp16)[name = tensor("op_6218_cast_fp16")]; tensor var_6220_axes_0 = const()[name = tensor("op_6220_axes_0"), val = tensor([-1])]; tensor var_6220_keep_dims_0 = const()[name = tensor("op_6220_keep_dims_0"), val = tensor(true)]; tensor var_6220_cast_fp16 = reduce_mean(axes = var_6220_axes_0, keep_dims = var_6220_keep_dims_0, x = var_6218_cast_fp16)[name = tensor("op_6220_cast_fp16")]; tensor var_6221_to_fp16 = const()[name = tensor("op_6221_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_6222_cast_fp16 = add(x = var_6220_cast_fp16, y = var_6221_to_fp16)[name = tensor("op_6222_cast_fp16")]; tensor var_6223_epsilon_0 = const()[name = tensor("op_6223_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_6223_cast_fp16 = rsqrt(epsilon = var_6223_epsilon_0, x = var_6222_cast_fp16)[name = tensor("op_6223_cast_fp16")]; tensor output_669_cast_fp16 = mul(x = x_667, y = var_6223_cast_fp16)[name = tensor("output_669_cast_fp16")]; tensor var_6227_to_fp16 = const()[name = tensor("op_6227_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940797952)))]; tensor output_671_cast_fp16 = mul(x = output_669_cast_fp16, y = var_6227_to_fp16)[name = tensor("output_671_cast_fp16")]; tensor x_671 = add(x = x_663, y = output_671_cast_fp16)[name = tensor("x_671")]; tensor var_22_promoted_168_to_fp16 = const()[name = tensor("op_22_promoted_168_to_fp16"), val = tensor(0x1p+1)]; tensor var_6239_cast_fp16 = pow(x = x_671, y = var_22_promoted_168_to_fp16)[name = tensor("op_6239_cast_fp16")]; tensor var_6241_axes_0 = const()[name = tensor("op_6241_axes_0"), val = tensor([-1])]; tensor var_6241_keep_dims_0 = const()[name = tensor("op_6241_keep_dims_0"), val = tensor(true)]; tensor var_6241_cast_fp16 = reduce_mean(axes = var_6241_axes_0, keep_dims = var_6241_keep_dims_0, x = var_6239_cast_fp16)[name = tensor("op_6241_cast_fp16")]; tensor var_6242_to_fp16 = const()[name = tensor("op_6242_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_6243_cast_fp16 = add(x = var_6241_cast_fp16, y = var_6242_to_fp16)[name = tensor("op_6243_cast_fp16")]; tensor var_6244_epsilon_0 = const()[name = tensor("op_6244_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_6244_cast_fp16 = rsqrt(epsilon = var_6244_epsilon_0, x = var_6243_cast_fp16)[name = tensor("op_6244_cast_fp16")]; tensor output_673_cast_fp16 = mul(x = x_671, y = var_6244_cast_fp16)[name = tensor("output_673_cast_fp16")]; tensor var_6248_to_fp16 = const()[name = tensor("op_6248_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940803136)))]; tensor output_675_cast_fp16 = mul(x = output_673_cast_fp16, y = var_6248_to_fp16)[name = tensor("output_675_cast_fp16")]; tensor var_6260 = linear(bias = linear_0_bias_0, weight = wrapped_model_language_model_layers_28_self_attn_q_proj_weight_palettized, x = output_675_cast_fp16)[name = tensor("linear_196")]; tensor var_6261 = const()[name = tensor("op_6261"), val = tensor([1, 256, -1, 256])]; tensor var_6262 = reshape(shape = var_6261, x = var_6260)[name = tensor("op_6262")]; tensor x_675_perm_0 = const()[name = tensor("x_675_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_6265 = linear(bias = linear_1_bias_0, weight = wrapped_model_language_model_layers_28_self_attn_k_proj_weight_palettized, x = output_675_cast_fp16)[name = tensor("linear_197")]; tensor var_6266 = const()[name = tensor("op_6266"), val = tensor([1, 256, -1, 256])]; tensor var_6267 = reshape(shape = var_6266, x = var_6265)[name = tensor("op_6267")]; tensor x_679_perm_0 = const()[name = tensor("x_679_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_6270 = linear(bias = linear_1_bias_0, weight = wrapped_model_language_model_layers_28_self_attn_v_proj_weight_palettized, x = output_675_cast_fp16)[name = tensor("linear_198")]; tensor var_6271 = const()[name = tensor("op_6271"), val = tensor([1, 256, -1, 256])]; tensor var_6272 = reshape(shape = var_6271, x = var_6270)[name = tensor("op_6272")]; tensor hidden_states_399_perm_0 = const()[name = tensor("hidden_states_399_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_22_promoted_169_to_fp16 = const()[name = tensor("op_22_promoted_169_to_fp16"), val = tensor(0x1p+1)]; tensor x_675 = transpose(perm = x_675_perm_0, x = var_6262)[name = tensor("transpose_23")]; tensor var_6276_cast_fp16 = pow(x = x_675, y = var_22_promoted_169_to_fp16)[name = tensor("op_6276_cast_fp16")]; tensor var_6278_axes_0 = const()[name = tensor("op_6278_axes_0"), val = tensor([-1])]; tensor var_6278_keep_dims_0 = const()[name = tensor("op_6278_keep_dims_0"), val = tensor(true)]; tensor var_6278_cast_fp16 = reduce_mean(axes = var_6278_axes_0, keep_dims = var_6278_keep_dims_0, x = var_6276_cast_fp16)[name = tensor("op_6278_cast_fp16")]; tensor var_6279_to_fp16 = const()[name = tensor("op_6279_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_6280_cast_fp16 = add(x = var_6278_cast_fp16, y = var_6279_to_fp16)[name = tensor("op_6280_cast_fp16")]; tensor var_6281_epsilon_0 = const()[name = tensor("op_6281_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_6281_cast_fp16 = rsqrt(epsilon = var_6281_epsilon_0, x = var_6280_cast_fp16)[name = tensor("op_6281_cast_fp16")]; tensor output_677_cast_fp16 = mul(x = x_675, y = var_6281_cast_fp16)[name = tensor("output_677_cast_fp16")]; tensor var_6285_to_fp16 = const()[name = tensor("op_6285_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940808320)))]; tensor output_679_cast_fp16 = mul(x = output_677_cast_fp16, y = var_6285_to_fp16)[name = tensor("output_679_cast_fp16")]; tensor var_22_promoted_170_to_fp16 = const()[name = tensor("op_22_promoted_170_to_fp16"), val = tensor(0x1p+1)]; tensor x_679 = transpose(perm = x_679_perm_0, x = var_6267)[name = tensor("transpose_22")]; tensor var_6290_cast_fp16 = pow(x = x_679, y = var_22_promoted_170_to_fp16)[name = tensor("op_6290_cast_fp16")]; tensor var_6292_axes_0 = const()[name = tensor("op_6292_axes_0"), val = tensor([-1])]; tensor var_6292_keep_dims_0 = const()[name = tensor("op_6292_keep_dims_0"), val = tensor(true)]; tensor var_6292_cast_fp16 = reduce_mean(axes = var_6292_axes_0, keep_dims = var_6292_keep_dims_0, x = var_6290_cast_fp16)[name = tensor("op_6292_cast_fp16")]; tensor var_6293_to_fp16 = const()[name = tensor("op_6293_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_6294_cast_fp16 = add(x = var_6292_cast_fp16, y = var_6293_to_fp16)[name = tensor("op_6294_cast_fp16")]; tensor var_6295_epsilon_0 = const()[name = tensor("op_6295_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_6295_cast_fp16 = rsqrt(epsilon = var_6295_epsilon_0, x = var_6294_cast_fp16)[name = tensor("op_6295_cast_fp16")]; tensor output_681_cast_fp16 = mul(x = x_679, y = var_6295_cast_fp16)[name = tensor("output_681_cast_fp16")]; tensor var_6299_to_fp16 = const()[name = tensor("op_6299_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940808896)))]; tensor output_683_cast_fp16 = mul(x = output_681_cast_fp16, y = var_6299_to_fp16)[name = tensor("output_683_cast_fp16")]; tensor var_6304 = mul(x = output_679_cast_fp16, y = cos_7_palettized)[name = tensor("op_6304")]; tensor x1_113_begin_0 = const()[name = tensor("x1_113_begin_0"), val = tensor([0, 0, 0, 0])]; tensor x1_113_end_0 = const()[name = tensor("x1_113_end_0"), val = tensor([1, 8, 256, 128])]; tensor x1_113_end_mask_0 = const()[name = tensor("x1_113_end_mask_0"), val = tensor([true, true, true, false])]; tensor x1_113 = slice_by_index(begin = x1_113_begin_0, end = x1_113_end_0, end_mask = x1_113_end_mask_0, x = output_679_cast_fp16)[name = tensor("x1_113")]; tensor x2_113_begin_0 = const()[name = tensor("x2_113_begin_0"), val = tensor([0, 0, 0, 128])]; tensor x2_113_end_0 = const()[name = tensor("x2_113_end_0"), val = tensor([1, 8, 256, 256])]; tensor x2_113_end_mask_0 = const()[name = tensor("x2_113_end_mask_0"), val = tensor([true, true, true, true])]; tensor x2_113 = slice_by_index(begin = x2_113_begin_0, end = x2_113_end_0, end_mask = x2_113_end_mask_0, x = output_679_cast_fp16)[name = tensor("x2_113")]; tensor const_679_promoted = const()[name = tensor("const_679_promoted"), val = tensor(-0x1p+0)]; tensor var_6315 = mul(x = x2_113, y = const_679_promoted)[name = tensor("op_6315")]; tensor var_6317_interleave_0 = const()[name = tensor("op_6317_interleave_0"), val = tensor(false)]; tensor var_6317 = concat(axis = var_24, interleave = var_6317_interleave_0, values = (var_6315, x1_113))[name = tensor("op_6317")]; tensor var_6318 = mul(x = var_6317, y = sin_7_palettized)[name = tensor("op_6318")]; tensor query_57 = add(x = var_6304, y = var_6318)[name = tensor("query_57")]; tensor var_6320 = mul(x = output_683_cast_fp16, y = cos_7_palettized)[name = tensor("op_6320")]; tensor x1_115_begin_0 = const()[name = tensor("x1_115_begin_0"), val = tensor([0, 0, 0, 0])]; tensor x1_115_end_0 = const()[name = tensor("x1_115_end_0"), val = tensor([1, 4, 256, 128])]; tensor x1_115_end_mask_0 = const()[name = tensor("x1_115_end_mask_0"), val = tensor([true, true, true, false])]; tensor x1_115 = slice_by_index(begin = x1_115_begin_0, end = x1_115_end_0, end_mask = x1_115_end_mask_0, x = output_683_cast_fp16)[name = tensor("x1_115")]; tensor x2_115_begin_0 = const()[name = tensor("x2_115_begin_0"), val = tensor([0, 0, 0, 128])]; tensor x2_115_end_0 = const()[name = tensor("x2_115_end_0"), val = tensor([1, 4, 256, 256])]; tensor x2_115_end_mask_0 = const()[name = tensor("x2_115_end_mask_0"), val = tensor([true, true, true, true])]; tensor x2_115 = slice_by_index(begin = x2_115_begin_0, end = x2_115_end_0, end_mask = x2_115_end_mask_0, x = output_683_cast_fp16)[name = tensor("x2_115")]; tensor const_682_promoted = const()[name = tensor("const_682_promoted"), val = tensor(-0x1p+0)]; tensor var_6331 = mul(x = x2_115, y = const_682_promoted)[name = tensor("op_6331")]; tensor var_6333_interleave_0 = const()[name = tensor("op_6333_interleave_0"), val = tensor(false)]; tensor var_6333 = concat(axis = var_24, interleave = var_6333_interleave_0, values = (var_6331, x1_115))[name = tensor("op_6333")]; tensor var_6334 = mul(x = var_6333, y = sin_7_palettized)[name = tensor("op_6334")]; tensor hidden_states_395 = add(x = var_6320, y = var_6334)[name = tensor("hidden_states_395")]; tensor var_6343_axes_0 = const()[name = tensor("op_6343_axes_0"), val = tensor([2])]; tensor var_6343 = expand_dims(axes = var_6343_axes_0, x = hidden_states_395)[name = tensor("op_6343")]; tensor hidden_states_397_reps_0 = const()[name = tensor("hidden_states_397_reps_0"), val = tensor([1, 1, 2, 1, 1])]; tensor hidden_states_397 = tile(reps = hidden_states_397_reps_0, x = var_6343)[name = tensor("hidden_states_397")]; tensor var_6351 = const()[name = tensor("op_6351"), val = tensor([1, 8, 256, 256])]; tensor key_states_57 = reshape(shape = var_6351, x = hidden_states_397)[name = tensor("key_states_57")]; tensor var_6360_axes_0 = const()[name = tensor("op_6360_axes_0"), val = tensor([2])]; tensor hidden_states_399 = transpose(perm = hidden_states_399_perm_0, x = var_6272)[name = tensor("transpose_21")]; tensor var_6360 = expand_dims(axes = var_6360_axes_0, x = hidden_states_399)[name = tensor("op_6360")]; tensor hidden_states_401_reps_0 = const()[name = tensor("hidden_states_401_reps_0"), val = tensor([1, 1, 2, 1, 1])]; tensor hidden_states_401 = tile(reps = hidden_states_401_reps_0, x = var_6360)[name = tensor("hidden_states_401")]; tensor var_6368 = const()[name = tensor("op_6368"), val = tensor([1, 8, 256, 256])]; tensor value_states_57 = reshape(shape = var_6368, x = hidden_states_401)[name = tensor("value_states_57")]; tensor var_6371_transpose_x_1 = const()[name = tensor("op_6371_transpose_x_1"), val = tensor(false)]; tensor var_6371_transpose_y_1 = const()[name = tensor("op_6371_transpose_y_1"), val = tensor(true)]; tensor var_6371 = matmul(transpose_x = var_6371_transpose_x_1, transpose_y = var_6371_transpose_y_1, x = query_57, y = key_states_57)[name = tensor("op_6371")]; tensor var_6372_to_fp16 = const()[name = tensor("op_6372_to_fp16"), val = tensor(0x1p-4)]; tensor attn_weights_113_cast_fp16 = mul(x = var_6371, y = var_6372_to_fp16)[name = tensor("attn_weights_113_cast_fp16")]; tensor input_337_cast_fp16 = add(x = attn_weights_113_cast_fp16, y = attention_mask_to_fp16_palettized)[name = tensor("input_337_cast_fp16")]; tensor var_6380_cast_fp16 = softmax(axis = var_24, x = input_337_cast_fp16)[name = tensor("op_6380_cast_fp16")]; tensor attn_output_113_transpose_x_0 = const()[name = tensor("attn_output_113_transpose_x_0"), val = tensor(false)]; tensor attn_output_113_transpose_y_0 = const()[name = tensor("attn_output_113_transpose_y_0"), val = tensor(false)]; tensor attn_output_113 = matmul(transpose_x = attn_output_113_transpose_x_0, transpose_y = attn_output_113_transpose_y_0, x = var_6380_cast_fp16, y = value_states_57)[name = tensor("attn_output_113")]; tensor var_6384_perm_0 = const()[name = tensor("op_6384_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_6386 = const()[name = tensor("op_6386"), val = tensor([1, 256, -1])]; tensor var_6384 = transpose(perm = var_6384_perm_0, x = attn_output_113)[name = tensor("transpose_20")]; tensor var_6387 = reshape(shape = var_6386, x = var_6384)[name = tensor("op_6387")]; tensor x_683 = linear(bias = linear_3_bias_0, weight = wrapped_model_language_model_layers_28_self_attn_o_proj_weight_palettized, x = var_6387)[name = tensor("linear_199")]; tensor var_22_promoted_171_to_fp16 = const()[name = tensor("op_22_promoted_171_to_fp16"), val = tensor(0x1p+1)]; tensor var_6393_cast_fp16 = pow(x = x_683, y = var_22_promoted_171_to_fp16)[name = tensor("op_6393_cast_fp16")]; tensor var_6395_axes_0 = const()[name = tensor("op_6395_axes_0"), val = tensor([-1])]; tensor var_6395_keep_dims_0 = const()[name = tensor("op_6395_keep_dims_0"), val = tensor(true)]; tensor var_6395_cast_fp16 = reduce_mean(axes = var_6395_axes_0, keep_dims = var_6395_keep_dims_0, x = var_6393_cast_fp16)[name = tensor("op_6395_cast_fp16")]; tensor var_6396_to_fp16 = const()[name = tensor("op_6396_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_6397_cast_fp16 = add(x = var_6395_cast_fp16, y = var_6396_to_fp16)[name = tensor("op_6397_cast_fp16")]; tensor var_6398_epsilon_0 = const()[name = tensor("op_6398_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_6398_cast_fp16 = rsqrt(epsilon = var_6398_epsilon_0, x = var_6397_cast_fp16)[name = tensor("op_6398_cast_fp16")]; tensor output_685_cast_fp16 = mul(x = x_683, y = var_6398_cast_fp16)[name = tensor("output_685_cast_fp16")]; tensor var_6402_to_fp16 = const()[name = tensor("op_6402_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940809472)))]; tensor output_687_cast_fp16 = mul(x = output_685_cast_fp16, y = var_6402_to_fp16)[name = tensor("output_687_cast_fp16")]; tensor x_687 = add(x = x_671, y = output_687_cast_fp16)[name = tensor("x_687")]; tensor var_22_promoted_172_to_fp16 = const()[name = tensor("op_22_promoted_172_to_fp16"), val = tensor(0x1p+1)]; tensor var_6408_cast_fp16 = pow(x = x_687, y = var_22_promoted_172_to_fp16)[name = tensor("op_6408_cast_fp16")]; tensor var_6410_axes_0 = const()[name = tensor("op_6410_axes_0"), val = tensor([-1])]; tensor var_6410_keep_dims_0 = const()[name = tensor("op_6410_keep_dims_0"), val = tensor(true)]; tensor var_6410_cast_fp16 = reduce_mean(axes = var_6410_axes_0, keep_dims = var_6410_keep_dims_0, x = var_6408_cast_fp16)[name = tensor("op_6410_cast_fp16")]; tensor var_6411_to_fp16 = const()[name = tensor("op_6411_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_6412_cast_fp16 = add(x = var_6410_cast_fp16, y = var_6411_to_fp16)[name = tensor("op_6412_cast_fp16")]; tensor var_6413_epsilon_0 = const()[name = tensor("op_6413_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_6413_cast_fp16 = rsqrt(epsilon = var_6413_epsilon_0, x = var_6412_cast_fp16)[name = tensor("op_6413_cast_fp16")]; tensor output_689_cast_fp16 = mul(x = x_687, y = var_6413_cast_fp16)[name = tensor("output_689_cast_fp16")]; tensor var_6417_to_fp16 = const()[name = tensor("op_6417_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940814656)))]; tensor output_691_cast_fp16 = mul(x = output_689_cast_fp16, y = var_6417_to_fp16)[name = tensor("output_691_cast_fp16")]; tensor input_345 = linear(bias = linear_4_bias_0, weight = wrapped_model_language_model_layers_28_mlp_gate_proj_weight_palettized, x = output_691_cast_fp16)[name = tensor("linear_200")]; tensor var_6425_mode_0 = const()[name = tensor("op_6425_mode_0"), val = tensor("TANH_APPROXIMATION")]; tensor var_6425 = gelu(mode = var_6425_mode_0, x = input_345)[name = tensor("op_6425")]; tensor var_6427 = linear(bias = linear_4_bias_0, weight = wrapped_model_language_model_layers_28_mlp_up_proj_weight_palettized, x = output_691_cast_fp16)[name = tensor("linear_201")]; tensor input_347 = mul(x = var_6425, y = var_6427)[name = tensor("input_347")]; tensor x_691 = linear(bias = linear_3_bias_0, weight = wrapped_model_language_model_layers_28_mlp_down_proj_weight_palettized, x = input_347)[name = tensor("linear_202")]; tensor var_22_promoted_173_to_fp16 = const()[name = tensor("op_22_promoted_173_to_fp16"), val = tensor(0x1p+1)]; tensor var_6433_cast_fp16 = pow(x = x_691, y = var_22_promoted_173_to_fp16)[name = tensor("op_6433_cast_fp16")]; tensor var_6435_axes_0 = const()[name = tensor("op_6435_axes_0"), val = tensor([-1])]; tensor var_6435_keep_dims_0 = const()[name = tensor("op_6435_keep_dims_0"), val = tensor(true)]; tensor var_6435_cast_fp16 = reduce_mean(axes = var_6435_axes_0, keep_dims = var_6435_keep_dims_0, x = var_6433_cast_fp16)[name = tensor("op_6435_cast_fp16")]; tensor var_6436_to_fp16 = const()[name = tensor("op_6436_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_6437_cast_fp16 = add(x = var_6435_cast_fp16, y = var_6436_to_fp16)[name = tensor("op_6437_cast_fp16")]; tensor var_6438_epsilon_0 = const()[name = tensor("op_6438_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_6438_cast_fp16 = rsqrt(epsilon = var_6438_epsilon_0, x = var_6437_cast_fp16)[name = tensor("op_6438_cast_fp16")]; tensor output_693_cast_fp16 = mul(x = x_691, y = var_6438_cast_fp16)[name = tensor("output_693_cast_fp16")]; tensor var_6442_to_fp16 = const()[name = tensor("op_6442_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940819840)))]; tensor output_695_cast_fp16 = mul(x = output_693_cast_fp16, y = var_6442_to_fp16)[name = tensor("output_695_cast_fp16")]; tensor x_695 = add(x = x_687, y = output_695_cast_fp16)[name = tensor("x_695")]; tensor var_22_promoted_174_to_fp16 = const()[name = tensor("op_22_promoted_174_to_fp16"), val = tensor(0x1p+1)]; tensor var_6454_cast_fp16 = pow(x = x_695, y = var_22_promoted_174_to_fp16)[name = tensor("op_6454_cast_fp16")]; tensor var_6456_axes_0 = const()[name = tensor("op_6456_axes_0"), val = tensor([-1])]; tensor var_6456_keep_dims_0 = const()[name = tensor("op_6456_keep_dims_0"), val = tensor(true)]; tensor var_6456_cast_fp16 = reduce_mean(axes = var_6456_axes_0, keep_dims = var_6456_keep_dims_0, x = var_6454_cast_fp16)[name = tensor("op_6456_cast_fp16")]; tensor var_6457_to_fp16 = const()[name = tensor("op_6457_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_6458_cast_fp16 = add(x = var_6456_cast_fp16, y = var_6457_to_fp16)[name = tensor("op_6458_cast_fp16")]; tensor var_6459_epsilon_0 = const()[name = tensor("op_6459_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_6459_cast_fp16 = rsqrt(epsilon = var_6459_epsilon_0, x = var_6458_cast_fp16)[name = tensor("op_6459_cast_fp16")]; tensor output_697_cast_fp16 = mul(x = x_695, y = var_6459_cast_fp16)[name = tensor("output_697_cast_fp16")]; tensor var_6463_to_fp16 = const()[name = tensor("op_6463_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940825024)))]; tensor output_699_cast_fp16 = mul(x = output_697_cast_fp16, y = var_6463_to_fp16)[name = tensor("output_699_cast_fp16")]; tensor var_6475 = linear(bias = linear_0_bias_0, weight = wrapped_model_language_model_layers_29_self_attn_q_proj_weight_palettized, x = output_699_cast_fp16)[name = tensor("linear_203")]; tensor var_6476 = const()[name = tensor("op_6476"), val = tensor([1, 256, -1, 256])]; tensor var_6477 = reshape(shape = var_6476, x = var_6475)[name = tensor("op_6477")]; tensor x_699_perm_0 = const()[name = tensor("x_699_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_6480 = linear(bias = linear_1_bias_0, weight = wrapped_model_language_model_layers_29_self_attn_k_proj_weight_palettized, x = output_699_cast_fp16)[name = tensor("linear_204")]; tensor var_6481 = const()[name = tensor("op_6481"), val = tensor([1, 256, -1, 256])]; tensor var_6482 = reshape(shape = var_6481, x = var_6480)[name = tensor("op_6482")]; tensor x_703_perm_0 = const()[name = tensor("x_703_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_6485 = linear(bias = linear_1_bias_0, weight = wrapped_model_language_model_layers_29_self_attn_v_proj_weight_palettized, x = output_699_cast_fp16)[name = tensor("linear_205")]; tensor var_6486 = const()[name = tensor("op_6486"), val = tensor([1, 256, -1, 256])]; tensor var_6487 = reshape(shape = var_6486, x = var_6485)[name = tensor("op_6487")]; tensor hidden_states_413_perm_0 = const()[name = tensor("hidden_states_413_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_22_promoted_175_to_fp16 = const()[name = tensor("op_22_promoted_175_to_fp16"), val = tensor(0x1p+1)]; tensor x_699 = transpose(perm = x_699_perm_0, x = var_6477)[name = tensor("transpose_19")]; tensor var_6491_cast_fp16 = pow(x = x_699, y = var_22_promoted_175_to_fp16)[name = tensor("op_6491_cast_fp16")]; tensor var_6493_axes_0 = const()[name = tensor("op_6493_axes_0"), val = tensor([-1])]; tensor var_6493_keep_dims_0 = const()[name = tensor("op_6493_keep_dims_0"), val = tensor(true)]; tensor var_6493_cast_fp16 = reduce_mean(axes = var_6493_axes_0, keep_dims = var_6493_keep_dims_0, x = var_6491_cast_fp16)[name = tensor("op_6493_cast_fp16")]; tensor var_6494_to_fp16 = const()[name = tensor("op_6494_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_6495_cast_fp16 = add(x = var_6493_cast_fp16, y = var_6494_to_fp16)[name = tensor("op_6495_cast_fp16")]; tensor var_6496_epsilon_0 = const()[name = tensor("op_6496_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_6496_cast_fp16 = rsqrt(epsilon = var_6496_epsilon_0, x = var_6495_cast_fp16)[name = tensor("op_6496_cast_fp16")]; tensor output_701_cast_fp16 = mul(x = x_699, y = var_6496_cast_fp16)[name = tensor("output_701_cast_fp16")]; tensor var_6500_to_fp16 = const()[name = tensor("op_6500_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940830208)))]; tensor output_703_cast_fp16 = mul(x = output_701_cast_fp16, y = var_6500_to_fp16)[name = tensor("output_703_cast_fp16")]; tensor var_22_promoted_176_to_fp16 = const()[name = tensor("op_22_promoted_176_to_fp16"), val = tensor(0x1p+1)]; tensor x_703 = transpose(perm = x_703_perm_0, x = var_6482)[name = tensor("transpose_18")]; tensor var_6505_cast_fp16 = pow(x = x_703, y = var_22_promoted_176_to_fp16)[name = tensor("op_6505_cast_fp16")]; tensor var_6507_axes_0 = const()[name = tensor("op_6507_axes_0"), val = tensor([-1])]; tensor var_6507_keep_dims_0 = const()[name = tensor("op_6507_keep_dims_0"), val = tensor(true)]; tensor var_6507_cast_fp16 = reduce_mean(axes = var_6507_axes_0, keep_dims = var_6507_keep_dims_0, x = var_6505_cast_fp16)[name = tensor("op_6507_cast_fp16")]; tensor var_6508_to_fp16 = const()[name = tensor("op_6508_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_6509_cast_fp16 = add(x = var_6507_cast_fp16, y = var_6508_to_fp16)[name = tensor("op_6509_cast_fp16")]; tensor var_6510_epsilon_0 = const()[name = tensor("op_6510_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_6510_cast_fp16 = rsqrt(epsilon = var_6510_epsilon_0, x = var_6509_cast_fp16)[name = tensor("op_6510_cast_fp16")]; tensor output_705_cast_fp16 = mul(x = x_703, y = var_6510_cast_fp16)[name = tensor("output_705_cast_fp16")]; tensor var_6514_to_fp16 = const()[name = tensor("op_6514_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940830784)))]; tensor output_707_cast_fp16 = mul(x = output_705_cast_fp16, y = var_6514_to_fp16)[name = tensor("output_707_cast_fp16")]; tensor var_6519 = mul(x = output_703_cast_fp16, y = cos_19_palettized)[name = tensor("op_6519")]; tensor x1_117_begin_0 = const()[name = tensor("x1_117_begin_0"), val = tensor([0, 0, 0, 0])]; tensor x1_117_end_0 = const()[name = tensor("x1_117_end_0"), val = tensor([1, 8, 256, 128])]; tensor x1_117_end_mask_0 = const()[name = tensor("x1_117_end_mask_0"), val = tensor([true, true, true, false])]; tensor x1_117 = slice_by_index(begin = x1_117_begin_0, end = x1_117_end_0, end_mask = x1_117_end_mask_0, x = output_703_cast_fp16)[name = tensor("x1_117")]; tensor x2_117_begin_0 = const()[name = tensor("x2_117_begin_0"), val = tensor([0, 0, 0, 128])]; tensor x2_117_end_0 = const()[name = tensor("x2_117_end_0"), val = tensor([1, 8, 256, 256])]; tensor x2_117_end_mask_0 = const()[name = tensor("x2_117_end_mask_0"), val = tensor([true, true, true, true])]; tensor x2_117 = slice_by_index(begin = x2_117_begin_0, end = x2_117_end_0, end_mask = x2_117_end_mask_0, x = output_703_cast_fp16)[name = tensor("x2_117")]; tensor const_702_promoted = const()[name = tensor("const_702_promoted"), val = tensor(-0x1p+0)]; tensor var_6530 = mul(x = x2_117, y = const_702_promoted)[name = tensor("op_6530")]; tensor var_6532_interleave_0 = const()[name = tensor("op_6532_interleave_0"), val = tensor(false)]; tensor var_6532 = concat(axis = var_24, interleave = var_6532_interleave_0, values = (var_6530, x1_117))[name = tensor("op_6532")]; tensor var_6533 = mul(x = var_6532, y = sin_19_palettized)[name = tensor("op_6533")]; tensor query_59 = add(x = var_6519, y = var_6533)[name = tensor("query_59")]; tensor var_6535 = mul(x = output_707_cast_fp16, y = cos_19_palettized)[name = tensor("op_6535")]; tensor x1_119_begin_0 = const()[name = tensor("x1_119_begin_0"), val = tensor([0, 0, 0, 0])]; tensor x1_119_end_0 = const()[name = tensor("x1_119_end_0"), val = tensor([1, 4, 256, 128])]; tensor x1_119_end_mask_0 = const()[name = tensor("x1_119_end_mask_0"), val = tensor([true, true, true, false])]; tensor x1_119 = slice_by_index(begin = x1_119_begin_0, end = x1_119_end_0, end_mask = x1_119_end_mask_0, x = output_707_cast_fp16)[name = tensor("x1_119")]; tensor x2_119_begin_0 = const()[name = tensor("x2_119_begin_0"), val = tensor([0, 0, 0, 128])]; tensor x2_119_end_0 = const()[name = tensor("x2_119_end_0"), val = tensor([1, 4, 256, 256])]; tensor x2_119_end_mask_0 = const()[name = tensor("x2_119_end_mask_0"), val = tensor([true, true, true, true])]; tensor x2_119 = slice_by_index(begin = x2_119_begin_0, end = x2_119_end_0, end_mask = x2_119_end_mask_0, x = output_707_cast_fp16)[name = tensor("x2_119")]; tensor const_705_promoted = const()[name = tensor("const_705_promoted"), val = tensor(-0x1p+0)]; tensor var_6546 = mul(x = x2_119, y = const_705_promoted)[name = tensor("op_6546")]; tensor var_6548_interleave_0 = const()[name = tensor("op_6548_interleave_0"), val = tensor(false)]; tensor var_6548 = concat(axis = var_24, interleave = var_6548_interleave_0, values = (var_6546, x1_119))[name = tensor("op_6548")]; tensor var_6549 = mul(x = var_6548, y = sin_19_palettized)[name = tensor("op_6549")]; tensor hidden_states_409 = add(x = var_6535, y = var_6549)[name = tensor("hidden_states_409")]; tensor var_6558_axes_0 = const()[name = tensor("op_6558_axes_0"), val = tensor([2])]; tensor var_6558 = expand_dims(axes = var_6558_axes_0, x = hidden_states_409)[name = tensor("op_6558")]; tensor hidden_states_411_reps_0 = const()[name = tensor("hidden_states_411_reps_0"), val = tensor([1, 1, 2, 1, 1])]; tensor hidden_states_411 = tile(reps = hidden_states_411_reps_0, x = var_6558)[name = tensor("hidden_states_411")]; tensor var_6566 = const()[name = tensor("op_6566"), val = tensor([1, 8, 256, 256])]; tensor key_states_59 = reshape(shape = var_6566, x = hidden_states_411)[name = tensor("key_states_59")]; tensor var_6575_axes_0 = const()[name = tensor("op_6575_axes_0"), val = tensor([2])]; tensor hidden_states_413 = transpose(perm = hidden_states_413_perm_0, x = var_6487)[name = tensor("transpose_17")]; tensor var_6575 = expand_dims(axes = var_6575_axes_0, x = hidden_states_413)[name = tensor("op_6575")]; tensor hidden_states_415_reps_0 = const()[name = tensor("hidden_states_415_reps_0"), val = tensor([1, 1, 2, 1, 1])]; tensor hidden_states_415 = tile(reps = hidden_states_415_reps_0, x = var_6575)[name = tensor("hidden_states_415")]; tensor var_6583 = const()[name = tensor("op_6583"), val = tensor([1, 8, 256, 256])]; tensor value_states_59 = reshape(shape = var_6583, x = hidden_states_415)[name = tensor("value_states_59")]; tensor var_6586_transpose_x_1 = const()[name = tensor("op_6586_transpose_x_1"), val = tensor(false)]; tensor var_6586_transpose_y_1 = const()[name = tensor("op_6586_transpose_y_1"), val = tensor(true)]; tensor var_6586 = matmul(transpose_x = var_6586_transpose_x_1, transpose_y = var_6586_transpose_y_1, x = query_59, y = key_states_59)[name = tensor("op_6586")]; tensor var_6587_to_fp16 = const()[name = tensor("op_6587_to_fp16"), val = tensor(0x1p-4)]; tensor attn_weights_117_cast_fp16 = mul(x = var_6586, y = var_6587_to_fp16)[name = tensor("attn_weights_117_cast_fp16")]; tensor input_349_cast_fp16 = add(x = attn_weights_117_cast_fp16, y = attention_mask_to_fp16_palettized)[name = tensor("input_349_cast_fp16")]; tensor var_6595_cast_fp16 = softmax(axis = var_24, x = input_349_cast_fp16)[name = tensor("op_6595_cast_fp16")]; tensor attn_output_117_transpose_x_0 = const()[name = tensor("attn_output_117_transpose_x_0"), val = tensor(false)]; tensor attn_output_117_transpose_y_0 = const()[name = tensor("attn_output_117_transpose_y_0"), val = tensor(false)]; tensor attn_output_117 = matmul(transpose_x = attn_output_117_transpose_x_0, transpose_y = attn_output_117_transpose_y_0, x = var_6595_cast_fp16, y = value_states_59)[name = tensor("attn_output_117")]; tensor var_6599_perm_0 = const()[name = tensor("op_6599_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_6601 = const()[name = tensor("op_6601"), val = tensor([1, 256, -1])]; tensor var_6599 = transpose(perm = var_6599_perm_0, x = attn_output_117)[name = tensor("transpose_16")]; tensor var_6602 = reshape(shape = var_6601, x = var_6599)[name = tensor("op_6602")]; tensor x_707 = linear(bias = linear_3_bias_0, weight = wrapped_model_language_model_layers_29_self_attn_o_proj_weight_palettized, x = var_6602)[name = tensor("linear_206")]; tensor var_22_promoted_177_to_fp16 = const()[name = tensor("op_22_promoted_177_to_fp16"), val = tensor(0x1p+1)]; tensor var_6608_cast_fp16 = pow(x = x_707, y = var_22_promoted_177_to_fp16)[name = tensor("op_6608_cast_fp16")]; tensor var_6610_axes_0 = const()[name = tensor("op_6610_axes_0"), val = tensor([-1])]; tensor var_6610_keep_dims_0 = const()[name = tensor("op_6610_keep_dims_0"), val = tensor(true)]; tensor var_6610_cast_fp16 = reduce_mean(axes = var_6610_axes_0, keep_dims = var_6610_keep_dims_0, x = var_6608_cast_fp16)[name = tensor("op_6610_cast_fp16")]; tensor var_6611_to_fp16 = const()[name = tensor("op_6611_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_6612_cast_fp16 = add(x = var_6610_cast_fp16, y = var_6611_to_fp16)[name = tensor("op_6612_cast_fp16")]; tensor var_6613_epsilon_0 = const()[name = tensor("op_6613_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_6613_cast_fp16 = rsqrt(epsilon = var_6613_epsilon_0, x = var_6612_cast_fp16)[name = tensor("op_6613_cast_fp16")]; tensor output_709_cast_fp16 = mul(x = x_707, y = var_6613_cast_fp16)[name = tensor("output_709_cast_fp16")]; tensor var_6617_to_fp16 = const()[name = tensor("op_6617_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940831360)))]; tensor output_711_cast_fp16 = mul(x = output_709_cast_fp16, y = var_6617_to_fp16)[name = tensor("output_711_cast_fp16")]; tensor x_711 = add(x = x_695, y = output_711_cast_fp16)[name = tensor("x_711")]; tensor var_22_promoted_178_to_fp16 = const()[name = tensor("op_22_promoted_178_to_fp16"), val = tensor(0x1p+1)]; tensor var_6623_cast_fp16 = pow(x = x_711, y = var_22_promoted_178_to_fp16)[name = tensor("op_6623_cast_fp16")]; tensor var_6625_axes_0 = const()[name = tensor("op_6625_axes_0"), val = tensor([-1])]; tensor var_6625_keep_dims_0 = const()[name = tensor("op_6625_keep_dims_0"), val = tensor(true)]; tensor var_6625_cast_fp16 = reduce_mean(axes = var_6625_axes_0, keep_dims = var_6625_keep_dims_0, x = var_6623_cast_fp16)[name = tensor("op_6625_cast_fp16")]; tensor var_6626_to_fp16 = const()[name = tensor("op_6626_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_6627_cast_fp16 = add(x = var_6625_cast_fp16, y = var_6626_to_fp16)[name = tensor("op_6627_cast_fp16")]; tensor var_6628_epsilon_0 = const()[name = tensor("op_6628_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_6628_cast_fp16 = rsqrt(epsilon = var_6628_epsilon_0, x = var_6627_cast_fp16)[name = tensor("op_6628_cast_fp16")]; tensor output_713_cast_fp16 = mul(x = x_711, y = var_6628_cast_fp16)[name = tensor("output_713_cast_fp16")]; tensor var_6632_to_fp16 = const()[name = tensor("op_6632_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940836544)))]; tensor output_715_cast_fp16 = mul(x = output_713_cast_fp16, y = var_6632_to_fp16)[name = tensor("output_715_cast_fp16")]; tensor input_357 = linear(bias = linear_4_bias_0, weight = wrapped_model_language_model_layers_29_mlp_gate_proj_weight_palettized, x = output_715_cast_fp16)[name = tensor("linear_207")]; tensor var_6640_mode_0 = const()[name = tensor("op_6640_mode_0"), val = tensor("TANH_APPROXIMATION")]; tensor var_6640 = gelu(mode = var_6640_mode_0, x = input_357)[name = tensor("op_6640")]; tensor var_6642 = linear(bias = linear_4_bias_0, weight = wrapped_model_language_model_layers_29_mlp_up_proj_weight_palettized, x = output_715_cast_fp16)[name = tensor("linear_208")]; tensor input_359 = mul(x = var_6640, y = var_6642)[name = tensor("input_359")]; tensor x_715 = linear(bias = linear_3_bias_0, weight = wrapped_model_language_model_layers_29_mlp_down_proj_weight_palettized, x = input_359)[name = tensor("linear_209")]; tensor var_22_promoted_179_to_fp16 = const()[name = tensor("op_22_promoted_179_to_fp16"), val = tensor(0x1p+1)]; tensor var_6648_cast_fp16 = pow(x = x_715, y = var_22_promoted_179_to_fp16)[name = tensor("op_6648_cast_fp16")]; tensor var_6650_axes_0 = const()[name = tensor("op_6650_axes_0"), val = tensor([-1])]; tensor var_6650_keep_dims_0 = const()[name = tensor("op_6650_keep_dims_0"), val = tensor(true)]; tensor var_6650_cast_fp16 = reduce_mean(axes = var_6650_axes_0, keep_dims = var_6650_keep_dims_0, x = var_6648_cast_fp16)[name = tensor("op_6650_cast_fp16")]; tensor var_6651_to_fp16 = const()[name = tensor("op_6651_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_6652_cast_fp16 = add(x = var_6650_cast_fp16, y = var_6651_to_fp16)[name = tensor("op_6652_cast_fp16")]; tensor var_6653_epsilon_0 = const()[name = tensor("op_6653_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_6653_cast_fp16 = rsqrt(epsilon = var_6653_epsilon_0, x = var_6652_cast_fp16)[name = tensor("op_6653_cast_fp16")]; tensor output_717_cast_fp16 = mul(x = x_715, y = var_6653_cast_fp16)[name = tensor("output_717_cast_fp16")]; tensor var_6657_to_fp16 = const()[name = tensor("op_6657_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940841728)))]; tensor output_719_cast_fp16 = mul(x = output_717_cast_fp16, y = var_6657_to_fp16)[name = tensor("output_719_cast_fp16")]; tensor x_719 = add(x = x_711, y = output_719_cast_fp16)[name = tensor("x_719")]; tensor var_22_promoted_180_to_fp16 = const()[name = tensor("op_22_promoted_180_to_fp16"), val = tensor(0x1p+1)]; tensor var_6669_cast_fp16 = pow(x = x_719, y = var_22_promoted_180_to_fp16)[name = tensor("op_6669_cast_fp16")]; tensor var_6671_axes_0 = const()[name = tensor("op_6671_axes_0"), val = tensor([-1])]; tensor var_6671_keep_dims_0 = const()[name = tensor("op_6671_keep_dims_0"), val = tensor(true)]; tensor var_6671_cast_fp16 = reduce_mean(axes = var_6671_axes_0, keep_dims = var_6671_keep_dims_0, x = var_6669_cast_fp16)[name = tensor("op_6671_cast_fp16")]; tensor var_6672_to_fp16 = const()[name = tensor("op_6672_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_6673_cast_fp16 = add(x = var_6671_cast_fp16, y = var_6672_to_fp16)[name = tensor("op_6673_cast_fp16")]; tensor var_6674_epsilon_0 = const()[name = tensor("op_6674_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_6674_cast_fp16 = rsqrt(epsilon = var_6674_epsilon_0, x = var_6673_cast_fp16)[name = tensor("op_6674_cast_fp16")]; tensor output_721_cast_fp16 = mul(x = x_719, y = var_6674_cast_fp16)[name = tensor("output_721_cast_fp16")]; tensor var_6678_to_fp16 = const()[name = tensor("op_6678_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940846912)))]; tensor output_723_cast_fp16 = mul(x = output_721_cast_fp16, y = var_6678_to_fp16)[name = tensor("output_723_cast_fp16")]; tensor var_6690 = linear(bias = linear_0_bias_0, weight = wrapped_model_language_model_layers_30_self_attn_q_proj_weight_palettized, x = output_723_cast_fp16)[name = tensor("linear_210")]; tensor var_6691 = const()[name = tensor("op_6691"), val = tensor([1, 256, -1, 256])]; tensor var_6692 = reshape(shape = var_6691, x = var_6690)[name = tensor("op_6692")]; tensor x_723_perm_0 = const()[name = tensor("x_723_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_6695 = linear(bias = linear_1_bias_0, weight = wrapped_model_language_model_layers_30_self_attn_k_proj_weight_palettized, x = output_723_cast_fp16)[name = tensor("linear_211")]; tensor var_6696 = const()[name = tensor("op_6696"), val = tensor([1, 256, -1, 256])]; tensor var_6697 = reshape(shape = var_6696, x = var_6695)[name = tensor("op_6697")]; tensor x_727_perm_0 = const()[name = tensor("x_727_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_6700 = linear(bias = linear_1_bias_0, weight = wrapped_model_language_model_layers_30_self_attn_v_proj_weight_palettized, x = output_723_cast_fp16)[name = tensor("linear_212")]; tensor var_6701 = const()[name = tensor("op_6701"), val = tensor([1, 256, -1, 256])]; tensor var_6702 = reshape(shape = var_6701, x = var_6700)[name = tensor("op_6702")]; tensor hidden_states_427_perm_0 = const()[name = tensor("hidden_states_427_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_22_promoted_181_to_fp16 = const()[name = tensor("op_22_promoted_181_to_fp16"), val = tensor(0x1p+1)]; tensor x_723 = transpose(perm = x_723_perm_0, x = var_6692)[name = tensor("transpose_15")]; tensor var_6706_cast_fp16 = pow(x = x_723, y = var_22_promoted_181_to_fp16)[name = tensor("op_6706_cast_fp16")]; tensor var_6708_axes_0 = const()[name = tensor("op_6708_axes_0"), val = tensor([-1])]; tensor var_6708_keep_dims_0 = const()[name = tensor("op_6708_keep_dims_0"), val = tensor(true)]; tensor var_6708_cast_fp16 = reduce_mean(axes = var_6708_axes_0, keep_dims = var_6708_keep_dims_0, x = var_6706_cast_fp16)[name = tensor("op_6708_cast_fp16")]; tensor var_6709_to_fp16 = const()[name = tensor("op_6709_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_6710_cast_fp16 = add(x = var_6708_cast_fp16, y = var_6709_to_fp16)[name = tensor("op_6710_cast_fp16")]; tensor var_6711_epsilon_0 = const()[name = tensor("op_6711_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_6711_cast_fp16 = rsqrt(epsilon = var_6711_epsilon_0, x = var_6710_cast_fp16)[name = tensor("op_6711_cast_fp16")]; tensor output_725_cast_fp16 = mul(x = x_723, y = var_6711_cast_fp16)[name = tensor("output_725_cast_fp16")]; tensor var_6715_to_fp16 = const()[name = tensor("op_6715_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940852096)))]; tensor output_727_cast_fp16 = mul(x = output_725_cast_fp16, y = var_6715_to_fp16)[name = tensor("output_727_cast_fp16")]; tensor var_22_promoted_182_to_fp16 = const()[name = tensor("op_22_promoted_182_to_fp16"), val = tensor(0x1p+1)]; tensor x_727 = transpose(perm = x_727_perm_0, x = var_6697)[name = tensor("transpose_14")]; tensor var_6720_cast_fp16 = pow(x = x_727, y = var_22_promoted_182_to_fp16)[name = tensor("op_6720_cast_fp16")]; tensor var_6722_axes_0 = const()[name = tensor("op_6722_axes_0"), val = tensor([-1])]; tensor var_6722_keep_dims_0 = const()[name = tensor("op_6722_keep_dims_0"), val = tensor(true)]; tensor var_6722_cast_fp16 = reduce_mean(axes = var_6722_axes_0, keep_dims = var_6722_keep_dims_0, x = var_6720_cast_fp16)[name = tensor("op_6722_cast_fp16")]; tensor var_6723_to_fp16 = const()[name = tensor("op_6723_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_6724_cast_fp16 = add(x = var_6722_cast_fp16, y = var_6723_to_fp16)[name = tensor("op_6724_cast_fp16")]; tensor var_6725_epsilon_0 = const()[name = tensor("op_6725_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_6725_cast_fp16 = rsqrt(epsilon = var_6725_epsilon_0, x = var_6724_cast_fp16)[name = tensor("op_6725_cast_fp16")]; tensor output_729_cast_fp16 = mul(x = x_727, y = var_6725_cast_fp16)[name = tensor("output_729_cast_fp16")]; tensor var_6729_to_fp16 = const()[name = tensor("op_6729_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940852672)))]; tensor output_731_cast_fp16 = mul(x = output_729_cast_fp16, y = var_6729_to_fp16)[name = tensor("output_731_cast_fp16")]; tensor var_6734 = mul(x = output_727_cast_fp16, y = cos_7_palettized)[name = tensor("op_6734")]; tensor x1_121_begin_0 = const()[name = tensor("x1_121_begin_0"), val = tensor([0, 0, 0, 0])]; tensor x1_121_end_0 = const()[name = tensor("x1_121_end_0"), val = tensor([1, 8, 256, 128])]; tensor x1_121_end_mask_0 = const()[name = tensor("x1_121_end_mask_0"), val = tensor([true, true, true, false])]; tensor x1_121 = slice_by_index(begin = x1_121_begin_0, end = x1_121_end_0, end_mask = x1_121_end_mask_0, x = output_727_cast_fp16)[name = tensor("x1_121")]; tensor x2_121_begin_0 = const()[name = tensor("x2_121_begin_0"), val = tensor([0, 0, 0, 128])]; tensor x2_121_end_0 = const()[name = tensor("x2_121_end_0"), val = tensor([1, 8, 256, 256])]; tensor x2_121_end_mask_0 = const()[name = tensor("x2_121_end_mask_0"), val = tensor([true, true, true, true])]; tensor x2_121 = slice_by_index(begin = x2_121_begin_0, end = x2_121_end_0, end_mask = x2_121_end_mask_0, x = output_727_cast_fp16)[name = tensor("x2_121")]; tensor const_725_promoted = const()[name = tensor("const_725_promoted"), val = tensor(-0x1p+0)]; tensor var_6745 = mul(x = x2_121, y = const_725_promoted)[name = tensor("op_6745")]; tensor var_6747_interleave_0 = const()[name = tensor("op_6747_interleave_0"), val = tensor(false)]; tensor var_6747 = concat(axis = var_24, interleave = var_6747_interleave_0, values = (var_6745, x1_121))[name = tensor("op_6747")]; tensor var_6748 = mul(x = var_6747, y = sin_7_palettized)[name = tensor("op_6748")]; tensor query_61 = add(x = var_6734, y = var_6748)[name = tensor("query_61")]; tensor var_6750 = mul(x = output_731_cast_fp16, y = cos_7_palettized)[name = tensor("op_6750")]; tensor x1_123_begin_0 = const()[name = tensor("x1_123_begin_0"), val = tensor([0, 0, 0, 0])]; tensor x1_123_end_0 = const()[name = tensor("x1_123_end_0"), val = tensor([1, 4, 256, 128])]; tensor x1_123_end_mask_0 = const()[name = tensor("x1_123_end_mask_0"), val = tensor([true, true, true, false])]; tensor x1_123 = slice_by_index(begin = x1_123_begin_0, end = x1_123_end_0, end_mask = x1_123_end_mask_0, x = output_731_cast_fp16)[name = tensor("x1_123")]; tensor x2_123_begin_0 = const()[name = tensor("x2_123_begin_0"), val = tensor([0, 0, 0, 128])]; tensor x2_123_end_0 = const()[name = tensor("x2_123_end_0"), val = tensor([1, 4, 256, 256])]; tensor x2_123_end_mask_0 = const()[name = tensor("x2_123_end_mask_0"), val = tensor([true, true, true, true])]; tensor x2_123 = slice_by_index(begin = x2_123_begin_0, end = x2_123_end_0, end_mask = x2_123_end_mask_0, x = output_731_cast_fp16)[name = tensor("x2_123")]; tensor const_728_promoted = const()[name = tensor("const_728_promoted"), val = tensor(-0x1p+0)]; tensor var_6761 = mul(x = x2_123, y = const_728_promoted)[name = tensor("op_6761")]; tensor var_6763_interleave_0 = const()[name = tensor("op_6763_interleave_0"), val = tensor(false)]; tensor var_6763 = concat(axis = var_24, interleave = var_6763_interleave_0, values = (var_6761, x1_123))[name = tensor("op_6763")]; tensor var_6764 = mul(x = var_6763, y = sin_7_palettized)[name = tensor("op_6764")]; tensor hidden_states_423 = add(x = var_6750, y = var_6764)[name = tensor("hidden_states_423")]; tensor var_6773_axes_0 = const()[name = tensor("op_6773_axes_0"), val = tensor([2])]; tensor var_6773 = expand_dims(axes = var_6773_axes_0, x = hidden_states_423)[name = tensor("op_6773")]; tensor hidden_states_425_reps_0 = const()[name = tensor("hidden_states_425_reps_0"), val = tensor([1, 1, 2, 1, 1])]; tensor hidden_states_425 = tile(reps = hidden_states_425_reps_0, x = var_6773)[name = tensor("hidden_states_425")]; tensor var_6781 = const()[name = tensor("op_6781"), val = tensor([1, 8, 256, 256])]; tensor key_states_61 = reshape(shape = var_6781, x = hidden_states_425)[name = tensor("key_states_61")]; tensor var_6790_axes_0 = const()[name = tensor("op_6790_axes_0"), val = tensor([2])]; tensor hidden_states_427 = transpose(perm = hidden_states_427_perm_0, x = var_6702)[name = tensor("transpose_13")]; tensor var_6790 = expand_dims(axes = var_6790_axes_0, x = hidden_states_427)[name = tensor("op_6790")]; tensor hidden_states_429_reps_0 = const()[name = tensor("hidden_states_429_reps_0"), val = tensor([1, 1, 2, 1, 1])]; tensor hidden_states_429 = tile(reps = hidden_states_429_reps_0, x = var_6790)[name = tensor("hidden_states_429")]; tensor var_6798 = const()[name = tensor("op_6798"), val = tensor([1, 8, 256, 256])]; tensor value_states_61 = reshape(shape = var_6798, x = hidden_states_429)[name = tensor("value_states_61")]; tensor var_6801_transpose_x_1 = const()[name = tensor("op_6801_transpose_x_1"), val = tensor(false)]; tensor var_6801_transpose_y_1 = const()[name = tensor("op_6801_transpose_y_1"), val = tensor(true)]; tensor var_6801 = matmul(transpose_x = var_6801_transpose_x_1, transpose_y = var_6801_transpose_y_1, x = query_61, y = key_states_61)[name = tensor("op_6801")]; tensor var_6802_to_fp16 = const()[name = tensor("op_6802_to_fp16"), val = tensor(0x1p-4)]; tensor attn_weights_121_cast_fp16 = mul(x = var_6801, y = var_6802_to_fp16)[name = tensor("attn_weights_121_cast_fp16")]; tensor input_361_cast_fp16 = add(x = attn_weights_121_cast_fp16, y = attention_mask_to_fp16_palettized)[name = tensor("input_361_cast_fp16")]; tensor var_6810_cast_fp16 = softmax(axis = var_24, x = input_361_cast_fp16)[name = tensor("op_6810_cast_fp16")]; tensor attn_output_121_transpose_x_0 = const()[name = tensor("attn_output_121_transpose_x_0"), val = tensor(false)]; tensor attn_output_121_transpose_y_0 = const()[name = tensor("attn_output_121_transpose_y_0"), val = tensor(false)]; tensor attn_output_121 = matmul(transpose_x = attn_output_121_transpose_x_0, transpose_y = attn_output_121_transpose_y_0, x = var_6810_cast_fp16, y = value_states_61)[name = tensor("attn_output_121")]; tensor var_6814_perm_0 = const()[name = tensor("op_6814_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_6816 = const()[name = tensor("op_6816"), val = tensor([1, 256, -1])]; tensor var_6814 = transpose(perm = var_6814_perm_0, x = attn_output_121)[name = tensor("transpose_12")]; tensor var_6817 = reshape(shape = var_6816, x = var_6814)[name = tensor("op_6817")]; tensor x_731 = linear(bias = linear_3_bias_0, weight = wrapped_model_language_model_layers_30_self_attn_o_proj_weight_palettized, x = var_6817)[name = tensor("linear_213")]; tensor var_22_promoted_183_to_fp16 = const()[name = tensor("op_22_promoted_183_to_fp16"), val = tensor(0x1p+1)]; tensor var_6823_cast_fp16 = pow(x = x_731, y = var_22_promoted_183_to_fp16)[name = tensor("op_6823_cast_fp16")]; tensor var_6825_axes_0 = const()[name = tensor("op_6825_axes_0"), val = tensor([-1])]; tensor var_6825_keep_dims_0 = const()[name = tensor("op_6825_keep_dims_0"), val = tensor(true)]; tensor var_6825_cast_fp16 = reduce_mean(axes = var_6825_axes_0, keep_dims = var_6825_keep_dims_0, x = var_6823_cast_fp16)[name = tensor("op_6825_cast_fp16")]; tensor var_6826_to_fp16 = const()[name = tensor("op_6826_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_6827_cast_fp16 = add(x = var_6825_cast_fp16, y = var_6826_to_fp16)[name = tensor("op_6827_cast_fp16")]; tensor var_6828_epsilon_0 = const()[name = tensor("op_6828_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_6828_cast_fp16 = rsqrt(epsilon = var_6828_epsilon_0, x = var_6827_cast_fp16)[name = tensor("op_6828_cast_fp16")]; tensor output_733_cast_fp16 = mul(x = x_731, y = var_6828_cast_fp16)[name = tensor("output_733_cast_fp16")]; tensor var_6832_to_fp16 = const()[name = tensor("op_6832_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940853248)))]; tensor output_735_cast_fp16 = mul(x = output_733_cast_fp16, y = var_6832_to_fp16)[name = tensor("output_735_cast_fp16")]; tensor x_735 = add(x = x_719, y = output_735_cast_fp16)[name = tensor("x_735")]; tensor var_22_promoted_184_to_fp16 = const()[name = tensor("op_22_promoted_184_to_fp16"), val = tensor(0x1p+1)]; tensor var_6838_cast_fp16 = pow(x = x_735, y = var_22_promoted_184_to_fp16)[name = tensor("op_6838_cast_fp16")]; tensor var_6840_axes_0 = const()[name = tensor("op_6840_axes_0"), val = tensor([-1])]; tensor var_6840_keep_dims_0 = const()[name = tensor("op_6840_keep_dims_0"), val = tensor(true)]; tensor var_6840_cast_fp16 = reduce_mean(axes = var_6840_axes_0, keep_dims = var_6840_keep_dims_0, x = var_6838_cast_fp16)[name = tensor("op_6840_cast_fp16")]; tensor var_6841_to_fp16 = const()[name = tensor("op_6841_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_6842_cast_fp16 = add(x = var_6840_cast_fp16, y = var_6841_to_fp16)[name = tensor("op_6842_cast_fp16")]; tensor var_6843_epsilon_0 = const()[name = tensor("op_6843_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_6843_cast_fp16 = rsqrt(epsilon = var_6843_epsilon_0, x = var_6842_cast_fp16)[name = tensor("op_6843_cast_fp16")]; tensor output_737_cast_fp16 = mul(x = x_735, y = var_6843_cast_fp16)[name = tensor("output_737_cast_fp16")]; tensor var_6847_to_fp16 = const()[name = tensor("op_6847_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940858432)))]; tensor output_739_cast_fp16 = mul(x = output_737_cast_fp16, y = var_6847_to_fp16)[name = tensor("output_739_cast_fp16")]; tensor input_369 = linear(bias = linear_4_bias_0, weight = wrapped_model_language_model_layers_30_mlp_gate_proj_weight_palettized, x = output_739_cast_fp16)[name = tensor("linear_214")]; tensor var_6855_mode_0 = const()[name = tensor("op_6855_mode_0"), val = tensor("TANH_APPROXIMATION")]; tensor var_6855 = gelu(mode = var_6855_mode_0, x = input_369)[name = tensor("op_6855")]; tensor var_6857 = linear(bias = linear_4_bias_0, weight = wrapped_model_language_model_layers_30_mlp_up_proj_weight_palettized, x = output_739_cast_fp16)[name = tensor("linear_215")]; tensor input_371 = mul(x = var_6855, y = var_6857)[name = tensor("input_371")]; tensor x_739 = linear(bias = linear_3_bias_0, weight = wrapped_model_language_model_layers_30_mlp_down_proj_weight_palettized, x = input_371)[name = tensor("linear_216")]; tensor var_22_promoted_185_to_fp16 = const()[name = tensor("op_22_promoted_185_to_fp16"), val = tensor(0x1p+1)]; tensor var_6863_cast_fp16 = pow(x = x_739, y = var_22_promoted_185_to_fp16)[name = tensor("op_6863_cast_fp16")]; tensor var_6865_axes_0 = const()[name = tensor("op_6865_axes_0"), val = tensor([-1])]; tensor var_6865_keep_dims_0 = const()[name = tensor("op_6865_keep_dims_0"), val = tensor(true)]; tensor var_6865_cast_fp16 = reduce_mean(axes = var_6865_axes_0, keep_dims = var_6865_keep_dims_0, x = var_6863_cast_fp16)[name = tensor("op_6865_cast_fp16")]; tensor var_6866_to_fp16 = const()[name = tensor("op_6866_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_6867_cast_fp16 = add(x = var_6865_cast_fp16, y = var_6866_to_fp16)[name = tensor("op_6867_cast_fp16")]; tensor var_6868_epsilon_0 = const()[name = tensor("op_6868_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_6868_cast_fp16 = rsqrt(epsilon = var_6868_epsilon_0, x = var_6867_cast_fp16)[name = tensor("op_6868_cast_fp16")]; tensor output_741_cast_fp16 = mul(x = x_739, y = var_6868_cast_fp16)[name = tensor("output_741_cast_fp16")]; tensor var_6872_to_fp16 = const()[name = tensor("op_6872_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940863616)))]; tensor output_743_cast_fp16 = mul(x = output_741_cast_fp16, y = var_6872_to_fp16)[name = tensor("output_743_cast_fp16")]; tensor x_743 = add(x = x_735, y = output_743_cast_fp16)[name = tensor("x_743")]; tensor var_22_promoted_186_to_fp16 = const()[name = tensor("op_22_promoted_186_to_fp16"), val = tensor(0x1p+1)]; tensor var_6884_cast_fp16 = pow(x = x_743, y = var_22_promoted_186_to_fp16)[name = tensor("op_6884_cast_fp16")]; tensor var_6886_axes_0 = const()[name = tensor("op_6886_axes_0"), val = tensor([-1])]; tensor var_6886_keep_dims_0 = const()[name = tensor("op_6886_keep_dims_0"), val = tensor(true)]; tensor var_6886_cast_fp16 = reduce_mean(axes = var_6886_axes_0, keep_dims = var_6886_keep_dims_0, x = var_6884_cast_fp16)[name = tensor("op_6886_cast_fp16")]; tensor var_6887_to_fp16 = const()[name = tensor("op_6887_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_6888_cast_fp16 = add(x = var_6886_cast_fp16, y = var_6887_to_fp16)[name = tensor("op_6888_cast_fp16")]; tensor var_6889_epsilon_0 = const()[name = tensor("op_6889_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_6889_cast_fp16 = rsqrt(epsilon = var_6889_epsilon_0, x = var_6888_cast_fp16)[name = tensor("op_6889_cast_fp16")]; tensor output_745_cast_fp16 = mul(x = x_743, y = var_6889_cast_fp16)[name = tensor("output_745_cast_fp16")]; tensor var_6893_to_fp16 = const()[name = tensor("op_6893_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940868800)))]; tensor output_747_cast_fp16 = mul(x = output_745_cast_fp16, y = var_6893_to_fp16)[name = tensor("output_747_cast_fp16")]; tensor var_6905 = linear(bias = linear_0_bias_0, weight = wrapped_model_language_model_layers_31_self_attn_q_proj_weight_palettized, x = output_747_cast_fp16)[name = tensor("linear_217")]; tensor var_6906 = const()[name = tensor("op_6906"), val = tensor([1, 256, -1, 256])]; tensor var_6907 = reshape(shape = var_6906, x = var_6905)[name = tensor("op_6907")]; tensor x_747_perm_0 = const()[name = tensor("x_747_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_6910 = linear(bias = linear_1_bias_0, weight = wrapped_model_language_model_layers_31_self_attn_k_proj_weight_palettized, x = output_747_cast_fp16)[name = tensor("linear_218")]; tensor var_6911 = const()[name = tensor("op_6911"), val = tensor([1, 256, -1, 256])]; tensor var_6912 = reshape(shape = var_6911, x = var_6910)[name = tensor("op_6912")]; tensor x_751_perm_0 = const()[name = tensor("x_751_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_6915 = linear(bias = linear_1_bias_0, weight = wrapped_model_language_model_layers_31_self_attn_v_proj_weight_palettized, x = output_747_cast_fp16)[name = tensor("linear_219")]; tensor var_6916 = const()[name = tensor("op_6916"), val = tensor([1, 256, -1, 256])]; tensor var_6917 = reshape(shape = var_6916, x = var_6915)[name = tensor("op_6917")]; tensor hidden_states_441_perm_0 = const()[name = tensor("hidden_states_441_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_22_promoted_187_to_fp16 = const()[name = tensor("op_22_promoted_187_to_fp16"), val = tensor(0x1p+1)]; tensor x_747 = transpose(perm = x_747_perm_0, x = var_6907)[name = tensor("transpose_11")]; tensor var_6921_cast_fp16 = pow(x = x_747, y = var_22_promoted_187_to_fp16)[name = tensor("op_6921_cast_fp16")]; tensor var_6923_axes_0 = const()[name = tensor("op_6923_axes_0"), val = tensor([-1])]; tensor var_6923_keep_dims_0 = const()[name = tensor("op_6923_keep_dims_0"), val = tensor(true)]; tensor var_6923_cast_fp16 = reduce_mean(axes = var_6923_axes_0, keep_dims = var_6923_keep_dims_0, x = var_6921_cast_fp16)[name = tensor("op_6923_cast_fp16")]; tensor var_6924_to_fp16 = const()[name = tensor("op_6924_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_6925_cast_fp16 = add(x = var_6923_cast_fp16, y = var_6924_to_fp16)[name = tensor("op_6925_cast_fp16")]; tensor var_6926_epsilon_0 = const()[name = tensor("op_6926_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_6926_cast_fp16 = rsqrt(epsilon = var_6926_epsilon_0, x = var_6925_cast_fp16)[name = tensor("op_6926_cast_fp16")]; tensor output_749_cast_fp16 = mul(x = x_747, y = var_6926_cast_fp16)[name = tensor("output_749_cast_fp16")]; tensor var_6930_to_fp16 = const()[name = tensor("op_6930_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940873984)))]; tensor output_751_cast_fp16 = mul(x = output_749_cast_fp16, y = var_6930_to_fp16)[name = tensor("output_751_cast_fp16")]; tensor var_22_promoted_188_to_fp16 = const()[name = tensor("op_22_promoted_188_to_fp16"), val = tensor(0x1p+1)]; tensor x_751 = transpose(perm = x_751_perm_0, x = var_6912)[name = tensor("transpose_10")]; tensor var_6935_cast_fp16 = pow(x = x_751, y = var_22_promoted_188_to_fp16)[name = tensor("op_6935_cast_fp16")]; tensor var_6937_axes_0 = const()[name = tensor("op_6937_axes_0"), val = tensor([-1])]; tensor var_6937_keep_dims_0 = const()[name = tensor("op_6937_keep_dims_0"), val = tensor(true)]; tensor var_6937_cast_fp16 = reduce_mean(axes = var_6937_axes_0, keep_dims = var_6937_keep_dims_0, x = var_6935_cast_fp16)[name = tensor("op_6937_cast_fp16")]; tensor var_6938_to_fp16 = const()[name = tensor("op_6938_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_6939_cast_fp16 = add(x = var_6937_cast_fp16, y = var_6938_to_fp16)[name = tensor("op_6939_cast_fp16")]; tensor var_6940_epsilon_0 = const()[name = tensor("op_6940_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_6940_cast_fp16 = rsqrt(epsilon = var_6940_epsilon_0, x = var_6939_cast_fp16)[name = tensor("op_6940_cast_fp16")]; tensor output_753_cast_fp16 = mul(x = x_751, y = var_6940_cast_fp16)[name = tensor("output_753_cast_fp16")]; tensor var_6944_to_fp16 = const()[name = tensor("op_6944_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940874560)))]; tensor output_755_cast_fp16 = mul(x = output_753_cast_fp16, y = var_6944_to_fp16)[name = tensor("output_755_cast_fp16")]; tensor var_6949 = mul(x = output_751_cast_fp16, y = cos_7_palettized)[name = tensor("op_6949")]; tensor x1_125_begin_0 = const()[name = tensor("x1_125_begin_0"), val = tensor([0, 0, 0, 0])]; tensor x1_125_end_0 = const()[name = tensor("x1_125_end_0"), val = tensor([1, 8, 256, 128])]; tensor x1_125_end_mask_0 = const()[name = tensor("x1_125_end_mask_0"), val = tensor([true, true, true, false])]; tensor x1_125 = slice_by_index(begin = x1_125_begin_0, end = x1_125_end_0, end_mask = x1_125_end_mask_0, x = output_751_cast_fp16)[name = tensor("x1_125")]; tensor x2_125_begin_0 = const()[name = tensor("x2_125_begin_0"), val = tensor([0, 0, 0, 128])]; tensor x2_125_end_0 = const()[name = tensor("x2_125_end_0"), val = tensor([1, 8, 256, 256])]; tensor x2_125_end_mask_0 = const()[name = tensor("x2_125_end_mask_0"), val = tensor([true, true, true, true])]; tensor x2_125 = slice_by_index(begin = x2_125_begin_0, end = x2_125_end_0, end_mask = x2_125_end_mask_0, x = output_751_cast_fp16)[name = tensor("x2_125")]; tensor const_748_promoted = const()[name = tensor("const_748_promoted"), val = tensor(-0x1p+0)]; tensor var_6960 = mul(x = x2_125, y = const_748_promoted)[name = tensor("op_6960")]; tensor var_6962_interleave_0 = const()[name = tensor("op_6962_interleave_0"), val = tensor(false)]; tensor var_6962 = concat(axis = var_24, interleave = var_6962_interleave_0, values = (var_6960, x1_125))[name = tensor("op_6962")]; tensor var_6963 = mul(x = var_6962, y = sin_7_palettized)[name = tensor("op_6963")]; tensor query_63 = add(x = var_6949, y = var_6963)[name = tensor("query_63")]; tensor var_6965 = mul(x = output_755_cast_fp16, y = cos_7_palettized)[name = tensor("op_6965")]; tensor x1_127_begin_0 = const()[name = tensor("x1_127_begin_0"), val = tensor([0, 0, 0, 0])]; tensor x1_127_end_0 = const()[name = tensor("x1_127_end_0"), val = tensor([1, 4, 256, 128])]; tensor x1_127_end_mask_0 = const()[name = tensor("x1_127_end_mask_0"), val = tensor([true, true, true, false])]; tensor x1_127 = slice_by_index(begin = x1_127_begin_0, end = x1_127_end_0, end_mask = x1_127_end_mask_0, x = output_755_cast_fp16)[name = tensor("x1_127")]; tensor x2_127_begin_0 = const()[name = tensor("x2_127_begin_0"), val = tensor([0, 0, 0, 128])]; tensor x2_127_end_0 = const()[name = tensor("x2_127_end_0"), val = tensor([1, 4, 256, 256])]; tensor x2_127_end_mask_0 = const()[name = tensor("x2_127_end_mask_0"), val = tensor([true, true, true, true])]; tensor x2_127 = slice_by_index(begin = x2_127_begin_0, end = x2_127_end_0, end_mask = x2_127_end_mask_0, x = output_755_cast_fp16)[name = tensor("x2_127")]; tensor const_751_promoted = const()[name = tensor("const_751_promoted"), val = tensor(-0x1p+0)]; tensor var_6976 = mul(x = x2_127, y = const_751_promoted)[name = tensor("op_6976")]; tensor var_6978_interleave_0 = const()[name = tensor("op_6978_interleave_0"), val = tensor(false)]; tensor var_6978 = concat(axis = var_24, interleave = var_6978_interleave_0, values = (var_6976, x1_127))[name = tensor("op_6978")]; tensor var_6979 = mul(x = var_6978, y = sin_7_palettized)[name = tensor("op_6979")]; tensor hidden_states_437 = add(x = var_6965, y = var_6979)[name = tensor("hidden_states_437")]; tensor var_6988_axes_0 = const()[name = tensor("op_6988_axes_0"), val = tensor([2])]; tensor var_6988 = expand_dims(axes = var_6988_axes_0, x = hidden_states_437)[name = tensor("op_6988")]; tensor hidden_states_439_reps_0 = const()[name = tensor("hidden_states_439_reps_0"), val = tensor([1, 1, 2, 1, 1])]; tensor hidden_states_439 = tile(reps = hidden_states_439_reps_0, x = var_6988)[name = tensor("hidden_states_439")]; tensor var_6996 = const()[name = tensor("op_6996"), val = tensor([1, 8, 256, 256])]; tensor key_states_63 = reshape(shape = var_6996, x = hidden_states_439)[name = tensor("key_states_63")]; tensor var_7005_axes_0 = const()[name = tensor("op_7005_axes_0"), val = tensor([2])]; tensor hidden_states_441 = transpose(perm = hidden_states_441_perm_0, x = var_6917)[name = tensor("transpose_9")]; tensor var_7005 = expand_dims(axes = var_7005_axes_0, x = hidden_states_441)[name = tensor("op_7005")]; tensor hidden_states_443_reps_0 = const()[name = tensor("hidden_states_443_reps_0"), val = tensor([1, 1, 2, 1, 1])]; tensor hidden_states_443 = tile(reps = hidden_states_443_reps_0, x = var_7005)[name = tensor("hidden_states_443")]; tensor var_7013 = const()[name = tensor("op_7013"), val = tensor([1, 8, 256, 256])]; tensor value_states_63 = reshape(shape = var_7013, x = hidden_states_443)[name = tensor("value_states_63")]; tensor var_7016_transpose_x_1 = const()[name = tensor("op_7016_transpose_x_1"), val = tensor(false)]; tensor var_7016_transpose_y_1 = const()[name = tensor("op_7016_transpose_y_1"), val = tensor(true)]; tensor var_7016 = matmul(transpose_x = var_7016_transpose_x_1, transpose_y = var_7016_transpose_y_1, x = query_63, y = key_states_63)[name = tensor("op_7016")]; tensor var_7017_to_fp16 = const()[name = tensor("op_7017_to_fp16"), val = tensor(0x1p-4)]; tensor attn_weights_125_cast_fp16 = mul(x = var_7016, y = var_7017_to_fp16)[name = tensor("attn_weights_125_cast_fp16")]; tensor input_373_cast_fp16 = add(x = attn_weights_125_cast_fp16, y = attention_mask_to_fp16_palettized)[name = tensor("input_373_cast_fp16")]; tensor var_7025_cast_fp16 = softmax(axis = var_24, x = input_373_cast_fp16)[name = tensor("op_7025_cast_fp16")]; tensor attn_output_125_transpose_x_0 = const()[name = tensor("attn_output_125_transpose_x_0"), val = tensor(false)]; tensor attn_output_125_transpose_y_0 = const()[name = tensor("attn_output_125_transpose_y_0"), val = tensor(false)]; tensor attn_output_125 = matmul(transpose_x = attn_output_125_transpose_x_0, transpose_y = attn_output_125_transpose_y_0, x = var_7025_cast_fp16, y = value_states_63)[name = tensor("attn_output_125")]; tensor var_7029_perm_0 = const()[name = tensor("op_7029_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_7031 = const()[name = tensor("op_7031"), val = tensor([1, 256, -1])]; tensor var_7029 = transpose(perm = var_7029_perm_0, x = attn_output_125)[name = tensor("transpose_8")]; tensor var_7032 = reshape(shape = var_7031, x = var_7029)[name = tensor("op_7032")]; tensor x_755 = linear(bias = linear_3_bias_0, weight = wrapped_model_language_model_layers_31_self_attn_o_proj_weight_palettized, x = var_7032)[name = tensor("linear_220")]; tensor var_22_promoted_189_to_fp16 = const()[name = tensor("op_22_promoted_189_to_fp16"), val = tensor(0x1p+1)]; tensor var_7038_cast_fp16 = pow(x = x_755, y = var_22_promoted_189_to_fp16)[name = tensor("op_7038_cast_fp16")]; tensor var_7040_axes_0 = const()[name = tensor("op_7040_axes_0"), val = tensor([-1])]; tensor var_7040_keep_dims_0 = const()[name = tensor("op_7040_keep_dims_0"), val = tensor(true)]; tensor var_7040_cast_fp16 = reduce_mean(axes = var_7040_axes_0, keep_dims = var_7040_keep_dims_0, x = var_7038_cast_fp16)[name = tensor("op_7040_cast_fp16")]; tensor var_7041_to_fp16 = const()[name = tensor("op_7041_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_7042_cast_fp16 = add(x = var_7040_cast_fp16, y = var_7041_to_fp16)[name = tensor("op_7042_cast_fp16")]; tensor var_7043_epsilon_0 = const()[name = tensor("op_7043_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_7043_cast_fp16 = rsqrt(epsilon = var_7043_epsilon_0, x = var_7042_cast_fp16)[name = tensor("op_7043_cast_fp16")]; tensor output_757_cast_fp16 = mul(x = x_755, y = var_7043_cast_fp16)[name = tensor("output_757_cast_fp16")]; tensor var_7047_to_fp16 = const()[name = tensor("op_7047_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940875136)))]; tensor output_759_cast_fp16 = mul(x = output_757_cast_fp16, y = var_7047_to_fp16)[name = tensor("output_759_cast_fp16")]; tensor x_759 = add(x = x_743, y = output_759_cast_fp16)[name = tensor("x_759")]; tensor var_22_promoted_190_to_fp16 = const()[name = tensor("op_22_promoted_190_to_fp16"), val = tensor(0x1p+1)]; tensor var_7053_cast_fp16 = pow(x = x_759, y = var_22_promoted_190_to_fp16)[name = tensor("op_7053_cast_fp16")]; tensor var_7055_axes_0 = const()[name = tensor("op_7055_axes_0"), val = tensor([-1])]; tensor var_7055_keep_dims_0 = const()[name = tensor("op_7055_keep_dims_0"), val = tensor(true)]; tensor var_7055_cast_fp16 = reduce_mean(axes = var_7055_axes_0, keep_dims = var_7055_keep_dims_0, x = var_7053_cast_fp16)[name = tensor("op_7055_cast_fp16")]; tensor var_7056_to_fp16 = const()[name = tensor("op_7056_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_7057_cast_fp16 = add(x = var_7055_cast_fp16, y = var_7056_to_fp16)[name = tensor("op_7057_cast_fp16")]; tensor var_7058_epsilon_0 = const()[name = tensor("op_7058_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_7058_cast_fp16 = rsqrt(epsilon = var_7058_epsilon_0, x = var_7057_cast_fp16)[name = tensor("op_7058_cast_fp16")]; tensor output_761_cast_fp16 = mul(x = x_759, y = var_7058_cast_fp16)[name = tensor("output_761_cast_fp16")]; tensor var_7062_to_fp16 = const()[name = tensor("op_7062_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940880320)))]; tensor output_763_cast_fp16 = mul(x = output_761_cast_fp16, y = var_7062_to_fp16)[name = tensor("output_763_cast_fp16")]; tensor input_381 = linear(bias = linear_4_bias_0, weight = wrapped_model_language_model_layers_31_mlp_gate_proj_weight_palettized, x = output_763_cast_fp16)[name = tensor("linear_221")]; tensor var_7070_mode_0 = const()[name = tensor("op_7070_mode_0"), val = tensor("TANH_APPROXIMATION")]; tensor var_7070 = gelu(mode = var_7070_mode_0, x = input_381)[name = tensor("op_7070")]; tensor var_7072 = linear(bias = linear_4_bias_0, weight = wrapped_model_language_model_layers_31_mlp_up_proj_weight_palettized, x = output_763_cast_fp16)[name = tensor("linear_222")]; tensor input_383 = mul(x = var_7070, y = var_7072)[name = tensor("input_383")]; tensor x_763 = linear(bias = linear_3_bias_0, weight = wrapped_model_language_model_layers_31_mlp_down_proj_weight_palettized, x = input_383)[name = tensor("linear_223")]; tensor var_22_promoted_191_to_fp16 = const()[name = tensor("op_22_promoted_191_to_fp16"), val = tensor(0x1p+1)]; tensor var_7078_cast_fp16 = pow(x = x_763, y = var_22_promoted_191_to_fp16)[name = tensor("op_7078_cast_fp16")]; tensor var_7080_axes_0 = const()[name = tensor("op_7080_axes_0"), val = tensor([-1])]; tensor var_7080_keep_dims_0 = const()[name = tensor("op_7080_keep_dims_0"), val = tensor(true)]; tensor var_7080_cast_fp16 = reduce_mean(axes = var_7080_axes_0, keep_dims = var_7080_keep_dims_0, x = var_7078_cast_fp16)[name = tensor("op_7080_cast_fp16")]; tensor var_7081_to_fp16 = const()[name = tensor("op_7081_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_7082_cast_fp16 = add(x = var_7080_cast_fp16, y = var_7081_to_fp16)[name = tensor("op_7082_cast_fp16")]; tensor var_7083_epsilon_0 = const()[name = tensor("op_7083_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_7083_cast_fp16 = rsqrt(epsilon = var_7083_epsilon_0, x = var_7082_cast_fp16)[name = tensor("op_7083_cast_fp16")]; tensor output_765_cast_fp16 = mul(x = x_763, y = var_7083_cast_fp16)[name = tensor("output_765_cast_fp16")]; tensor var_7087_to_fp16 = const()[name = tensor("op_7087_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940885504)))]; tensor output_767_cast_fp16 = mul(x = output_765_cast_fp16, y = var_7087_to_fp16)[name = tensor("output_767_cast_fp16")]; tensor x_767 = add(x = x_759, y = output_767_cast_fp16)[name = tensor("x_767")]; tensor var_22_promoted_192_to_fp16 = const()[name = tensor("op_22_promoted_192_to_fp16"), val = tensor(0x1p+1)]; tensor var_7099_cast_fp16 = pow(x = x_767, y = var_22_promoted_192_to_fp16)[name = tensor("op_7099_cast_fp16")]; tensor var_7101_axes_0 = const()[name = tensor("op_7101_axes_0"), val = tensor([-1])]; tensor var_7101_keep_dims_0 = const()[name = tensor("op_7101_keep_dims_0"), val = tensor(true)]; tensor var_7101_cast_fp16 = reduce_mean(axes = var_7101_axes_0, keep_dims = var_7101_keep_dims_0, x = var_7099_cast_fp16)[name = tensor("op_7101_cast_fp16")]; tensor var_7102_to_fp16 = const()[name = tensor("op_7102_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_7103_cast_fp16 = add(x = var_7101_cast_fp16, y = var_7102_to_fp16)[name = tensor("op_7103_cast_fp16")]; tensor var_7104_epsilon_0 = const()[name = tensor("op_7104_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_7104_cast_fp16 = rsqrt(epsilon = var_7104_epsilon_0, x = var_7103_cast_fp16)[name = tensor("op_7104_cast_fp16")]; tensor output_769_cast_fp16 = mul(x = x_767, y = var_7104_cast_fp16)[name = tensor("output_769_cast_fp16")]; tensor var_7108_to_fp16 = const()[name = tensor("op_7108_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940890688)))]; tensor output_771_cast_fp16 = mul(x = output_769_cast_fp16, y = var_7108_to_fp16)[name = tensor("output_771_cast_fp16")]; tensor var_7120 = linear(bias = linear_0_bias_0, weight = wrapped_model_language_model_layers_32_self_attn_q_proj_weight_palettized, x = output_771_cast_fp16)[name = tensor("linear_224")]; tensor var_7121 = const()[name = tensor("op_7121"), val = tensor([1, 256, -1, 256])]; tensor var_7122 = reshape(shape = var_7121, x = var_7120)[name = tensor("op_7122")]; tensor x_771_perm_0 = const()[name = tensor("x_771_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_7125 = linear(bias = linear_1_bias_0, weight = wrapped_model_language_model_layers_32_self_attn_k_proj_weight_palettized, x = output_771_cast_fp16)[name = tensor("linear_225")]; tensor var_7126 = const()[name = tensor("op_7126"), val = tensor([1, 256, -1, 256])]; tensor var_7127 = reshape(shape = var_7126, x = var_7125)[name = tensor("op_7127")]; tensor x_775_perm_0 = const()[name = tensor("x_775_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_7130 = linear(bias = linear_1_bias_0, weight = wrapped_model_language_model_layers_32_self_attn_v_proj_weight_palettized, x = output_771_cast_fp16)[name = tensor("linear_226")]; tensor var_7131 = const()[name = tensor("op_7131"), val = tensor([1, 256, -1, 256])]; tensor var_7132 = reshape(shape = var_7131, x = var_7130)[name = tensor("op_7132")]; tensor hidden_states_455_perm_0 = const()[name = tensor("hidden_states_455_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_22_promoted_193_to_fp16 = const()[name = tensor("op_22_promoted_193_to_fp16"), val = tensor(0x1p+1)]; tensor x_771 = transpose(perm = x_771_perm_0, x = var_7122)[name = tensor("transpose_7")]; tensor var_7136_cast_fp16 = pow(x = x_771, y = var_22_promoted_193_to_fp16)[name = tensor("op_7136_cast_fp16")]; tensor var_7138_axes_0 = const()[name = tensor("op_7138_axes_0"), val = tensor([-1])]; tensor var_7138_keep_dims_0 = const()[name = tensor("op_7138_keep_dims_0"), val = tensor(true)]; tensor var_7138_cast_fp16 = reduce_mean(axes = var_7138_axes_0, keep_dims = var_7138_keep_dims_0, x = var_7136_cast_fp16)[name = tensor("op_7138_cast_fp16")]; tensor var_7139_to_fp16 = const()[name = tensor("op_7139_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_7140_cast_fp16 = add(x = var_7138_cast_fp16, y = var_7139_to_fp16)[name = tensor("op_7140_cast_fp16")]; tensor var_7141_epsilon_0 = const()[name = tensor("op_7141_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_7141_cast_fp16 = rsqrt(epsilon = var_7141_epsilon_0, x = var_7140_cast_fp16)[name = tensor("op_7141_cast_fp16")]; tensor output_773_cast_fp16 = mul(x = x_771, y = var_7141_cast_fp16)[name = tensor("output_773_cast_fp16")]; tensor var_7145_to_fp16 = const()[name = tensor("op_7145_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940895872)))]; tensor output_775_cast_fp16 = mul(x = output_773_cast_fp16, y = var_7145_to_fp16)[name = tensor("output_775_cast_fp16")]; tensor var_22_promoted_194_to_fp16 = const()[name = tensor("op_22_promoted_194_to_fp16"), val = tensor(0x1p+1)]; tensor x_775 = transpose(perm = x_775_perm_0, x = var_7127)[name = tensor("transpose_6")]; tensor var_7150_cast_fp16 = pow(x = x_775, y = var_22_promoted_194_to_fp16)[name = tensor("op_7150_cast_fp16")]; tensor var_7152_axes_0 = const()[name = tensor("op_7152_axes_0"), val = tensor([-1])]; tensor var_7152_keep_dims_0 = const()[name = tensor("op_7152_keep_dims_0"), val = tensor(true)]; tensor var_7152_cast_fp16 = reduce_mean(axes = var_7152_axes_0, keep_dims = var_7152_keep_dims_0, x = var_7150_cast_fp16)[name = tensor("op_7152_cast_fp16")]; tensor var_7153_to_fp16 = const()[name = tensor("op_7153_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_7154_cast_fp16 = add(x = var_7152_cast_fp16, y = var_7153_to_fp16)[name = tensor("op_7154_cast_fp16")]; tensor var_7155_epsilon_0 = const()[name = tensor("op_7155_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_7155_cast_fp16 = rsqrt(epsilon = var_7155_epsilon_0, x = var_7154_cast_fp16)[name = tensor("op_7155_cast_fp16")]; tensor output_777_cast_fp16 = mul(x = x_775, y = var_7155_cast_fp16)[name = tensor("output_777_cast_fp16")]; tensor var_7159_to_fp16 = const()[name = tensor("op_7159_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940896448)))]; tensor output_779_cast_fp16 = mul(x = output_777_cast_fp16, y = var_7159_to_fp16)[name = tensor("output_779_cast_fp16")]; tensor var_7164 = mul(x = output_775_cast_fp16, y = cos_7_palettized)[name = tensor("op_7164")]; tensor x1_129_begin_0 = const()[name = tensor("x1_129_begin_0"), val = tensor([0, 0, 0, 0])]; tensor x1_129_end_0 = const()[name = tensor("x1_129_end_0"), val = tensor([1, 8, 256, 128])]; tensor x1_129_end_mask_0 = const()[name = tensor("x1_129_end_mask_0"), val = tensor([true, true, true, false])]; tensor x1_129 = slice_by_index(begin = x1_129_begin_0, end = x1_129_end_0, end_mask = x1_129_end_mask_0, x = output_775_cast_fp16)[name = tensor("x1_129")]; tensor x2_129_begin_0 = const()[name = tensor("x2_129_begin_0"), val = tensor([0, 0, 0, 128])]; tensor x2_129_end_0 = const()[name = tensor("x2_129_end_0"), val = tensor([1, 8, 256, 256])]; tensor x2_129_end_mask_0 = const()[name = tensor("x2_129_end_mask_0"), val = tensor([true, true, true, true])]; tensor x2_129 = slice_by_index(begin = x2_129_begin_0, end = x2_129_end_0, end_mask = x2_129_end_mask_0, x = output_775_cast_fp16)[name = tensor("x2_129")]; tensor const_771_promoted = const()[name = tensor("const_771_promoted"), val = tensor(-0x1p+0)]; tensor var_7175 = mul(x = x2_129, y = const_771_promoted)[name = tensor("op_7175")]; tensor var_7177_interleave_0 = const()[name = tensor("op_7177_interleave_0"), val = tensor(false)]; tensor var_7177 = concat(axis = var_24, interleave = var_7177_interleave_0, values = (var_7175, x1_129))[name = tensor("op_7177")]; tensor var_7178 = mul(x = var_7177, y = sin_7_palettized)[name = tensor("op_7178")]; tensor query_65 = add(x = var_7164, y = var_7178)[name = tensor("query_65")]; tensor var_7180 = mul(x = output_779_cast_fp16, y = cos_7_palettized)[name = tensor("op_7180")]; tensor x1_131_begin_0 = const()[name = tensor("x1_131_begin_0"), val = tensor([0, 0, 0, 0])]; tensor x1_131_end_0 = const()[name = tensor("x1_131_end_0"), val = tensor([1, 4, 256, 128])]; tensor x1_131_end_mask_0 = const()[name = tensor("x1_131_end_mask_0"), val = tensor([true, true, true, false])]; tensor x1_131 = slice_by_index(begin = x1_131_begin_0, end = x1_131_end_0, end_mask = x1_131_end_mask_0, x = output_779_cast_fp16)[name = tensor("x1_131")]; tensor x2_131_begin_0 = const()[name = tensor("x2_131_begin_0"), val = tensor([0, 0, 0, 128])]; tensor x2_131_end_0 = const()[name = tensor("x2_131_end_0"), val = tensor([1, 4, 256, 256])]; tensor x2_131_end_mask_0 = const()[name = tensor("x2_131_end_mask_0"), val = tensor([true, true, true, true])]; tensor x2_131 = slice_by_index(begin = x2_131_begin_0, end = x2_131_end_0, end_mask = x2_131_end_mask_0, x = output_779_cast_fp16)[name = tensor("x2_131")]; tensor const_774_promoted = const()[name = tensor("const_774_promoted"), val = tensor(-0x1p+0)]; tensor var_7191 = mul(x = x2_131, y = const_774_promoted)[name = tensor("op_7191")]; tensor var_7193_interleave_0 = const()[name = tensor("op_7193_interleave_0"), val = tensor(false)]; tensor var_7193 = concat(axis = var_24, interleave = var_7193_interleave_0, values = (var_7191, x1_131))[name = tensor("op_7193")]; tensor var_7194 = mul(x = var_7193, y = sin_7_palettized)[name = tensor("op_7194")]; tensor hidden_states_451 = add(x = var_7180, y = var_7194)[name = tensor("hidden_states_451")]; tensor var_7203_axes_0 = const()[name = tensor("op_7203_axes_0"), val = tensor([2])]; tensor var_7203 = expand_dims(axes = var_7203_axes_0, x = hidden_states_451)[name = tensor("op_7203")]; tensor hidden_states_453_reps_0 = const()[name = tensor("hidden_states_453_reps_0"), val = tensor([1, 1, 2, 1, 1])]; tensor hidden_states_453 = tile(reps = hidden_states_453_reps_0, x = var_7203)[name = tensor("hidden_states_453")]; tensor var_7211 = const()[name = tensor("op_7211"), val = tensor([1, 8, 256, 256])]; tensor key_states_65 = reshape(shape = var_7211, x = hidden_states_453)[name = tensor("key_states_65")]; tensor var_7220_axes_0 = const()[name = tensor("op_7220_axes_0"), val = tensor([2])]; tensor hidden_states_455 = transpose(perm = hidden_states_455_perm_0, x = var_7132)[name = tensor("transpose_5")]; tensor var_7220 = expand_dims(axes = var_7220_axes_0, x = hidden_states_455)[name = tensor("op_7220")]; tensor hidden_states_457_reps_0 = const()[name = tensor("hidden_states_457_reps_0"), val = tensor([1, 1, 2, 1, 1])]; tensor hidden_states_457 = tile(reps = hidden_states_457_reps_0, x = var_7220)[name = tensor("hidden_states_457")]; tensor var_7228 = const()[name = tensor("op_7228"), val = tensor([1, 8, 256, 256])]; tensor value_states_65 = reshape(shape = var_7228, x = hidden_states_457)[name = tensor("value_states_65")]; tensor var_7231_transpose_x_1 = const()[name = tensor("op_7231_transpose_x_1"), val = tensor(false)]; tensor var_7231_transpose_y_1 = const()[name = tensor("op_7231_transpose_y_1"), val = tensor(true)]; tensor var_7231 = matmul(transpose_x = var_7231_transpose_x_1, transpose_y = var_7231_transpose_y_1, x = query_65, y = key_states_65)[name = tensor("op_7231")]; tensor var_7232_to_fp16 = const()[name = tensor("op_7232_to_fp16"), val = tensor(0x1p-4)]; tensor attn_weights_129_cast_fp16 = mul(x = var_7231, y = var_7232_to_fp16)[name = tensor("attn_weights_129_cast_fp16")]; tensor input_385_cast_fp16 = add(x = attn_weights_129_cast_fp16, y = attention_mask_to_fp16_palettized)[name = tensor("input_385_cast_fp16")]; tensor var_7240_cast_fp16 = softmax(axis = var_24, x = input_385_cast_fp16)[name = tensor("op_7240_cast_fp16")]; tensor attn_output_129_transpose_x_0 = const()[name = tensor("attn_output_129_transpose_x_0"), val = tensor(false)]; tensor attn_output_129_transpose_y_0 = const()[name = tensor("attn_output_129_transpose_y_0"), val = tensor(false)]; tensor attn_output_129 = matmul(transpose_x = attn_output_129_transpose_x_0, transpose_y = attn_output_129_transpose_y_0, x = var_7240_cast_fp16, y = value_states_65)[name = tensor("attn_output_129")]; tensor var_7244_perm_0 = const()[name = tensor("op_7244_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_7246 = const()[name = tensor("op_7246"), val = tensor([1, 256, -1])]; tensor var_7244 = transpose(perm = var_7244_perm_0, x = attn_output_129)[name = tensor("transpose_4")]; tensor var_7247 = reshape(shape = var_7246, x = var_7244)[name = tensor("op_7247")]; tensor x_779 = linear(bias = linear_3_bias_0, weight = wrapped_model_language_model_layers_32_self_attn_o_proj_weight_palettized, x = var_7247)[name = tensor("linear_227")]; tensor var_22_promoted_195_to_fp16 = const()[name = tensor("op_22_promoted_195_to_fp16"), val = tensor(0x1p+1)]; tensor var_7253_cast_fp16 = pow(x = x_779, y = var_22_promoted_195_to_fp16)[name = tensor("op_7253_cast_fp16")]; tensor var_7255_axes_0 = const()[name = tensor("op_7255_axes_0"), val = tensor([-1])]; tensor var_7255_keep_dims_0 = const()[name = tensor("op_7255_keep_dims_0"), val = tensor(true)]; tensor var_7255_cast_fp16 = reduce_mean(axes = var_7255_axes_0, keep_dims = var_7255_keep_dims_0, x = var_7253_cast_fp16)[name = tensor("op_7255_cast_fp16")]; tensor var_7256_to_fp16 = const()[name = tensor("op_7256_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_7257_cast_fp16 = add(x = var_7255_cast_fp16, y = var_7256_to_fp16)[name = tensor("op_7257_cast_fp16")]; tensor var_7258_epsilon_0 = const()[name = tensor("op_7258_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_7258_cast_fp16 = rsqrt(epsilon = var_7258_epsilon_0, x = var_7257_cast_fp16)[name = tensor("op_7258_cast_fp16")]; tensor output_781_cast_fp16 = mul(x = x_779, y = var_7258_cast_fp16)[name = tensor("output_781_cast_fp16")]; tensor var_7262_to_fp16 = const()[name = tensor("op_7262_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940897024)))]; tensor output_783_cast_fp16 = mul(x = output_781_cast_fp16, y = var_7262_to_fp16)[name = tensor("output_783_cast_fp16")]; tensor x_783 = add(x = x_767, y = output_783_cast_fp16)[name = tensor("x_783")]; tensor var_22_promoted_196_to_fp16 = const()[name = tensor("op_22_promoted_196_to_fp16"), val = tensor(0x1p+1)]; tensor var_7268_cast_fp16 = pow(x = x_783, y = var_22_promoted_196_to_fp16)[name = tensor("op_7268_cast_fp16")]; tensor var_7270_axes_0 = const()[name = tensor("op_7270_axes_0"), val = tensor([-1])]; tensor var_7270_keep_dims_0 = const()[name = tensor("op_7270_keep_dims_0"), val = tensor(true)]; tensor var_7270_cast_fp16 = reduce_mean(axes = var_7270_axes_0, keep_dims = var_7270_keep_dims_0, x = var_7268_cast_fp16)[name = tensor("op_7270_cast_fp16")]; tensor var_7271_to_fp16 = const()[name = tensor("op_7271_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_7272_cast_fp16 = add(x = var_7270_cast_fp16, y = var_7271_to_fp16)[name = tensor("op_7272_cast_fp16")]; tensor var_7273_epsilon_0 = const()[name = tensor("op_7273_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_7273_cast_fp16 = rsqrt(epsilon = var_7273_epsilon_0, x = var_7272_cast_fp16)[name = tensor("op_7273_cast_fp16")]; tensor output_785_cast_fp16 = mul(x = x_783, y = var_7273_cast_fp16)[name = tensor("output_785_cast_fp16")]; tensor var_7277_to_fp16 = const()[name = tensor("op_7277_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940902208)))]; tensor output_787_cast_fp16 = mul(x = output_785_cast_fp16, y = var_7277_to_fp16)[name = tensor("output_787_cast_fp16")]; tensor input_393 = linear(bias = linear_4_bias_0, weight = wrapped_model_language_model_layers_32_mlp_gate_proj_weight_palettized, x = output_787_cast_fp16)[name = tensor("linear_228")]; tensor var_7285_mode_0 = const()[name = tensor("op_7285_mode_0"), val = tensor("TANH_APPROXIMATION")]; tensor var_7285 = gelu(mode = var_7285_mode_0, x = input_393)[name = tensor("op_7285")]; tensor var_7287 = linear(bias = linear_4_bias_0, weight = wrapped_model_language_model_layers_32_mlp_up_proj_weight_palettized, x = output_787_cast_fp16)[name = tensor("linear_229")]; tensor input_395 = mul(x = var_7285, y = var_7287)[name = tensor("input_395")]; tensor x_787 = linear(bias = linear_3_bias_0, weight = wrapped_model_language_model_layers_32_mlp_down_proj_weight_palettized, x = input_395)[name = tensor("linear_230")]; tensor var_22_promoted_197_to_fp16 = const()[name = tensor("op_22_promoted_197_to_fp16"), val = tensor(0x1p+1)]; tensor var_7293_cast_fp16 = pow(x = x_787, y = var_22_promoted_197_to_fp16)[name = tensor("op_7293_cast_fp16")]; tensor var_7295_axes_0 = const()[name = tensor("op_7295_axes_0"), val = tensor([-1])]; tensor var_7295_keep_dims_0 = const()[name = tensor("op_7295_keep_dims_0"), val = tensor(true)]; tensor var_7295_cast_fp16 = reduce_mean(axes = var_7295_axes_0, keep_dims = var_7295_keep_dims_0, x = var_7293_cast_fp16)[name = tensor("op_7295_cast_fp16")]; tensor var_7296_to_fp16 = const()[name = tensor("op_7296_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_7297_cast_fp16 = add(x = var_7295_cast_fp16, y = var_7296_to_fp16)[name = tensor("op_7297_cast_fp16")]; tensor var_7298_epsilon_0 = const()[name = tensor("op_7298_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_7298_cast_fp16 = rsqrt(epsilon = var_7298_epsilon_0, x = var_7297_cast_fp16)[name = tensor("op_7298_cast_fp16")]; tensor output_789_cast_fp16 = mul(x = x_787, y = var_7298_cast_fp16)[name = tensor("output_789_cast_fp16")]; tensor var_7302_to_fp16 = const()[name = tensor("op_7302_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940907392)))]; tensor output_791_cast_fp16 = mul(x = output_789_cast_fp16, y = var_7302_to_fp16)[name = tensor("output_791_cast_fp16")]; tensor x_791 = add(x = x_783, y = output_791_cast_fp16)[name = tensor("x_791")]; tensor var_22_promoted_198_to_fp16 = const()[name = tensor("op_22_promoted_198_to_fp16"), val = tensor(0x1p+1)]; tensor var_7314_cast_fp16 = pow(x = x_791, y = var_22_promoted_198_to_fp16)[name = tensor("op_7314_cast_fp16")]; tensor var_7316_axes_0 = const()[name = tensor("op_7316_axes_0"), val = tensor([-1])]; tensor var_7316_keep_dims_0 = const()[name = tensor("op_7316_keep_dims_0"), val = tensor(true)]; tensor var_7316_cast_fp16 = reduce_mean(axes = var_7316_axes_0, keep_dims = var_7316_keep_dims_0, x = var_7314_cast_fp16)[name = tensor("op_7316_cast_fp16")]; tensor var_7317_to_fp16 = const()[name = tensor("op_7317_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_7318_cast_fp16 = add(x = var_7316_cast_fp16, y = var_7317_to_fp16)[name = tensor("op_7318_cast_fp16")]; tensor var_7319_epsilon_0 = const()[name = tensor("op_7319_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_7319_cast_fp16 = rsqrt(epsilon = var_7319_epsilon_0, x = var_7318_cast_fp16)[name = tensor("op_7319_cast_fp16")]; tensor output_793_cast_fp16 = mul(x = x_791, y = var_7319_cast_fp16)[name = tensor("output_793_cast_fp16")]; tensor var_7323_to_fp16 = const()[name = tensor("op_7323_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940912576)))]; tensor output_795_cast_fp16 = mul(x = output_793_cast_fp16, y = var_7323_to_fp16)[name = tensor("output_795_cast_fp16")]; tensor var_7335 = linear(bias = linear_0_bias_0, weight = wrapped_model_language_model_layers_33_self_attn_q_proj_weight_palettized, x = output_795_cast_fp16)[name = tensor("linear_231")]; tensor var_7336 = const()[name = tensor("op_7336"), val = tensor([1, 256, -1, 256])]; tensor var_7337 = reshape(shape = var_7336, x = var_7335)[name = tensor("op_7337")]; tensor x_795_perm_0 = const()[name = tensor("x_795_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_7340 = linear(bias = linear_1_bias_0, weight = wrapped_model_language_model_layers_33_self_attn_k_proj_weight_palettized, x = output_795_cast_fp16)[name = tensor("linear_232")]; tensor var_7341 = const()[name = tensor("op_7341"), val = tensor([1, 256, -1, 256])]; tensor var_7342 = reshape(shape = var_7341, x = var_7340)[name = tensor("op_7342")]; tensor x_799_perm_0 = const()[name = tensor("x_799_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_7345 = linear(bias = linear_1_bias_0, weight = wrapped_model_language_model_layers_33_self_attn_v_proj_weight_palettized, x = output_795_cast_fp16)[name = tensor("linear_233")]; tensor var_7346 = const()[name = tensor("op_7346"), val = tensor([1, 256, -1, 256])]; tensor var_7347 = reshape(shape = var_7346, x = var_7345)[name = tensor("op_7347")]; tensor hidden_states_469_perm_0 = const()[name = tensor("hidden_states_469_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_22_promoted_199_to_fp16 = const()[name = tensor("op_22_promoted_199_to_fp16"), val = tensor(0x1p+1)]; tensor x_795 = transpose(perm = x_795_perm_0, x = var_7337)[name = tensor("transpose_3")]; tensor var_7351_cast_fp16 = pow(x = x_795, y = var_22_promoted_199_to_fp16)[name = tensor("op_7351_cast_fp16")]; tensor var_7353_axes_0 = const()[name = tensor("op_7353_axes_0"), val = tensor([-1])]; tensor var_7353_keep_dims_0 = const()[name = tensor("op_7353_keep_dims_0"), val = tensor(true)]; tensor var_7353_cast_fp16 = reduce_mean(axes = var_7353_axes_0, keep_dims = var_7353_keep_dims_0, x = var_7351_cast_fp16)[name = tensor("op_7353_cast_fp16")]; tensor var_7354_to_fp16 = const()[name = tensor("op_7354_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_7355_cast_fp16 = add(x = var_7353_cast_fp16, y = var_7354_to_fp16)[name = tensor("op_7355_cast_fp16")]; tensor var_7356_epsilon_0 = const()[name = tensor("op_7356_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_7356_cast_fp16 = rsqrt(epsilon = var_7356_epsilon_0, x = var_7355_cast_fp16)[name = tensor("op_7356_cast_fp16")]; tensor output_797_cast_fp16 = mul(x = x_795, y = var_7356_cast_fp16)[name = tensor("output_797_cast_fp16")]; tensor var_7360_to_fp16 = const()[name = tensor("op_7360_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940917760)))]; tensor output_799_cast_fp16 = mul(x = output_797_cast_fp16, y = var_7360_to_fp16)[name = tensor("output_799_cast_fp16")]; tensor var_22_promoted_200_to_fp16 = const()[name = tensor("op_22_promoted_200_to_fp16"), val = tensor(0x1p+1)]; tensor x_799 = transpose(perm = x_799_perm_0, x = var_7342)[name = tensor("transpose_2")]; tensor var_7365_cast_fp16 = pow(x = x_799, y = var_22_promoted_200_to_fp16)[name = tensor("op_7365_cast_fp16")]; tensor var_7367_axes_0 = const()[name = tensor("op_7367_axes_0"), val = tensor([-1])]; tensor var_7367_keep_dims_0 = const()[name = tensor("op_7367_keep_dims_0"), val = tensor(true)]; tensor var_7367_cast_fp16 = reduce_mean(axes = var_7367_axes_0, keep_dims = var_7367_keep_dims_0, x = var_7365_cast_fp16)[name = tensor("op_7367_cast_fp16")]; tensor var_7368_to_fp16 = const()[name = tensor("op_7368_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_7369_cast_fp16 = add(x = var_7367_cast_fp16, y = var_7368_to_fp16)[name = tensor("op_7369_cast_fp16")]; tensor var_7370_epsilon_0 = const()[name = tensor("op_7370_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_7370_cast_fp16 = rsqrt(epsilon = var_7370_epsilon_0, x = var_7369_cast_fp16)[name = tensor("op_7370_cast_fp16")]; tensor output_801_cast_fp16 = mul(x = x_799, y = var_7370_cast_fp16)[name = tensor("output_801_cast_fp16")]; tensor var_7374_to_fp16 = const()[name = tensor("op_7374_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940918336)))]; tensor output_803_cast_fp16 = mul(x = output_801_cast_fp16, y = var_7374_to_fp16)[name = tensor("output_803_cast_fp16")]; tensor var_7379 = mul(x = output_799_cast_fp16, y = cos_7_palettized)[name = tensor("op_7379")]; tensor x1_133_begin_0 = const()[name = tensor("x1_133_begin_0"), val = tensor([0, 0, 0, 0])]; tensor x1_133_end_0 = const()[name = tensor("x1_133_end_0"), val = tensor([1, 8, 256, 128])]; tensor x1_133_end_mask_0 = const()[name = tensor("x1_133_end_mask_0"), val = tensor([true, true, true, false])]; tensor x1_133 = slice_by_index(begin = x1_133_begin_0, end = x1_133_end_0, end_mask = x1_133_end_mask_0, x = output_799_cast_fp16)[name = tensor("x1_133")]; tensor x2_133_begin_0 = const()[name = tensor("x2_133_begin_0"), val = tensor([0, 0, 0, 128])]; tensor x2_133_end_0 = const()[name = tensor("x2_133_end_0"), val = tensor([1, 8, 256, 256])]; tensor x2_133_end_mask_0 = const()[name = tensor("x2_133_end_mask_0"), val = tensor([true, true, true, true])]; tensor x2_133 = slice_by_index(begin = x2_133_begin_0, end = x2_133_end_0, end_mask = x2_133_end_mask_0, x = output_799_cast_fp16)[name = tensor("x2_133")]; tensor const_794_promoted = const()[name = tensor("const_794_promoted"), val = tensor(-0x1p+0)]; tensor var_7390 = mul(x = x2_133, y = const_794_promoted)[name = tensor("op_7390")]; tensor var_7392_interleave_0 = const()[name = tensor("op_7392_interleave_0"), val = tensor(false)]; tensor var_7392 = concat(axis = var_24, interleave = var_7392_interleave_0, values = (var_7390, x1_133))[name = tensor("op_7392")]; tensor var_7393 = mul(x = var_7392, y = sin_7_palettized)[name = tensor("op_7393")]; tensor query = add(x = var_7379, y = var_7393)[name = tensor("query")]; tensor var_7395 = mul(x = output_803_cast_fp16, y = cos_7_palettized)[name = tensor("op_7395")]; tensor x1_begin_0 = const()[name = tensor("x1_begin_0"), val = tensor([0, 0, 0, 0])]; tensor x1_end_0 = const()[name = tensor("x1_end_0"), val = tensor([1, 4, 256, 128])]; tensor x1_end_mask_0 = const()[name = tensor("x1_end_mask_0"), val = tensor([true, true, true, false])]; tensor x1 = slice_by_index(begin = x1_begin_0, end = x1_end_0, end_mask = x1_end_mask_0, x = output_803_cast_fp16)[name = tensor("x1")]; tensor x2_begin_0 = const()[name = tensor("x2_begin_0"), val = tensor([0, 0, 0, 128])]; tensor x2_end_0 = const()[name = tensor("x2_end_0"), val = tensor([1, 4, 256, 256])]; tensor x2_end_mask_0 = const()[name = tensor("x2_end_mask_0"), val = tensor([true, true, true, true])]; tensor x2 = slice_by_index(begin = x2_begin_0, end = x2_end_0, end_mask = x2_end_mask_0, x = output_803_cast_fp16)[name = tensor("x2")]; tensor const_797_promoted = const()[name = tensor("const_797_promoted"), val = tensor(-0x1p+0)]; tensor var_7406 = mul(x = x2, y = const_797_promoted)[name = tensor("op_7406")]; tensor var_7408_interleave_0 = const()[name = tensor("op_7408_interleave_0"), val = tensor(false)]; tensor var_7408 = concat(axis = var_24, interleave = var_7408_interleave_0, values = (var_7406, x1))[name = tensor("op_7408")]; tensor var_7409 = mul(x = var_7408, y = sin_7_palettized)[name = tensor("op_7409")]; tensor hidden_states_465 = add(x = var_7395, y = var_7409)[name = tensor("hidden_states_465")]; tensor var_7418_axes_0 = const()[name = tensor("op_7418_axes_0"), val = tensor([2])]; tensor var_7418 = expand_dims(axes = var_7418_axes_0, x = hidden_states_465)[name = tensor("op_7418")]; tensor hidden_states_467_reps_0 = const()[name = tensor("hidden_states_467_reps_0"), val = tensor([1, 1, 2, 1, 1])]; tensor hidden_states_467 = tile(reps = hidden_states_467_reps_0, x = var_7418)[name = tensor("hidden_states_467")]; tensor var_7426 = const()[name = tensor("op_7426"), val = tensor([1, 8, 256, 256])]; tensor key_states = reshape(shape = var_7426, x = hidden_states_467)[name = tensor("key_states")]; tensor var_7435_axes_0 = const()[name = tensor("op_7435_axes_0"), val = tensor([2])]; tensor hidden_states_469 = transpose(perm = hidden_states_469_perm_0, x = var_7347)[name = tensor("transpose_1")]; tensor var_7435 = expand_dims(axes = var_7435_axes_0, x = hidden_states_469)[name = tensor("op_7435")]; tensor hidden_states_471_reps_0 = const()[name = tensor("hidden_states_471_reps_0"), val = tensor([1, 1, 2, 1, 1])]; tensor hidden_states_471 = tile(reps = hidden_states_471_reps_0, x = var_7435)[name = tensor("hidden_states_471")]; tensor var_7443 = const()[name = tensor("op_7443"), val = tensor([1, 8, 256, 256])]; tensor value_states = reshape(shape = var_7443, x = hidden_states_471)[name = tensor("value_states")]; tensor var_7446_transpose_x_1 = const()[name = tensor("op_7446_transpose_x_1"), val = tensor(false)]; tensor var_7446_transpose_y_1 = const()[name = tensor("op_7446_transpose_y_1"), val = tensor(true)]; tensor var_7446 = matmul(transpose_x = var_7446_transpose_x_1, transpose_y = var_7446_transpose_y_1, x = query, y = key_states)[name = tensor("op_7446")]; tensor var_7447_to_fp16 = const()[name = tensor("op_7447_to_fp16"), val = tensor(0x1p-4)]; tensor attn_weights_133_cast_fp16 = mul(x = var_7446, y = var_7447_to_fp16)[name = tensor("attn_weights_133_cast_fp16")]; tensor input_397_cast_fp16 = add(x = attn_weights_133_cast_fp16, y = attention_mask_to_fp16_palettized)[name = tensor("input_397_cast_fp16")]; tensor var_7455_cast_fp16 = softmax(axis = var_24, x = input_397_cast_fp16)[name = tensor("op_7455_cast_fp16")]; tensor attn_output_133_transpose_x_0 = const()[name = tensor("attn_output_133_transpose_x_0"), val = tensor(false)]; tensor attn_output_133_transpose_y_0 = const()[name = tensor("attn_output_133_transpose_y_0"), val = tensor(false)]; tensor attn_output_133 = matmul(transpose_x = attn_output_133_transpose_x_0, transpose_y = attn_output_133_transpose_y_0, x = var_7455_cast_fp16, y = value_states)[name = tensor("attn_output_133")]; tensor var_7459_perm_0 = const()[name = tensor("op_7459_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_7461 = const()[name = tensor("op_7461"), val = tensor([1, 256, -1])]; tensor var_7459 = transpose(perm = var_7459_perm_0, x = attn_output_133)[name = tensor("transpose_0")]; tensor var_7462 = reshape(shape = var_7461, x = var_7459)[name = tensor("op_7462")]; tensor x_803 = linear(bias = linear_3_bias_0, weight = wrapped_model_language_model_layers_33_self_attn_o_proj_weight_palettized, x = var_7462)[name = tensor("linear_234")]; tensor var_22_promoted_201_to_fp16 = const()[name = tensor("op_22_promoted_201_to_fp16"), val = tensor(0x1p+1)]; tensor var_7468_cast_fp16 = pow(x = x_803, y = var_22_promoted_201_to_fp16)[name = tensor("op_7468_cast_fp16")]; tensor var_7470_axes_0 = const()[name = tensor("op_7470_axes_0"), val = tensor([-1])]; tensor var_7470_keep_dims_0 = const()[name = tensor("op_7470_keep_dims_0"), val = tensor(true)]; tensor var_7470_cast_fp16 = reduce_mean(axes = var_7470_axes_0, keep_dims = var_7470_keep_dims_0, x = var_7468_cast_fp16)[name = tensor("op_7470_cast_fp16")]; tensor var_7471_to_fp16 = const()[name = tensor("op_7471_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_7472_cast_fp16 = add(x = var_7470_cast_fp16, y = var_7471_to_fp16)[name = tensor("op_7472_cast_fp16")]; tensor var_7473_epsilon_0 = const()[name = tensor("op_7473_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_7473_cast_fp16 = rsqrt(epsilon = var_7473_epsilon_0, x = var_7472_cast_fp16)[name = tensor("op_7473_cast_fp16")]; tensor output_805_cast_fp16 = mul(x = x_803, y = var_7473_cast_fp16)[name = tensor("output_805_cast_fp16")]; tensor var_7477_to_fp16 = const()[name = tensor("op_7477_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940918912)))]; tensor output_807_cast_fp16 = mul(x = output_805_cast_fp16, y = var_7477_to_fp16)[name = tensor("output_807_cast_fp16")]; tensor x_807 = add(x = x_791, y = output_807_cast_fp16)[name = tensor("x_807")]; tensor var_22_promoted_202_to_fp16 = const()[name = tensor("op_22_promoted_202_to_fp16"), val = tensor(0x1p+1)]; tensor var_7483_cast_fp16 = pow(x = x_807, y = var_22_promoted_202_to_fp16)[name = tensor("op_7483_cast_fp16")]; tensor var_7485_axes_0 = const()[name = tensor("op_7485_axes_0"), val = tensor([-1])]; tensor var_7485_keep_dims_0 = const()[name = tensor("op_7485_keep_dims_0"), val = tensor(true)]; tensor var_7485_cast_fp16 = reduce_mean(axes = var_7485_axes_0, keep_dims = var_7485_keep_dims_0, x = var_7483_cast_fp16)[name = tensor("op_7485_cast_fp16")]; tensor var_7486_to_fp16 = const()[name = tensor("op_7486_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_7487_cast_fp16 = add(x = var_7485_cast_fp16, y = var_7486_to_fp16)[name = tensor("op_7487_cast_fp16")]; tensor var_7488_epsilon_0 = const()[name = tensor("op_7488_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_7488_cast_fp16 = rsqrt(epsilon = var_7488_epsilon_0, x = var_7487_cast_fp16)[name = tensor("op_7488_cast_fp16")]; tensor output_809_cast_fp16 = mul(x = x_807, y = var_7488_cast_fp16)[name = tensor("output_809_cast_fp16")]; tensor var_7492_to_fp16 = const()[name = tensor("op_7492_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940924096)))]; tensor output_811_cast_fp16 = mul(x = output_809_cast_fp16, y = var_7492_to_fp16)[name = tensor("output_811_cast_fp16")]; tensor input_405 = linear(bias = linear_4_bias_0, weight = wrapped_model_language_model_layers_33_mlp_gate_proj_weight_palettized, x = output_811_cast_fp16)[name = tensor("linear_235")]; tensor var_7500_mode_0 = const()[name = tensor("op_7500_mode_0"), val = tensor("TANH_APPROXIMATION")]; tensor var_7500 = gelu(mode = var_7500_mode_0, x = input_405)[name = tensor("op_7500")]; tensor var_7502 = linear(bias = linear_4_bias_0, weight = wrapped_model_language_model_layers_33_mlp_up_proj_weight_palettized, x = output_811_cast_fp16)[name = tensor("linear_236")]; tensor input_407 = mul(x = var_7500, y = var_7502)[name = tensor("input_407")]; tensor x_811 = linear(bias = linear_3_bias_0, weight = wrapped_model_language_model_layers_33_mlp_down_proj_weight_palettized, x = input_407)[name = tensor("linear_237")]; tensor var_22_promoted_203_to_fp16 = const()[name = tensor("op_22_promoted_203_to_fp16"), val = tensor(0x1p+1)]; tensor var_7508_cast_fp16 = pow(x = x_811, y = var_22_promoted_203_to_fp16)[name = tensor("op_7508_cast_fp16")]; tensor var_7510_axes_0 = const()[name = tensor("op_7510_axes_0"), val = tensor([-1])]; tensor var_7510_keep_dims_0 = const()[name = tensor("op_7510_keep_dims_0"), val = tensor(true)]; tensor var_7510_cast_fp16 = reduce_mean(axes = var_7510_axes_0, keep_dims = var_7510_keep_dims_0, x = var_7508_cast_fp16)[name = tensor("op_7510_cast_fp16")]; tensor var_7511_to_fp16 = const()[name = tensor("op_7511_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_7512_cast_fp16 = add(x = var_7510_cast_fp16, y = var_7511_to_fp16)[name = tensor("op_7512_cast_fp16")]; tensor var_7513_epsilon_0 = const()[name = tensor("op_7513_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_7513_cast_fp16 = rsqrt(epsilon = var_7513_epsilon_0, x = var_7512_cast_fp16)[name = tensor("op_7513_cast_fp16")]; tensor output_813_cast_fp16 = mul(x = x_811, y = var_7513_cast_fp16)[name = tensor("output_813_cast_fp16")]; tensor var_7517_to_fp16 = const()[name = tensor("op_7517_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940929280)))]; tensor output_815_cast_fp16 = mul(x = output_813_cast_fp16, y = var_7517_to_fp16)[name = tensor("output_815_cast_fp16")]; tensor x_815 = add(x = x_807, y = output_815_cast_fp16)[name = tensor("x_815")]; tensor var_22_promoted_204_to_fp16 = const()[name = tensor("op_22_promoted_204_to_fp16"), val = tensor(0x1p+1)]; tensor var_7523_cast_fp16 = pow(x = x_815, y = var_22_promoted_204_to_fp16)[name = tensor("op_7523_cast_fp16")]; tensor var_7525_axes_0 = const()[name = tensor("op_7525_axes_0"), val = tensor([-1])]; tensor var_7525_keep_dims_0 = const()[name = tensor("op_7525_keep_dims_0"), val = tensor(true)]; tensor var_7525_cast_fp16 = reduce_mean(axes = var_7525_axes_0, keep_dims = var_7525_keep_dims_0, x = var_7523_cast_fp16)[name = tensor("op_7525_cast_fp16")]; tensor var_7526_to_fp16 = const()[name = tensor("op_7526_to_fp16"), val = tensor(0x1.1p-20)]; tensor var_7527_cast_fp16 = add(x = var_7525_cast_fp16, y = var_7526_to_fp16)[name = tensor("op_7527_cast_fp16")]; tensor var_7528_epsilon_0 = const()[name = tensor("op_7528_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor var_7528_cast_fp16 = rsqrt(epsilon = var_7528_epsilon_0, x = var_7527_cast_fp16)[name = tensor("op_7528_cast_fp16")]; tensor output_817_cast_fp16 = mul(x = x_815, y = var_7528_cast_fp16)[name = tensor("output_817_cast_fp16")]; tensor var_7532_to_fp16 = const()[name = tensor("op_7532_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940934464)))]; tensor output_cast_fp16 = mul(x = output_817_cast_fp16, y = var_7532_to_fp16)[name = tensor("output_cast_fp16")]; tensor linear_238_bias_0 = const()[name = tensor("linear_238_bias_0"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1940939648)))]; tensor logits = linear(bias = linear_238_bias_0, weight = wrapped_model_language_model_embed_tokens_weight_palettized, x = output_cast_fp16)[name = tensor("linear_238")]; } -> (logits); }