| { | |
| "transformer.context_embedder.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 4096 | |
| ], | |
| "data_offsets": [ | |
| 0, | |
| 1048576 | |
| ] | |
| }, | |
| "transformer.context_embedder.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 1048576, | |
| 1835008 | |
| ] | |
| }, | |
| "transformer.norm_out.linear.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 1835008, | |
| 2621440 | |
| ] | |
| }, | |
| "transformer.norm_out.linear.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 6144, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 2621440, | |
| 4194304 | |
| ] | |
| }, | |
| "transformer.proj_out.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 4194304, | |
| 4980736 | |
| ] | |
| }, | |
| "transformer.proj_out.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 4980736, | |
| 4997120 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.0.attn.to_k.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 4997120, | |
| 5783552 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.0.attn.to_k.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 5783552, | |
| 6569984 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.0.attn.to_q.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 6569984, | |
| 7356416 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.0.attn.to_q.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 7356416, | |
| 8142848 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.0.attn.to_v.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 8142848, | |
| 8929280 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.0.attn.to_v.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 8929280, | |
| 9715712 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.0.norm.linear.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 9715712, | |
| 10502144 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.0.norm.linear.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 9216, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 10502144, | |
| 12861440 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.0.proj_mlp.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 12861440, | |
| 13647872 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.0.proj_mlp.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 12288, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 13647872, | |
| 16793600 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.0.proj_out.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 15360 | |
| ], | |
| "data_offsets": [ | |
| 16793600, | |
| 20725760 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.0.proj_out.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 20725760, | |
| 21512192 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.1.attn.to_k.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 21512192, | |
| 22298624 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.1.attn.to_k.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 22298624, | |
| 23085056 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.1.attn.to_q.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 23085056, | |
| 23871488 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.1.attn.to_q.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 23871488, | |
| 24657920 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.1.attn.to_v.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 24657920, | |
| 25444352 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.1.attn.to_v.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 25444352, | |
| 26230784 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.1.norm.linear.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 26230784, | |
| 27017216 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.1.norm.linear.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 9216, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 27017216, | |
| 29376512 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.1.proj_mlp.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 29376512, | |
| 30162944 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.1.proj_mlp.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 12288, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 30162944, | |
| 33308672 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.1.proj_out.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 15360 | |
| ], | |
| "data_offsets": [ | |
| 33308672, | |
| 37240832 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.1.proj_out.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 37240832, | |
| 38027264 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.10.attn.to_k.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 38027264, | |
| 38813696 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.10.attn.to_k.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 38813696, | |
| 39600128 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.10.attn.to_q.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 39600128, | |
| 40386560 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.10.attn.to_q.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 40386560, | |
| 41172992 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.10.attn.to_v.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 41172992, | |
| 41959424 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.10.attn.to_v.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 41959424, | |
| 42745856 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.10.norm.linear.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 42745856, | |
| 43532288 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.10.norm.linear.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 9216, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 43532288, | |
| 45891584 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.10.proj_mlp.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 45891584, | |
| 46678016 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.10.proj_mlp.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 12288, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 46678016, | |
| 49823744 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.10.proj_out.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 15360 | |
| ], | |
| "data_offsets": [ | |
| 49823744, | |
| 53755904 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.10.proj_out.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 53755904, | |
| 54542336 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.11.attn.to_k.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 54542336, | |
| 55328768 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.11.attn.to_k.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 55328768, | |
| 56115200 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.11.attn.to_q.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 56115200, | |
| 56901632 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.11.attn.to_q.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 56901632, | |
| 57688064 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.11.attn.to_v.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 57688064, | |
| 58474496 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.11.attn.to_v.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 58474496, | |
| 59260928 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.11.norm.linear.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 59260928, | |
| 60047360 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.11.norm.linear.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 9216, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 60047360, | |
| 62406656 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.11.proj_mlp.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 62406656, | |
| 63193088 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.11.proj_mlp.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 12288, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 63193088, | |
| 66338816 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.11.proj_out.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 15360 | |
| ], | |
| "data_offsets": [ | |
| 66338816, | |
| 70270976 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.11.proj_out.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 70270976, | |
| 71057408 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.12.attn.to_k.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 71057408, | |
| 71843840 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.12.attn.to_k.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 71843840, | |
| 72630272 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.12.attn.to_q.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 72630272, | |
| 73416704 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.12.attn.to_q.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 73416704, | |
| 74203136 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.12.attn.to_v.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 74203136, | |
| 74989568 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.12.attn.to_v.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 74989568, | |
| 75776000 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.12.norm.linear.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 75776000, | |
| 76562432 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.12.norm.linear.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 9216, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 76562432, | |
| 78921728 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.12.proj_mlp.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 78921728, | |
| 79708160 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.12.proj_mlp.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 12288, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 79708160, | |
| 82853888 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.12.proj_out.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 15360 | |
| ], | |
| "data_offsets": [ | |
| 82853888, | |
| 86786048 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.12.proj_out.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 86786048, | |
| 87572480 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.13.attn.to_k.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 87572480, | |
| 88358912 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.13.attn.to_k.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 88358912, | |
| 89145344 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.13.attn.to_q.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 89145344, | |
| 89931776 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.13.attn.to_q.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 89931776, | |
| 90718208 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.13.attn.to_v.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 90718208, | |
| 91504640 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.13.attn.to_v.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 91504640, | |
| 92291072 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.13.norm.linear.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 92291072, | |
| 93077504 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.13.norm.linear.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 9216, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 93077504, | |
| 95436800 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.13.proj_mlp.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 95436800, | |
| 96223232 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.13.proj_mlp.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 12288, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 96223232, | |
| 99368960 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.13.proj_out.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 15360 | |
| ], | |
| "data_offsets": [ | |
| 99368960, | |
| 103301120 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.13.proj_out.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 103301120, | |
| 104087552 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.14.attn.to_k.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 104087552, | |
| 104873984 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.14.attn.to_k.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 104873984, | |
| 105660416 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.14.attn.to_q.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 105660416, | |
| 106446848 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.14.attn.to_q.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 106446848, | |
| 107233280 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.14.attn.to_v.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 107233280, | |
| 108019712 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.14.attn.to_v.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 108019712, | |
| 108806144 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.14.norm.linear.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 108806144, | |
| 109592576 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.14.norm.linear.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 9216, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 109592576, | |
| 111951872 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.14.proj_mlp.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 111951872, | |
| 112738304 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.14.proj_mlp.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 12288, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 112738304, | |
| 115884032 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.14.proj_out.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 15360 | |
| ], | |
| "data_offsets": [ | |
| 115884032, | |
| 119816192 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.14.proj_out.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 119816192, | |
| 120602624 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.15.attn.to_k.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 120602624, | |
| 121389056 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.15.attn.to_k.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 121389056, | |
| 122175488 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.15.attn.to_q.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 122175488, | |
| 122961920 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.15.attn.to_q.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 122961920, | |
| 123748352 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.15.attn.to_v.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 123748352, | |
| 124534784 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.15.attn.to_v.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 124534784, | |
| 125321216 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.15.norm.linear.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 125321216, | |
| 126107648 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.15.norm.linear.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 9216, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 126107648, | |
| 128466944 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.15.proj_mlp.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 128466944, | |
| 129253376 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.15.proj_mlp.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 12288, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 129253376, | |
| 132399104 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.15.proj_out.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 15360 | |
| ], | |
| "data_offsets": [ | |
| 132399104, | |
| 136331264 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.15.proj_out.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 136331264, | |
| 137117696 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.16.attn.to_k.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 137117696, | |
| 137904128 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.16.attn.to_k.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 137904128, | |
| 138690560 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.16.attn.to_q.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 138690560, | |
| 139476992 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.16.attn.to_q.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 139476992, | |
| 140263424 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.16.attn.to_v.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 140263424, | |
| 141049856 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.16.attn.to_v.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 141049856, | |
| 141836288 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.16.norm.linear.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 141836288, | |
| 142622720 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.16.norm.linear.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 9216, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 142622720, | |
| 144982016 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.16.proj_mlp.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 144982016, | |
| 145768448 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.16.proj_mlp.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 12288, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 145768448, | |
| 148914176 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.16.proj_out.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 15360 | |
| ], | |
| "data_offsets": [ | |
| 148914176, | |
| 152846336 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.16.proj_out.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 152846336, | |
| 153632768 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.17.attn.to_k.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 153632768, | |
| 154419200 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.17.attn.to_k.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 154419200, | |
| 155205632 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.17.attn.to_q.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 155205632, | |
| 155992064 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.17.attn.to_q.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 155992064, | |
| 156778496 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.17.attn.to_v.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 156778496, | |
| 157564928 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.17.attn.to_v.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 157564928, | |
| 158351360 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.17.norm.linear.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 158351360, | |
| 159137792 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.17.norm.linear.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 9216, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 159137792, | |
| 161497088 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.17.proj_mlp.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 161497088, | |
| 162283520 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.17.proj_mlp.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 12288, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 162283520, | |
| 165429248 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.17.proj_out.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 15360 | |
| ], | |
| "data_offsets": [ | |
| 165429248, | |
| 169361408 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.17.proj_out.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 169361408, | |
| 170147840 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.18.attn.to_k.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 170147840, | |
| 170934272 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.18.attn.to_k.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 170934272, | |
| 171720704 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.18.attn.to_q.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 171720704, | |
| 172507136 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.18.attn.to_q.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 172507136, | |
| 173293568 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.18.attn.to_v.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 173293568, | |
| 174080000 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.18.attn.to_v.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 174080000, | |
| 174866432 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.18.norm.linear.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 174866432, | |
| 175652864 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.18.norm.linear.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 9216, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 175652864, | |
| 178012160 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.18.proj_mlp.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 178012160, | |
| 178798592 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.18.proj_mlp.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 12288, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 178798592, | |
| 181944320 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.18.proj_out.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 15360 | |
| ], | |
| "data_offsets": [ | |
| 181944320, | |
| 185876480 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.18.proj_out.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 185876480, | |
| 186662912 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.19.attn.to_k.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 186662912, | |
| 187449344 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.19.attn.to_k.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 187449344, | |
| 188235776 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.19.attn.to_q.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 188235776, | |
| 189022208 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.19.attn.to_q.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 189022208, | |
| 189808640 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.19.attn.to_v.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 189808640, | |
| 190595072 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.19.attn.to_v.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 190595072, | |
| 191381504 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.19.norm.linear.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 191381504, | |
| 192167936 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.19.norm.linear.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 9216, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 192167936, | |
| 194527232 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.19.proj_mlp.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 194527232, | |
| 195313664 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.19.proj_mlp.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 12288, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 195313664, | |
| 198459392 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.19.proj_out.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 15360 | |
| ], | |
| "data_offsets": [ | |
| 198459392, | |
| 202391552 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.19.proj_out.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 202391552, | |
| 203177984 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.2.attn.to_k.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 203177984, | |
| 203964416 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.2.attn.to_k.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 203964416, | |
| 204750848 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.2.attn.to_q.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 204750848, | |
| 205537280 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.2.attn.to_q.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 205537280, | |
| 206323712 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.2.attn.to_v.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 206323712, | |
| 207110144 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.2.attn.to_v.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 207110144, | |
| 207896576 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.2.norm.linear.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 207896576, | |
| 208683008 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.2.norm.linear.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 9216, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 208683008, | |
| 211042304 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.2.proj_mlp.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 211042304, | |
| 211828736 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.2.proj_mlp.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 12288, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 211828736, | |
| 214974464 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.2.proj_out.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 15360 | |
| ], | |
| "data_offsets": [ | |
| 214974464, | |
| 218906624 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.2.proj_out.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 218906624, | |
| 219693056 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.20.attn.to_k.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 219693056, | |
| 220479488 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.20.attn.to_k.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 220479488, | |
| 221265920 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.20.attn.to_q.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 221265920, | |
| 222052352 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.20.attn.to_q.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 222052352, | |
| 222838784 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.20.attn.to_v.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 222838784, | |
| 223625216 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.20.attn.to_v.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 223625216, | |
| 224411648 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.20.norm.linear.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 224411648, | |
| 225198080 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.20.norm.linear.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 9216, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 225198080, | |
| 227557376 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.20.proj_mlp.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 227557376, | |
| 228343808 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.20.proj_mlp.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 12288, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 228343808, | |
| 231489536 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.20.proj_out.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 15360 | |
| ], | |
| "data_offsets": [ | |
| 231489536, | |
| 235421696 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.20.proj_out.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 235421696, | |
| 236208128 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.21.attn.to_k.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 236208128, | |
| 236994560 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.21.attn.to_k.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 236994560, | |
| 237780992 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.21.attn.to_q.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 237780992, | |
| 238567424 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.21.attn.to_q.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 238567424, | |
| 239353856 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.21.attn.to_v.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 239353856, | |
| 240140288 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.21.attn.to_v.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 240140288, | |
| 240926720 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.21.norm.linear.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 240926720, | |
| 241713152 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.21.norm.linear.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 9216, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 241713152, | |
| 244072448 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.21.proj_mlp.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 244072448, | |
| 244858880 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.21.proj_mlp.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 12288, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 244858880, | |
| 248004608 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.21.proj_out.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 15360 | |
| ], | |
| "data_offsets": [ | |
| 248004608, | |
| 251936768 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.21.proj_out.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 251936768, | |
| 252723200 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.22.attn.to_k.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 252723200, | |
| 253509632 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.22.attn.to_k.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 253509632, | |
| 254296064 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.22.attn.to_q.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 254296064, | |
| 255082496 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.22.attn.to_q.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 255082496, | |
| 255868928 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.22.attn.to_v.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 255868928, | |
| 256655360 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.22.attn.to_v.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 256655360, | |
| 257441792 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.22.norm.linear.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 257441792, | |
| 258228224 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.22.norm.linear.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 9216, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 258228224, | |
| 260587520 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.22.proj_mlp.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 260587520, | |
| 261373952 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.22.proj_mlp.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 12288, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 261373952, | |
| 264519680 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.22.proj_out.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 15360 | |
| ], | |
| "data_offsets": [ | |
| 264519680, | |
| 268451840 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.22.proj_out.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 268451840, | |
| 269238272 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.23.attn.to_k.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 269238272, | |
| 270024704 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.23.attn.to_k.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 270024704, | |
| 270811136 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.23.attn.to_q.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 270811136, | |
| 271597568 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.23.attn.to_q.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 271597568, | |
| 272384000 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.23.attn.to_v.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 272384000, | |
| 273170432 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.23.attn.to_v.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 273170432, | |
| 273956864 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.23.norm.linear.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 273956864, | |
| 274743296 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.23.norm.linear.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 9216, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 274743296, | |
| 277102592 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.23.proj_mlp.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 277102592, | |
| 277889024 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.23.proj_mlp.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 12288, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 277889024, | |
| 281034752 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.23.proj_out.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 15360 | |
| ], | |
| "data_offsets": [ | |
| 281034752, | |
| 284966912 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.23.proj_out.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 284966912, | |
| 285753344 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.24.attn.to_k.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 285753344, | |
| 286539776 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.24.attn.to_k.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 286539776, | |
| 287326208 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.24.attn.to_q.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 287326208, | |
| 288112640 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.24.attn.to_q.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 288112640, | |
| 288899072 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.24.attn.to_v.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 288899072, | |
| 289685504 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.24.attn.to_v.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 289685504, | |
| 290471936 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.24.norm.linear.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 290471936, | |
| 291258368 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.24.norm.linear.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 9216, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 291258368, | |
| 293617664 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.24.proj_mlp.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 293617664, | |
| 294404096 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.24.proj_mlp.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 12288, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 294404096, | |
| 297549824 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.24.proj_out.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 15360 | |
| ], | |
| "data_offsets": [ | |
| 297549824, | |
| 301481984 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.24.proj_out.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 301481984, | |
| 302268416 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.25.attn.to_k.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 302268416, | |
| 303054848 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.25.attn.to_k.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 303054848, | |
| 303841280 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.25.attn.to_q.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 303841280, | |
| 304627712 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.25.attn.to_q.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 304627712, | |
| 305414144 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.25.attn.to_v.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 305414144, | |
| 306200576 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.25.attn.to_v.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 306200576, | |
| 306987008 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.25.norm.linear.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 306987008, | |
| 307773440 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.25.norm.linear.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 9216, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 307773440, | |
| 310132736 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.25.proj_mlp.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 310132736, | |
| 310919168 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.25.proj_mlp.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 12288, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 310919168, | |
| 314064896 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.25.proj_out.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 15360 | |
| ], | |
| "data_offsets": [ | |
| 314064896, | |
| 317997056 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.25.proj_out.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 317997056, | |
| 318783488 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.26.attn.to_k.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 318783488, | |
| 319569920 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.26.attn.to_k.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 319569920, | |
| 320356352 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.26.attn.to_q.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 320356352, | |
| 321142784 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.26.attn.to_q.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 321142784, | |
| 321929216 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.26.attn.to_v.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 321929216, | |
| 322715648 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.26.attn.to_v.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 322715648, | |
| 323502080 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.26.norm.linear.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 323502080, | |
| 324288512 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.26.norm.linear.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 9216, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 324288512, | |
| 326647808 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.26.proj_mlp.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 326647808, | |
| 327434240 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.26.proj_mlp.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 12288, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 327434240, | |
| 330579968 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.26.proj_out.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 15360 | |
| ], | |
| "data_offsets": [ | |
| 330579968, | |
| 334512128 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.26.proj_out.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 334512128, | |
| 335298560 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.27.attn.to_k.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 335298560, | |
| 336084992 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.27.attn.to_k.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 336084992, | |
| 336871424 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.27.attn.to_q.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 336871424, | |
| 337657856 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.27.attn.to_q.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 337657856, | |
| 338444288 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.27.attn.to_v.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 338444288, | |
| 339230720 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.27.attn.to_v.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 339230720, | |
| 340017152 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.27.norm.linear.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 340017152, | |
| 340803584 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.27.norm.linear.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 9216, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 340803584, | |
| 343162880 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.27.proj_mlp.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 343162880, | |
| 343949312 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.27.proj_mlp.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 12288, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 343949312, | |
| 347095040 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.27.proj_out.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 15360 | |
| ], | |
| "data_offsets": [ | |
| 347095040, | |
| 351027200 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.27.proj_out.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 351027200, | |
| 351813632 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.28.attn.to_k.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 351813632, | |
| 352600064 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.28.attn.to_k.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 352600064, | |
| 353386496 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.28.attn.to_q.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 353386496, | |
| 354172928 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.28.attn.to_q.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 354172928, | |
| 354959360 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.28.attn.to_v.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 354959360, | |
| 355745792 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.28.attn.to_v.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 355745792, | |
| 356532224 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.28.norm.linear.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 356532224, | |
| 357318656 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.28.norm.linear.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 9216, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 357318656, | |
| 359677952 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.28.proj_mlp.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 359677952, | |
| 360464384 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.28.proj_mlp.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 12288, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 360464384, | |
| 363610112 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.28.proj_out.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 15360 | |
| ], | |
| "data_offsets": [ | |
| 363610112, | |
| 367542272 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.28.proj_out.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 367542272, | |
| 368328704 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.29.attn.to_k.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 368328704, | |
| 369115136 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.29.attn.to_k.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 369115136, | |
| 369901568 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.29.attn.to_q.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 369901568, | |
| 370688000 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.29.attn.to_q.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 370688000, | |
| 371474432 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.29.attn.to_v.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 371474432, | |
| 372260864 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.29.attn.to_v.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 372260864, | |
| 373047296 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.29.norm.linear.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 373047296, | |
| 373833728 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.29.norm.linear.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 9216, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 373833728, | |
| 376193024 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.29.proj_mlp.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 376193024, | |
| 376979456 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.29.proj_mlp.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 12288, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 376979456, | |
| 380125184 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.29.proj_out.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 15360 | |
| ], | |
| "data_offsets": [ | |
| 380125184, | |
| 384057344 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.29.proj_out.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 384057344, | |
| 384843776 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.3.attn.to_k.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 384843776, | |
| 385630208 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.3.attn.to_k.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 385630208, | |
| 386416640 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.3.attn.to_q.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 386416640, | |
| 387203072 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.3.attn.to_q.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 387203072, | |
| 387989504 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.3.attn.to_v.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 387989504, | |
| 388775936 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.3.attn.to_v.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 388775936, | |
| 389562368 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.3.norm.linear.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 389562368, | |
| 390348800 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.3.norm.linear.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 9216, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 390348800, | |
| 392708096 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.3.proj_mlp.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 392708096, | |
| 393494528 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.3.proj_mlp.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 12288, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 393494528, | |
| 396640256 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.3.proj_out.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 15360 | |
| ], | |
| "data_offsets": [ | |
| 396640256, | |
| 400572416 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.3.proj_out.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 400572416, | |
| 401358848 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.30.attn.to_k.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 401358848, | |
| 402145280 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.30.attn.to_k.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 402145280, | |
| 402931712 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.30.attn.to_q.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 402931712, | |
| 403718144 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.30.attn.to_q.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 403718144, | |
| 404504576 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.30.attn.to_v.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 404504576, | |
| 405291008 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.30.attn.to_v.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 405291008, | |
| 406077440 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.30.norm.linear.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 406077440, | |
| 406863872 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.30.norm.linear.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 9216, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 406863872, | |
| 409223168 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.30.proj_mlp.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 409223168, | |
| 410009600 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.30.proj_mlp.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 12288, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 410009600, | |
| 413155328 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.30.proj_out.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 15360 | |
| ], | |
| "data_offsets": [ | |
| 413155328, | |
| 417087488 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.30.proj_out.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 417087488, | |
| 417873920 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.31.attn.to_k.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 417873920, | |
| 418660352 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.31.attn.to_k.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 418660352, | |
| 419446784 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.31.attn.to_q.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 419446784, | |
| 420233216 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.31.attn.to_q.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 420233216, | |
| 421019648 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.31.attn.to_v.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 421019648, | |
| 421806080 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.31.attn.to_v.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 421806080, | |
| 422592512 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.31.norm.linear.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 422592512, | |
| 423378944 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.31.norm.linear.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 9216, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 423378944, | |
| 425738240 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.31.proj_mlp.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 425738240, | |
| 426524672 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.31.proj_mlp.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 12288, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 426524672, | |
| 429670400 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.31.proj_out.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 15360 | |
| ], | |
| "data_offsets": [ | |
| 429670400, | |
| 433602560 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.31.proj_out.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 433602560, | |
| 434388992 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.32.attn.to_k.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 434388992, | |
| 435175424 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.32.attn.to_k.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 435175424, | |
| 435961856 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.32.attn.to_q.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 435961856, | |
| 436748288 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.32.attn.to_q.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 436748288, | |
| 437534720 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.32.attn.to_v.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 437534720, | |
| 438321152 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.32.attn.to_v.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 438321152, | |
| 439107584 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.32.norm.linear.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 439107584, | |
| 439894016 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.32.norm.linear.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 9216, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 439894016, | |
| 442253312 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.32.proj_mlp.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 442253312, | |
| 443039744 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.32.proj_mlp.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 12288, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 443039744, | |
| 446185472 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.32.proj_out.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 15360 | |
| ], | |
| "data_offsets": [ | |
| 446185472, | |
| 450117632 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.32.proj_out.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 450117632, | |
| 450904064 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.33.attn.to_k.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 450904064, | |
| 451690496 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.33.attn.to_k.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 451690496, | |
| 452476928 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.33.attn.to_q.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 452476928, | |
| 453263360 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.33.attn.to_q.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 453263360, | |
| 454049792 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.33.attn.to_v.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 454049792, | |
| 454836224 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.33.attn.to_v.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 454836224, | |
| 455622656 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.33.norm.linear.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 455622656, | |
| 456409088 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.33.norm.linear.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 9216, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 456409088, | |
| 458768384 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.33.proj_mlp.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 458768384, | |
| 459554816 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.33.proj_mlp.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 12288, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 459554816, | |
| 462700544 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.33.proj_out.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 15360 | |
| ], | |
| "data_offsets": [ | |
| 462700544, | |
| 466632704 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.33.proj_out.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 466632704, | |
| 467419136 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.34.attn.to_k.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 467419136, | |
| 468205568 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.34.attn.to_k.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 468205568, | |
| 468992000 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.34.attn.to_q.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 468992000, | |
| 469778432 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.34.attn.to_q.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 469778432, | |
| 470564864 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.34.attn.to_v.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 470564864, | |
| 471351296 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.34.attn.to_v.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 471351296, | |
| 472137728 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.34.norm.linear.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 472137728, | |
| 472924160 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.34.norm.linear.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 9216, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 472924160, | |
| 475283456 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.34.proj_mlp.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 475283456, | |
| 476069888 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.34.proj_mlp.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 12288, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 476069888, | |
| 479215616 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.34.proj_out.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 15360 | |
| ], | |
| "data_offsets": [ | |
| 479215616, | |
| 483147776 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.34.proj_out.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 483147776, | |
| 483934208 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.35.attn.to_k.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 483934208, | |
| 484720640 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.35.attn.to_k.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 484720640, | |
| 485507072 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.35.attn.to_q.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 485507072, | |
| 486293504 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.35.attn.to_q.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 486293504, | |
| 487079936 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.35.attn.to_v.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 487079936, | |
| 487866368 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.35.attn.to_v.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 487866368, | |
| 488652800 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.35.norm.linear.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 488652800, | |
| 489439232 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.35.norm.linear.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 9216, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 489439232, | |
| 491798528 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.35.proj_mlp.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 491798528, | |
| 492584960 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.35.proj_mlp.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 12288, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 492584960, | |
| 495730688 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.35.proj_out.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 15360 | |
| ], | |
| "data_offsets": [ | |
| 495730688, | |
| 499662848 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.35.proj_out.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 499662848, | |
| 500449280 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.36.attn.to_k.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 500449280, | |
| 501235712 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.36.attn.to_k.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 501235712, | |
| 502022144 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.36.attn.to_q.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 502022144, | |
| 502808576 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.36.attn.to_q.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 502808576, | |
| 503595008 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.36.attn.to_v.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 503595008, | |
| 504381440 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.36.attn.to_v.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 504381440, | |
| 505167872 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.36.norm.linear.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 505167872, | |
| 505954304 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.36.norm.linear.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 9216, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 505954304, | |
| 508313600 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.36.proj_mlp.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 508313600, | |
| 509100032 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.36.proj_mlp.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 12288, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 509100032, | |
| 512245760 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.36.proj_out.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 15360 | |
| ], | |
| "data_offsets": [ | |
| 512245760, | |
| 516177920 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.36.proj_out.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 516177920, | |
| 516964352 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.37.attn.to_k.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 516964352, | |
| 517750784 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.37.attn.to_k.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 517750784, | |
| 518537216 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.37.attn.to_q.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 518537216, | |
| 519323648 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.37.attn.to_q.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 519323648, | |
| 520110080 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.37.attn.to_v.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 520110080, | |
| 520896512 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.37.attn.to_v.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 520896512, | |
| 521682944 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.37.norm.linear.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 521682944, | |
| 522469376 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.37.norm.linear.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 9216, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 522469376, | |
| 524828672 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.37.proj_mlp.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 524828672, | |
| 525615104 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.37.proj_mlp.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 12288, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 525615104, | |
| 528760832 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.37.proj_out.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 15360 | |
| ], | |
| "data_offsets": [ | |
| 528760832, | |
| 532692992 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.37.proj_out.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 532692992, | |
| 533479424 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.4.attn.to_k.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 533479424, | |
| 534265856 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.4.attn.to_k.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 534265856, | |
| 535052288 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.4.attn.to_q.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 535052288, | |
| 535838720 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.4.attn.to_q.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 535838720, | |
| 536625152 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.4.attn.to_v.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 536625152, | |
| 537411584 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.4.attn.to_v.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 537411584, | |
| 538198016 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.4.norm.linear.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 538198016, | |
| 538984448 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.4.norm.linear.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 9216, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 538984448, | |
| 541343744 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.4.proj_mlp.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 541343744, | |
| 542130176 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.4.proj_mlp.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 12288, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 542130176, | |
| 545275904 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.4.proj_out.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 15360 | |
| ], | |
| "data_offsets": [ | |
| 545275904, | |
| 549208064 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.4.proj_out.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 549208064, | |
| 549994496 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.5.attn.to_k.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 549994496, | |
| 550780928 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.5.attn.to_k.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 550780928, | |
| 551567360 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.5.attn.to_q.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 551567360, | |
| 552353792 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.5.attn.to_q.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 552353792, | |
| 553140224 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.5.attn.to_v.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 553140224, | |
| 553926656 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.5.attn.to_v.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 553926656, | |
| 554713088 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.5.norm.linear.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 554713088, | |
| 555499520 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.5.norm.linear.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 9216, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 555499520, | |
| 557858816 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.5.proj_mlp.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 557858816, | |
| 558645248 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.5.proj_mlp.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 12288, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 558645248, | |
| 561790976 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.5.proj_out.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 15360 | |
| ], | |
| "data_offsets": [ | |
| 561790976, | |
| 565723136 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.5.proj_out.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 565723136, | |
| 566509568 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.6.attn.to_k.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 566509568, | |
| 567296000 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.6.attn.to_k.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 567296000, | |
| 568082432 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.6.attn.to_q.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 568082432, | |
| 568868864 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.6.attn.to_q.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 568868864, | |
| 569655296 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.6.attn.to_v.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 569655296, | |
| 570441728 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.6.attn.to_v.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 570441728, | |
| 571228160 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.6.norm.linear.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 571228160, | |
| 572014592 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.6.norm.linear.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 9216, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 572014592, | |
| 574373888 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.6.proj_mlp.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 574373888, | |
| 575160320 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.6.proj_mlp.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 12288, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 575160320, | |
| 578306048 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.6.proj_out.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 15360 | |
| ], | |
| "data_offsets": [ | |
| 578306048, | |
| 582238208 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.6.proj_out.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 582238208, | |
| 583024640 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.7.attn.to_k.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 583024640, | |
| 583811072 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.7.attn.to_k.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 583811072, | |
| 584597504 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.7.attn.to_q.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 584597504, | |
| 585383936 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.7.attn.to_q.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 585383936, | |
| 586170368 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.7.attn.to_v.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 586170368, | |
| 586956800 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.7.attn.to_v.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 586956800, | |
| 587743232 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.7.norm.linear.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 587743232, | |
| 588529664 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.7.norm.linear.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 9216, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 588529664, | |
| 590888960 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.7.proj_mlp.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 590888960, | |
| 591675392 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.7.proj_mlp.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 12288, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 591675392, | |
| 594821120 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.7.proj_out.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 15360 | |
| ], | |
| "data_offsets": [ | |
| 594821120, | |
| 598753280 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.7.proj_out.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 598753280, | |
| 599539712 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.8.attn.to_k.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 599539712, | |
| 600326144 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.8.attn.to_k.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 600326144, | |
| 601112576 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.8.attn.to_q.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 601112576, | |
| 601899008 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.8.attn.to_q.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 601899008, | |
| 602685440 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.8.attn.to_v.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 602685440, | |
| 603471872 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.8.attn.to_v.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 603471872, | |
| 604258304 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.8.norm.linear.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 604258304, | |
| 605044736 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.8.norm.linear.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 9216, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 605044736, | |
| 607404032 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.8.proj_mlp.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 607404032, | |
| 608190464 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.8.proj_mlp.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 12288, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 608190464, | |
| 611336192 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.8.proj_out.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 15360 | |
| ], | |
| "data_offsets": [ | |
| 611336192, | |
| 615268352 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.8.proj_out.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 615268352, | |
| 616054784 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.9.attn.to_k.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 616054784, | |
| 616841216 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.9.attn.to_k.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 616841216, | |
| 617627648 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.9.attn.to_q.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 617627648, | |
| 618414080 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.9.attn.to_q.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 618414080, | |
| 619200512 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.9.attn.to_v.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 619200512, | |
| 619986944 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.9.attn.to_v.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 619986944, | |
| 620773376 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.9.norm.linear.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 620773376, | |
| 621559808 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.9.norm.linear.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 9216, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 621559808, | |
| 623919104 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.9.proj_mlp.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 623919104, | |
| 624705536 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.9.proj_mlp.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 12288, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 624705536, | |
| 627851264 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.9.proj_out.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 15360 | |
| ], | |
| "data_offsets": [ | |
| 627851264, | |
| 631783424 | |
| ] | |
| }, | |
| "transformer.single_transformer_blocks.9.proj_out.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 631783424, | |
| 632569856 | |
| ] | |
| }, | |
| "transformer.time_text_embed.guidance_embedder.linear_1.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 256 | |
| ], | |
| "data_offsets": [ | |
| 632569856, | |
| 632635392 | |
| ] | |
| }, | |
| "transformer.time_text_embed.guidance_embedder.linear_1.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 632635392, | |
| 633421824 | |
| ] | |
| }, | |
| "transformer.time_text_embed.guidance_embedder.linear_2.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 633421824, | |
| 634208256 | |
| ] | |
| }, | |
| "transformer.time_text_embed.guidance_embedder.linear_2.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 634208256, | |
| 634994688 | |
| ] | |
| }, | |
| "transformer.time_text_embed.text_embedder.linear_1.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 768 | |
| ], | |
| "data_offsets": [ | |
| 634994688, | |
| 635191296 | |
| ] | |
| }, | |
| "transformer.time_text_embed.text_embedder.linear_1.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 635191296, | |
| 635977728 | |
| ] | |
| }, | |
| "transformer.time_text_embed.text_embedder.linear_2.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 635977728, | |
| 636764160 | |
| ] | |
| }, | |
| "transformer.time_text_embed.text_embedder.linear_2.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 636764160, | |
| 637550592 | |
| ] | |
| }, | |
| "transformer.time_text_embed.timestep_embedder.linear_1.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 256 | |
| ], | |
| "data_offsets": [ | |
| 637550592, | |
| 637616128 | |
| ] | |
| }, | |
| "transformer.time_text_embed.timestep_embedder.linear_1.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 637616128, | |
| 638402560 | |
| ] | |
| }, | |
| "transformer.time_text_embed.timestep_embedder.linear_2.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 638402560, | |
| 639188992 | |
| ] | |
| }, | |
| "transformer.time_text_embed.timestep_embedder.linear_2.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 639188992, | |
| 639975424 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.0.attn.add_k_proj.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 639975424, | |
| 640761856 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.0.attn.add_k_proj.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 640761856, | |
| 641548288 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.0.attn.add_q_proj.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 641548288, | |
| 642334720 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.0.attn.add_q_proj.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 642334720, | |
| 643121152 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.0.attn.add_v_proj.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 643121152, | |
| 643907584 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.0.attn.add_v_proj.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 643907584, | |
| 644694016 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.0.attn.to_add_out.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 644694016, | |
| 645480448 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.0.attn.to_add_out.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 645480448, | |
| 646266880 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.0.attn.to_k.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 646266880, | |
| 647053312 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.0.attn.to_k.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 647053312, | |
| 647839744 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.0.attn.to_out.0.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 647839744, | |
| 648626176 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.0.attn.to_out.0.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 648626176, | |
| 649412608 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.0.attn.to_q.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 649412608, | |
| 650199040 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.0.attn.to_q.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 650199040, | |
| 650985472 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.0.attn.to_v.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 650985472, | |
| 651771904 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.0.attn.to_v.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 651771904, | |
| 652558336 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.0.ff.net.0.proj.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 652558336, | |
| 653344768 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.0.ff.net.0.proj.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 12288, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 653344768, | |
| 656490496 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.0.ff.net.2.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 12288 | |
| ], | |
| "data_offsets": [ | |
| 656490496, | |
| 659636224 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.0.ff.net.2.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 659636224, | |
| 660422656 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.0.ff_context.net.0.proj.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 660422656, | |
| 661209088 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.0.ff_context.net.0.proj.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 12288, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 661209088, | |
| 664354816 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.0.ff_context.net.2.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 12288 | |
| ], | |
| "data_offsets": [ | |
| 664354816, | |
| 667500544 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.0.ff_context.net.2.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 667500544, | |
| 668286976 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.0.norm1.linear.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 668286976, | |
| 669073408 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.0.norm1.linear.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 18432, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 669073408, | |
| 673792000 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.0.norm1_context.linear.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 673792000, | |
| 674578432 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.0.norm1_context.linear.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 18432, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 674578432, | |
| 679297024 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.1.attn.add_k_proj.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 679297024, | |
| 680083456 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.1.attn.add_k_proj.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 680083456, | |
| 680869888 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.1.attn.add_q_proj.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 680869888, | |
| 681656320 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.1.attn.add_q_proj.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 681656320, | |
| 682442752 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.1.attn.add_v_proj.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 682442752, | |
| 683229184 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.1.attn.add_v_proj.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 683229184, | |
| 684015616 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.1.attn.to_add_out.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 684015616, | |
| 684802048 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.1.attn.to_add_out.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 684802048, | |
| 685588480 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.1.attn.to_k.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 685588480, | |
| 686374912 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.1.attn.to_k.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 686374912, | |
| 687161344 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.1.attn.to_out.0.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 687161344, | |
| 687947776 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.1.attn.to_out.0.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 687947776, | |
| 688734208 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.1.attn.to_q.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 688734208, | |
| 689520640 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.1.attn.to_q.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 689520640, | |
| 690307072 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.1.attn.to_v.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 690307072, | |
| 691093504 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.1.attn.to_v.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 691093504, | |
| 691879936 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.1.ff.net.0.proj.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 691879936, | |
| 692666368 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.1.ff.net.0.proj.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 12288, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 692666368, | |
| 695812096 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.1.ff.net.2.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 12288 | |
| ], | |
| "data_offsets": [ | |
| 695812096, | |
| 698957824 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.1.ff.net.2.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 698957824, | |
| 699744256 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.1.ff_context.net.0.proj.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 699744256, | |
| 700530688 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.1.ff_context.net.0.proj.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 12288, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 700530688, | |
| 703676416 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.1.ff_context.net.2.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 12288 | |
| ], | |
| "data_offsets": [ | |
| 703676416, | |
| 706822144 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.1.ff_context.net.2.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 706822144, | |
| 707608576 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.1.norm1.linear.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 707608576, | |
| 708395008 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.1.norm1.linear.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 18432, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 708395008, | |
| 713113600 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.1.norm1_context.linear.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 713113600, | |
| 713900032 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.1.norm1_context.linear.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 18432, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 713900032, | |
| 718618624 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.10.attn.add_k_proj.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 718618624, | |
| 719405056 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.10.attn.add_k_proj.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 719405056, | |
| 720191488 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.10.attn.add_q_proj.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 720191488, | |
| 720977920 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.10.attn.add_q_proj.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 720977920, | |
| 721764352 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.10.attn.add_v_proj.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 721764352, | |
| 722550784 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.10.attn.add_v_proj.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 722550784, | |
| 723337216 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.10.attn.to_add_out.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 723337216, | |
| 724123648 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.10.attn.to_add_out.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 724123648, | |
| 724910080 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.10.attn.to_k.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 724910080, | |
| 725696512 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.10.attn.to_k.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 725696512, | |
| 726482944 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.10.attn.to_out.0.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 726482944, | |
| 727269376 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.10.attn.to_out.0.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 727269376, | |
| 728055808 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.10.attn.to_q.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 728055808, | |
| 728842240 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.10.attn.to_q.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 728842240, | |
| 729628672 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.10.attn.to_v.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 729628672, | |
| 730415104 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.10.attn.to_v.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 730415104, | |
| 731201536 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.10.ff.net.0.proj.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 731201536, | |
| 731987968 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.10.ff.net.0.proj.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 12288, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 731987968, | |
| 735133696 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.10.ff.net.2.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 12288 | |
| ], | |
| "data_offsets": [ | |
| 735133696, | |
| 738279424 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.10.ff.net.2.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 738279424, | |
| 739065856 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.10.ff_context.net.0.proj.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 739065856, | |
| 739852288 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.10.ff_context.net.0.proj.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 12288, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 739852288, | |
| 742998016 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.10.ff_context.net.2.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 12288 | |
| ], | |
| "data_offsets": [ | |
| 742998016, | |
| 746143744 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.10.ff_context.net.2.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 746143744, | |
| 746930176 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.10.norm1.linear.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 746930176, | |
| 747716608 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.10.norm1.linear.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 18432, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 747716608, | |
| 752435200 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.10.norm1_context.linear.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 752435200, | |
| 753221632 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.10.norm1_context.linear.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 18432, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 753221632, | |
| 757940224 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.11.attn.add_k_proj.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 757940224, | |
| 758726656 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.11.attn.add_k_proj.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 758726656, | |
| 759513088 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.11.attn.add_q_proj.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 759513088, | |
| 760299520 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.11.attn.add_q_proj.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 760299520, | |
| 761085952 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.11.attn.add_v_proj.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 761085952, | |
| 761872384 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.11.attn.add_v_proj.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 761872384, | |
| 762658816 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.11.attn.to_add_out.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 762658816, | |
| 763445248 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.11.attn.to_add_out.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 763445248, | |
| 764231680 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.11.attn.to_k.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 764231680, | |
| 765018112 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.11.attn.to_k.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 765018112, | |
| 765804544 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.11.attn.to_out.0.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 765804544, | |
| 766590976 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.11.attn.to_out.0.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 766590976, | |
| 767377408 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.11.attn.to_q.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 767377408, | |
| 768163840 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.11.attn.to_q.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 768163840, | |
| 768950272 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.11.attn.to_v.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 768950272, | |
| 769736704 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.11.attn.to_v.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 769736704, | |
| 770523136 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.11.ff.net.0.proj.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 770523136, | |
| 771309568 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.11.ff.net.0.proj.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 12288, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 771309568, | |
| 774455296 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.11.ff.net.2.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 12288 | |
| ], | |
| "data_offsets": [ | |
| 774455296, | |
| 777601024 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.11.ff.net.2.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 777601024, | |
| 778387456 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.11.ff_context.net.0.proj.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 778387456, | |
| 779173888 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.11.ff_context.net.0.proj.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 12288, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 779173888, | |
| 782319616 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.11.ff_context.net.2.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 12288 | |
| ], | |
| "data_offsets": [ | |
| 782319616, | |
| 785465344 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.11.ff_context.net.2.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 785465344, | |
| 786251776 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.11.norm1.linear.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 786251776, | |
| 787038208 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.11.norm1.linear.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 18432, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 787038208, | |
| 791756800 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.11.norm1_context.linear.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 791756800, | |
| 792543232 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.11.norm1_context.linear.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 18432, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 792543232, | |
| 797261824 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.12.attn.add_k_proj.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 797261824, | |
| 798048256 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.12.attn.add_k_proj.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 798048256, | |
| 798834688 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.12.attn.add_q_proj.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 798834688, | |
| 799621120 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.12.attn.add_q_proj.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 799621120, | |
| 800407552 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.12.attn.add_v_proj.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 800407552, | |
| 801193984 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.12.attn.add_v_proj.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 801193984, | |
| 801980416 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.12.attn.to_add_out.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 801980416, | |
| 802766848 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.12.attn.to_add_out.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 802766848, | |
| 803553280 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.12.attn.to_k.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 803553280, | |
| 804339712 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.12.attn.to_k.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 804339712, | |
| 805126144 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.12.attn.to_out.0.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 805126144, | |
| 805912576 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.12.attn.to_out.0.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 805912576, | |
| 806699008 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.12.attn.to_q.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 806699008, | |
| 807485440 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.12.attn.to_q.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 807485440, | |
| 808271872 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.12.attn.to_v.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 808271872, | |
| 809058304 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.12.attn.to_v.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 809058304, | |
| 809844736 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.12.ff.net.0.proj.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 809844736, | |
| 810631168 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.12.ff.net.0.proj.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 12288, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 810631168, | |
| 813776896 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.12.ff.net.2.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 12288 | |
| ], | |
| "data_offsets": [ | |
| 813776896, | |
| 816922624 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.12.ff.net.2.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 816922624, | |
| 817709056 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.12.ff_context.net.0.proj.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 817709056, | |
| 818495488 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.12.ff_context.net.0.proj.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 12288, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 818495488, | |
| 821641216 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.12.ff_context.net.2.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 12288 | |
| ], | |
| "data_offsets": [ | |
| 821641216, | |
| 824786944 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.12.ff_context.net.2.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 824786944, | |
| 825573376 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.12.norm1.linear.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 825573376, | |
| 826359808 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.12.norm1.linear.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 18432, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 826359808, | |
| 831078400 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.12.norm1_context.linear.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 831078400, | |
| 831864832 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.12.norm1_context.linear.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 18432, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 831864832, | |
| 836583424 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.13.attn.add_k_proj.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 836583424, | |
| 837369856 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.13.attn.add_k_proj.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 837369856, | |
| 838156288 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.13.attn.add_q_proj.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 838156288, | |
| 838942720 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.13.attn.add_q_proj.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 838942720, | |
| 839729152 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.13.attn.add_v_proj.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 839729152, | |
| 840515584 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.13.attn.add_v_proj.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 840515584, | |
| 841302016 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.13.attn.to_add_out.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 841302016, | |
| 842088448 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.13.attn.to_add_out.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 842088448, | |
| 842874880 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.13.attn.to_k.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 842874880, | |
| 843661312 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.13.attn.to_k.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 843661312, | |
| 844447744 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.13.attn.to_out.0.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 844447744, | |
| 845234176 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.13.attn.to_out.0.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 845234176, | |
| 846020608 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.13.attn.to_q.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 846020608, | |
| 846807040 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.13.attn.to_q.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 846807040, | |
| 847593472 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.13.attn.to_v.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 847593472, | |
| 848379904 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.13.attn.to_v.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 848379904, | |
| 849166336 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.13.ff.net.0.proj.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 849166336, | |
| 849952768 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.13.ff.net.0.proj.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 12288, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 849952768, | |
| 853098496 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.13.ff.net.2.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 12288 | |
| ], | |
| "data_offsets": [ | |
| 853098496, | |
| 856244224 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.13.ff.net.2.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 856244224, | |
| 857030656 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.13.ff_context.net.0.proj.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 857030656, | |
| 857817088 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.13.ff_context.net.0.proj.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 12288, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 857817088, | |
| 860962816 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.13.ff_context.net.2.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 12288 | |
| ], | |
| "data_offsets": [ | |
| 860962816, | |
| 864108544 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.13.ff_context.net.2.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 864108544, | |
| 864894976 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.13.norm1.linear.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 864894976, | |
| 865681408 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.13.norm1.linear.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 18432, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 865681408, | |
| 870400000 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.13.norm1_context.linear.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 870400000, | |
| 871186432 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.13.norm1_context.linear.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 18432, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 871186432, | |
| 875905024 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.14.attn.add_k_proj.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 875905024, | |
| 876691456 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.14.attn.add_k_proj.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 876691456, | |
| 877477888 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.14.attn.add_q_proj.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 877477888, | |
| 878264320 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.14.attn.add_q_proj.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 878264320, | |
| 879050752 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.14.attn.add_v_proj.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 879050752, | |
| 879837184 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.14.attn.add_v_proj.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 879837184, | |
| 880623616 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.14.attn.to_add_out.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 880623616, | |
| 881410048 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.14.attn.to_add_out.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 881410048, | |
| 882196480 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.14.attn.to_k.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 882196480, | |
| 882982912 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.14.attn.to_k.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 882982912, | |
| 883769344 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.14.attn.to_out.0.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 883769344, | |
| 884555776 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.14.attn.to_out.0.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 884555776, | |
| 885342208 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.14.attn.to_q.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 885342208, | |
| 886128640 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.14.attn.to_q.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 886128640, | |
| 886915072 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.14.attn.to_v.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 886915072, | |
| 887701504 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.14.attn.to_v.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 887701504, | |
| 888487936 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.14.ff.net.0.proj.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 888487936, | |
| 889274368 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.14.ff.net.0.proj.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 12288, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 889274368, | |
| 892420096 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.14.ff.net.2.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 12288 | |
| ], | |
| "data_offsets": [ | |
| 892420096, | |
| 895565824 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.14.ff.net.2.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 895565824, | |
| 896352256 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.14.ff_context.net.0.proj.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 896352256, | |
| 897138688 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.14.ff_context.net.0.proj.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 12288, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 897138688, | |
| 900284416 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.14.ff_context.net.2.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 12288 | |
| ], | |
| "data_offsets": [ | |
| 900284416, | |
| 903430144 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.14.ff_context.net.2.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 903430144, | |
| 904216576 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.14.norm1.linear.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 904216576, | |
| 905003008 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.14.norm1.linear.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 18432, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 905003008, | |
| 909721600 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.14.norm1_context.linear.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 909721600, | |
| 910508032 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.14.norm1_context.linear.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 18432, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 910508032, | |
| 915226624 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.15.attn.add_k_proj.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 915226624, | |
| 916013056 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.15.attn.add_k_proj.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 916013056, | |
| 916799488 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.15.attn.add_q_proj.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 916799488, | |
| 917585920 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.15.attn.add_q_proj.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 917585920, | |
| 918372352 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.15.attn.add_v_proj.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 918372352, | |
| 919158784 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.15.attn.add_v_proj.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 919158784, | |
| 919945216 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.15.attn.to_add_out.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 919945216, | |
| 920731648 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.15.attn.to_add_out.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 920731648, | |
| 921518080 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.15.attn.to_k.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 921518080, | |
| 922304512 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.15.attn.to_k.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 922304512, | |
| 923090944 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.15.attn.to_out.0.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 923090944, | |
| 923877376 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.15.attn.to_out.0.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 923877376, | |
| 924663808 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.15.attn.to_q.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 924663808, | |
| 925450240 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.15.attn.to_q.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 925450240, | |
| 926236672 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.15.attn.to_v.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 926236672, | |
| 927023104 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.15.attn.to_v.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 927023104, | |
| 927809536 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.15.ff.net.0.proj.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 927809536, | |
| 928595968 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.15.ff.net.0.proj.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 12288, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 928595968, | |
| 931741696 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.15.ff.net.2.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 12288 | |
| ], | |
| "data_offsets": [ | |
| 931741696, | |
| 934887424 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.15.ff.net.2.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 934887424, | |
| 935673856 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.15.ff_context.net.0.proj.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 935673856, | |
| 936460288 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.15.ff_context.net.0.proj.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 12288, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 936460288, | |
| 939606016 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.15.ff_context.net.2.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 12288 | |
| ], | |
| "data_offsets": [ | |
| 939606016, | |
| 942751744 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.15.ff_context.net.2.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 942751744, | |
| 943538176 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.15.norm1.linear.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 943538176, | |
| 944324608 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.15.norm1.linear.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 18432, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 944324608, | |
| 949043200 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.15.norm1_context.linear.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 949043200, | |
| 949829632 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.15.norm1_context.linear.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 18432, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 949829632, | |
| 954548224 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.16.attn.add_k_proj.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 954548224, | |
| 955334656 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.16.attn.add_k_proj.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 955334656, | |
| 956121088 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.16.attn.add_q_proj.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 956121088, | |
| 956907520 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.16.attn.add_q_proj.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 956907520, | |
| 957693952 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.16.attn.add_v_proj.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 957693952, | |
| 958480384 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.16.attn.add_v_proj.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 958480384, | |
| 959266816 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.16.attn.to_add_out.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 959266816, | |
| 960053248 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.16.attn.to_add_out.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 960053248, | |
| 960839680 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.16.attn.to_k.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 960839680, | |
| 961626112 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.16.attn.to_k.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 961626112, | |
| 962412544 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.16.attn.to_out.0.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 962412544, | |
| 963198976 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.16.attn.to_out.0.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 963198976, | |
| 963985408 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.16.attn.to_q.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 963985408, | |
| 964771840 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.16.attn.to_q.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 964771840, | |
| 965558272 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.16.attn.to_v.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 965558272, | |
| 966344704 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.16.attn.to_v.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 966344704, | |
| 967131136 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.16.ff.net.0.proj.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 967131136, | |
| 967917568 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.16.ff.net.0.proj.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 12288, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 967917568, | |
| 971063296 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.16.ff.net.2.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 12288 | |
| ], | |
| "data_offsets": [ | |
| 971063296, | |
| 974209024 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.16.ff.net.2.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 974209024, | |
| 974995456 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.16.ff_context.net.0.proj.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 974995456, | |
| 975781888 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.16.ff_context.net.0.proj.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 12288, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 975781888, | |
| 978927616 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.16.ff_context.net.2.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 12288 | |
| ], | |
| "data_offsets": [ | |
| 978927616, | |
| 982073344 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.16.ff_context.net.2.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 982073344, | |
| 982859776 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.16.norm1.linear.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 982859776, | |
| 983646208 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.16.norm1.linear.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 18432, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 983646208, | |
| 988364800 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.16.norm1_context.linear.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 988364800, | |
| 989151232 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.16.norm1_context.linear.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 18432, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 989151232, | |
| 993869824 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.17.attn.add_k_proj.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 993869824, | |
| 994656256 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.17.attn.add_k_proj.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 994656256, | |
| 995442688 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.17.attn.add_q_proj.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 995442688, | |
| 996229120 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.17.attn.add_q_proj.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 996229120, | |
| 997015552 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.17.attn.add_v_proj.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 997015552, | |
| 997801984 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.17.attn.add_v_proj.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 997801984, | |
| 998588416 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.17.attn.to_add_out.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 998588416, | |
| 999374848 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.17.attn.to_add_out.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 999374848, | |
| 1000161280 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.17.attn.to_k.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 1000161280, | |
| 1000947712 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.17.attn.to_k.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 1000947712, | |
| 1001734144 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.17.attn.to_out.0.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 1001734144, | |
| 1002520576 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.17.attn.to_out.0.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 1002520576, | |
| 1003307008 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.17.attn.to_q.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 1003307008, | |
| 1004093440 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.17.attn.to_q.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 1004093440, | |
| 1004879872 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.17.attn.to_v.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 1004879872, | |
| 1005666304 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.17.attn.to_v.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 1005666304, | |
| 1006452736 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.17.ff.net.0.proj.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 1006452736, | |
| 1007239168 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.17.ff.net.0.proj.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 12288, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 1007239168, | |
| 1010384896 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.17.ff.net.2.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 12288 | |
| ], | |
| "data_offsets": [ | |
| 1010384896, | |
| 1013530624 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.17.ff.net.2.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 1013530624, | |
| 1014317056 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.17.ff_context.net.0.proj.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 1014317056, | |
| 1015103488 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.17.ff_context.net.0.proj.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 12288, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 1015103488, | |
| 1018249216 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.17.ff_context.net.2.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 12288 | |
| ], | |
| "data_offsets": [ | |
| 1018249216, | |
| 1021394944 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.17.ff_context.net.2.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 1021394944, | |
| 1022181376 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.17.norm1.linear.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 1022181376, | |
| 1022967808 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.17.norm1.linear.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 18432, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 1022967808, | |
| 1027686400 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.17.norm1_context.linear.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 1027686400, | |
| 1028472832 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.17.norm1_context.linear.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 18432, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 1028472832, | |
| 1033191424 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.18.attn.add_k_proj.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 1033191424, | |
| 1033977856 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.18.attn.add_k_proj.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 1033977856, | |
| 1034764288 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.18.attn.add_q_proj.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 1034764288, | |
| 1035550720 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.18.attn.add_q_proj.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 1035550720, | |
| 1036337152 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.18.attn.add_v_proj.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 1036337152, | |
| 1037123584 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.18.attn.add_v_proj.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 1037123584, | |
| 1037910016 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.18.attn.to_add_out.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 1037910016, | |
| 1038696448 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.18.attn.to_add_out.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 1038696448, | |
| 1039482880 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.18.attn.to_k.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 1039482880, | |
| 1040269312 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.18.attn.to_k.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 1040269312, | |
| 1041055744 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.18.attn.to_out.0.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 1041055744, | |
| 1041842176 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.18.attn.to_out.0.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 1041842176, | |
| 1042628608 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.18.attn.to_q.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 1042628608, | |
| 1043415040 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.18.attn.to_q.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 1043415040, | |
| 1044201472 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.18.attn.to_v.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 1044201472, | |
| 1044987904 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.18.attn.to_v.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 1044987904, | |
| 1045774336 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.18.ff.net.0.proj.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 1045774336, | |
| 1046560768 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.18.ff.net.0.proj.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 12288, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 1046560768, | |
| 1049706496 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.18.ff.net.2.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 12288 | |
| ], | |
| "data_offsets": [ | |
| 1049706496, | |
| 1052852224 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.18.ff.net.2.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 1052852224, | |
| 1053638656 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.18.ff_context.net.0.proj.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 1053638656, | |
| 1054425088 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.18.ff_context.net.0.proj.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 12288, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 1054425088, | |
| 1057570816 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.18.ff_context.net.2.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 12288 | |
| ], | |
| "data_offsets": [ | |
| 1057570816, | |
| 1060716544 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.18.ff_context.net.2.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 1060716544, | |
| 1061502976 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.18.norm1.linear.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 1061502976, | |
| 1062289408 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.18.norm1.linear.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 18432, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 1062289408, | |
| 1067008000 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.18.norm1_context.linear.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 1067008000, | |
| 1067794432 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.18.norm1_context.linear.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 18432, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 1067794432, | |
| 1072513024 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.2.attn.add_k_proj.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 1072513024, | |
| 1073299456 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.2.attn.add_k_proj.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 1073299456, | |
| 1074085888 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.2.attn.add_q_proj.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 1074085888, | |
| 1074872320 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.2.attn.add_q_proj.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 1074872320, | |
| 1075658752 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.2.attn.add_v_proj.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 1075658752, | |
| 1076445184 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.2.attn.add_v_proj.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 1076445184, | |
| 1077231616 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.2.attn.to_add_out.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 1077231616, | |
| 1078018048 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.2.attn.to_add_out.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 1078018048, | |
| 1078804480 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.2.attn.to_k.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 1078804480, | |
| 1079590912 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.2.attn.to_k.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 1079590912, | |
| 1080377344 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.2.attn.to_out.0.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 1080377344, | |
| 1081163776 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.2.attn.to_out.0.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 1081163776, | |
| 1081950208 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.2.attn.to_q.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 1081950208, | |
| 1082736640 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.2.attn.to_q.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 1082736640, | |
| 1083523072 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.2.attn.to_v.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 1083523072, | |
| 1084309504 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.2.attn.to_v.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 1084309504, | |
| 1085095936 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.2.ff.net.0.proj.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 1085095936, | |
| 1085882368 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.2.ff.net.0.proj.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 12288, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 1085882368, | |
| 1089028096 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.2.ff.net.2.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 12288 | |
| ], | |
| "data_offsets": [ | |
| 1089028096, | |
| 1092173824 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.2.ff.net.2.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 1092173824, | |
| 1092960256 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.2.ff_context.net.0.proj.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 1092960256, | |
| 1093746688 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.2.ff_context.net.0.proj.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 12288, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 1093746688, | |
| 1096892416 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.2.ff_context.net.2.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 12288 | |
| ], | |
| "data_offsets": [ | |
| 1096892416, | |
| 1100038144 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.2.ff_context.net.2.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 1100038144, | |
| 1100824576 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.2.norm1.linear.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 1100824576, | |
| 1101611008 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.2.norm1.linear.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 18432, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 1101611008, | |
| 1106329600 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.2.norm1_context.linear.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 1106329600, | |
| 1107116032 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.2.norm1_context.linear.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 18432, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 1107116032, | |
| 1111834624 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.3.attn.add_k_proj.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 1111834624, | |
| 1112621056 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.3.attn.add_k_proj.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 1112621056, | |
| 1113407488 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.3.attn.add_q_proj.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 1113407488, | |
| 1114193920 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.3.attn.add_q_proj.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 1114193920, | |
| 1114980352 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.3.attn.add_v_proj.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 1114980352, | |
| 1115766784 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.3.attn.add_v_proj.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 1115766784, | |
| 1116553216 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.3.attn.to_add_out.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 1116553216, | |
| 1117339648 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.3.attn.to_add_out.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 1117339648, | |
| 1118126080 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.3.attn.to_k.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 1118126080, | |
| 1118912512 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.3.attn.to_k.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 1118912512, | |
| 1119698944 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.3.attn.to_out.0.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 1119698944, | |
| 1120485376 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.3.attn.to_out.0.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 1120485376, | |
| 1121271808 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.3.attn.to_q.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 1121271808, | |
| 1122058240 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.3.attn.to_q.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 1122058240, | |
| 1122844672 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.3.attn.to_v.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 1122844672, | |
| 1123631104 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.3.attn.to_v.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 1123631104, | |
| 1124417536 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.3.ff.net.0.proj.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 1124417536, | |
| 1125203968 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.3.ff.net.0.proj.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 12288, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 1125203968, | |
| 1128349696 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.3.ff.net.2.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 12288 | |
| ], | |
| "data_offsets": [ | |
| 1128349696, | |
| 1131495424 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.3.ff.net.2.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 1131495424, | |
| 1132281856 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.3.ff_context.net.0.proj.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 1132281856, | |
| 1133068288 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.3.ff_context.net.0.proj.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 12288, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 1133068288, | |
| 1136214016 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.3.ff_context.net.2.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 12288 | |
| ], | |
| "data_offsets": [ | |
| 1136214016, | |
| 1139359744 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.3.ff_context.net.2.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 1139359744, | |
| 1140146176 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.3.norm1.linear.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 1140146176, | |
| 1140932608 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.3.norm1.linear.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 18432, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 1140932608, | |
| 1145651200 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.3.norm1_context.linear.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 1145651200, | |
| 1146437632 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.3.norm1_context.linear.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 18432, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 1146437632, | |
| 1151156224 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.4.attn.add_k_proj.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 1151156224, | |
| 1151942656 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.4.attn.add_k_proj.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 1151942656, | |
| 1152729088 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.4.attn.add_q_proj.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 1152729088, | |
| 1153515520 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.4.attn.add_q_proj.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 1153515520, | |
| 1154301952 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.4.attn.add_v_proj.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 1154301952, | |
| 1155088384 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.4.attn.add_v_proj.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 1155088384, | |
| 1155874816 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.4.attn.to_add_out.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 1155874816, | |
| 1156661248 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.4.attn.to_add_out.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 1156661248, | |
| 1157447680 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.4.attn.to_k.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 1157447680, | |
| 1158234112 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.4.attn.to_k.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 1158234112, | |
| 1159020544 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.4.attn.to_out.0.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 1159020544, | |
| 1159806976 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.4.attn.to_out.0.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 1159806976, | |
| 1160593408 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.4.attn.to_q.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 1160593408, | |
| 1161379840 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.4.attn.to_q.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 1161379840, | |
| 1162166272 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.4.attn.to_v.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 1162166272, | |
| 1162952704 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.4.attn.to_v.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 1162952704, | |
| 1163739136 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.4.ff.net.0.proj.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 1163739136, | |
| 1164525568 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.4.ff.net.0.proj.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 12288, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 1164525568, | |
| 1167671296 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.4.ff.net.2.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 12288 | |
| ], | |
| "data_offsets": [ | |
| 1167671296, | |
| 1170817024 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.4.ff.net.2.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 1170817024, | |
| 1171603456 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.4.ff_context.net.0.proj.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 1171603456, | |
| 1172389888 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.4.ff_context.net.0.proj.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 12288, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 1172389888, | |
| 1175535616 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.4.ff_context.net.2.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 12288 | |
| ], | |
| "data_offsets": [ | |
| 1175535616, | |
| 1178681344 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.4.ff_context.net.2.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 1178681344, | |
| 1179467776 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.4.norm1.linear.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 1179467776, | |
| 1180254208 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.4.norm1.linear.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 18432, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 1180254208, | |
| 1184972800 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.4.norm1_context.linear.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 1184972800, | |
| 1185759232 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.4.norm1_context.linear.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 18432, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 1185759232, | |
| 1190477824 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.5.attn.add_k_proj.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 1190477824, | |
| 1191264256 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.5.attn.add_k_proj.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 1191264256, | |
| 1192050688 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.5.attn.add_q_proj.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 1192050688, | |
| 1192837120 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.5.attn.add_q_proj.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 1192837120, | |
| 1193623552 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.5.attn.add_v_proj.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 1193623552, | |
| 1194409984 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.5.attn.add_v_proj.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 1194409984, | |
| 1195196416 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.5.attn.to_add_out.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 1195196416, | |
| 1195982848 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.5.attn.to_add_out.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 1195982848, | |
| 1196769280 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.5.attn.to_k.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 1196769280, | |
| 1197555712 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.5.attn.to_k.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 1197555712, | |
| 1198342144 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.5.attn.to_out.0.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 1198342144, | |
| 1199128576 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.5.attn.to_out.0.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 1199128576, | |
| 1199915008 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.5.attn.to_q.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 1199915008, | |
| 1200701440 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.5.attn.to_q.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 1200701440, | |
| 1201487872 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.5.attn.to_v.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 1201487872, | |
| 1202274304 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.5.attn.to_v.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 1202274304, | |
| 1203060736 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.5.ff.net.0.proj.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 1203060736, | |
| 1203847168 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.5.ff.net.0.proj.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 12288, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 1203847168, | |
| 1206992896 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.5.ff.net.2.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 12288 | |
| ], | |
| "data_offsets": [ | |
| 1206992896, | |
| 1210138624 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.5.ff.net.2.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 1210138624, | |
| 1210925056 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.5.ff_context.net.0.proj.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 1210925056, | |
| 1211711488 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.5.ff_context.net.0.proj.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 12288, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 1211711488, | |
| 1214857216 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.5.ff_context.net.2.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 12288 | |
| ], | |
| "data_offsets": [ | |
| 1214857216, | |
| 1218002944 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.5.ff_context.net.2.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 1218002944, | |
| 1218789376 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.5.norm1.linear.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 1218789376, | |
| 1219575808 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.5.norm1.linear.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 18432, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 1219575808, | |
| 1224294400 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.5.norm1_context.linear.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 1224294400, | |
| 1225080832 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.5.norm1_context.linear.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 18432, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 1225080832, | |
| 1229799424 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.6.attn.add_k_proj.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 1229799424, | |
| 1230585856 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.6.attn.add_k_proj.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 1230585856, | |
| 1231372288 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.6.attn.add_q_proj.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 1231372288, | |
| 1232158720 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.6.attn.add_q_proj.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 1232158720, | |
| 1232945152 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.6.attn.add_v_proj.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 1232945152, | |
| 1233731584 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.6.attn.add_v_proj.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 1233731584, | |
| 1234518016 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.6.attn.to_add_out.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 1234518016, | |
| 1235304448 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.6.attn.to_add_out.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 1235304448, | |
| 1236090880 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.6.attn.to_k.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 1236090880, | |
| 1236877312 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.6.attn.to_k.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 1236877312, | |
| 1237663744 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.6.attn.to_out.0.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 1237663744, | |
| 1238450176 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.6.attn.to_out.0.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 1238450176, | |
| 1239236608 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.6.attn.to_q.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 1239236608, | |
| 1240023040 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.6.attn.to_q.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 1240023040, | |
| 1240809472 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.6.attn.to_v.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 1240809472, | |
| 1241595904 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.6.attn.to_v.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 1241595904, | |
| 1242382336 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.6.ff.net.0.proj.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 1242382336, | |
| 1243168768 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.6.ff.net.0.proj.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 12288, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 1243168768, | |
| 1246314496 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.6.ff.net.2.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 12288 | |
| ], | |
| "data_offsets": [ | |
| 1246314496, | |
| 1249460224 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.6.ff.net.2.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 1249460224, | |
| 1250246656 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.6.ff_context.net.0.proj.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 1250246656, | |
| 1251033088 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.6.ff_context.net.0.proj.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 12288, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 1251033088, | |
| 1254178816 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.6.ff_context.net.2.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 12288 | |
| ], | |
| "data_offsets": [ | |
| 1254178816, | |
| 1257324544 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.6.ff_context.net.2.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 1257324544, | |
| 1258110976 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.6.norm1.linear.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 1258110976, | |
| 1258897408 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.6.norm1.linear.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 18432, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 1258897408, | |
| 1263616000 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.6.norm1_context.linear.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 1263616000, | |
| 1264402432 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.6.norm1_context.linear.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 18432, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 1264402432, | |
| 1269121024 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.7.attn.add_k_proj.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 1269121024, | |
| 1269907456 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.7.attn.add_k_proj.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 1269907456, | |
| 1270693888 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.7.attn.add_q_proj.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 1270693888, | |
| 1271480320 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.7.attn.add_q_proj.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 1271480320, | |
| 1272266752 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.7.attn.add_v_proj.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 1272266752, | |
| 1273053184 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.7.attn.add_v_proj.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 1273053184, | |
| 1273839616 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.7.attn.to_add_out.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 1273839616, | |
| 1274626048 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.7.attn.to_add_out.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 1274626048, | |
| 1275412480 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.7.attn.to_k.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 1275412480, | |
| 1276198912 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.7.attn.to_k.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 1276198912, | |
| 1276985344 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.7.attn.to_out.0.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 1276985344, | |
| 1277771776 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.7.attn.to_out.0.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 1277771776, | |
| 1278558208 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.7.attn.to_q.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 1278558208, | |
| 1279344640 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.7.attn.to_q.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 1279344640, | |
| 1280131072 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.7.attn.to_v.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 1280131072, | |
| 1280917504 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.7.attn.to_v.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 1280917504, | |
| 1281703936 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.7.ff.net.0.proj.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 1281703936, | |
| 1282490368 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.7.ff.net.0.proj.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 12288, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 1282490368, | |
| 1285636096 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.7.ff.net.2.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 12288 | |
| ], | |
| "data_offsets": [ | |
| 1285636096, | |
| 1288781824 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.7.ff.net.2.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 1288781824, | |
| 1289568256 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.7.ff_context.net.0.proj.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 1289568256, | |
| 1290354688 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.7.ff_context.net.0.proj.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 12288, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 1290354688, | |
| 1293500416 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.7.ff_context.net.2.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 12288 | |
| ], | |
| "data_offsets": [ | |
| 1293500416, | |
| 1296646144 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.7.ff_context.net.2.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 1296646144, | |
| 1297432576 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.7.norm1.linear.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 1297432576, | |
| 1298219008 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.7.norm1.linear.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 18432, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 1298219008, | |
| 1302937600 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.7.norm1_context.linear.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 1302937600, | |
| 1303724032 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.7.norm1_context.linear.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 18432, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 1303724032, | |
| 1308442624 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.8.attn.add_k_proj.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 1308442624, | |
| 1309229056 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.8.attn.add_k_proj.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 1309229056, | |
| 1310015488 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.8.attn.add_q_proj.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 1310015488, | |
| 1310801920 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.8.attn.add_q_proj.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 1310801920, | |
| 1311588352 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.8.attn.add_v_proj.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 1311588352, | |
| 1312374784 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.8.attn.add_v_proj.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 1312374784, | |
| 1313161216 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.8.attn.to_add_out.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 1313161216, | |
| 1313947648 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.8.attn.to_add_out.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 1313947648, | |
| 1314734080 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.8.attn.to_k.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 1314734080, | |
| 1315520512 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.8.attn.to_k.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 1315520512, | |
| 1316306944 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.8.attn.to_out.0.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 1316306944, | |
| 1317093376 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.8.attn.to_out.0.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 1317093376, | |
| 1317879808 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.8.attn.to_q.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 1317879808, | |
| 1318666240 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.8.attn.to_q.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 1318666240, | |
| 1319452672 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.8.attn.to_v.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 1319452672, | |
| 1320239104 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.8.attn.to_v.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 1320239104, | |
| 1321025536 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.8.ff.net.0.proj.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 1321025536, | |
| 1321811968 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.8.ff.net.0.proj.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 12288, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 1321811968, | |
| 1324957696 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.8.ff.net.2.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 12288 | |
| ], | |
| "data_offsets": [ | |
| 1324957696, | |
| 1328103424 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.8.ff.net.2.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 1328103424, | |
| 1328889856 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.8.ff_context.net.0.proj.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 1328889856, | |
| 1329676288 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.8.ff_context.net.0.proj.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 12288, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 1329676288, | |
| 1332822016 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.8.ff_context.net.2.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 12288 | |
| ], | |
| "data_offsets": [ | |
| 1332822016, | |
| 1335967744 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.8.ff_context.net.2.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 1335967744, | |
| 1336754176 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.8.norm1.linear.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 1336754176, | |
| 1337540608 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.8.norm1.linear.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 18432, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 1337540608, | |
| 1342259200 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.8.norm1_context.linear.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 1342259200, | |
| 1343045632 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.8.norm1_context.linear.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 18432, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 1343045632, | |
| 1347764224 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.9.attn.add_k_proj.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 1347764224, | |
| 1348550656 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.9.attn.add_k_proj.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 1348550656, | |
| 1349337088 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.9.attn.add_q_proj.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 1349337088, | |
| 1350123520 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.9.attn.add_q_proj.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 1350123520, | |
| 1350909952 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.9.attn.add_v_proj.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 1350909952, | |
| 1351696384 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.9.attn.add_v_proj.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 1351696384, | |
| 1352482816 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.9.attn.to_add_out.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 1352482816, | |
| 1353269248 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.9.attn.to_add_out.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 1353269248, | |
| 1354055680 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.9.attn.to_k.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 1354055680, | |
| 1354842112 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.9.attn.to_k.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 1354842112, | |
| 1355628544 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.9.attn.to_out.0.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 1355628544, | |
| 1356414976 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.9.attn.to_out.0.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 1356414976, | |
| 1357201408 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.9.attn.to_q.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 1357201408, | |
| 1357987840 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.9.attn.to_q.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 1357987840, | |
| 1358774272 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.9.attn.to_v.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 1358774272, | |
| 1359560704 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.9.attn.to_v.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 1359560704, | |
| 1360347136 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.9.ff.net.0.proj.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 1360347136, | |
| 1361133568 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.9.ff.net.0.proj.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 12288, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 1361133568, | |
| 1364279296 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.9.ff.net.2.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 12288 | |
| ], | |
| "data_offsets": [ | |
| 1364279296, | |
| 1367425024 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.9.ff.net.2.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 1367425024, | |
| 1368211456 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.9.ff_context.net.0.proj.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 1368211456, | |
| 1368997888 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.9.ff_context.net.0.proj.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 12288, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 1368997888, | |
| 1372143616 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.9.ff_context.net.2.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 12288 | |
| ], | |
| "data_offsets": [ | |
| 1372143616, | |
| 1375289344 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.9.ff_context.net.2.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 1375289344, | |
| 1376075776 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.9.norm1.linear.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 1376075776, | |
| 1376862208 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.9.norm1.linear.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 18432, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 1376862208, | |
| 1381580800 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.9.norm1_context.linear.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 3072 | |
| ], | |
| "data_offsets": [ | |
| 1381580800, | |
| 1382367232 | |
| ] | |
| }, | |
| "transformer.transformer_blocks.9.norm1_context.linear.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 18432, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 1382367232, | |
| 1387085824 | |
| ] | |
| }, | |
| "transformer.x_embedder.lora_A.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 64, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 1387085824, | |
| 1387102208 | |
| ] | |
| }, | |
| "transformer.x_embedder.lora_B.weight": { | |
| "dtype": "F32", | |
| "shape": [ | |
| 3072, | |
| 64 | |
| ], | |
| "data_offsets": [ | |
| 1387102208, | |
| 1387888640 | |
| ] | |
| } | |
| } |