MIR_ / layer_data /Hyper-FLUX.1-dev-8steps-lora.safetensors.json
exdysa's picture
Upload 423 files
726308e verified
{
"transformer.context_embedder.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
4096
],
"data_offsets": [
0,
1048576
]
},
"transformer.context_embedder.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
1048576,
1835008
]
},
"transformer.norm_out.linear.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
1835008,
2621440
]
},
"transformer.norm_out.linear.lora_B.weight": {
"dtype": "F32",
"shape": [
6144,
64
],
"data_offsets": [
2621440,
4194304
]
},
"transformer.proj_out.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
4194304,
4980736
]
},
"transformer.proj_out.lora_B.weight": {
"dtype": "F32",
"shape": [
64,
64
],
"data_offsets": [
4980736,
4997120
]
},
"transformer.single_transformer_blocks.0.attn.to_k.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
4997120,
5783552
]
},
"transformer.single_transformer_blocks.0.attn.to_k.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
5783552,
6569984
]
},
"transformer.single_transformer_blocks.0.attn.to_q.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
6569984,
7356416
]
},
"transformer.single_transformer_blocks.0.attn.to_q.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
7356416,
8142848
]
},
"transformer.single_transformer_blocks.0.attn.to_v.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
8142848,
8929280
]
},
"transformer.single_transformer_blocks.0.attn.to_v.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
8929280,
9715712
]
},
"transformer.single_transformer_blocks.0.norm.linear.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
9715712,
10502144
]
},
"transformer.single_transformer_blocks.0.norm.linear.lora_B.weight": {
"dtype": "F32",
"shape": [
9216,
64
],
"data_offsets": [
10502144,
12861440
]
},
"transformer.single_transformer_blocks.0.proj_mlp.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
12861440,
13647872
]
},
"transformer.single_transformer_blocks.0.proj_mlp.lora_B.weight": {
"dtype": "F32",
"shape": [
12288,
64
],
"data_offsets": [
13647872,
16793600
]
},
"transformer.single_transformer_blocks.0.proj_out.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
15360
],
"data_offsets": [
16793600,
20725760
]
},
"transformer.single_transformer_blocks.0.proj_out.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
20725760,
21512192
]
},
"transformer.single_transformer_blocks.1.attn.to_k.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
21512192,
22298624
]
},
"transformer.single_transformer_blocks.1.attn.to_k.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
22298624,
23085056
]
},
"transformer.single_transformer_blocks.1.attn.to_q.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
23085056,
23871488
]
},
"transformer.single_transformer_blocks.1.attn.to_q.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
23871488,
24657920
]
},
"transformer.single_transformer_blocks.1.attn.to_v.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
24657920,
25444352
]
},
"transformer.single_transformer_blocks.1.attn.to_v.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
25444352,
26230784
]
},
"transformer.single_transformer_blocks.1.norm.linear.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
26230784,
27017216
]
},
"transformer.single_transformer_blocks.1.norm.linear.lora_B.weight": {
"dtype": "F32",
"shape": [
9216,
64
],
"data_offsets": [
27017216,
29376512
]
},
"transformer.single_transformer_blocks.1.proj_mlp.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
29376512,
30162944
]
},
"transformer.single_transformer_blocks.1.proj_mlp.lora_B.weight": {
"dtype": "F32",
"shape": [
12288,
64
],
"data_offsets": [
30162944,
33308672
]
},
"transformer.single_transformer_blocks.1.proj_out.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
15360
],
"data_offsets": [
33308672,
37240832
]
},
"transformer.single_transformer_blocks.1.proj_out.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
37240832,
38027264
]
},
"transformer.single_transformer_blocks.10.attn.to_k.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
38027264,
38813696
]
},
"transformer.single_transformer_blocks.10.attn.to_k.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
38813696,
39600128
]
},
"transformer.single_transformer_blocks.10.attn.to_q.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
39600128,
40386560
]
},
"transformer.single_transformer_blocks.10.attn.to_q.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
40386560,
41172992
]
},
"transformer.single_transformer_blocks.10.attn.to_v.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
41172992,
41959424
]
},
"transformer.single_transformer_blocks.10.attn.to_v.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
41959424,
42745856
]
},
"transformer.single_transformer_blocks.10.norm.linear.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
42745856,
43532288
]
},
"transformer.single_transformer_blocks.10.norm.linear.lora_B.weight": {
"dtype": "F32",
"shape": [
9216,
64
],
"data_offsets": [
43532288,
45891584
]
},
"transformer.single_transformer_blocks.10.proj_mlp.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
45891584,
46678016
]
},
"transformer.single_transformer_blocks.10.proj_mlp.lora_B.weight": {
"dtype": "F32",
"shape": [
12288,
64
],
"data_offsets": [
46678016,
49823744
]
},
"transformer.single_transformer_blocks.10.proj_out.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
15360
],
"data_offsets": [
49823744,
53755904
]
},
"transformer.single_transformer_blocks.10.proj_out.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
53755904,
54542336
]
},
"transformer.single_transformer_blocks.11.attn.to_k.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
54542336,
55328768
]
},
"transformer.single_transformer_blocks.11.attn.to_k.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
55328768,
56115200
]
},
"transformer.single_transformer_blocks.11.attn.to_q.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
56115200,
56901632
]
},
"transformer.single_transformer_blocks.11.attn.to_q.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
56901632,
57688064
]
},
"transformer.single_transformer_blocks.11.attn.to_v.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
57688064,
58474496
]
},
"transformer.single_transformer_blocks.11.attn.to_v.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
58474496,
59260928
]
},
"transformer.single_transformer_blocks.11.norm.linear.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
59260928,
60047360
]
},
"transformer.single_transformer_blocks.11.norm.linear.lora_B.weight": {
"dtype": "F32",
"shape": [
9216,
64
],
"data_offsets": [
60047360,
62406656
]
},
"transformer.single_transformer_blocks.11.proj_mlp.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
62406656,
63193088
]
},
"transformer.single_transformer_blocks.11.proj_mlp.lora_B.weight": {
"dtype": "F32",
"shape": [
12288,
64
],
"data_offsets": [
63193088,
66338816
]
},
"transformer.single_transformer_blocks.11.proj_out.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
15360
],
"data_offsets": [
66338816,
70270976
]
},
"transformer.single_transformer_blocks.11.proj_out.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
70270976,
71057408
]
},
"transformer.single_transformer_blocks.12.attn.to_k.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
71057408,
71843840
]
},
"transformer.single_transformer_blocks.12.attn.to_k.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
71843840,
72630272
]
},
"transformer.single_transformer_blocks.12.attn.to_q.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
72630272,
73416704
]
},
"transformer.single_transformer_blocks.12.attn.to_q.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
73416704,
74203136
]
},
"transformer.single_transformer_blocks.12.attn.to_v.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
74203136,
74989568
]
},
"transformer.single_transformer_blocks.12.attn.to_v.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
74989568,
75776000
]
},
"transformer.single_transformer_blocks.12.norm.linear.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
75776000,
76562432
]
},
"transformer.single_transformer_blocks.12.norm.linear.lora_B.weight": {
"dtype": "F32",
"shape": [
9216,
64
],
"data_offsets": [
76562432,
78921728
]
},
"transformer.single_transformer_blocks.12.proj_mlp.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
78921728,
79708160
]
},
"transformer.single_transformer_blocks.12.proj_mlp.lora_B.weight": {
"dtype": "F32",
"shape": [
12288,
64
],
"data_offsets": [
79708160,
82853888
]
},
"transformer.single_transformer_blocks.12.proj_out.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
15360
],
"data_offsets": [
82853888,
86786048
]
},
"transformer.single_transformer_blocks.12.proj_out.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
86786048,
87572480
]
},
"transformer.single_transformer_blocks.13.attn.to_k.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
87572480,
88358912
]
},
"transformer.single_transformer_blocks.13.attn.to_k.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
88358912,
89145344
]
},
"transformer.single_transformer_blocks.13.attn.to_q.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
89145344,
89931776
]
},
"transformer.single_transformer_blocks.13.attn.to_q.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
89931776,
90718208
]
},
"transformer.single_transformer_blocks.13.attn.to_v.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
90718208,
91504640
]
},
"transformer.single_transformer_blocks.13.attn.to_v.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
91504640,
92291072
]
},
"transformer.single_transformer_blocks.13.norm.linear.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
92291072,
93077504
]
},
"transformer.single_transformer_blocks.13.norm.linear.lora_B.weight": {
"dtype": "F32",
"shape": [
9216,
64
],
"data_offsets": [
93077504,
95436800
]
},
"transformer.single_transformer_blocks.13.proj_mlp.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
95436800,
96223232
]
},
"transformer.single_transformer_blocks.13.proj_mlp.lora_B.weight": {
"dtype": "F32",
"shape": [
12288,
64
],
"data_offsets": [
96223232,
99368960
]
},
"transformer.single_transformer_blocks.13.proj_out.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
15360
],
"data_offsets": [
99368960,
103301120
]
},
"transformer.single_transformer_blocks.13.proj_out.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
103301120,
104087552
]
},
"transformer.single_transformer_blocks.14.attn.to_k.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
104087552,
104873984
]
},
"transformer.single_transformer_blocks.14.attn.to_k.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
104873984,
105660416
]
},
"transformer.single_transformer_blocks.14.attn.to_q.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
105660416,
106446848
]
},
"transformer.single_transformer_blocks.14.attn.to_q.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
106446848,
107233280
]
},
"transformer.single_transformer_blocks.14.attn.to_v.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
107233280,
108019712
]
},
"transformer.single_transformer_blocks.14.attn.to_v.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
108019712,
108806144
]
},
"transformer.single_transformer_blocks.14.norm.linear.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
108806144,
109592576
]
},
"transformer.single_transformer_blocks.14.norm.linear.lora_B.weight": {
"dtype": "F32",
"shape": [
9216,
64
],
"data_offsets": [
109592576,
111951872
]
},
"transformer.single_transformer_blocks.14.proj_mlp.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
111951872,
112738304
]
},
"transformer.single_transformer_blocks.14.proj_mlp.lora_B.weight": {
"dtype": "F32",
"shape": [
12288,
64
],
"data_offsets": [
112738304,
115884032
]
},
"transformer.single_transformer_blocks.14.proj_out.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
15360
],
"data_offsets": [
115884032,
119816192
]
},
"transformer.single_transformer_blocks.14.proj_out.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
119816192,
120602624
]
},
"transformer.single_transformer_blocks.15.attn.to_k.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
120602624,
121389056
]
},
"transformer.single_transformer_blocks.15.attn.to_k.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
121389056,
122175488
]
},
"transformer.single_transformer_blocks.15.attn.to_q.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
122175488,
122961920
]
},
"transformer.single_transformer_blocks.15.attn.to_q.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
122961920,
123748352
]
},
"transformer.single_transformer_blocks.15.attn.to_v.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
123748352,
124534784
]
},
"transformer.single_transformer_blocks.15.attn.to_v.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
124534784,
125321216
]
},
"transformer.single_transformer_blocks.15.norm.linear.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
125321216,
126107648
]
},
"transformer.single_transformer_blocks.15.norm.linear.lora_B.weight": {
"dtype": "F32",
"shape": [
9216,
64
],
"data_offsets": [
126107648,
128466944
]
},
"transformer.single_transformer_blocks.15.proj_mlp.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
128466944,
129253376
]
},
"transformer.single_transformer_blocks.15.proj_mlp.lora_B.weight": {
"dtype": "F32",
"shape": [
12288,
64
],
"data_offsets": [
129253376,
132399104
]
},
"transformer.single_transformer_blocks.15.proj_out.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
15360
],
"data_offsets": [
132399104,
136331264
]
},
"transformer.single_transformer_blocks.15.proj_out.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
136331264,
137117696
]
},
"transformer.single_transformer_blocks.16.attn.to_k.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
137117696,
137904128
]
},
"transformer.single_transformer_blocks.16.attn.to_k.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
137904128,
138690560
]
},
"transformer.single_transformer_blocks.16.attn.to_q.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
138690560,
139476992
]
},
"transformer.single_transformer_blocks.16.attn.to_q.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
139476992,
140263424
]
},
"transformer.single_transformer_blocks.16.attn.to_v.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
140263424,
141049856
]
},
"transformer.single_transformer_blocks.16.attn.to_v.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
141049856,
141836288
]
},
"transformer.single_transformer_blocks.16.norm.linear.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
141836288,
142622720
]
},
"transformer.single_transformer_blocks.16.norm.linear.lora_B.weight": {
"dtype": "F32",
"shape": [
9216,
64
],
"data_offsets": [
142622720,
144982016
]
},
"transformer.single_transformer_blocks.16.proj_mlp.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
144982016,
145768448
]
},
"transformer.single_transformer_blocks.16.proj_mlp.lora_B.weight": {
"dtype": "F32",
"shape": [
12288,
64
],
"data_offsets": [
145768448,
148914176
]
},
"transformer.single_transformer_blocks.16.proj_out.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
15360
],
"data_offsets": [
148914176,
152846336
]
},
"transformer.single_transformer_blocks.16.proj_out.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
152846336,
153632768
]
},
"transformer.single_transformer_blocks.17.attn.to_k.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
153632768,
154419200
]
},
"transformer.single_transformer_blocks.17.attn.to_k.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
154419200,
155205632
]
},
"transformer.single_transformer_blocks.17.attn.to_q.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
155205632,
155992064
]
},
"transformer.single_transformer_blocks.17.attn.to_q.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
155992064,
156778496
]
},
"transformer.single_transformer_blocks.17.attn.to_v.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
156778496,
157564928
]
},
"transformer.single_transformer_blocks.17.attn.to_v.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
157564928,
158351360
]
},
"transformer.single_transformer_blocks.17.norm.linear.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
158351360,
159137792
]
},
"transformer.single_transformer_blocks.17.norm.linear.lora_B.weight": {
"dtype": "F32",
"shape": [
9216,
64
],
"data_offsets": [
159137792,
161497088
]
},
"transformer.single_transformer_blocks.17.proj_mlp.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
161497088,
162283520
]
},
"transformer.single_transformer_blocks.17.proj_mlp.lora_B.weight": {
"dtype": "F32",
"shape": [
12288,
64
],
"data_offsets": [
162283520,
165429248
]
},
"transformer.single_transformer_blocks.17.proj_out.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
15360
],
"data_offsets": [
165429248,
169361408
]
},
"transformer.single_transformer_blocks.17.proj_out.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
169361408,
170147840
]
},
"transformer.single_transformer_blocks.18.attn.to_k.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
170147840,
170934272
]
},
"transformer.single_transformer_blocks.18.attn.to_k.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
170934272,
171720704
]
},
"transformer.single_transformer_blocks.18.attn.to_q.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
171720704,
172507136
]
},
"transformer.single_transformer_blocks.18.attn.to_q.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
172507136,
173293568
]
},
"transformer.single_transformer_blocks.18.attn.to_v.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
173293568,
174080000
]
},
"transformer.single_transformer_blocks.18.attn.to_v.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
174080000,
174866432
]
},
"transformer.single_transformer_blocks.18.norm.linear.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
174866432,
175652864
]
},
"transformer.single_transformer_blocks.18.norm.linear.lora_B.weight": {
"dtype": "F32",
"shape": [
9216,
64
],
"data_offsets": [
175652864,
178012160
]
},
"transformer.single_transformer_blocks.18.proj_mlp.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
178012160,
178798592
]
},
"transformer.single_transformer_blocks.18.proj_mlp.lora_B.weight": {
"dtype": "F32",
"shape": [
12288,
64
],
"data_offsets": [
178798592,
181944320
]
},
"transformer.single_transformer_blocks.18.proj_out.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
15360
],
"data_offsets": [
181944320,
185876480
]
},
"transformer.single_transformer_blocks.18.proj_out.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
185876480,
186662912
]
},
"transformer.single_transformer_blocks.19.attn.to_k.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
186662912,
187449344
]
},
"transformer.single_transformer_blocks.19.attn.to_k.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
187449344,
188235776
]
},
"transformer.single_transformer_blocks.19.attn.to_q.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
188235776,
189022208
]
},
"transformer.single_transformer_blocks.19.attn.to_q.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
189022208,
189808640
]
},
"transformer.single_transformer_blocks.19.attn.to_v.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
189808640,
190595072
]
},
"transformer.single_transformer_blocks.19.attn.to_v.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
190595072,
191381504
]
},
"transformer.single_transformer_blocks.19.norm.linear.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
191381504,
192167936
]
},
"transformer.single_transformer_blocks.19.norm.linear.lora_B.weight": {
"dtype": "F32",
"shape": [
9216,
64
],
"data_offsets": [
192167936,
194527232
]
},
"transformer.single_transformer_blocks.19.proj_mlp.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
194527232,
195313664
]
},
"transformer.single_transformer_blocks.19.proj_mlp.lora_B.weight": {
"dtype": "F32",
"shape": [
12288,
64
],
"data_offsets": [
195313664,
198459392
]
},
"transformer.single_transformer_blocks.19.proj_out.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
15360
],
"data_offsets": [
198459392,
202391552
]
},
"transformer.single_transformer_blocks.19.proj_out.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
202391552,
203177984
]
},
"transformer.single_transformer_blocks.2.attn.to_k.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
203177984,
203964416
]
},
"transformer.single_transformer_blocks.2.attn.to_k.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
203964416,
204750848
]
},
"transformer.single_transformer_blocks.2.attn.to_q.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
204750848,
205537280
]
},
"transformer.single_transformer_blocks.2.attn.to_q.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
205537280,
206323712
]
},
"transformer.single_transformer_blocks.2.attn.to_v.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
206323712,
207110144
]
},
"transformer.single_transformer_blocks.2.attn.to_v.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
207110144,
207896576
]
},
"transformer.single_transformer_blocks.2.norm.linear.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
207896576,
208683008
]
},
"transformer.single_transformer_blocks.2.norm.linear.lora_B.weight": {
"dtype": "F32",
"shape": [
9216,
64
],
"data_offsets": [
208683008,
211042304
]
},
"transformer.single_transformer_blocks.2.proj_mlp.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
211042304,
211828736
]
},
"transformer.single_transformer_blocks.2.proj_mlp.lora_B.weight": {
"dtype": "F32",
"shape": [
12288,
64
],
"data_offsets": [
211828736,
214974464
]
},
"transformer.single_transformer_blocks.2.proj_out.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
15360
],
"data_offsets": [
214974464,
218906624
]
},
"transformer.single_transformer_blocks.2.proj_out.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
218906624,
219693056
]
},
"transformer.single_transformer_blocks.20.attn.to_k.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
219693056,
220479488
]
},
"transformer.single_transformer_blocks.20.attn.to_k.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
220479488,
221265920
]
},
"transformer.single_transformer_blocks.20.attn.to_q.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
221265920,
222052352
]
},
"transformer.single_transformer_blocks.20.attn.to_q.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
222052352,
222838784
]
},
"transformer.single_transformer_blocks.20.attn.to_v.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
222838784,
223625216
]
},
"transformer.single_transformer_blocks.20.attn.to_v.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
223625216,
224411648
]
},
"transformer.single_transformer_blocks.20.norm.linear.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
224411648,
225198080
]
},
"transformer.single_transformer_blocks.20.norm.linear.lora_B.weight": {
"dtype": "F32",
"shape": [
9216,
64
],
"data_offsets": [
225198080,
227557376
]
},
"transformer.single_transformer_blocks.20.proj_mlp.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
227557376,
228343808
]
},
"transformer.single_transformer_blocks.20.proj_mlp.lora_B.weight": {
"dtype": "F32",
"shape": [
12288,
64
],
"data_offsets": [
228343808,
231489536
]
},
"transformer.single_transformer_blocks.20.proj_out.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
15360
],
"data_offsets": [
231489536,
235421696
]
},
"transformer.single_transformer_blocks.20.proj_out.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
235421696,
236208128
]
},
"transformer.single_transformer_blocks.21.attn.to_k.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
236208128,
236994560
]
},
"transformer.single_transformer_blocks.21.attn.to_k.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
236994560,
237780992
]
},
"transformer.single_transformer_blocks.21.attn.to_q.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
237780992,
238567424
]
},
"transformer.single_transformer_blocks.21.attn.to_q.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
238567424,
239353856
]
},
"transformer.single_transformer_blocks.21.attn.to_v.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
239353856,
240140288
]
},
"transformer.single_transformer_blocks.21.attn.to_v.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
240140288,
240926720
]
},
"transformer.single_transformer_blocks.21.norm.linear.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
240926720,
241713152
]
},
"transformer.single_transformer_blocks.21.norm.linear.lora_B.weight": {
"dtype": "F32",
"shape": [
9216,
64
],
"data_offsets": [
241713152,
244072448
]
},
"transformer.single_transformer_blocks.21.proj_mlp.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
244072448,
244858880
]
},
"transformer.single_transformer_blocks.21.proj_mlp.lora_B.weight": {
"dtype": "F32",
"shape": [
12288,
64
],
"data_offsets": [
244858880,
248004608
]
},
"transformer.single_transformer_blocks.21.proj_out.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
15360
],
"data_offsets": [
248004608,
251936768
]
},
"transformer.single_transformer_blocks.21.proj_out.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
251936768,
252723200
]
},
"transformer.single_transformer_blocks.22.attn.to_k.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
252723200,
253509632
]
},
"transformer.single_transformer_blocks.22.attn.to_k.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
253509632,
254296064
]
},
"transformer.single_transformer_blocks.22.attn.to_q.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
254296064,
255082496
]
},
"transformer.single_transformer_blocks.22.attn.to_q.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
255082496,
255868928
]
},
"transformer.single_transformer_blocks.22.attn.to_v.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
255868928,
256655360
]
},
"transformer.single_transformer_blocks.22.attn.to_v.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
256655360,
257441792
]
},
"transformer.single_transformer_blocks.22.norm.linear.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
257441792,
258228224
]
},
"transformer.single_transformer_blocks.22.norm.linear.lora_B.weight": {
"dtype": "F32",
"shape": [
9216,
64
],
"data_offsets": [
258228224,
260587520
]
},
"transformer.single_transformer_blocks.22.proj_mlp.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
260587520,
261373952
]
},
"transformer.single_transformer_blocks.22.proj_mlp.lora_B.weight": {
"dtype": "F32",
"shape": [
12288,
64
],
"data_offsets": [
261373952,
264519680
]
},
"transformer.single_transformer_blocks.22.proj_out.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
15360
],
"data_offsets": [
264519680,
268451840
]
},
"transformer.single_transformer_blocks.22.proj_out.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
268451840,
269238272
]
},
"transformer.single_transformer_blocks.23.attn.to_k.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
269238272,
270024704
]
},
"transformer.single_transformer_blocks.23.attn.to_k.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
270024704,
270811136
]
},
"transformer.single_transformer_blocks.23.attn.to_q.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
270811136,
271597568
]
},
"transformer.single_transformer_blocks.23.attn.to_q.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
271597568,
272384000
]
},
"transformer.single_transformer_blocks.23.attn.to_v.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
272384000,
273170432
]
},
"transformer.single_transformer_blocks.23.attn.to_v.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
273170432,
273956864
]
},
"transformer.single_transformer_blocks.23.norm.linear.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
273956864,
274743296
]
},
"transformer.single_transformer_blocks.23.norm.linear.lora_B.weight": {
"dtype": "F32",
"shape": [
9216,
64
],
"data_offsets": [
274743296,
277102592
]
},
"transformer.single_transformer_blocks.23.proj_mlp.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
277102592,
277889024
]
},
"transformer.single_transformer_blocks.23.proj_mlp.lora_B.weight": {
"dtype": "F32",
"shape": [
12288,
64
],
"data_offsets": [
277889024,
281034752
]
},
"transformer.single_transformer_blocks.23.proj_out.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
15360
],
"data_offsets": [
281034752,
284966912
]
},
"transformer.single_transformer_blocks.23.proj_out.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
284966912,
285753344
]
},
"transformer.single_transformer_blocks.24.attn.to_k.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
285753344,
286539776
]
},
"transformer.single_transformer_blocks.24.attn.to_k.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
286539776,
287326208
]
},
"transformer.single_transformer_blocks.24.attn.to_q.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
287326208,
288112640
]
},
"transformer.single_transformer_blocks.24.attn.to_q.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
288112640,
288899072
]
},
"transformer.single_transformer_blocks.24.attn.to_v.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
288899072,
289685504
]
},
"transformer.single_transformer_blocks.24.attn.to_v.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
289685504,
290471936
]
},
"transformer.single_transformer_blocks.24.norm.linear.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
290471936,
291258368
]
},
"transformer.single_transformer_blocks.24.norm.linear.lora_B.weight": {
"dtype": "F32",
"shape": [
9216,
64
],
"data_offsets": [
291258368,
293617664
]
},
"transformer.single_transformer_blocks.24.proj_mlp.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
293617664,
294404096
]
},
"transformer.single_transformer_blocks.24.proj_mlp.lora_B.weight": {
"dtype": "F32",
"shape": [
12288,
64
],
"data_offsets": [
294404096,
297549824
]
},
"transformer.single_transformer_blocks.24.proj_out.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
15360
],
"data_offsets": [
297549824,
301481984
]
},
"transformer.single_transformer_blocks.24.proj_out.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
301481984,
302268416
]
},
"transformer.single_transformer_blocks.25.attn.to_k.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
302268416,
303054848
]
},
"transformer.single_transformer_blocks.25.attn.to_k.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
303054848,
303841280
]
},
"transformer.single_transformer_blocks.25.attn.to_q.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
303841280,
304627712
]
},
"transformer.single_transformer_blocks.25.attn.to_q.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
304627712,
305414144
]
},
"transformer.single_transformer_blocks.25.attn.to_v.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
305414144,
306200576
]
},
"transformer.single_transformer_blocks.25.attn.to_v.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
306200576,
306987008
]
},
"transformer.single_transformer_blocks.25.norm.linear.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
306987008,
307773440
]
},
"transformer.single_transformer_blocks.25.norm.linear.lora_B.weight": {
"dtype": "F32",
"shape": [
9216,
64
],
"data_offsets": [
307773440,
310132736
]
},
"transformer.single_transformer_blocks.25.proj_mlp.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
310132736,
310919168
]
},
"transformer.single_transformer_blocks.25.proj_mlp.lora_B.weight": {
"dtype": "F32",
"shape": [
12288,
64
],
"data_offsets": [
310919168,
314064896
]
},
"transformer.single_transformer_blocks.25.proj_out.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
15360
],
"data_offsets": [
314064896,
317997056
]
},
"transformer.single_transformer_blocks.25.proj_out.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
317997056,
318783488
]
},
"transformer.single_transformer_blocks.26.attn.to_k.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
318783488,
319569920
]
},
"transformer.single_transformer_blocks.26.attn.to_k.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
319569920,
320356352
]
},
"transformer.single_transformer_blocks.26.attn.to_q.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
320356352,
321142784
]
},
"transformer.single_transformer_blocks.26.attn.to_q.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
321142784,
321929216
]
},
"transformer.single_transformer_blocks.26.attn.to_v.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
321929216,
322715648
]
},
"transformer.single_transformer_blocks.26.attn.to_v.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
322715648,
323502080
]
},
"transformer.single_transformer_blocks.26.norm.linear.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
323502080,
324288512
]
},
"transformer.single_transformer_blocks.26.norm.linear.lora_B.weight": {
"dtype": "F32",
"shape": [
9216,
64
],
"data_offsets": [
324288512,
326647808
]
},
"transformer.single_transformer_blocks.26.proj_mlp.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
326647808,
327434240
]
},
"transformer.single_transformer_blocks.26.proj_mlp.lora_B.weight": {
"dtype": "F32",
"shape": [
12288,
64
],
"data_offsets": [
327434240,
330579968
]
},
"transformer.single_transformer_blocks.26.proj_out.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
15360
],
"data_offsets": [
330579968,
334512128
]
},
"transformer.single_transformer_blocks.26.proj_out.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
334512128,
335298560
]
},
"transformer.single_transformer_blocks.27.attn.to_k.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
335298560,
336084992
]
},
"transformer.single_transformer_blocks.27.attn.to_k.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
336084992,
336871424
]
},
"transformer.single_transformer_blocks.27.attn.to_q.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
336871424,
337657856
]
},
"transformer.single_transformer_blocks.27.attn.to_q.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
337657856,
338444288
]
},
"transformer.single_transformer_blocks.27.attn.to_v.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
338444288,
339230720
]
},
"transformer.single_transformer_blocks.27.attn.to_v.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
339230720,
340017152
]
},
"transformer.single_transformer_blocks.27.norm.linear.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
340017152,
340803584
]
},
"transformer.single_transformer_blocks.27.norm.linear.lora_B.weight": {
"dtype": "F32",
"shape": [
9216,
64
],
"data_offsets": [
340803584,
343162880
]
},
"transformer.single_transformer_blocks.27.proj_mlp.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
343162880,
343949312
]
},
"transformer.single_transformer_blocks.27.proj_mlp.lora_B.weight": {
"dtype": "F32",
"shape": [
12288,
64
],
"data_offsets": [
343949312,
347095040
]
},
"transformer.single_transformer_blocks.27.proj_out.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
15360
],
"data_offsets": [
347095040,
351027200
]
},
"transformer.single_transformer_blocks.27.proj_out.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
351027200,
351813632
]
},
"transformer.single_transformer_blocks.28.attn.to_k.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
351813632,
352600064
]
},
"transformer.single_transformer_blocks.28.attn.to_k.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
352600064,
353386496
]
},
"transformer.single_transformer_blocks.28.attn.to_q.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
353386496,
354172928
]
},
"transformer.single_transformer_blocks.28.attn.to_q.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
354172928,
354959360
]
},
"transformer.single_transformer_blocks.28.attn.to_v.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
354959360,
355745792
]
},
"transformer.single_transformer_blocks.28.attn.to_v.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
355745792,
356532224
]
},
"transformer.single_transformer_blocks.28.norm.linear.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
356532224,
357318656
]
},
"transformer.single_transformer_blocks.28.norm.linear.lora_B.weight": {
"dtype": "F32",
"shape": [
9216,
64
],
"data_offsets": [
357318656,
359677952
]
},
"transformer.single_transformer_blocks.28.proj_mlp.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
359677952,
360464384
]
},
"transformer.single_transformer_blocks.28.proj_mlp.lora_B.weight": {
"dtype": "F32",
"shape": [
12288,
64
],
"data_offsets": [
360464384,
363610112
]
},
"transformer.single_transformer_blocks.28.proj_out.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
15360
],
"data_offsets": [
363610112,
367542272
]
},
"transformer.single_transformer_blocks.28.proj_out.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
367542272,
368328704
]
},
"transformer.single_transformer_blocks.29.attn.to_k.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
368328704,
369115136
]
},
"transformer.single_transformer_blocks.29.attn.to_k.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
369115136,
369901568
]
},
"transformer.single_transformer_blocks.29.attn.to_q.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
369901568,
370688000
]
},
"transformer.single_transformer_blocks.29.attn.to_q.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
370688000,
371474432
]
},
"transformer.single_transformer_blocks.29.attn.to_v.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
371474432,
372260864
]
},
"transformer.single_transformer_blocks.29.attn.to_v.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
372260864,
373047296
]
},
"transformer.single_transformer_blocks.29.norm.linear.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
373047296,
373833728
]
},
"transformer.single_transformer_blocks.29.norm.linear.lora_B.weight": {
"dtype": "F32",
"shape": [
9216,
64
],
"data_offsets": [
373833728,
376193024
]
},
"transformer.single_transformer_blocks.29.proj_mlp.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
376193024,
376979456
]
},
"transformer.single_transformer_blocks.29.proj_mlp.lora_B.weight": {
"dtype": "F32",
"shape": [
12288,
64
],
"data_offsets": [
376979456,
380125184
]
},
"transformer.single_transformer_blocks.29.proj_out.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
15360
],
"data_offsets": [
380125184,
384057344
]
},
"transformer.single_transformer_blocks.29.proj_out.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
384057344,
384843776
]
},
"transformer.single_transformer_blocks.3.attn.to_k.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
384843776,
385630208
]
},
"transformer.single_transformer_blocks.3.attn.to_k.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
385630208,
386416640
]
},
"transformer.single_transformer_blocks.3.attn.to_q.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
386416640,
387203072
]
},
"transformer.single_transformer_blocks.3.attn.to_q.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
387203072,
387989504
]
},
"transformer.single_transformer_blocks.3.attn.to_v.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
387989504,
388775936
]
},
"transformer.single_transformer_blocks.3.attn.to_v.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
388775936,
389562368
]
},
"transformer.single_transformer_blocks.3.norm.linear.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
389562368,
390348800
]
},
"transformer.single_transformer_blocks.3.norm.linear.lora_B.weight": {
"dtype": "F32",
"shape": [
9216,
64
],
"data_offsets": [
390348800,
392708096
]
},
"transformer.single_transformer_blocks.3.proj_mlp.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
392708096,
393494528
]
},
"transformer.single_transformer_blocks.3.proj_mlp.lora_B.weight": {
"dtype": "F32",
"shape": [
12288,
64
],
"data_offsets": [
393494528,
396640256
]
},
"transformer.single_transformer_blocks.3.proj_out.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
15360
],
"data_offsets": [
396640256,
400572416
]
},
"transformer.single_transformer_blocks.3.proj_out.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
400572416,
401358848
]
},
"transformer.single_transformer_blocks.30.attn.to_k.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
401358848,
402145280
]
},
"transformer.single_transformer_blocks.30.attn.to_k.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
402145280,
402931712
]
},
"transformer.single_transformer_blocks.30.attn.to_q.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
402931712,
403718144
]
},
"transformer.single_transformer_blocks.30.attn.to_q.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
403718144,
404504576
]
},
"transformer.single_transformer_blocks.30.attn.to_v.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
404504576,
405291008
]
},
"transformer.single_transformer_blocks.30.attn.to_v.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
405291008,
406077440
]
},
"transformer.single_transformer_blocks.30.norm.linear.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
406077440,
406863872
]
},
"transformer.single_transformer_blocks.30.norm.linear.lora_B.weight": {
"dtype": "F32",
"shape": [
9216,
64
],
"data_offsets": [
406863872,
409223168
]
},
"transformer.single_transformer_blocks.30.proj_mlp.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
409223168,
410009600
]
},
"transformer.single_transformer_blocks.30.proj_mlp.lora_B.weight": {
"dtype": "F32",
"shape": [
12288,
64
],
"data_offsets": [
410009600,
413155328
]
},
"transformer.single_transformer_blocks.30.proj_out.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
15360
],
"data_offsets": [
413155328,
417087488
]
},
"transformer.single_transformer_blocks.30.proj_out.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
417087488,
417873920
]
},
"transformer.single_transformer_blocks.31.attn.to_k.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
417873920,
418660352
]
},
"transformer.single_transformer_blocks.31.attn.to_k.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
418660352,
419446784
]
},
"transformer.single_transformer_blocks.31.attn.to_q.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
419446784,
420233216
]
},
"transformer.single_transformer_blocks.31.attn.to_q.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
420233216,
421019648
]
},
"transformer.single_transformer_blocks.31.attn.to_v.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
421019648,
421806080
]
},
"transformer.single_transformer_blocks.31.attn.to_v.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
421806080,
422592512
]
},
"transformer.single_transformer_blocks.31.norm.linear.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
422592512,
423378944
]
},
"transformer.single_transformer_blocks.31.norm.linear.lora_B.weight": {
"dtype": "F32",
"shape": [
9216,
64
],
"data_offsets": [
423378944,
425738240
]
},
"transformer.single_transformer_blocks.31.proj_mlp.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
425738240,
426524672
]
},
"transformer.single_transformer_blocks.31.proj_mlp.lora_B.weight": {
"dtype": "F32",
"shape": [
12288,
64
],
"data_offsets": [
426524672,
429670400
]
},
"transformer.single_transformer_blocks.31.proj_out.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
15360
],
"data_offsets": [
429670400,
433602560
]
},
"transformer.single_transformer_blocks.31.proj_out.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
433602560,
434388992
]
},
"transformer.single_transformer_blocks.32.attn.to_k.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
434388992,
435175424
]
},
"transformer.single_transformer_blocks.32.attn.to_k.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
435175424,
435961856
]
},
"transformer.single_transformer_blocks.32.attn.to_q.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
435961856,
436748288
]
},
"transformer.single_transformer_blocks.32.attn.to_q.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
436748288,
437534720
]
},
"transformer.single_transformer_blocks.32.attn.to_v.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
437534720,
438321152
]
},
"transformer.single_transformer_blocks.32.attn.to_v.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
438321152,
439107584
]
},
"transformer.single_transformer_blocks.32.norm.linear.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
439107584,
439894016
]
},
"transformer.single_transformer_blocks.32.norm.linear.lora_B.weight": {
"dtype": "F32",
"shape": [
9216,
64
],
"data_offsets": [
439894016,
442253312
]
},
"transformer.single_transformer_blocks.32.proj_mlp.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
442253312,
443039744
]
},
"transformer.single_transformer_blocks.32.proj_mlp.lora_B.weight": {
"dtype": "F32",
"shape": [
12288,
64
],
"data_offsets": [
443039744,
446185472
]
},
"transformer.single_transformer_blocks.32.proj_out.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
15360
],
"data_offsets": [
446185472,
450117632
]
},
"transformer.single_transformer_blocks.32.proj_out.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
450117632,
450904064
]
},
"transformer.single_transformer_blocks.33.attn.to_k.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
450904064,
451690496
]
},
"transformer.single_transformer_blocks.33.attn.to_k.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
451690496,
452476928
]
},
"transformer.single_transformer_blocks.33.attn.to_q.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
452476928,
453263360
]
},
"transformer.single_transformer_blocks.33.attn.to_q.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
453263360,
454049792
]
},
"transformer.single_transformer_blocks.33.attn.to_v.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
454049792,
454836224
]
},
"transformer.single_transformer_blocks.33.attn.to_v.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
454836224,
455622656
]
},
"transformer.single_transformer_blocks.33.norm.linear.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
455622656,
456409088
]
},
"transformer.single_transformer_blocks.33.norm.linear.lora_B.weight": {
"dtype": "F32",
"shape": [
9216,
64
],
"data_offsets": [
456409088,
458768384
]
},
"transformer.single_transformer_blocks.33.proj_mlp.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
458768384,
459554816
]
},
"transformer.single_transformer_blocks.33.proj_mlp.lora_B.weight": {
"dtype": "F32",
"shape": [
12288,
64
],
"data_offsets": [
459554816,
462700544
]
},
"transformer.single_transformer_blocks.33.proj_out.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
15360
],
"data_offsets": [
462700544,
466632704
]
},
"transformer.single_transformer_blocks.33.proj_out.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
466632704,
467419136
]
},
"transformer.single_transformer_blocks.34.attn.to_k.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
467419136,
468205568
]
},
"transformer.single_transformer_blocks.34.attn.to_k.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
468205568,
468992000
]
},
"transformer.single_transformer_blocks.34.attn.to_q.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
468992000,
469778432
]
},
"transformer.single_transformer_blocks.34.attn.to_q.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
469778432,
470564864
]
},
"transformer.single_transformer_blocks.34.attn.to_v.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
470564864,
471351296
]
},
"transformer.single_transformer_blocks.34.attn.to_v.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
471351296,
472137728
]
},
"transformer.single_transformer_blocks.34.norm.linear.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
472137728,
472924160
]
},
"transformer.single_transformer_blocks.34.norm.linear.lora_B.weight": {
"dtype": "F32",
"shape": [
9216,
64
],
"data_offsets": [
472924160,
475283456
]
},
"transformer.single_transformer_blocks.34.proj_mlp.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
475283456,
476069888
]
},
"transformer.single_transformer_blocks.34.proj_mlp.lora_B.weight": {
"dtype": "F32",
"shape": [
12288,
64
],
"data_offsets": [
476069888,
479215616
]
},
"transformer.single_transformer_blocks.34.proj_out.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
15360
],
"data_offsets": [
479215616,
483147776
]
},
"transformer.single_transformer_blocks.34.proj_out.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
483147776,
483934208
]
},
"transformer.single_transformer_blocks.35.attn.to_k.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
483934208,
484720640
]
},
"transformer.single_transformer_blocks.35.attn.to_k.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
484720640,
485507072
]
},
"transformer.single_transformer_blocks.35.attn.to_q.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
485507072,
486293504
]
},
"transformer.single_transformer_blocks.35.attn.to_q.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
486293504,
487079936
]
},
"transformer.single_transformer_blocks.35.attn.to_v.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
487079936,
487866368
]
},
"transformer.single_transformer_blocks.35.attn.to_v.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
487866368,
488652800
]
},
"transformer.single_transformer_blocks.35.norm.linear.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
488652800,
489439232
]
},
"transformer.single_transformer_blocks.35.norm.linear.lora_B.weight": {
"dtype": "F32",
"shape": [
9216,
64
],
"data_offsets": [
489439232,
491798528
]
},
"transformer.single_transformer_blocks.35.proj_mlp.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
491798528,
492584960
]
},
"transformer.single_transformer_blocks.35.proj_mlp.lora_B.weight": {
"dtype": "F32",
"shape": [
12288,
64
],
"data_offsets": [
492584960,
495730688
]
},
"transformer.single_transformer_blocks.35.proj_out.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
15360
],
"data_offsets": [
495730688,
499662848
]
},
"transformer.single_transformer_blocks.35.proj_out.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
499662848,
500449280
]
},
"transformer.single_transformer_blocks.36.attn.to_k.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
500449280,
501235712
]
},
"transformer.single_transformer_blocks.36.attn.to_k.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
501235712,
502022144
]
},
"transformer.single_transformer_blocks.36.attn.to_q.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
502022144,
502808576
]
},
"transformer.single_transformer_blocks.36.attn.to_q.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
502808576,
503595008
]
},
"transformer.single_transformer_blocks.36.attn.to_v.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
503595008,
504381440
]
},
"transformer.single_transformer_blocks.36.attn.to_v.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
504381440,
505167872
]
},
"transformer.single_transformer_blocks.36.norm.linear.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
505167872,
505954304
]
},
"transformer.single_transformer_blocks.36.norm.linear.lora_B.weight": {
"dtype": "F32",
"shape": [
9216,
64
],
"data_offsets": [
505954304,
508313600
]
},
"transformer.single_transformer_blocks.36.proj_mlp.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
508313600,
509100032
]
},
"transformer.single_transformer_blocks.36.proj_mlp.lora_B.weight": {
"dtype": "F32",
"shape": [
12288,
64
],
"data_offsets": [
509100032,
512245760
]
},
"transformer.single_transformer_blocks.36.proj_out.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
15360
],
"data_offsets": [
512245760,
516177920
]
},
"transformer.single_transformer_blocks.36.proj_out.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
516177920,
516964352
]
},
"transformer.single_transformer_blocks.37.attn.to_k.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
516964352,
517750784
]
},
"transformer.single_transformer_blocks.37.attn.to_k.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
517750784,
518537216
]
},
"transformer.single_transformer_blocks.37.attn.to_q.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
518537216,
519323648
]
},
"transformer.single_transformer_blocks.37.attn.to_q.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
519323648,
520110080
]
},
"transformer.single_transformer_blocks.37.attn.to_v.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
520110080,
520896512
]
},
"transformer.single_transformer_blocks.37.attn.to_v.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
520896512,
521682944
]
},
"transformer.single_transformer_blocks.37.norm.linear.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
521682944,
522469376
]
},
"transformer.single_transformer_blocks.37.norm.linear.lora_B.weight": {
"dtype": "F32",
"shape": [
9216,
64
],
"data_offsets": [
522469376,
524828672
]
},
"transformer.single_transformer_blocks.37.proj_mlp.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
524828672,
525615104
]
},
"transformer.single_transformer_blocks.37.proj_mlp.lora_B.weight": {
"dtype": "F32",
"shape": [
12288,
64
],
"data_offsets": [
525615104,
528760832
]
},
"transformer.single_transformer_blocks.37.proj_out.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
15360
],
"data_offsets": [
528760832,
532692992
]
},
"transformer.single_transformer_blocks.37.proj_out.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
532692992,
533479424
]
},
"transformer.single_transformer_blocks.4.attn.to_k.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
533479424,
534265856
]
},
"transformer.single_transformer_blocks.4.attn.to_k.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
534265856,
535052288
]
},
"transformer.single_transformer_blocks.4.attn.to_q.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
535052288,
535838720
]
},
"transformer.single_transformer_blocks.4.attn.to_q.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
535838720,
536625152
]
},
"transformer.single_transformer_blocks.4.attn.to_v.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
536625152,
537411584
]
},
"transformer.single_transformer_blocks.4.attn.to_v.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
537411584,
538198016
]
},
"transformer.single_transformer_blocks.4.norm.linear.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
538198016,
538984448
]
},
"transformer.single_transformer_blocks.4.norm.linear.lora_B.weight": {
"dtype": "F32",
"shape": [
9216,
64
],
"data_offsets": [
538984448,
541343744
]
},
"transformer.single_transformer_blocks.4.proj_mlp.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
541343744,
542130176
]
},
"transformer.single_transformer_blocks.4.proj_mlp.lora_B.weight": {
"dtype": "F32",
"shape": [
12288,
64
],
"data_offsets": [
542130176,
545275904
]
},
"transformer.single_transformer_blocks.4.proj_out.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
15360
],
"data_offsets": [
545275904,
549208064
]
},
"transformer.single_transformer_blocks.4.proj_out.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
549208064,
549994496
]
},
"transformer.single_transformer_blocks.5.attn.to_k.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
549994496,
550780928
]
},
"transformer.single_transformer_blocks.5.attn.to_k.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
550780928,
551567360
]
},
"transformer.single_transformer_blocks.5.attn.to_q.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
551567360,
552353792
]
},
"transformer.single_transformer_blocks.5.attn.to_q.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
552353792,
553140224
]
},
"transformer.single_transformer_blocks.5.attn.to_v.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
553140224,
553926656
]
},
"transformer.single_transformer_blocks.5.attn.to_v.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
553926656,
554713088
]
},
"transformer.single_transformer_blocks.5.norm.linear.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
554713088,
555499520
]
},
"transformer.single_transformer_blocks.5.norm.linear.lora_B.weight": {
"dtype": "F32",
"shape": [
9216,
64
],
"data_offsets": [
555499520,
557858816
]
},
"transformer.single_transformer_blocks.5.proj_mlp.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
557858816,
558645248
]
},
"transformer.single_transformer_blocks.5.proj_mlp.lora_B.weight": {
"dtype": "F32",
"shape": [
12288,
64
],
"data_offsets": [
558645248,
561790976
]
},
"transformer.single_transformer_blocks.5.proj_out.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
15360
],
"data_offsets": [
561790976,
565723136
]
},
"transformer.single_transformer_blocks.5.proj_out.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
565723136,
566509568
]
},
"transformer.single_transformer_blocks.6.attn.to_k.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
566509568,
567296000
]
},
"transformer.single_transformer_blocks.6.attn.to_k.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
567296000,
568082432
]
},
"transformer.single_transformer_blocks.6.attn.to_q.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
568082432,
568868864
]
},
"transformer.single_transformer_blocks.6.attn.to_q.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
568868864,
569655296
]
},
"transformer.single_transformer_blocks.6.attn.to_v.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
569655296,
570441728
]
},
"transformer.single_transformer_blocks.6.attn.to_v.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
570441728,
571228160
]
},
"transformer.single_transformer_blocks.6.norm.linear.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
571228160,
572014592
]
},
"transformer.single_transformer_blocks.6.norm.linear.lora_B.weight": {
"dtype": "F32",
"shape": [
9216,
64
],
"data_offsets": [
572014592,
574373888
]
},
"transformer.single_transformer_blocks.6.proj_mlp.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
574373888,
575160320
]
},
"transformer.single_transformer_blocks.6.proj_mlp.lora_B.weight": {
"dtype": "F32",
"shape": [
12288,
64
],
"data_offsets": [
575160320,
578306048
]
},
"transformer.single_transformer_blocks.6.proj_out.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
15360
],
"data_offsets": [
578306048,
582238208
]
},
"transformer.single_transformer_blocks.6.proj_out.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
582238208,
583024640
]
},
"transformer.single_transformer_blocks.7.attn.to_k.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
583024640,
583811072
]
},
"transformer.single_transformer_blocks.7.attn.to_k.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
583811072,
584597504
]
},
"transformer.single_transformer_blocks.7.attn.to_q.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
584597504,
585383936
]
},
"transformer.single_transformer_blocks.7.attn.to_q.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
585383936,
586170368
]
},
"transformer.single_transformer_blocks.7.attn.to_v.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
586170368,
586956800
]
},
"transformer.single_transformer_blocks.7.attn.to_v.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
586956800,
587743232
]
},
"transformer.single_transformer_blocks.7.norm.linear.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
587743232,
588529664
]
},
"transformer.single_transformer_blocks.7.norm.linear.lora_B.weight": {
"dtype": "F32",
"shape": [
9216,
64
],
"data_offsets": [
588529664,
590888960
]
},
"transformer.single_transformer_blocks.7.proj_mlp.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
590888960,
591675392
]
},
"transformer.single_transformer_blocks.7.proj_mlp.lora_B.weight": {
"dtype": "F32",
"shape": [
12288,
64
],
"data_offsets": [
591675392,
594821120
]
},
"transformer.single_transformer_blocks.7.proj_out.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
15360
],
"data_offsets": [
594821120,
598753280
]
},
"transformer.single_transformer_blocks.7.proj_out.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
598753280,
599539712
]
},
"transformer.single_transformer_blocks.8.attn.to_k.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
599539712,
600326144
]
},
"transformer.single_transformer_blocks.8.attn.to_k.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
600326144,
601112576
]
},
"transformer.single_transformer_blocks.8.attn.to_q.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
601112576,
601899008
]
},
"transformer.single_transformer_blocks.8.attn.to_q.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
601899008,
602685440
]
},
"transformer.single_transformer_blocks.8.attn.to_v.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
602685440,
603471872
]
},
"transformer.single_transformer_blocks.8.attn.to_v.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
603471872,
604258304
]
},
"transformer.single_transformer_blocks.8.norm.linear.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
604258304,
605044736
]
},
"transformer.single_transformer_blocks.8.norm.linear.lora_B.weight": {
"dtype": "F32",
"shape": [
9216,
64
],
"data_offsets": [
605044736,
607404032
]
},
"transformer.single_transformer_blocks.8.proj_mlp.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
607404032,
608190464
]
},
"transformer.single_transformer_blocks.8.proj_mlp.lora_B.weight": {
"dtype": "F32",
"shape": [
12288,
64
],
"data_offsets": [
608190464,
611336192
]
},
"transformer.single_transformer_blocks.8.proj_out.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
15360
],
"data_offsets": [
611336192,
615268352
]
},
"transformer.single_transformer_blocks.8.proj_out.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
615268352,
616054784
]
},
"transformer.single_transformer_blocks.9.attn.to_k.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
616054784,
616841216
]
},
"transformer.single_transformer_blocks.9.attn.to_k.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
616841216,
617627648
]
},
"transformer.single_transformer_blocks.9.attn.to_q.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
617627648,
618414080
]
},
"transformer.single_transformer_blocks.9.attn.to_q.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
618414080,
619200512
]
},
"transformer.single_transformer_blocks.9.attn.to_v.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
619200512,
619986944
]
},
"transformer.single_transformer_blocks.9.attn.to_v.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
619986944,
620773376
]
},
"transformer.single_transformer_blocks.9.norm.linear.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
620773376,
621559808
]
},
"transformer.single_transformer_blocks.9.norm.linear.lora_B.weight": {
"dtype": "F32",
"shape": [
9216,
64
],
"data_offsets": [
621559808,
623919104
]
},
"transformer.single_transformer_blocks.9.proj_mlp.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
623919104,
624705536
]
},
"transformer.single_transformer_blocks.9.proj_mlp.lora_B.weight": {
"dtype": "F32",
"shape": [
12288,
64
],
"data_offsets": [
624705536,
627851264
]
},
"transformer.single_transformer_blocks.9.proj_out.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
15360
],
"data_offsets": [
627851264,
631783424
]
},
"transformer.single_transformer_blocks.9.proj_out.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
631783424,
632569856
]
},
"transformer.time_text_embed.guidance_embedder.linear_1.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
256
],
"data_offsets": [
632569856,
632635392
]
},
"transformer.time_text_embed.guidance_embedder.linear_1.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
632635392,
633421824
]
},
"transformer.time_text_embed.guidance_embedder.linear_2.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
633421824,
634208256
]
},
"transformer.time_text_embed.guidance_embedder.linear_2.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
634208256,
634994688
]
},
"transformer.time_text_embed.text_embedder.linear_1.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
768
],
"data_offsets": [
634994688,
635191296
]
},
"transformer.time_text_embed.text_embedder.linear_1.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
635191296,
635977728
]
},
"transformer.time_text_embed.text_embedder.linear_2.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
635977728,
636764160
]
},
"transformer.time_text_embed.text_embedder.linear_2.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
636764160,
637550592
]
},
"transformer.time_text_embed.timestep_embedder.linear_1.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
256
],
"data_offsets": [
637550592,
637616128
]
},
"transformer.time_text_embed.timestep_embedder.linear_1.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
637616128,
638402560
]
},
"transformer.time_text_embed.timestep_embedder.linear_2.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
638402560,
639188992
]
},
"transformer.time_text_embed.timestep_embedder.linear_2.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
639188992,
639975424
]
},
"transformer.transformer_blocks.0.attn.add_k_proj.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
639975424,
640761856
]
},
"transformer.transformer_blocks.0.attn.add_k_proj.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
640761856,
641548288
]
},
"transformer.transformer_blocks.0.attn.add_q_proj.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
641548288,
642334720
]
},
"transformer.transformer_blocks.0.attn.add_q_proj.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
642334720,
643121152
]
},
"transformer.transformer_blocks.0.attn.add_v_proj.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
643121152,
643907584
]
},
"transformer.transformer_blocks.0.attn.add_v_proj.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
643907584,
644694016
]
},
"transformer.transformer_blocks.0.attn.to_add_out.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
644694016,
645480448
]
},
"transformer.transformer_blocks.0.attn.to_add_out.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
645480448,
646266880
]
},
"transformer.transformer_blocks.0.attn.to_k.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
646266880,
647053312
]
},
"transformer.transformer_blocks.0.attn.to_k.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
647053312,
647839744
]
},
"transformer.transformer_blocks.0.attn.to_out.0.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
647839744,
648626176
]
},
"transformer.transformer_blocks.0.attn.to_out.0.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
648626176,
649412608
]
},
"transformer.transformer_blocks.0.attn.to_q.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
649412608,
650199040
]
},
"transformer.transformer_blocks.0.attn.to_q.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
650199040,
650985472
]
},
"transformer.transformer_blocks.0.attn.to_v.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
650985472,
651771904
]
},
"transformer.transformer_blocks.0.attn.to_v.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
651771904,
652558336
]
},
"transformer.transformer_blocks.0.ff.net.0.proj.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
652558336,
653344768
]
},
"transformer.transformer_blocks.0.ff.net.0.proj.lora_B.weight": {
"dtype": "F32",
"shape": [
12288,
64
],
"data_offsets": [
653344768,
656490496
]
},
"transformer.transformer_blocks.0.ff.net.2.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
12288
],
"data_offsets": [
656490496,
659636224
]
},
"transformer.transformer_blocks.0.ff.net.2.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
659636224,
660422656
]
},
"transformer.transformer_blocks.0.ff_context.net.0.proj.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
660422656,
661209088
]
},
"transformer.transformer_blocks.0.ff_context.net.0.proj.lora_B.weight": {
"dtype": "F32",
"shape": [
12288,
64
],
"data_offsets": [
661209088,
664354816
]
},
"transformer.transformer_blocks.0.ff_context.net.2.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
12288
],
"data_offsets": [
664354816,
667500544
]
},
"transformer.transformer_blocks.0.ff_context.net.2.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
667500544,
668286976
]
},
"transformer.transformer_blocks.0.norm1.linear.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
668286976,
669073408
]
},
"transformer.transformer_blocks.0.norm1.linear.lora_B.weight": {
"dtype": "F32",
"shape": [
18432,
64
],
"data_offsets": [
669073408,
673792000
]
},
"transformer.transformer_blocks.0.norm1_context.linear.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
673792000,
674578432
]
},
"transformer.transformer_blocks.0.norm1_context.linear.lora_B.weight": {
"dtype": "F32",
"shape": [
18432,
64
],
"data_offsets": [
674578432,
679297024
]
},
"transformer.transformer_blocks.1.attn.add_k_proj.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
679297024,
680083456
]
},
"transformer.transformer_blocks.1.attn.add_k_proj.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
680083456,
680869888
]
},
"transformer.transformer_blocks.1.attn.add_q_proj.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
680869888,
681656320
]
},
"transformer.transformer_blocks.1.attn.add_q_proj.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
681656320,
682442752
]
},
"transformer.transformer_blocks.1.attn.add_v_proj.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
682442752,
683229184
]
},
"transformer.transformer_blocks.1.attn.add_v_proj.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
683229184,
684015616
]
},
"transformer.transformer_blocks.1.attn.to_add_out.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
684015616,
684802048
]
},
"transformer.transformer_blocks.1.attn.to_add_out.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
684802048,
685588480
]
},
"transformer.transformer_blocks.1.attn.to_k.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
685588480,
686374912
]
},
"transformer.transformer_blocks.1.attn.to_k.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
686374912,
687161344
]
},
"transformer.transformer_blocks.1.attn.to_out.0.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
687161344,
687947776
]
},
"transformer.transformer_blocks.1.attn.to_out.0.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
687947776,
688734208
]
},
"transformer.transformer_blocks.1.attn.to_q.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
688734208,
689520640
]
},
"transformer.transformer_blocks.1.attn.to_q.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
689520640,
690307072
]
},
"transformer.transformer_blocks.1.attn.to_v.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
690307072,
691093504
]
},
"transformer.transformer_blocks.1.attn.to_v.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
691093504,
691879936
]
},
"transformer.transformer_blocks.1.ff.net.0.proj.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
691879936,
692666368
]
},
"transformer.transformer_blocks.1.ff.net.0.proj.lora_B.weight": {
"dtype": "F32",
"shape": [
12288,
64
],
"data_offsets": [
692666368,
695812096
]
},
"transformer.transformer_blocks.1.ff.net.2.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
12288
],
"data_offsets": [
695812096,
698957824
]
},
"transformer.transformer_blocks.1.ff.net.2.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
698957824,
699744256
]
},
"transformer.transformer_blocks.1.ff_context.net.0.proj.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
699744256,
700530688
]
},
"transformer.transformer_blocks.1.ff_context.net.0.proj.lora_B.weight": {
"dtype": "F32",
"shape": [
12288,
64
],
"data_offsets": [
700530688,
703676416
]
},
"transformer.transformer_blocks.1.ff_context.net.2.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
12288
],
"data_offsets": [
703676416,
706822144
]
},
"transformer.transformer_blocks.1.ff_context.net.2.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
706822144,
707608576
]
},
"transformer.transformer_blocks.1.norm1.linear.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
707608576,
708395008
]
},
"transformer.transformer_blocks.1.norm1.linear.lora_B.weight": {
"dtype": "F32",
"shape": [
18432,
64
],
"data_offsets": [
708395008,
713113600
]
},
"transformer.transformer_blocks.1.norm1_context.linear.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
713113600,
713900032
]
},
"transformer.transformer_blocks.1.norm1_context.linear.lora_B.weight": {
"dtype": "F32",
"shape": [
18432,
64
],
"data_offsets": [
713900032,
718618624
]
},
"transformer.transformer_blocks.10.attn.add_k_proj.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
718618624,
719405056
]
},
"transformer.transformer_blocks.10.attn.add_k_proj.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
719405056,
720191488
]
},
"transformer.transformer_blocks.10.attn.add_q_proj.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
720191488,
720977920
]
},
"transformer.transformer_blocks.10.attn.add_q_proj.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
720977920,
721764352
]
},
"transformer.transformer_blocks.10.attn.add_v_proj.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
721764352,
722550784
]
},
"transformer.transformer_blocks.10.attn.add_v_proj.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
722550784,
723337216
]
},
"transformer.transformer_blocks.10.attn.to_add_out.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
723337216,
724123648
]
},
"transformer.transformer_blocks.10.attn.to_add_out.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
724123648,
724910080
]
},
"transformer.transformer_blocks.10.attn.to_k.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
724910080,
725696512
]
},
"transformer.transformer_blocks.10.attn.to_k.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
725696512,
726482944
]
},
"transformer.transformer_blocks.10.attn.to_out.0.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
726482944,
727269376
]
},
"transformer.transformer_blocks.10.attn.to_out.0.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
727269376,
728055808
]
},
"transformer.transformer_blocks.10.attn.to_q.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
728055808,
728842240
]
},
"transformer.transformer_blocks.10.attn.to_q.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
728842240,
729628672
]
},
"transformer.transformer_blocks.10.attn.to_v.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
729628672,
730415104
]
},
"transformer.transformer_blocks.10.attn.to_v.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
730415104,
731201536
]
},
"transformer.transformer_blocks.10.ff.net.0.proj.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
731201536,
731987968
]
},
"transformer.transformer_blocks.10.ff.net.0.proj.lora_B.weight": {
"dtype": "F32",
"shape": [
12288,
64
],
"data_offsets": [
731987968,
735133696
]
},
"transformer.transformer_blocks.10.ff.net.2.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
12288
],
"data_offsets": [
735133696,
738279424
]
},
"transformer.transformer_blocks.10.ff.net.2.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
738279424,
739065856
]
},
"transformer.transformer_blocks.10.ff_context.net.0.proj.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
739065856,
739852288
]
},
"transformer.transformer_blocks.10.ff_context.net.0.proj.lora_B.weight": {
"dtype": "F32",
"shape": [
12288,
64
],
"data_offsets": [
739852288,
742998016
]
},
"transformer.transformer_blocks.10.ff_context.net.2.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
12288
],
"data_offsets": [
742998016,
746143744
]
},
"transformer.transformer_blocks.10.ff_context.net.2.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
746143744,
746930176
]
},
"transformer.transformer_blocks.10.norm1.linear.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
746930176,
747716608
]
},
"transformer.transformer_blocks.10.norm1.linear.lora_B.weight": {
"dtype": "F32",
"shape": [
18432,
64
],
"data_offsets": [
747716608,
752435200
]
},
"transformer.transformer_blocks.10.norm1_context.linear.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
752435200,
753221632
]
},
"transformer.transformer_blocks.10.norm1_context.linear.lora_B.weight": {
"dtype": "F32",
"shape": [
18432,
64
],
"data_offsets": [
753221632,
757940224
]
},
"transformer.transformer_blocks.11.attn.add_k_proj.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
757940224,
758726656
]
},
"transformer.transformer_blocks.11.attn.add_k_proj.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
758726656,
759513088
]
},
"transformer.transformer_blocks.11.attn.add_q_proj.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
759513088,
760299520
]
},
"transformer.transformer_blocks.11.attn.add_q_proj.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
760299520,
761085952
]
},
"transformer.transformer_blocks.11.attn.add_v_proj.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
761085952,
761872384
]
},
"transformer.transformer_blocks.11.attn.add_v_proj.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
761872384,
762658816
]
},
"transformer.transformer_blocks.11.attn.to_add_out.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
762658816,
763445248
]
},
"transformer.transformer_blocks.11.attn.to_add_out.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
763445248,
764231680
]
},
"transformer.transformer_blocks.11.attn.to_k.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
764231680,
765018112
]
},
"transformer.transformer_blocks.11.attn.to_k.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
765018112,
765804544
]
},
"transformer.transformer_blocks.11.attn.to_out.0.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
765804544,
766590976
]
},
"transformer.transformer_blocks.11.attn.to_out.0.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
766590976,
767377408
]
},
"transformer.transformer_blocks.11.attn.to_q.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
767377408,
768163840
]
},
"transformer.transformer_blocks.11.attn.to_q.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
768163840,
768950272
]
},
"transformer.transformer_blocks.11.attn.to_v.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
768950272,
769736704
]
},
"transformer.transformer_blocks.11.attn.to_v.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
769736704,
770523136
]
},
"transformer.transformer_blocks.11.ff.net.0.proj.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
770523136,
771309568
]
},
"transformer.transformer_blocks.11.ff.net.0.proj.lora_B.weight": {
"dtype": "F32",
"shape": [
12288,
64
],
"data_offsets": [
771309568,
774455296
]
},
"transformer.transformer_blocks.11.ff.net.2.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
12288
],
"data_offsets": [
774455296,
777601024
]
},
"transformer.transformer_blocks.11.ff.net.2.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
777601024,
778387456
]
},
"transformer.transformer_blocks.11.ff_context.net.0.proj.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
778387456,
779173888
]
},
"transformer.transformer_blocks.11.ff_context.net.0.proj.lora_B.weight": {
"dtype": "F32",
"shape": [
12288,
64
],
"data_offsets": [
779173888,
782319616
]
},
"transformer.transformer_blocks.11.ff_context.net.2.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
12288
],
"data_offsets": [
782319616,
785465344
]
},
"transformer.transformer_blocks.11.ff_context.net.2.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
785465344,
786251776
]
},
"transformer.transformer_blocks.11.norm1.linear.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
786251776,
787038208
]
},
"transformer.transformer_blocks.11.norm1.linear.lora_B.weight": {
"dtype": "F32",
"shape": [
18432,
64
],
"data_offsets": [
787038208,
791756800
]
},
"transformer.transformer_blocks.11.norm1_context.linear.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
791756800,
792543232
]
},
"transformer.transformer_blocks.11.norm1_context.linear.lora_B.weight": {
"dtype": "F32",
"shape": [
18432,
64
],
"data_offsets": [
792543232,
797261824
]
},
"transformer.transformer_blocks.12.attn.add_k_proj.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
797261824,
798048256
]
},
"transformer.transformer_blocks.12.attn.add_k_proj.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
798048256,
798834688
]
},
"transformer.transformer_blocks.12.attn.add_q_proj.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
798834688,
799621120
]
},
"transformer.transformer_blocks.12.attn.add_q_proj.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
799621120,
800407552
]
},
"transformer.transformer_blocks.12.attn.add_v_proj.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
800407552,
801193984
]
},
"transformer.transformer_blocks.12.attn.add_v_proj.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
801193984,
801980416
]
},
"transformer.transformer_blocks.12.attn.to_add_out.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
801980416,
802766848
]
},
"transformer.transformer_blocks.12.attn.to_add_out.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
802766848,
803553280
]
},
"transformer.transformer_blocks.12.attn.to_k.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
803553280,
804339712
]
},
"transformer.transformer_blocks.12.attn.to_k.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
804339712,
805126144
]
},
"transformer.transformer_blocks.12.attn.to_out.0.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
805126144,
805912576
]
},
"transformer.transformer_blocks.12.attn.to_out.0.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
805912576,
806699008
]
},
"transformer.transformer_blocks.12.attn.to_q.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
806699008,
807485440
]
},
"transformer.transformer_blocks.12.attn.to_q.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
807485440,
808271872
]
},
"transformer.transformer_blocks.12.attn.to_v.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
808271872,
809058304
]
},
"transformer.transformer_blocks.12.attn.to_v.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
809058304,
809844736
]
},
"transformer.transformer_blocks.12.ff.net.0.proj.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
809844736,
810631168
]
},
"transformer.transformer_blocks.12.ff.net.0.proj.lora_B.weight": {
"dtype": "F32",
"shape": [
12288,
64
],
"data_offsets": [
810631168,
813776896
]
},
"transformer.transformer_blocks.12.ff.net.2.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
12288
],
"data_offsets": [
813776896,
816922624
]
},
"transformer.transformer_blocks.12.ff.net.2.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
816922624,
817709056
]
},
"transformer.transformer_blocks.12.ff_context.net.0.proj.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
817709056,
818495488
]
},
"transformer.transformer_blocks.12.ff_context.net.0.proj.lora_B.weight": {
"dtype": "F32",
"shape": [
12288,
64
],
"data_offsets": [
818495488,
821641216
]
},
"transformer.transformer_blocks.12.ff_context.net.2.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
12288
],
"data_offsets": [
821641216,
824786944
]
},
"transformer.transformer_blocks.12.ff_context.net.2.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
824786944,
825573376
]
},
"transformer.transformer_blocks.12.norm1.linear.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
825573376,
826359808
]
},
"transformer.transformer_blocks.12.norm1.linear.lora_B.weight": {
"dtype": "F32",
"shape": [
18432,
64
],
"data_offsets": [
826359808,
831078400
]
},
"transformer.transformer_blocks.12.norm1_context.linear.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
831078400,
831864832
]
},
"transformer.transformer_blocks.12.norm1_context.linear.lora_B.weight": {
"dtype": "F32",
"shape": [
18432,
64
],
"data_offsets": [
831864832,
836583424
]
},
"transformer.transformer_blocks.13.attn.add_k_proj.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
836583424,
837369856
]
},
"transformer.transformer_blocks.13.attn.add_k_proj.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
837369856,
838156288
]
},
"transformer.transformer_blocks.13.attn.add_q_proj.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
838156288,
838942720
]
},
"transformer.transformer_blocks.13.attn.add_q_proj.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
838942720,
839729152
]
},
"transformer.transformer_blocks.13.attn.add_v_proj.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
839729152,
840515584
]
},
"transformer.transformer_blocks.13.attn.add_v_proj.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
840515584,
841302016
]
},
"transformer.transformer_blocks.13.attn.to_add_out.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
841302016,
842088448
]
},
"transformer.transformer_blocks.13.attn.to_add_out.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
842088448,
842874880
]
},
"transformer.transformer_blocks.13.attn.to_k.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
842874880,
843661312
]
},
"transformer.transformer_blocks.13.attn.to_k.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
843661312,
844447744
]
},
"transformer.transformer_blocks.13.attn.to_out.0.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
844447744,
845234176
]
},
"transformer.transformer_blocks.13.attn.to_out.0.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
845234176,
846020608
]
},
"transformer.transformer_blocks.13.attn.to_q.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
846020608,
846807040
]
},
"transformer.transformer_blocks.13.attn.to_q.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
846807040,
847593472
]
},
"transformer.transformer_blocks.13.attn.to_v.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
847593472,
848379904
]
},
"transformer.transformer_blocks.13.attn.to_v.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
848379904,
849166336
]
},
"transformer.transformer_blocks.13.ff.net.0.proj.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
849166336,
849952768
]
},
"transformer.transformer_blocks.13.ff.net.0.proj.lora_B.weight": {
"dtype": "F32",
"shape": [
12288,
64
],
"data_offsets": [
849952768,
853098496
]
},
"transformer.transformer_blocks.13.ff.net.2.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
12288
],
"data_offsets": [
853098496,
856244224
]
},
"transformer.transformer_blocks.13.ff.net.2.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
856244224,
857030656
]
},
"transformer.transformer_blocks.13.ff_context.net.0.proj.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
857030656,
857817088
]
},
"transformer.transformer_blocks.13.ff_context.net.0.proj.lora_B.weight": {
"dtype": "F32",
"shape": [
12288,
64
],
"data_offsets": [
857817088,
860962816
]
},
"transformer.transformer_blocks.13.ff_context.net.2.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
12288
],
"data_offsets": [
860962816,
864108544
]
},
"transformer.transformer_blocks.13.ff_context.net.2.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
864108544,
864894976
]
},
"transformer.transformer_blocks.13.norm1.linear.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
864894976,
865681408
]
},
"transformer.transformer_blocks.13.norm1.linear.lora_B.weight": {
"dtype": "F32",
"shape": [
18432,
64
],
"data_offsets": [
865681408,
870400000
]
},
"transformer.transformer_blocks.13.norm1_context.linear.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
870400000,
871186432
]
},
"transformer.transformer_blocks.13.norm1_context.linear.lora_B.weight": {
"dtype": "F32",
"shape": [
18432,
64
],
"data_offsets": [
871186432,
875905024
]
},
"transformer.transformer_blocks.14.attn.add_k_proj.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
875905024,
876691456
]
},
"transformer.transformer_blocks.14.attn.add_k_proj.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
876691456,
877477888
]
},
"transformer.transformer_blocks.14.attn.add_q_proj.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
877477888,
878264320
]
},
"transformer.transformer_blocks.14.attn.add_q_proj.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
878264320,
879050752
]
},
"transformer.transformer_blocks.14.attn.add_v_proj.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
879050752,
879837184
]
},
"transformer.transformer_blocks.14.attn.add_v_proj.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
879837184,
880623616
]
},
"transformer.transformer_blocks.14.attn.to_add_out.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
880623616,
881410048
]
},
"transformer.transformer_blocks.14.attn.to_add_out.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
881410048,
882196480
]
},
"transformer.transformer_blocks.14.attn.to_k.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
882196480,
882982912
]
},
"transformer.transformer_blocks.14.attn.to_k.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
882982912,
883769344
]
},
"transformer.transformer_blocks.14.attn.to_out.0.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
883769344,
884555776
]
},
"transformer.transformer_blocks.14.attn.to_out.0.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
884555776,
885342208
]
},
"transformer.transformer_blocks.14.attn.to_q.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
885342208,
886128640
]
},
"transformer.transformer_blocks.14.attn.to_q.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
886128640,
886915072
]
},
"transformer.transformer_blocks.14.attn.to_v.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
886915072,
887701504
]
},
"transformer.transformer_blocks.14.attn.to_v.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
887701504,
888487936
]
},
"transformer.transformer_blocks.14.ff.net.0.proj.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
888487936,
889274368
]
},
"transformer.transformer_blocks.14.ff.net.0.proj.lora_B.weight": {
"dtype": "F32",
"shape": [
12288,
64
],
"data_offsets": [
889274368,
892420096
]
},
"transformer.transformer_blocks.14.ff.net.2.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
12288
],
"data_offsets": [
892420096,
895565824
]
},
"transformer.transformer_blocks.14.ff.net.2.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
895565824,
896352256
]
},
"transformer.transformer_blocks.14.ff_context.net.0.proj.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
896352256,
897138688
]
},
"transformer.transformer_blocks.14.ff_context.net.0.proj.lora_B.weight": {
"dtype": "F32",
"shape": [
12288,
64
],
"data_offsets": [
897138688,
900284416
]
},
"transformer.transformer_blocks.14.ff_context.net.2.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
12288
],
"data_offsets": [
900284416,
903430144
]
},
"transformer.transformer_blocks.14.ff_context.net.2.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
903430144,
904216576
]
},
"transformer.transformer_blocks.14.norm1.linear.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
904216576,
905003008
]
},
"transformer.transformer_blocks.14.norm1.linear.lora_B.weight": {
"dtype": "F32",
"shape": [
18432,
64
],
"data_offsets": [
905003008,
909721600
]
},
"transformer.transformer_blocks.14.norm1_context.linear.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
909721600,
910508032
]
},
"transformer.transformer_blocks.14.norm1_context.linear.lora_B.weight": {
"dtype": "F32",
"shape": [
18432,
64
],
"data_offsets": [
910508032,
915226624
]
},
"transformer.transformer_blocks.15.attn.add_k_proj.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
915226624,
916013056
]
},
"transformer.transformer_blocks.15.attn.add_k_proj.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
916013056,
916799488
]
},
"transformer.transformer_blocks.15.attn.add_q_proj.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
916799488,
917585920
]
},
"transformer.transformer_blocks.15.attn.add_q_proj.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
917585920,
918372352
]
},
"transformer.transformer_blocks.15.attn.add_v_proj.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
918372352,
919158784
]
},
"transformer.transformer_blocks.15.attn.add_v_proj.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
919158784,
919945216
]
},
"transformer.transformer_blocks.15.attn.to_add_out.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
919945216,
920731648
]
},
"transformer.transformer_blocks.15.attn.to_add_out.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
920731648,
921518080
]
},
"transformer.transformer_blocks.15.attn.to_k.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
921518080,
922304512
]
},
"transformer.transformer_blocks.15.attn.to_k.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
922304512,
923090944
]
},
"transformer.transformer_blocks.15.attn.to_out.0.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
923090944,
923877376
]
},
"transformer.transformer_blocks.15.attn.to_out.0.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
923877376,
924663808
]
},
"transformer.transformer_blocks.15.attn.to_q.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
924663808,
925450240
]
},
"transformer.transformer_blocks.15.attn.to_q.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
925450240,
926236672
]
},
"transformer.transformer_blocks.15.attn.to_v.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
926236672,
927023104
]
},
"transformer.transformer_blocks.15.attn.to_v.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
927023104,
927809536
]
},
"transformer.transformer_blocks.15.ff.net.0.proj.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
927809536,
928595968
]
},
"transformer.transformer_blocks.15.ff.net.0.proj.lora_B.weight": {
"dtype": "F32",
"shape": [
12288,
64
],
"data_offsets": [
928595968,
931741696
]
},
"transformer.transformer_blocks.15.ff.net.2.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
12288
],
"data_offsets": [
931741696,
934887424
]
},
"transformer.transformer_blocks.15.ff.net.2.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
934887424,
935673856
]
},
"transformer.transformer_blocks.15.ff_context.net.0.proj.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
935673856,
936460288
]
},
"transformer.transformer_blocks.15.ff_context.net.0.proj.lora_B.weight": {
"dtype": "F32",
"shape": [
12288,
64
],
"data_offsets": [
936460288,
939606016
]
},
"transformer.transformer_blocks.15.ff_context.net.2.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
12288
],
"data_offsets": [
939606016,
942751744
]
},
"transformer.transformer_blocks.15.ff_context.net.2.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
942751744,
943538176
]
},
"transformer.transformer_blocks.15.norm1.linear.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
943538176,
944324608
]
},
"transformer.transformer_blocks.15.norm1.linear.lora_B.weight": {
"dtype": "F32",
"shape": [
18432,
64
],
"data_offsets": [
944324608,
949043200
]
},
"transformer.transformer_blocks.15.norm1_context.linear.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
949043200,
949829632
]
},
"transformer.transformer_blocks.15.norm1_context.linear.lora_B.weight": {
"dtype": "F32",
"shape": [
18432,
64
],
"data_offsets": [
949829632,
954548224
]
},
"transformer.transformer_blocks.16.attn.add_k_proj.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
954548224,
955334656
]
},
"transformer.transformer_blocks.16.attn.add_k_proj.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
955334656,
956121088
]
},
"transformer.transformer_blocks.16.attn.add_q_proj.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
956121088,
956907520
]
},
"transformer.transformer_blocks.16.attn.add_q_proj.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
956907520,
957693952
]
},
"transformer.transformer_blocks.16.attn.add_v_proj.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
957693952,
958480384
]
},
"transformer.transformer_blocks.16.attn.add_v_proj.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
958480384,
959266816
]
},
"transformer.transformer_blocks.16.attn.to_add_out.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
959266816,
960053248
]
},
"transformer.transformer_blocks.16.attn.to_add_out.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
960053248,
960839680
]
},
"transformer.transformer_blocks.16.attn.to_k.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
960839680,
961626112
]
},
"transformer.transformer_blocks.16.attn.to_k.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
961626112,
962412544
]
},
"transformer.transformer_blocks.16.attn.to_out.0.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
962412544,
963198976
]
},
"transformer.transformer_blocks.16.attn.to_out.0.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
963198976,
963985408
]
},
"transformer.transformer_blocks.16.attn.to_q.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
963985408,
964771840
]
},
"transformer.transformer_blocks.16.attn.to_q.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
964771840,
965558272
]
},
"transformer.transformer_blocks.16.attn.to_v.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
965558272,
966344704
]
},
"transformer.transformer_blocks.16.attn.to_v.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
966344704,
967131136
]
},
"transformer.transformer_blocks.16.ff.net.0.proj.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
967131136,
967917568
]
},
"transformer.transformer_blocks.16.ff.net.0.proj.lora_B.weight": {
"dtype": "F32",
"shape": [
12288,
64
],
"data_offsets": [
967917568,
971063296
]
},
"transformer.transformer_blocks.16.ff.net.2.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
12288
],
"data_offsets": [
971063296,
974209024
]
},
"transformer.transformer_blocks.16.ff.net.2.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
974209024,
974995456
]
},
"transformer.transformer_blocks.16.ff_context.net.0.proj.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
974995456,
975781888
]
},
"transformer.transformer_blocks.16.ff_context.net.0.proj.lora_B.weight": {
"dtype": "F32",
"shape": [
12288,
64
],
"data_offsets": [
975781888,
978927616
]
},
"transformer.transformer_blocks.16.ff_context.net.2.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
12288
],
"data_offsets": [
978927616,
982073344
]
},
"transformer.transformer_blocks.16.ff_context.net.2.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
982073344,
982859776
]
},
"transformer.transformer_blocks.16.norm1.linear.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
982859776,
983646208
]
},
"transformer.transformer_blocks.16.norm1.linear.lora_B.weight": {
"dtype": "F32",
"shape": [
18432,
64
],
"data_offsets": [
983646208,
988364800
]
},
"transformer.transformer_blocks.16.norm1_context.linear.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
988364800,
989151232
]
},
"transformer.transformer_blocks.16.norm1_context.linear.lora_B.weight": {
"dtype": "F32",
"shape": [
18432,
64
],
"data_offsets": [
989151232,
993869824
]
},
"transformer.transformer_blocks.17.attn.add_k_proj.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
993869824,
994656256
]
},
"transformer.transformer_blocks.17.attn.add_k_proj.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
994656256,
995442688
]
},
"transformer.transformer_blocks.17.attn.add_q_proj.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
995442688,
996229120
]
},
"transformer.transformer_blocks.17.attn.add_q_proj.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
996229120,
997015552
]
},
"transformer.transformer_blocks.17.attn.add_v_proj.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
997015552,
997801984
]
},
"transformer.transformer_blocks.17.attn.add_v_proj.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
997801984,
998588416
]
},
"transformer.transformer_blocks.17.attn.to_add_out.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
998588416,
999374848
]
},
"transformer.transformer_blocks.17.attn.to_add_out.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
999374848,
1000161280
]
},
"transformer.transformer_blocks.17.attn.to_k.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
1000161280,
1000947712
]
},
"transformer.transformer_blocks.17.attn.to_k.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
1000947712,
1001734144
]
},
"transformer.transformer_blocks.17.attn.to_out.0.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
1001734144,
1002520576
]
},
"transformer.transformer_blocks.17.attn.to_out.0.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
1002520576,
1003307008
]
},
"transformer.transformer_blocks.17.attn.to_q.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
1003307008,
1004093440
]
},
"transformer.transformer_blocks.17.attn.to_q.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
1004093440,
1004879872
]
},
"transformer.transformer_blocks.17.attn.to_v.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
1004879872,
1005666304
]
},
"transformer.transformer_blocks.17.attn.to_v.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
1005666304,
1006452736
]
},
"transformer.transformer_blocks.17.ff.net.0.proj.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
1006452736,
1007239168
]
},
"transformer.transformer_blocks.17.ff.net.0.proj.lora_B.weight": {
"dtype": "F32",
"shape": [
12288,
64
],
"data_offsets": [
1007239168,
1010384896
]
},
"transformer.transformer_blocks.17.ff.net.2.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
12288
],
"data_offsets": [
1010384896,
1013530624
]
},
"transformer.transformer_blocks.17.ff.net.2.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
1013530624,
1014317056
]
},
"transformer.transformer_blocks.17.ff_context.net.0.proj.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
1014317056,
1015103488
]
},
"transformer.transformer_blocks.17.ff_context.net.0.proj.lora_B.weight": {
"dtype": "F32",
"shape": [
12288,
64
],
"data_offsets": [
1015103488,
1018249216
]
},
"transformer.transformer_blocks.17.ff_context.net.2.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
12288
],
"data_offsets": [
1018249216,
1021394944
]
},
"transformer.transformer_blocks.17.ff_context.net.2.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
1021394944,
1022181376
]
},
"transformer.transformer_blocks.17.norm1.linear.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
1022181376,
1022967808
]
},
"transformer.transformer_blocks.17.norm1.linear.lora_B.weight": {
"dtype": "F32",
"shape": [
18432,
64
],
"data_offsets": [
1022967808,
1027686400
]
},
"transformer.transformer_blocks.17.norm1_context.linear.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
1027686400,
1028472832
]
},
"transformer.transformer_blocks.17.norm1_context.linear.lora_B.weight": {
"dtype": "F32",
"shape": [
18432,
64
],
"data_offsets": [
1028472832,
1033191424
]
},
"transformer.transformer_blocks.18.attn.add_k_proj.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
1033191424,
1033977856
]
},
"transformer.transformer_blocks.18.attn.add_k_proj.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
1033977856,
1034764288
]
},
"transformer.transformer_blocks.18.attn.add_q_proj.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
1034764288,
1035550720
]
},
"transformer.transformer_blocks.18.attn.add_q_proj.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
1035550720,
1036337152
]
},
"transformer.transformer_blocks.18.attn.add_v_proj.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
1036337152,
1037123584
]
},
"transformer.transformer_blocks.18.attn.add_v_proj.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
1037123584,
1037910016
]
},
"transformer.transformer_blocks.18.attn.to_add_out.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
1037910016,
1038696448
]
},
"transformer.transformer_blocks.18.attn.to_add_out.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
1038696448,
1039482880
]
},
"transformer.transformer_blocks.18.attn.to_k.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
1039482880,
1040269312
]
},
"transformer.transformer_blocks.18.attn.to_k.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
1040269312,
1041055744
]
},
"transformer.transformer_blocks.18.attn.to_out.0.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
1041055744,
1041842176
]
},
"transformer.transformer_blocks.18.attn.to_out.0.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
1041842176,
1042628608
]
},
"transformer.transformer_blocks.18.attn.to_q.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
1042628608,
1043415040
]
},
"transformer.transformer_blocks.18.attn.to_q.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
1043415040,
1044201472
]
},
"transformer.transformer_blocks.18.attn.to_v.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
1044201472,
1044987904
]
},
"transformer.transformer_blocks.18.attn.to_v.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
1044987904,
1045774336
]
},
"transformer.transformer_blocks.18.ff.net.0.proj.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
1045774336,
1046560768
]
},
"transformer.transformer_blocks.18.ff.net.0.proj.lora_B.weight": {
"dtype": "F32",
"shape": [
12288,
64
],
"data_offsets": [
1046560768,
1049706496
]
},
"transformer.transformer_blocks.18.ff.net.2.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
12288
],
"data_offsets": [
1049706496,
1052852224
]
},
"transformer.transformer_blocks.18.ff.net.2.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
1052852224,
1053638656
]
},
"transformer.transformer_blocks.18.ff_context.net.0.proj.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
1053638656,
1054425088
]
},
"transformer.transformer_blocks.18.ff_context.net.0.proj.lora_B.weight": {
"dtype": "F32",
"shape": [
12288,
64
],
"data_offsets": [
1054425088,
1057570816
]
},
"transformer.transformer_blocks.18.ff_context.net.2.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
12288
],
"data_offsets": [
1057570816,
1060716544
]
},
"transformer.transformer_blocks.18.ff_context.net.2.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
1060716544,
1061502976
]
},
"transformer.transformer_blocks.18.norm1.linear.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
1061502976,
1062289408
]
},
"transformer.transformer_blocks.18.norm1.linear.lora_B.weight": {
"dtype": "F32",
"shape": [
18432,
64
],
"data_offsets": [
1062289408,
1067008000
]
},
"transformer.transformer_blocks.18.norm1_context.linear.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
1067008000,
1067794432
]
},
"transformer.transformer_blocks.18.norm1_context.linear.lora_B.weight": {
"dtype": "F32",
"shape": [
18432,
64
],
"data_offsets": [
1067794432,
1072513024
]
},
"transformer.transformer_blocks.2.attn.add_k_proj.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
1072513024,
1073299456
]
},
"transformer.transformer_blocks.2.attn.add_k_proj.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
1073299456,
1074085888
]
},
"transformer.transformer_blocks.2.attn.add_q_proj.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
1074085888,
1074872320
]
},
"transformer.transformer_blocks.2.attn.add_q_proj.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
1074872320,
1075658752
]
},
"transformer.transformer_blocks.2.attn.add_v_proj.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
1075658752,
1076445184
]
},
"transformer.transformer_blocks.2.attn.add_v_proj.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
1076445184,
1077231616
]
},
"transformer.transformer_blocks.2.attn.to_add_out.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
1077231616,
1078018048
]
},
"transformer.transformer_blocks.2.attn.to_add_out.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
1078018048,
1078804480
]
},
"transformer.transformer_blocks.2.attn.to_k.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
1078804480,
1079590912
]
},
"transformer.transformer_blocks.2.attn.to_k.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
1079590912,
1080377344
]
},
"transformer.transformer_blocks.2.attn.to_out.0.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
1080377344,
1081163776
]
},
"transformer.transformer_blocks.2.attn.to_out.0.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
1081163776,
1081950208
]
},
"transformer.transformer_blocks.2.attn.to_q.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
1081950208,
1082736640
]
},
"transformer.transformer_blocks.2.attn.to_q.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
1082736640,
1083523072
]
},
"transformer.transformer_blocks.2.attn.to_v.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
1083523072,
1084309504
]
},
"transformer.transformer_blocks.2.attn.to_v.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
1084309504,
1085095936
]
},
"transformer.transformer_blocks.2.ff.net.0.proj.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
1085095936,
1085882368
]
},
"transformer.transformer_blocks.2.ff.net.0.proj.lora_B.weight": {
"dtype": "F32",
"shape": [
12288,
64
],
"data_offsets": [
1085882368,
1089028096
]
},
"transformer.transformer_blocks.2.ff.net.2.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
12288
],
"data_offsets": [
1089028096,
1092173824
]
},
"transformer.transformer_blocks.2.ff.net.2.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
1092173824,
1092960256
]
},
"transformer.transformer_blocks.2.ff_context.net.0.proj.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
1092960256,
1093746688
]
},
"transformer.transformer_blocks.2.ff_context.net.0.proj.lora_B.weight": {
"dtype": "F32",
"shape": [
12288,
64
],
"data_offsets": [
1093746688,
1096892416
]
},
"transformer.transformer_blocks.2.ff_context.net.2.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
12288
],
"data_offsets": [
1096892416,
1100038144
]
},
"transformer.transformer_blocks.2.ff_context.net.2.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
1100038144,
1100824576
]
},
"transformer.transformer_blocks.2.norm1.linear.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
1100824576,
1101611008
]
},
"transformer.transformer_blocks.2.norm1.linear.lora_B.weight": {
"dtype": "F32",
"shape": [
18432,
64
],
"data_offsets": [
1101611008,
1106329600
]
},
"transformer.transformer_blocks.2.norm1_context.linear.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
1106329600,
1107116032
]
},
"transformer.transformer_blocks.2.norm1_context.linear.lora_B.weight": {
"dtype": "F32",
"shape": [
18432,
64
],
"data_offsets": [
1107116032,
1111834624
]
},
"transformer.transformer_blocks.3.attn.add_k_proj.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
1111834624,
1112621056
]
},
"transformer.transformer_blocks.3.attn.add_k_proj.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
1112621056,
1113407488
]
},
"transformer.transformer_blocks.3.attn.add_q_proj.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
1113407488,
1114193920
]
},
"transformer.transformer_blocks.3.attn.add_q_proj.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
1114193920,
1114980352
]
},
"transformer.transformer_blocks.3.attn.add_v_proj.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
1114980352,
1115766784
]
},
"transformer.transformer_blocks.3.attn.add_v_proj.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
1115766784,
1116553216
]
},
"transformer.transformer_blocks.3.attn.to_add_out.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
1116553216,
1117339648
]
},
"transformer.transformer_blocks.3.attn.to_add_out.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
1117339648,
1118126080
]
},
"transformer.transformer_blocks.3.attn.to_k.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
1118126080,
1118912512
]
},
"transformer.transformer_blocks.3.attn.to_k.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
1118912512,
1119698944
]
},
"transformer.transformer_blocks.3.attn.to_out.0.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
1119698944,
1120485376
]
},
"transformer.transformer_blocks.3.attn.to_out.0.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
1120485376,
1121271808
]
},
"transformer.transformer_blocks.3.attn.to_q.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
1121271808,
1122058240
]
},
"transformer.transformer_blocks.3.attn.to_q.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
1122058240,
1122844672
]
},
"transformer.transformer_blocks.3.attn.to_v.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
1122844672,
1123631104
]
},
"transformer.transformer_blocks.3.attn.to_v.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
1123631104,
1124417536
]
},
"transformer.transformer_blocks.3.ff.net.0.proj.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
1124417536,
1125203968
]
},
"transformer.transformer_blocks.3.ff.net.0.proj.lora_B.weight": {
"dtype": "F32",
"shape": [
12288,
64
],
"data_offsets": [
1125203968,
1128349696
]
},
"transformer.transformer_blocks.3.ff.net.2.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
12288
],
"data_offsets": [
1128349696,
1131495424
]
},
"transformer.transformer_blocks.3.ff.net.2.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
1131495424,
1132281856
]
},
"transformer.transformer_blocks.3.ff_context.net.0.proj.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
1132281856,
1133068288
]
},
"transformer.transformer_blocks.3.ff_context.net.0.proj.lora_B.weight": {
"dtype": "F32",
"shape": [
12288,
64
],
"data_offsets": [
1133068288,
1136214016
]
},
"transformer.transformer_blocks.3.ff_context.net.2.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
12288
],
"data_offsets": [
1136214016,
1139359744
]
},
"transformer.transformer_blocks.3.ff_context.net.2.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
1139359744,
1140146176
]
},
"transformer.transformer_blocks.3.norm1.linear.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
1140146176,
1140932608
]
},
"transformer.transformer_blocks.3.norm1.linear.lora_B.weight": {
"dtype": "F32",
"shape": [
18432,
64
],
"data_offsets": [
1140932608,
1145651200
]
},
"transformer.transformer_blocks.3.norm1_context.linear.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
1145651200,
1146437632
]
},
"transformer.transformer_blocks.3.norm1_context.linear.lora_B.weight": {
"dtype": "F32",
"shape": [
18432,
64
],
"data_offsets": [
1146437632,
1151156224
]
},
"transformer.transformer_blocks.4.attn.add_k_proj.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
1151156224,
1151942656
]
},
"transformer.transformer_blocks.4.attn.add_k_proj.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
1151942656,
1152729088
]
},
"transformer.transformer_blocks.4.attn.add_q_proj.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
1152729088,
1153515520
]
},
"transformer.transformer_blocks.4.attn.add_q_proj.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
1153515520,
1154301952
]
},
"transformer.transformer_blocks.4.attn.add_v_proj.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
1154301952,
1155088384
]
},
"transformer.transformer_blocks.4.attn.add_v_proj.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
1155088384,
1155874816
]
},
"transformer.transformer_blocks.4.attn.to_add_out.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
1155874816,
1156661248
]
},
"transformer.transformer_blocks.4.attn.to_add_out.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
1156661248,
1157447680
]
},
"transformer.transformer_blocks.4.attn.to_k.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
1157447680,
1158234112
]
},
"transformer.transformer_blocks.4.attn.to_k.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
1158234112,
1159020544
]
},
"transformer.transformer_blocks.4.attn.to_out.0.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
1159020544,
1159806976
]
},
"transformer.transformer_blocks.4.attn.to_out.0.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
1159806976,
1160593408
]
},
"transformer.transformer_blocks.4.attn.to_q.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
1160593408,
1161379840
]
},
"transformer.transformer_blocks.4.attn.to_q.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
1161379840,
1162166272
]
},
"transformer.transformer_blocks.4.attn.to_v.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
1162166272,
1162952704
]
},
"transformer.transformer_blocks.4.attn.to_v.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
1162952704,
1163739136
]
},
"transformer.transformer_blocks.4.ff.net.0.proj.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
1163739136,
1164525568
]
},
"transformer.transformer_blocks.4.ff.net.0.proj.lora_B.weight": {
"dtype": "F32",
"shape": [
12288,
64
],
"data_offsets": [
1164525568,
1167671296
]
},
"transformer.transformer_blocks.4.ff.net.2.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
12288
],
"data_offsets": [
1167671296,
1170817024
]
},
"transformer.transformer_blocks.4.ff.net.2.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
1170817024,
1171603456
]
},
"transformer.transformer_blocks.4.ff_context.net.0.proj.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
1171603456,
1172389888
]
},
"transformer.transformer_blocks.4.ff_context.net.0.proj.lora_B.weight": {
"dtype": "F32",
"shape": [
12288,
64
],
"data_offsets": [
1172389888,
1175535616
]
},
"transformer.transformer_blocks.4.ff_context.net.2.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
12288
],
"data_offsets": [
1175535616,
1178681344
]
},
"transformer.transformer_blocks.4.ff_context.net.2.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
1178681344,
1179467776
]
},
"transformer.transformer_blocks.4.norm1.linear.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
1179467776,
1180254208
]
},
"transformer.transformer_blocks.4.norm1.linear.lora_B.weight": {
"dtype": "F32",
"shape": [
18432,
64
],
"data_offsets": [
1180254208,
1184972800
]
},
"transformer.transformer_blocks.4.norm1_context.linear.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
1184972800,
1185759232
]
},
"transformer.transformer_blocks.4.norm1_context.linear.lora_B.weight": {
"dtype": "F32",
"shape": [
18432,
64
],
"data_offsets": [
1185759232,
1190477824
]
},
"transformer.transformer_blocks.5.attn.add_k_proj.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
1190477824,
1191264256
]
},
"transformer.transformer_blocks.5.attn.add_k_proj.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
1191264256,
1192050688
]
},
"transformer.transformer_blocks.5.attn.add_q_proj.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
1192050688,
1192837120
]
},
"transformer.transformer_blocks.5.attn.add_q_proj.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
1192837120,
1193623552
]
},
"transformer.transformer_blocks.5.attn.add_v_proj.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
1193623552,
1194409984
]
},
"transformer.transformer_blocks.5.attn.add_v_proj.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
1194409984,
1195196416
]
},
"transformer.transformer_blocks.5.attn.to_add_out.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
1195196416,
1195982848
]
},
"transformer.transformer_blocks.5.attn.to_add_out.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
1195982848,
1196769280
]
},
"transformer.transformer_blocks.5.attn.to_k.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
1196769280,
1197555712
]
},
"transformer.transformer_blocks.5.attn.to_k.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
1197555712,
1198342144
]
},
"transformer.transformer_blocks.5.attn.to_out.0.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
1198342144,
1199128576
]
},
"transformer.transformer_blocks.5.attn.to_out.0.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
1199128576,
1199915008
]
},
"transformer.transformer_blocks.5.attn.to_q.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
1199915008,
1200701440
]
},
"transformer.transformer_blocks.5.attn.to_q.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
1200701440,
1201487872
]
},
"transformer.transformer_blocks.5.attn.to_v.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
1201487872,
1202274304
]
},
"transformer.transformer_blocks.5.attn.to_v.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
1202274304,
1203060736
]
},
"transformer.transformer_blocks.5.ff.net.0.proj.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
1203060736,
1203847168
]
},
"transformer.transformer_blocks.5.ff.net.0.proj.lora_B.weight": {
"dtype": "F32",
"shape": [
12288,
64
],
"data_offsets": [
1203847168,
1206992896
]
},
"transformer.transformer_blocks.5.ff.net.2.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
12288
],
"data_offsets": [
1206992896,
1210138624
]
},
"transformer.transformer_blocks.5.ff.net.2.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
1210138624,
1210925056
]
},
"transformer.transformer_blocks.5.ff_context.net.0.proj.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
1210925056,
1211711488
]
},
"transformer.transformer_blocks.5.ff_context.net.0.proj.lora_B.weight": {
"dtype": "F32",
"shape": [
12288,
64
],
"data_offsets": [
1211711488,
1214857216
]
},
"transformer.transformer_blocks.5.ff_context.net.2.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
12288
],
"data_offsets": [
1214857216,
1218002944
]
},
"transformer.transformer_blocks.5.ff_context.net.2.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
1218002944,
1218789376
]
},
"transformer.transformer_blocks.5.norm1.linear.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
1218789376,
1219575808
]
},
"transformer.transformer_blocks.5.norm1.linear.lora_B.weight": {
"dtype": "F32",
"shape": [
18432,
64
],
"data_offsets": [
1219575808,
1224294400
]
},
"transformer.transformer_blocks.5.norm1_context.linear.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
1224294400,
1225080832
]
},
"transformer.transformer_blocks.5.norm1_context.linear.lora_B.weight": {
"dtype": "F32",
"shape": [
18432,
64
],
"data_offsets": [
1225080832,
1229799424
]
},
"transformer.transformer_blocks.6.attn.add_k_proj.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
1229799424,
1230585856
]
},
"transformer.transformer_blocks.6.attn.add_k_proj.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
1230585856,
1231372288
]
},
"transformer.transformer_blocks.6.attn.add_q_proj.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
1231372288,
1232158720
]
},
"transformer.transformer_blocks.6.attn.add_q_proj.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
1232158720,
1232945152
]
},
"transformer.transformer_blocks.6.attn.add_v_proj.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
1232945152,
1233731584
]
},
"transformer.transformer_blocks.6.attn.add_v_proj.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
1233731584,
1234518016
]
},
"transformer.transformer_blocks.6.attn.to_add_out.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
1234518016,
1235304448
]
},
"transformer.transformer_blocks.6.attn.to_add_out.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
1235304448,
1236090880
]
},
"transformer.transformer_blocks.6.attn.to_k.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
1236090880,
1236877312
]
},
"transformer.transformer_blocks.6.attn.to_k.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
1236877312,
1237663744
]
},
"transformer.transformer_blocks.6.attn.to_out.0.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
1237663744,
1238450176
]
},
"transformer.transformer_blocks.6.attn.to_out.0.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
1238450176,
1239236608
]
},
"transformer.transformer_blocks.6.attn.to_q.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
1239236608,
1240023040
]
},
"transformer.transformer_blocks.6.attn.to_q.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
1240023040,
1240809472
]
},
"transformer.transformer_blocks.6.attn.to_v.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
1240809472,
1241595904
]
},
"transformer.transformer_blocks.6.attn.to_v.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
1241595904,
1242382336
]
},
"transformer.transformer_blocks.6.ff.net.0.proj.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
1242382336,
1243168768
]
},
"transformer.transformer_blocks.6.ff.net.0.proj.lora_B.weight": {
"dtype": "F32",
"shape": [
12288,
64
],
"data_offsets": [
1243168768,
1246314496
]
},
"transformer.transformer_blocks.6.ff.net.2.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
12288
],
"data_offsets": [
1246314496,
1249460224
]
},
"transformer.transformer_blocks.6.ff.net.2.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
1249460224,
1250246656
]
},
"transformer.transformer_blocks.6.ff_context.net.0.proj.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
1250246656,
1251033088
]
},
"transformer.transformer_blocks.6.ff_context.net.0.proj.lora_B.weight": {
"dtype": "F32",
"shape": [
12288,
64
],
"data_offsets": [
1251033088,
1254178816
]
},
"transformer.transformer_blocks.6.ff_context.net.2.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
12288
],
"data_offsets": [
1254178816,
1257324544
]
},
"transformer.transformer_blocks.6.ff_context.net.2.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
1257324544,
1258110976
]
},
"transformer.transformer_blocks.6.norm1.linear.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
1258110976,
1258897408
]
},
"transformer.transformer_blocks.6.norm1.linear.lora_B.weight": {
"dtype": "F32",
"shape": [
18432,
64
],
"data_offsets": [
1258897408,
1263616000
]
},
"transformer.transformer_blocks.6.norm1_context.linear.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
1263616000,
1264402432
]
},
"transformer.transformer_blocks.6.norm1_context.linear.lora_B.weight": {
"dtype": "F32",
"shape": [
18432,
64
],
"data_offsets": [
1264402432,
1269121024
]
},
"transformer.transformer_blocks.7.attn.add_k_proj.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
1269121024,
1269907456
]
},
"transformer.transformer_blocks.7.attn.add_k_proj.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
1269907456,
1270693888
]
},
"transformer.transformer_blocks.7.attn.add_q_proj.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
1270693888,
1271480320
]
},
"transformer.transformer_blocks.7.attn.add_q_proj.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
1271480320,
1272266752
]
},
"transformer.transformer_blocks.7.attn.add_v_proj.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
1272266752,
1273053184
]
},
"transformer.transformer_blocks.7.attn.add_v_proj.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
1273053184,
1273839616
]
},
"transformer.transformer_blocks.7.attn.to_add_out.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
1273839616,
1274626048
]
},
"transformer.transformer_blocks.7.attn.to_add_out.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
1274626048,
1275412480
]
},
"transformer.transformer_blocks.7.attn.to_k.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
1275412480,
1276198912
]
},
"transformer.transformer_blocks.7.attn.to_k.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
1276198912,
1276985344
]
},
"transformer.transformer_blocks.7.attn.to_out.0.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
1276985344,
1277771776
]
},
"transformer.transformer_blocks.7.attn.to_out.0.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
1277771776,
1278558208
]
},
"transformer.transformer_blocks.7.attn.to_q.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
1278558208,
1279344640
]
},
"transformer.transformer_blocks.7.attn.to_q.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
1279344640,
1280131072
]
},
"transformer.transformer_blocks.7.attn.to_v.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
1280131072,
1280917504
]
},
"transformer.transformer_blocks.7.attn.to_v.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
1280917504,
1281703936
]
},
"transformer.transformer_blocks.7.ff.net.0.proj.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
1281703936,
1282490368
]
},
"transformer.transformer_blocks.7.ff.net.0.proj.lora_B.weight": {
"dtype": "F32",
"shape": [
12288,
64
],
"data_offsets": [
1282490368,
1285636096
]
},
"transformer.transformer_blocks.7.ff.net.2.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
12288
],
"data_offsets": [
1285636096,
1288781824
]
},
"transformer.transformer_blocks.7.ff.net.2.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
1288781824,
1289568256
]
},
"transformer.transformer_blocks.7.ff_context.net.0.proj.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
1289568256,
1290354688
]
},
"transformer.transformer_blocks.7.ff_context.net.0.proj.lora_B.weight": {
"dtype": "F32",
"shape": [
12288,
64
],
"data_offsets": [
1290354688,
1293500416
]
},
"transformer.transformer_blocks.7.ff_context.net.2.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
12288
],
"data_offsets": [
1293500416,
1296646144
]
},
"transformer.transformer_blocks.7.ff_context.net.2.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
1296646144,
1297432576
]
},
"transformer.transformer_blocks.7.norm1.linear.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
1297432576,
1298219008
]
},
"transformer.transformer_blocks.7.norm1.linear.lora_B.weight": {
"dtype": "F32",
"shape": [
18432,
64
],
"data_offsets": [
1298219008,
1302937600
]
},
"transformer.transformer_blocks.7.norm1_context.linear.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
1302937600,
1303724032
]
},
"transformer.transformer_blocks.7.norm1_context.linear.lora_B.weight": {
"dtype": "F32",
"shape": [
18432,
64
],
"data_offsets": [
1303724032,
1308442624
]
},
"transformer.transformer_blocks.8.attn.add_k_proj.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
1308442624,
1309229056
]
},
"transformer.transformer_blocks.8.attn.add_k_proj.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
1309229056,
1310015488
]
},
"transformer.transformer_blocks.8.attn.add_q_proj.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
1310015488,
1310801920
]
},
"transformer.transformer_blocks.8.attn.add_q_proj.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
1310801920,
1311588352
]
},
"transformer.transformer_blocks.8.attn.add_v_proj.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
1311588352,
1312374784
]
},
"transformer.transformer_blocks.8.attn.add_v_proj.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
1312374784,
1313161216
]
},
"transformer.transformer_blocks.8.attn.to_add_out.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
1313161216,
1313947648
]
},
"transformer.transformer_blocks.8.attn.to_add_out.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
1313947648,
1314734080
]
},
"transformer.transformer_blocks.8.attn.to_k.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
1314734080,
1315520512
]
},
"transformer.transformer_blocks.8.attn.to_k.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
1315520512,
1316306944
]
},
"transformer.transformer_blocks.8.attn.to_out.0.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
1316306944,
1317093376
]
},
"transformer.transformer_blocks.8.attn.to_out.0.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
1317093376,
1317879808
]
},
"transformer.transformer_blocks.8.attn.to_q.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
1317879808,
1318666240
]
},
"transformer.transformer_blocks.8.attn.to_q.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
1318666240,
1319452672
]
},
"transformer.transformer_blocks.8.attn.to_v.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
1319452672,
1320239104
]
},
"transformer.transformer_blocks.8.attn.to_v.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
1320239104,
1321025536
]
},
"transformer.transformer_blocks.8.ff.net.0.proj.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
1321025536,
1321811968
]
},
"transformer.transformer_blocks.8.ff.net.0.proj.lora_B.weight": {
"dtype": "F32",
"shape": [
12288,
64
],
"data_offsets": [
1321811968,
1324957696
]
},
"transformer.transformer_blocks.8.ff.net.2.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
12288
],
"data_offsets": [
1324957696,
1328103424
]
},
"transformer.transformer_blocks.8.ff.net.2.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
1328103424,
1328889856
]
},
"transformer.transformer_blocks.8.ff_context.net.0.proj.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
1328889856,
1329676288
]
},
"transformer.transformer_blocks.8.ff_context.net.0.proj.lora_B.weight": {
"dtype": "F32",
"shape": [
12288,
64
],
"data_offsets": [
1329676288,
1332822016
]
},
"transformer.transformer_blocks.8.ff_context.net.2.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
12288
],
"data_offsets": [
1332822016,
1335967744
]
},
"transformer.transformer_blocks.8.ff_context.net.2.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
1335967744,
1336754176
]
},
"transformer.transformer_blocks.8.norm1.linear.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
1336754176,
1337540608
]
},
"transformer.transformer_blocks.8.norm1.linear.lora_B.weight": {
"dtype": "F32",
"shape": [
18432,
64
],
"data_offsets": [
1337540608,
1342259200
]
},
"transformer.transformer_blocks.8.norm1_context.linear.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
1342259200,
1343045632
]
},
"transformer.transformer_blocks.8.norm1_context.linear.lora_B.weight": {
"dtype": "F32",
"shape": [
18432,
64
],
"data_offsets": [
1343045632,
1347764224
]
},
"transformer.transformer_blocks.9.attn.add_k_proj.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
1347764224,
1348550656
]
},
"transformer.transformer_blocks.9.attn.add_k_proj.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
1348550656,
1349337088
]
},
"transformer.transformer_blocks.9.attn.add_q_proj.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
1349337088,
1350123520
]
},
"transformer.transformer_blocks.9.attn.add_q_proj.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
1350123520,
1350909952
]
},
"transformer.transformer_blocks.9.attn.add_v_proj.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
1350909952,
1351696384
]
},
"transformer.transformer_blocks.9.attn.add_v_proj.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
1351696384,
1352482816
]
},
"transformer.transformer_blocks.9.attn.to_add_out.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
1352482816,
1353269248
]
},
"transformer.transformer_blocks.9.attn.to_add_out.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
1353269248,
1354055680
]
},
"transformer.transformer_blocks.9.attn.to_k.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
1354055680,
1354842112
]
},
"transformer.transformer_blocks.9.attn.to_k.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
1354842112,
1355628544
]
},
"transformer.transformer_blocks.9.attn.to_out.0.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
1355628544,
1356414976
]
},
"transformer.transformer_blocks.9.attn.to_out.0.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
1356414976,
1357201408
]
},
"transformer.transformer_blocks.9.attn.to_q.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
1357201408,
1357987840
]
},
"transformer.transformer_blocks.9.attn.to_q.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
1357987840,
1358774272
]
},
"transformer.transformer_blocks.9.attn.to_v.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
1358774272,
1359560704
]
},
"transformer.transformer_blocks.9.attn.to_v.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
1359560704,
1360347136
]
},
"transformer.transformer_blocks.9.ff.net.0.proj.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
1360347136,
1361133568
]
},
"transformer.transformer_blocks.9.ff.net.0.proj.lora_B.weight": {
"dtype": "F32",
"shape": [
12288,
64
],
"data_offsets": [
1361133568,
1364279296
]
},
"transformer.transformer_blocks.9.ff.net.2.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
12288
],
"data_offsets": [
1364279296,
1367425024
]
},
"transformer.transformer_blocks.9.ff.net.2.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
1367425024,
1368211456
]
},
"transformer.transformer_blocks.9.ff_context.net.0.proj.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
1368211456,
1368997888
]
},
"transformer.transformer_blocks.9.ff_context.net.0.proj.lora_B.weight": {
"dtype": "F32",
"shape": [
12288,
64
],
"data_offsets": [
1368997888,
1372143616
]
},
"transformer.transformer_blocks.9.ff_context.net.2.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
12288
],
"data_offsets": [
1372143616,
1375289344
]
},
"transformer.transformer_blocks.9.ff_context.net.2.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
1375289344,
1376075776
]
},
"transformer.transformer_blocks.9.norm1.linear.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
1376075776,
1376862208
]
},
"transformer.transformer_blocks.9.norm1.linear.lora_B.weight": {
"dtype": "F32",
"shape": [
18432,
64
],
"data_offsets": [
1376862208,
1381580800
]
},
"transformer.transformer_blocks.9.norm1_context.linear.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
3072
],
"data_offsets": [
1381580800,
1382367232
]
},
"transformer.transformer_blocks.9.norm1_context.linear.lora_B.weight": {
"dtype": "F32",
"shape": [
18432,
64
],
"data_offsets": [
1382367232,
1387085824
]
},
"transformer.x_embedder.lora_A.weight": {
"dtype": "F32",
"shape": [
64,
64
],
"data_offsets": [
1387085824,
1387102208
]
},
"transformer.x_embedder.lora_B.weight": {
"dtype": "F32",
"shape": [
3072,
64
],
"data_offsets": [
1387102208,
1387888640
]
}
}