Commit ·
20179e4
1
Parent(s): b0438b3
Upload part 70
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- .gitattributes +48 -0
- checkpoint_1007000/target.decoder.layers_2.encoder_decoder_attention.query.kernel/.zarray +1 -0
- checkpoint_1007000/target.decoder.layers_2.encoder_decoder_attention.query.kernel/.zarray.__tmp10631717546615226683.~1663960300549813~ +1 -0
- checkpoint_1007000/target.decoder.layers_2.encoder_decoder_attention.query.kernel/.zarray.__tmp12515279127317660978.~1663960300601621~ +1 -0
- checkpoint_1007000/target.decoder.layers_2.encoder_decoder_attention.query.kernel/.zarray.__tmp16850672775502047585.~1663960300684004~ +1 -0
- checkpoint_1007000/target.decoder.layers_2.encoder_decoder_attention.query.kernel/.zarray.__tmp17014265567154969946.~1663960300384122~ +1 -0
- checkpoint_1007000/target.decoder.layers_2.encoder_decoder_attention.query.kernel/.zarray.__tmp2502557247265826093.~1663960300495103~ +1 -0
- checkpoint_1007000/target.decoder.layers_2.encoder_decoder_attention.query.kernel/.zarray.__tmp6246011022581936266.~1663960300632092~ +1 -0
- checkpoint_1007000/target.decoder.layers_2.encoder_decoder_attention.query.kernel/.zarray.__tmp6442646648044591608.~1663960300885545~ +1 -0
- checkpoint_1007000/target.decoder.layers_2.encoder_decoder_attention.query.kernel/0.0 +3 -0
- checkpoint_1007000/target.decoder.layers_2.encoder_decoder_attention.query.kernel/0.1 +3 -0
- checkpoint_1007000/target.decoder.layers_2.encoder_decoder_attention.query.kernel/0.2 +3 -0
- checkpoint_1007000/target.decoder.layers_2.encoder_decoder_attention.query.kernel/0.3 +3 -0
- checkpoint_1007000/target.decoder.layers_2.encoder_decoder_attention.query.kernel/0.4 +3 -0
- checkpoint_1007000/target.decoder.layers_2.encoder_decoder_attention.query.kernel/0.5 +3 -0
- checkpoint_1007000/target.decoder.layers_2.encoder_decoder_attention.query.kernel/0.6 +3 -0
- checkpoint_1007000/target.decoder.layers_2.encoder_decoder_attention.query.kernel/0.7 +3 -0
- checkpoint_1007000/target.decoder.layers_2.pre_mlp_layer_norm.scale/.zarray +1 -0
- checkpoint_1007000/target.decoder.layers_2.pre_mlp_layer_norm.scale/0 +0 -0
- checkpoint_1007000/target.decoder.layers_3.mlp.wo.kernel/.zarray +1 -0
- checkpoint_1007000/target.decoder.layers_3.mlp.wo.kernel/.zarray.__tmp12164144768396930405.~1663960300347572~ +1 -0
- checkpoint_1007000/target.decoder.layers_3.mlp.wo.kernel/.zarray.__tmp13176161344907895275.~1663960300422591~ +1 -0
- checkpoint_1007000/target.decoder.layers_3.mlp.wo.kernel/.zarray.__tmp15877630234575677669.~1663960300730426~ +1 -0
- checkpoint_1007000/target.decoder.layers_3.mlp.wo.kernel/.zarray.__tmp4667462083429703658.~1663960300602045~ +1 -0
- checkpoint_1007000/target.decoder.layers_3.mlp.wo.kernel/.zarray.__tmp6686909515785747199.~1663960300384135~ +1 -0
- checkpoint_1007000/target.decoder.layers_3.mlp.wo.kernel/.zarray.__tmp7799999499370154336.~1663960300466651~ +1 -0
- checkpoint_1007000/target.decoder.layers_3.mlp.wo.kernel/.zarray.__tmp8199791667970183948.~1663960300272546~ +1 -0
- checkpoint_1007000/target.decoder.layers_3.mlp.wo.kernel/0.0 +3 -0
- checkpoint_1007000/target.decoder.layers_3.mlp.wo.kernel/1.0 +3 -0
- checkpoint_1007000/target.decoder.layers_3.mlp.wo.kernel/2.0 +3 -0
- checkpoint_1007000/target.decoder.layers_3.mlp.wo.kernel/3.0 +3 -0
- checkpoint_1007000/target.decoder.layers_3.mlp.wo.kernel/4.0 +3 -0
- checkpoint_1007000/target.decoder.layers_3.mlp.wo.kernel/5.0 +3 -0
- checkpoint_1007000/target.decoder.layers_3.mlp.wo.kernel/6.0 +3 -0
- checkpoint_1007000/target.decoder.layers_3.mlp.wo.kernel/7.0 +3 -0
- checkpoint_1007000/target.encoder.layers_1.mlp.wi_1.kernel/.zarray +1 -0
- checkpoint_1007000/target.encoder.layers_1.mlp.wi_1.kernel/.zarray.__tmp10192900048669059227.~1663960300780722~ +1 -0
- checkpoint_1007000/target.encoder.layers_1.mlp.wi_1.kernel/.zarray.__tmp11689713418066339141.~1663960300778641~ +1 -0
- checkpoint_1007000/target.encoder.layers_1.mlp.wi_1.kernel/.zarray.__tmp11794325550773358884.~1663960300550985~ +1 -0
- checkpoint_1007000/target.encoder.layers_1.mlp.wi_1.kernel/.zarray.__tmp15682293152539461437.~1663960300731443~ +1 -0
- checkpoint_1007000/target.encoder.layers_1.mlp.wi_1.kernel/.zarray.__tmp3355123498195616867.~1663960300889044~ +1 -0
- checkpoint_1007000/target.encoder.layers_1.mlp.wi_1.kernel/.zarray.__tmp3779781660571819135.~1663960300686436~ +1 -0
- checkpoint_1007000/target.encoder.layers_1.mlp.wi_1.kernel/.zarray.__tmp9561935997004653383.~1663960300937419~ +1 -0
- checkpoint_1007000/target.encoder.layers_1.mlp.wi_1.kernel/0.0 +3 -0
- checkpoint_1007000/target.encoder.layers_1.mlp.wi_1.kernel/0.1 +3 -0
- checkpoint_1007000/target.encoder.layers_1.mlp.wi_1.kernel/0.2 +3 -0
- checkpoint_1007000/target.encoder.layers_1.mlp.wi_1.kernel/0.3 +3 -0
- checkpoint_1007000/target.encoder.layers_1.mlp.wi_1.kernel/0.4 +3 -0
- checkpoint_1007000/target.encoder.layers_1.mlp.wi_1.kernel/0.5 +3 -0
- checkpoint_1007000/target.encoder.layers_1.mlp.wi_1.kernel/0.6 +3 -0
.gitattributes
CHANGED
|
@@ -3459,3 +3459,51 @@ checkpoint_1007000/target.decoder.layers_0.mlp.wo.kernel/7.0 filter=lfs diff=lfs
|
|
| 3459 |
checkpoint_1007000/target.decoder.layers_0.mlp.wo.kernel/5.0 filter=lfs diff=lfs merge=lfs -text
|
| 3460 |
checkpoint_1007000/target.decoder.layers_0.mlp.wo.kernel/2.0 filter=lfs diff=lfs merge=lfs -text
|
| 3461 |
checkpoint_1007000/target.decoder.layers_0.mlp.wo.kernel/4.0 filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 3459 |
checkpoint_1007000/target.decoder.layers_0.mlp.wo.kernel/5.0 filter=lfs diff=lfs merge=lfs -text
|
| 3460 |
checkpoint_1007000/target.decoder.layers_0.mlp.wo.kernel/2.0 filter=lfs diff=lfs merge=lfs -text
|
| 3461 |
checkpoint_1007000/target.decoder.layers_0.mlp.wo.kernel/4.0 filter=lfs diff=lfs merge=lfs -text
|
| 3462 |
+
checkpoint_1007000/target.decoder.layers_2.encoder_decoder_attention.query.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 3463 |
+
checkpoint_1007000/target.decoder.layers_2.encoder_decoder_attention.query.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
| 3464 |
+
checkpoint_1007000/target.decoder.layers_2.encoder_decoder_attention.query.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 3465 |
+
checkpoint_1007000/target.decoder.layers_2.encoder_decoder_attention.query.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
| 3466 |
+
checkpoint_1007000/target.decoder.layers_2.encoder_decoder_attention.query.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
| 3467 |
+
checkpoint_1007000/target.decoder.layers_2.encoder_decoder_attention.query.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
| 3468 |
+
checkpoint_1007000/target.decoder.layers_2.encoder_decoder_attention.query.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
| 3469 |
+
checkpoint_1007000/target.decoder.layers_2.encoder_decoder_attention.query.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
| 3470 |
+
checkpoint_1007000/target.encoder.layers_19.mlp.wi_0.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 3471 |
+
checkpoint_1007000/target.encoder.layers_19.mlp.wi_0.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
| 3472 |
+
checkpoint_1007000/target.encoder.layers_19.mlp.wi_0.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 3473 |
+
checkpoint_1007000/target.encoder.layers_19.mlp.wi_0.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
| 3474 |
+
checkpoint_1007000/target.encoder.layers_19.mlp.wi_0.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
| 3475 |
+
checkpoint_1007000/target.encoder.layers_19.mlp.wi_0.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
| 3476 |
+
checkpoint_1007000/target.encoder.layers_19.mlp.wi_0.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
| 3477 |
+
checkpoint_1007000/target.encoder.layers_19.mlp.wi_0.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
| 3478 |
+
checkpoint_1007000/target.decoder.layers_3.mlp.wo.kernel/6.0 filter=lfs diff=lfs merge=lfs -text
|
| 3479 |
+
checkpoint_1007000/target.decoder.layers_3.mlp.wo.kernel/1.0 filter=lfs diff=lfs merge=lfs -text
|
| 3480 |
+
checkpoint_1007000/target.decoder.layers_3.mlp.wo.kernel/3.0 filter=lfs diff=lfs merge=lfs -text
|
| 3481 |
+
checkpoint_1007000/target.decoder.layers_3.mlp.wo.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 3482 |
+
checkpoint_1007000/target.decoder.layers_3.mlp.wo.kernel/7.0 filter=lfs diff=lfs merge=lfs -text
|
| 3483 |
+
checkpoint_1007000/target.decoder.layers_3.mlp.wo.kernel/5.0 filter=lfs diff=lfs merge=lfs -text
|
| 3484 |
+
checkpoint_1007000/target.decoder.layers_3.mlp.wo.kernel/2.0 filter=lfs diff=lfs merge=lfs -text
|
| 3485 |
+
checkpoint_1007000/target.decoder.layers_3.mlp.wo.kernel/4.0 filter=lfs diff=lfs merge=lfs -text
|
| 3486 |
+
checkpoint_1007000/target.encoder.layers_16.attention.query.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 3487 |
+
checkpoint_1007000/target.encoder.layers_16.attention.query.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
| 3488 |
+
checkpoint_1007000/target.encoder.layers_16.attention.query.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 3489 |
+
checkpoint_1007000/target.encoder.layers_16.attention.query.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
| 3490 |
+
checkpoint_1007000/target.encoder.layers_16.attention.query.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
| 3491 |
+
checkpoint_1007000/target.encoder.layers_16.attention.query.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
| 3492 |
+
checkpoint_1007000/target.encoder.layers_16.attention.query.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
| 3493 |
+
checkpoint_1007000/target.encoder.layers_16.attention.query.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
| 3494 |
+
checkpoint_1007000/target.encoder.layers_1.mlp.wi_1.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 3495 |
+
checkpoint_1007000/target.encoder.layers_1.mlp.wi_1.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
| 3496 |
+
checkpoint_1007000/target.encoder.layers_1.mlp.wi_1.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 3497 |
+
checkpoint_1007000/target.encoder.layers_1.mlp.wi_1.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
| 3498 |
+
checkpoint_1007000/target.encoder.layers_1.mlp.wi_1.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
| 3499 |
+
checkpoint_1007000/target.encoder.layers_1.mlp.wi_1.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
| 3500 |
+
checkpoint_1007000/target.encoder.layers_1.mlp.wi_1.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
| 3501 |
+
checkpoint_1007000/target.encoder.layers_1.mlp.wi_1.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
| 3502 |
+
checkpoint_1007000/target.encoder.layers_13.attention.key.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 3503 |
+
checkpoint_1007000/target.encoder.layers_13.attention.key.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
| 3504 |
+
checkpoint_1007000/target.encoder.layers_13.attention.key.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 3505 |
+
checkpoint_1007000/target.encoder.layers_13.attention.key.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
| 3506 |
+
checkpoint_1007000/target.encoder.layers_13.attention.key.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
| 3507 |
+
checkpoint_1007000/target.encoder.layers_13.attention.key.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
| 3508 |
+
checkpoint_1007000/target.encoder.layers_13.attention.key.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
| 3509 |
+
checkpoint_1007000/target.encoder.layers_13.attention.key.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
checkpoint_1007000/target.decoder.layers_2.encoder_decoder_attention.query.kernel/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_2.encoder_decoder_attention.query.kernel/.zarray.__tmp10631717546615226683.~1663960300549813~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_2.encoder_decoder_attention.query.kernel/.zarray.__tmp12515279127317660978.~1663960300601621~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_2.encoder_decoder_attention.query.kernel/.zarray.__tmp16850672775502047585.~1663960300684004~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_2.encoder_decoder_attention.query.kernel/.zarray.__tmp17014265567154969946.~1663960300384122~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_2.encoder_decoder_attention.query.kernel/.zarray.__tmp2502557247265826093.~1663960300495103~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_2.encoder_decoder_attention.query.kernel/.zarray.__tmp6246011022581936266.~1663960300632092~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_2.encoder_decoder_attention.query.kernel/.zarray.__tmp6442646648044591608.~1663960300885545~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_2.encoder_decoder_attention.query.kernel/0.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:02eac88fd41f715f75cc7f5bf8cf7fa91122c92e6ca64bb90e9284d20f4dc20c
|
| 3 |
+
size 7825778
|
checkpoint_1007000/target.decoder.layers_2.encoder_decoder_attention.query.kernel/0.1
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1ba155defbfe639d50b38219fc0fb5c47df0c31e8d68f81b202c1f32e5c4302d
|
| 3 |
+
size 7824442
|
checkpoint_1007000/target.decoder.layers_2.encoder_decoder_attention.query.kernel/0.2
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:505330f5958d2beea2f6927146c34c4aaefc64244ccc3e83c15c343385741764
|
| 3 |
+
size 7828670
|
checkpoint_1007000/target.decoder.layers_2.encoder_decoder_attention.query.kernel/0.3
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:575aeed64eeea95cc15c9d274892ec5aa78419c01ca7048ea16d9c357a019b80
|
| 3 |
+
size 7825827
|
checkpoint_1007000/target.decoder.layers_2.encoder_decoder_attention.query.kernel/0.4
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4195dc997ceaac22f42963ad30ac87ecfe8be32339f9924dc65c68fcf2ecf635
|
| 3 |
+
size 7827870
|
checkpoint_1007000/target.decoder.layers_2.encoder_decoder_attention.query.kernel/0.5
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:31ddcc8c3a8318a4369d223e42f14ec0a88138f983bf9c1669dc959a7493fef9
|
| 3 |
+
size 7825706
|
checkpoint_1007000/target.decoder.layers_2.encoder_decoder_attention.query.kernel/0.6
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:475cd415ec5529b711f53edfb1cb53373d66627f0ab09927d2ad4818406b06d8
|
| 3 |
+
size 7827425
|
checkpoint_1007000/target.decoder.layers_2.encoder_decoder_attention.query.kernel/0.7
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:338268f9d68993fb1f8d8e41afa02e2d8b1bd1847e496c873c0843601fdfdb24
|
| 3 |
+
size 7830057
|
checkpoint_1007000/target.decoder.layers_2.pre_mlp_layer_norm.scale/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_2.pre_mlp_layer_norm.scale/0
ADDED
|
Binary file (14.9 kB). View file
|
|
|
checkpoint_1007000/target.decoder.layers_3.mlp.wo.kernel/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[1280,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[10240,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_3.mlp.wo.kernel/.zarray.__tmp12164144768396930405.~1663960300347572~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[1280,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[10240,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_3.mlp.wo.kernel/.zarray.__tmp13176161344907895275.~1663960300422591~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[1280,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[10240,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_3.mlp.wo.kernel/.zarray.__tmp15877630234575677669.~1663960300730426~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[1280,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[10240,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_3.mlp.wo.kernel/.zarray.__tmp4667462083429703658.~1663960300602045~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[1280,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[10240,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_3.mlp.wo.kernel/.zarray.__tmp6686909515785747199.~1663960300384135~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[1280,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[10240,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_3.mlp.wo.kernel/.zarray.__tmp7799999499370154336.~1663960300466651~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[1280,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[10240,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_3.mlp.wo.kernel/.zarray.__tmp8199791667970183948.~1663960300272546~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[1280,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[10240,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_3.mlp.wo.kernel/0.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9a029ecbbf2e5b089a10730885dc740ad8e25fbef36383af163b0b06803a4918
|
| 3 |
+
size 19540386
|
checkpoint_1007000/target.decoder.layers_3.mlp.wo.kernel/1.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:cb059d9b50ffd1d34a91bd07d4dcc08d349e3cd73270e1fa6f7d1b05da9ef332
|
| 3 |
+
size 19539978
|
checkpoint_1007000/target.decoder.layers_3.mlp.wo.kernel/2.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:36cc3fd62d98d44f96d6b22c60a0585849f3155a7278dadf2f95eaadbf217462
|
| 3 |
+
size 19538103
|
checkpoint_1007000/target.decoder.layers_3.mlp.wo.kernel/3.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7e396d81139336196e7d6722b2a559b2cf8e4960cfa9b674e7301e90d4546d43
|
| 3 |
+
size 19540244
|
checkpoint_1007000/target.decoder.layers_3.mlp.wo.kernel/4.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:716a7ff3879f45fa31f05f0b273ab967a4cc868b2fcf228ec2861efa398931b7
|
| 3 |
+
size 19538784
|
checkpoint_1007000/target.decoder.layers_3.mlp.wo.kernel/5.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:633887566ccebba7fafb99c10e14409b4933d9a4535c638692b801cf2460d09b
|
| 3 |
+
size 19539441
|
checkpoint_1007000/target.decoder.layers_3.mlp.wo.kernel/6.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:af89ddf7e62bfb2fd8e74f54ff0643c4e7f9bd60d3518820033e23deb13b5984
|
| 3 |
+
size 19539596
|
checkpoint_1007000/target.decoder.layers_3.mlp.wo.kernel/7.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:520879e9640730f54fabb09bcaaa7b8f1030475b36773d887040f353e9950d9c
|
| 3 |
+
size 19539308
|
checkpoint_1007000/target.encoder.layers_1.mlp.wi_1.kernel/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.encoder.layers_1.mlp.wi_1.kernel/.zarray.__tmp10192900048669059227.~1663960300780722~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.encoder.layers_1.mlp.wi_1.kernel/.zarray.__tmp11689713418066339141.~1663960300778641~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.encoder.layers_1.mlp.wi_1.kernel/.zarray.__tmp11794325550773358884.~1663960300550985~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.encoder.layers_1.mlp.wi_1.kernel/.zarray.__tmp15682293152539461437.~1663960300731443~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.encoder.layers_1.mlp.wi_1.kernel/.zarray.__tmp3355123498195616867.~1663960300889044~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.encoder.layers_1.mlp.wi_1.kernel/.zarray.__tmp3779781660571819135.~1663960300686436~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.encoder.layers_1.mlp.wi_1.kernel/.zarray.__tmp9561935997004653383.~1663960300937419~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.encoder.layers_1.mlp.wi_1.kernel/0.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b6b85203f676198069bb4cfaf2dbcfd0e776a99f5cd701d97671449b63e93622
|
| 3 |
+
size 19524454
|
checkpoint_1007000/target.encoder.layers_1.mlp.wi_1.kernel/0.1
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:fa1925035983435920356d39f679685490ced3f7534fb9af380f7a07afe01a38
|
| 3 |
+
size 19524476
|
checkpoint_1007000/target.encoder.layers_1.mlp.wi_1.kernel/0.2
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a4f5f870f4a8fb52b7a1da875c8e9687dd89f71a59efd6f1d1e413add6075ff6
|
| 3 |
+
size 19523926
|
checkpoint_1007000/target.encoder.layers_1.mlp.wi_1.kernel/0.3
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9d6f7494a5f93420a0f66eaacd00f1ab2d500f2c2148b8cb2720a75622e9afc3
|
| 3 |
+
size 19523546
|
checkpoint_1007000/target.encoder.layers_1.mlp.wi_1.kernel/0.4
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:622bb1360222facd68da867b70c11eca0a834facab7bbb7e22bfa2916e7fa30f
|
| 3 |
+
size 19523442
|
checkpoint_1007000/target.encoder.layers_1.mlp.wi_1.kernel/0.5
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9da1b91f9cbf045074eeac703f236dee10f3b65d4a602d88f63e130e8d5f5212
|
| 3 |
+
size 19524288
|
checkpoint_1007000/target.encoder.layers_1.mlp.wi_1.kernel/0.6
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:bbcf46a349199570b71f8c6bd1b6f691789bae4e2a33a323a5456241a9df848f
|
| 3 |
+
size 19523618
|