Commit
·
fd95ea8
1
Parent(s):
563417d
Upload part 10
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- .gitattributes +48 -0
- checkpoint_1007000/state.param_states.decoder.layers_17.pre_self_attention_layer_norm.scale.v/.zarray +1 -0
- checkpoint_1007000/state.param_states.decoder.layers_17.pre_self_attention_layer_norm.scale.v/0 +0 -0
- checkpoint_1007000/state.param_states.decoder.layers_22.pre_cross_attention_layer_norm.scale.v/.zarray +1 -0
- checkpoint_1007000/state.param_states.decoder.layers_22.pre_cross_attention_layer_norm.scale.v/0 +0 -0
- checkpoint_1007000/target.decoder.layers_16.mlp.wi_0.kernel/.zarray +1 -0
- checkpoint_1007000/target.decoder.layers_16.mlp.wi_0.kernel/.zarray.__tmp11061882100262455779.~1663960300468303~ +1 -0
- checkpoint_1007000/target.decoder.layers_16.mlp.wi_0.kernel/.zarray.__tmp12404652297103653635.~1663960300421972~ +1 -0
- checkpoint_1007000/target.decoder.layers_16.mlp.wi_0.kernel/.zarray.__tmp15957828040304424061.~1663960300549667~ +1 -0
- checkpoint_1007000/target.decoder.layers_16.mlp.wi_0.kernel/.zarray.__tmp16708457794751892080.~1663960300823355~ +1 -0
- checkpoint_1007000/target.decoder.layers_16.mlp.wi_0.kernel/.zarray.__tmp17484084605368576430.~1663960300466014~ +1 -0
- checkpoint_1007000/target.decoder.layers_16.mlp.wi_0.kernel/.zarray.__tmp4338021769387984029.~1663960300779434~ +1 -0
- checkpoint_1007000/target.decoder.layers_16.mlp.wi_0.kernel/.zarray.__tmp9230001793889186174.~1663960300466137~ +1 -0
- checkpoint_1007000/target.decoder.layers_16.mlp.wi_0.kernel/0.0 +3 -0
- checkpoint_1007000/target.decoder.layers_16.mlp.wi_0.kernel/0.1 +3 -0
- checkpoint_1007000/target.decoder.layers_16.mlp.wi_0.kernel/0.2 +3 -0
- checkpoint_1007000/target.decoder.layers_16.mlp.wi_0.kernel/0.3 +3 -0
- checkpoint_1007000/target.decoder.layers_16.mlp.wi_0.kernel/0.4 +3 -0
- checkpoint_1007000/target.decoder.layers_16.mlp.wi_0.kernel/0.5 +3 -0
- checkpoint_1007000/target.decoder.layers_16.mlp.wi_0.kernel/0.6 +3 -0
- checkpoint_1007000/target.decoder.layers_16.mlp.wi_0.kernel/0.7 +3 -0
- checkpoint_1007000/target.decoder.layers_18.encoder_decoder_attention.query.kernel/.zarray +1 -0
- checkpoint_1007000/target.decoder.layers_18.encoder_decoder_attention.query.kernel/.zarray.__tmp15573674163105097682.~1663960300422343~ +1 -0
- checkpoint_1007000/target.decoder.layers_18.encoder_decoder_attention.query.kernel/.zarray.__tmp6071354722398589434.~1663960300551684~ +1 -0
- checkpoint_1007000/target.decoder.layers_18.encoder_decoder_attention.query.kernel/.zarray.__tmp613296392217406530.~1663960300348204~ +1 -0
- checkpoint_1007000/target.decoder.layers_18.encoder_decoder_attention.query.kernel/.zarray.__tmp6341381603883440718.~1663960300607703~ +1 -0
- checkpoint_1007000/target.decoder.layers_18.encoder_decoder_attention.query.kernel/.zarray.__tmp6759559597614935639.~1663960300777500~ +1 -0
- checkpoint_1007000/target.decoder.layers_18.encoder_decoder_attention.query.kernel/.zarray.__tmp8699293708755251527.~1663960300176511~ +1 -0
- checkpoint_1007000/target.decoder.layers_18.encoder_decoder_attention.query.kernel/0.0 +3 -0
- checkpoint_1007000/target.decoder.layers_18.encoder_decoder_attention.query.kernel/0.1 +3 -0
- checkpoint_1007000/target.decoder.layers_18.encoder_decoder_attention.query.kernel/0.2 +3 -0
- checkpoint_1007000/target.decoder.layers_18.encoder_decoder_attention.query.kernel/0.3 +3 -0
- checkpoint_1007000/target.decoder.layers_18.encoder_decoder_attention.query.kernel/0.4 +3 -0
- checkpoint_1007000/target.decoder.layers_18.encoder_decoder_attention.query.kernel/0.5 +3 -0
- checkpoint_1007000/target.decoder.layers_18.encoder_decoder_attention.query.kernel/0.6 +3 -0
- checkpoint_1007000/target.decoder.layers_18.encoder_decoder_attention.query.kernel/0.7 +3 -0
- checkpoint_1007000/target.decoder.layers_6.self_attention.value.kernel/.zarray +1 -0
- checkpoint_1007000/target.decoder.layers_6.self_attention.value.kernel/.zarray.__tmp10093915599364340592.~1663960300724598~ +1 -0
- checkpoint_1007000/target.decoder.layers_6.self_attention.value.kernel/.zarray.__tmp1154904127954928177.~1663960300890722~ +1 -0
- checkpoint_1007000/target.decoder.layers_6.self_attention.value.kernel/.zarray.__tmp13521656113468784784.~1663960300602639~ +1 -0
- checkpoint_1007000/target.decoder.layers_6.self_attention.value.kernel/.zarray.__tmp15222130608404230048.~1663960300385982~ +1 -0
- checkpoint_1007000/target.decoder.layers_6.self_attention.value.kernel/.zarray.__tmp4913473462980707586.~1663960300547148~ +1 -0
- checkpoint_1007000/target.decoder.layers_6.self_attention.value.kernel/.zarray.__tmp571652921966429101.~1663960300623679~ +1 -0
- checkpoint_1007000/target.decoder.layers_6.self_attention.value.kernel/0.0 +3 -0
- checkpoint_1007000/target.decoder.layers_6.self_attention.value.kernel/0.1 +3 -0
- checkpoint_1007000/target.decoder.layers_6.self_attention.value.kernel/0.2 +3 -0
- checkpoint_1007000/target.decoder.layers_6.self_attention.value.kernel/0.3 +3 -0
- checkpoint_1007000/target.decoder.layers_6.self_attention.value.kernel/0.4 +3 -0
- checkpoint_1007000/target.decoder.layers_6.self_attention.value.kernel/0.5 +3 -0
- checkpoint_1007000/target.decoder.layers_6.self_attention.value.kernel/0.6 +3 -0
.gitattributes
CHANGED
|
@@ -503,3 +503,51 @@ checkpoint_1007000/target.encoder.layers_23.mlp.wi_1.kernel/0.1 filter=lfs diff=
|
|
| 503 |
checkpoint_1007000/target.encoder.layers_23.mlp.wi_1.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
| 504 |
checkpoint_1007000/target.encoder.layers_23.mlp.wi_1.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 505 |
checkpoint_1007000/target.encoder.layers_23.mlp.wi_1.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 503 |
checkpoint_1007000/target.encoder.layers_23.mlp.wi_1.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
| 504 |
checkpoint_1007000/target.encoder.layers_23.mlp.wi_1.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 505 |
checkpoint_1007000/target.encoder.layers_23.mlp.wi_1.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
| 506 |
+
checkpoint_1007000/target.encoder.layers_23.mlp.wi_1.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
| 507 |
+
checkpoint_1007000/target.encoder.layers_23.mlp.wi_1.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
| 508 |
+
checkpoint_1007000/target.encoder.layers_23.mlp.wi_1.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
| 509 |
+
checkpoint_1007000/target.encoder.layers_23.mlp.wi_1.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
| 510 |
+
checkpoint_1007000/target.decoder.layers_16.mlp.wi_0.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 511 |
+
checkpoint_1007000/target.decoder.layers_16.mlp.wi_0.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
| 512 |
+
checkpoint_1007000/target.decoder.layers_16.mlp.wi_0.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 513 |
+
checkpoint_1007000/target.decoder.layers_16.mlp.wi_0.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
| 514 |
+
checkpoint_1007000/target.decoder.layers_16.mlp.wi_0.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
| 515 |
+
checkpoint_1007000/target.decoder.layers_16.mlp.wi_0.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
| 516 |
+
checkpoint_1007000/target.decoder.layers_16.mlp.wi_0.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
| 517 |
+
checkpoint_1007000/target.decoder.layers_16.mlp.wi_0.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
| 518 |
+
checkpoint_1007000/target.decoder.layers_18.encoder_decoder_attention.query.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 519 |
+
checkpoint_1007000/target.decoder.layers_18.encoder_decoder_attention.query.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
| 520 |
+
checkpoint_1007000/target.decoder.layers_18.encoder_decoder_attention.query.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 521 |
+
checkpoint_1007000/target.decoder.layers_18.encoder_decoder_attention.query.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
| 522 |
+
checkpoint_1007000/target.decoder.layers_18.encoder_decoder_attention.query.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
| 523 |
+
checkpoint_1007000/target.decoder.layers_18.encoder_decoder_attention.query.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
| 524 |
+
checkpoint_1007000/target.decoder.layers_18.encoder_decoder_attention.query.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
| 525 |
+
checkpoint_1007000/target.decoder.layers_18.encoder_decoder_attention.query.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
| 526 |
+
checkpoint_1007000/target.encoder.layers_10.mlp.wo.kernel/6.0 filter=lfs diff=lfs merge=lfs -text
|
| 527 |
+
checkpoint_1007000/target.encoder.layers_10.mlp.wo.kernel/1.0 filter=lfs diff=lfs merge=lfs -text
|
| 528 |
+
checkpoint_1007000/target.encoder.layers_10.mlp.wo.kernel/3.0 filter=lfs diff=lfs merge=lfs -text
|
| 529 |
+
checkpoint_1007000/target.encoder.layers_10.mlp.wo.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 530 |
+
checkpoint_1007000/target.encoder.layers_10.mlp.wo.kernel/7.0 filter=lfs diff=lfs merge=lfs -text
|
| 531 |
+
checkpoint_1007000/target.encoder.layers_10.mlp.wo.kernel/5.0 filter=lfs diff=lfs merge=lfs -text
|
| 532 |
+
checkpoint_1007000/target.encoder.layers_10.mlp.wo.kernel/2.0 filter=lfs diff=lfs merge=lfs -text
|
| 533 |
+
checkpoint_1007000/target.encoder.layers_10.mlp.wo.kernel/4.0 filter=lfs diff=lfs merge=lfs -text
|
| 534 |
+
checkpoint_1007000/target.decoder.layers_9.self_attention.value.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 535 |
+
checkpoint_1007000/target.decoder.layers_9.self_attention.value.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
| 536 |
+
checkpoint_1007000/target.decoder.layers_9.self_attention.value.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 537 |
+
checkpoint_1007000/target.decoder.layers_9.self_attention.value.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
| 538 |
+
checkpoint_1007000/target.decoder.layers_9.self_attention.value.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
| 539 |
+
checkpoint_1007000/target.decoder.layers_9.self_attention.value.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
| 540 |
+
checkpoint_1007000/target.decoder.layers_9.self_attention.value.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
| 541 |
+
checkpoint_1007000/target.decoder.layers_9.self_attention.value.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
| 542 |
+
checkpoint_1007000/target.decoder.layers_6.self_attention.value.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 543 |
+
checkpoint_1007000/target.decoder.layers_6.self_attention.value.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
| 544 |
+
checkpoint_1007000/target.decoder.layers_6.self_attention.value.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 545 |
+
checkpoint_1007000/target.decoder.layers_6.self_attention.value.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
| 546 |
+
checkpoint_1007000/target.decoder.layers_6.self_attention.value.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
| 547 |
+
checkpoint_1007000/target.decoder.layers_6.self_attention.value.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
| 548 |
+
checkpoint_1007000/target.decoder.layers_6.self_attention.value.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
| 549 |
+
checkpoint_1007000/target.decoder.layers_6.self_attention.value.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
| 550 |
+
checkpoint_1007000/target.encoder.layers_9.mlp.wi_1.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 551 |
+
checkpoint_1007000/target.encoder.layers_9.mlp.wi_1.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
| 552 |
+
checkpoint_1007000/target.encoder.layers_9.mlp.wi_1.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 553 |
+
checkpoint_1007000/target.encoder.layers_9.mlp.wi_1.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
checkpoint_1007000/state.param_states.decoder.layers_17.pre_self_attention_layer_norm.scale.v/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096],"zarr_format":2}
|
checkpoint_1007000/state.param_states.decoder.layers_17.pre_self_attention_layer_norm.scale.v/0
ADDED
|
Binary file (14.9 kB). View file
|
|
|
checkpoint_1007000/state.param_states.decoder.layers_22.pre_cross_attention_layer_norm.scale.v/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096],"zarr_format":2}
|
checkpoint_1007000/state.param_states.decoder.layers_22.pre_cross_attention_layer_norm.scale.v/0
ADDED
|
Binary file (14.1 kB). View file
|
|
|
checkpoint_1007000/target.decoder.layers_16.mlp.wi_0.kernel/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_16.mlp.wi_0.kernel/.zarray.__tmp11061882100262455779.~1663960300468303~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_16.mlp.wi_0.kernel/.zarray.__tmp12404652297103653635.~1663960300421972~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_16.mlp.wi_0.kernel/.zarray.__tmp15957828040304424061.~1663960300549667~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_16.mlp.wi_0.kernel/.zarray.__tmp16708457794751892080.~1663960300823355~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_16.mlp.wi_0.kernel/.zarray.__tmp17484084605368576430.~1663960300466014~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_16.mlp.wi_0.kernel/.zarray.__tmp4338021769387984029.~1663960300779434~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_16.mlp.wi_0.kernel/.zarray.__tmp9230001793889186174.~1663960300466137~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_16.mlp.wi_0.kernel/0.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e23f466007f2883073d73b5a234c9ce17b1e01db636c8419367588be65f6e9ae
|
| 3 |
+
size 19532428
|
checkpoint_1007000/target.decoder.layers_16.mlp.wi_0.kernel/0.1
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:67653c0516732657615ec9e1de49eab96d76be7e85d3fe72ec42cb65da0429b7
|
| 3 |
+
size 19532895
|
checkpoint_1007000/target.decoder.layers_16.mlp.wi_0.kernel/0.2
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5f899fabf1b5929953bb14b4b74be66ba6c02fc9db8e4f9be5096866f3a4bc8c
|
| 3 |
+
size 19532877
|
checkpoint_1007000/target.decoder.layers_16.mlp.wi_0.kernel/0.3
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:23da18946aa1a364bd873d506a5ff093d0189bbf0400190324634f452cbbde3f
|
| 3 |
+
size 19533345
|
checkpoint_1007000/target.decoder.layers_16.mlp.wi_0.kernel/0.4
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b74b6e873ca154c6aae3a33df1f995d31cec9746be4a3014c2b8df41c51ed977
|
| 3 |
+
size 19532246
|
checkpoint_1007000/target.decoder.layers_16.mlp.wi_0.kernel/0.5
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d1c99427cb370b04272161db155e78c2a8ec26512671bdd1d6d645c5aaf6f6b6
|
| 3 |
+
size 19532905
|
checkpoint_1007000/target.decoder.layers_16.mlp.wi_0.kernel/0.6
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f5c26a0148693111163737706356599abf1983c7cd6d219b92c74e0a182365cc
|
| 3 |
+
size 19532508
|
checkpoint_1007000/target.decoder.layers_16.mlp.wi_0.kernel/0.7
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:706f93bcd08aa203e49091deb3e8d477004fe271813510b4b8b538b287b92b73
|
| 3 |
+
size 19533260
|
checkpoint_1007000/target.decoder.layers_18.encoder_decoder_attention.query.kernel/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_18.encoder_decoder_attention.query.kernel/.zarray.__tmp15573674163105097682.~1663960300422343~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_18.encoder_decoder_attention.query.kernel/.zarray.__tmp6071354722398589434.~1663960300551684~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_18.encoder_decoder_attention.query.kernel/.zarray.__tmp613296392217406530.~1663960300348204~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_18.encoder_decoder_attention.query.kernel/.zarray.__tmp6341381603883440718.~1663960300607703~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_18.encoder_decoder_attention.query.kernel/.zarray.__tmp6759559597614935639.~1663960300777500~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_18.encoder_decoder_attention.query.kernel/.zarray.__tmp8699293708755251527.~1663960300176511~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_18.encoder_decoder_attention.query.kernel/0.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:045baab6041f245b5f46e0b0b1a4cbc08e6d6f36e41d1bc5ca98790bd7e19d24
|
| 3 |
+
size 7815204
|
checkpoint_1007000/target.decoder.layers_18.encoder_decoder_attention.query.kernel/0.1
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:14a7258d28f1d837b274d70e93b80db5902fb99cf70e333497df5b60eec77524
|
| 3 |
+
size 7815167
|
checkpoint_1007000/target.decoder.layers_18.encoder_decoder_attention.query.kernel/0.2
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e355dd4779085a18405bb8396e59c445fb035857553f0503a5636e45e586ceb3
|
| 3 |
+
size 7812322
|
checkpoint_1007000/target.decoder.layers_18.encoder_decoder_attention.query.kernel/0.3
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a9e62c70beff127862c86cc0f7c7fc650a08ff96e5e19bc54074db3f107aaa1a
|
| 3 |
+
size 7815583
|
checkpoint_1007000/target.decoder.layers_18.encoder_decoder_attention.query.kernel/0.4
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:91862a589605e212065aef77e0d8347a1b22a90b23180e97db7628298ef7cf2b
|
| 3 |
+
size 7816419
|
checkpoint_1007000/target.decoder.layers_18.encoder_decoder_attention.query.kernel/0.5
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:23aec16c79fde69d9e06e170348e0e09feb467c69b7819efc73f4c2359d3d854
|
| 3 |
+
size 7815160
|
checkpoint_1007000/target.decoder.layers_18.encoder_decoder_attention.query.kernel/0.6
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:463551b7ca2530c1479feadc3d9369346b18490707c394439b32b0c679c57bd9
|
| 3 |
+
size 7816611
|
checkpoint_1007000/target.decoder.layers_18.encoder_decoder_attention.query.kernel/0.7
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f82b614ee8f29a41885a002a3ae6947a9af12e20f0838357e768b86000eae7b6
|
| 3 |
+
size 7815301
|
checkpoint_1007000/target.decoder.layers_6.self_attention.value.kernel/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_6.self_attention.value.kernel/.zarray.__tmp10093915599364340592.~1663960300724598~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_6.self_attention.value.kernel/.zarray.__tmp1154904127954928177.~1663960300890722~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_6.self_attention.value.kernel/.zarray.__tmp13521656113468784784.~1663960300602639~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_6.self_attention.value.kernel/.zarray.__tmp15222130608404230048.~1663960300385982~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_6.self_attention.value.kernel/.zarray.__tmp4913473462980707586.~1663960300547148~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_6.self_attention.value.kernel/.zarray.__tmp571652921966429101.~1663960300623679~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_6.self_attention.value.kernel/0.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d364c372ffbb34dbea0a058f446da49011a5db0d6abf13dd491d2fe00783d327
|
| 3 |
+
size 7820064
|
checkpoint_1007000/target.decoder.layers_6.self_attention.value.kernel/0.1
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f5ded5d654b8e852f46b3b18f079d8d656a884fb5489921615a86158abfc13e7
|
| 3 |
+
size 7821409
|
checkpoint_1007000/target.decoder.layers_6.self_attention.value.kernel/0.2
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:772cdd4a7b85f47843e5ba019f71706d5ea17f2a32de431e6a94b72abdf9c693
|
| 3 |
+
size 7824680
|
checkpoint_1007000/target.decoder.layers_6.self_attention.value.kernel/0.3
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9d338325ce1036ae8c72cf1f2a3671f5456079d73c974bc756c68b61ffdcd848
|
| 3 |
+
size 7823698
|
checkpoint_1007000/target.decoder.layers_6.self_attention.value.kernel/0.4
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:deeb8f5e49e25d61b7945efb9ad2afae1b59035d5be0bc70517a4840c0668ec3
|
| 3 |
+
size 7825365
|
checkpoint_1007000/target.decoder.layers_6.self_attention.value.kernel/0.5
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:46329e2b7108ab44fbe1c45aadabc5dc183c851ee19385cc5eeee81df1ee7b05
|
| 3 |
+
size 7823158
|
checkpoint_1007000/target.decoder.layers_6.self_attention.value.kernel/0.6
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9b717cf6725538765c8fc6431f91e07250642addca497439d36b32c877f2f4c2
|
| 3 |
+
size 7823880
|