Commit
·
42371b3
1
Parent(s):
20179e4
Upload part 71
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- .gitattributes +48 -0
- checkpoint_1007000/state.param_states.encoder.layers_4.pre_mlp_layer_norm.scale.v/.zarray +1 -0
- checkpoint_1007000/state.param_states.encoder.layers_4.pre_mlp_layer_norm.scale.v/0 +0 -0
- checkpoint_1007000/state.param_states.encoder.layers_8.pre_mlp_layer_norm.scale.v/.zarray +1 -0
- checkpoint_1007000/state.param_states.encoder.layers_8.pre_mlp_layer_norm.scale.v/0 +0 -0
- checkpoint_1007000/target.decoder.layers_1.pre_self_attention_layer_norm.scale/.zarray +1 -0
- checkpoint_1007000/target.decoder.layers_1.pre_self_attention_layer_norm.scale/0 +0 -0
- checkpoint_1007000/target.decoder.layers_18.self_attention.value.kernel/.zarray +1 -0
- checkpoint_1007000/target.decoder.layers_18.self_attention.value.kernel/.zarray.__tmp10549553869379367245.~1663960300865419~ +1 -0
- checkpoint_1007000/target.decoder.layers_18.self_attention.value.kernel/.zarray.__tmp11121093595175635601.~1663960300384125~ +1 -0
- checkpoint_1007000/target.decoder.layers_18.self_attention.value.kernel/.zarray.__tmp160614029260815911.~1663960300553404~ +1 -0
- checkpoint_1007000/target.decoder.layers_18.self_attention.value.kernel/.zarray.__tmp5834752992321814715.~1663960300776849~ +1 -0
- checkpoint_1007000/target.decoder.layers_18.self_attention.value.kernel/.zarray.__tmp700358743334726418.~1663960300468524~ +1 -0
- checkpoint_1007000/target.decoder.layers_18.self_attention.value.kernel/.zarray.__tmp7579797148608786836.~1663960300347922~ +1 -0
- checkpoint_1007000/target.decoder.layers_18.self_attention.value.kernel/.zarray.__tmp9044194797125352365.~1663960300420679~ +1 -0
- checkpoint_1007000/target.decoder.layers_18.self_attention.value.kernel/0.0 +3 -0
- checkpoint_1007000/target.decoder.layers_18.self_attention.value.kernel/0.1 +3 -0
- checkpoint_1007000/target.decoder.layers_18.self_attention.value.kernel/0.2 +3 -0
- checkpoint_1007000/target.decoder.layers_18.self_attention.value.kernel/0.3 +3 -0
- checkpoint_1007000/target.decoder.layers_18.self_attention.value.kernel/0.4 +3 -0
- checkpoint_1007000/target.decoder.layers_18.self_attention.value.kernel/0.5 +3 -0
- checkpoint_1007000/target.decoder.layers_18.self_attention.value.kernel/0.6 +3 -0
- checkpoint_1007000/target.decoder.layers_18.self_attention.value.kernel/0.7 +3 -0
- checkpoint_1007000/target.decoder.layers_20.pre_cross_attention_layer_norm.scale/.zarray +1 -0
- checkpoint_1007000/target.decoder.layers_20.pre_cross_attention_layer_norm.scale/0 +0 -0
- checkpoint_1007000/target.decoder.layers_20.pre_mlp_layer_norm.scale/.zarray +1 -0
- checkpoint_1007000/target.decoder.layers_20.pre_mlp_layer_norm.scale/0 +0 -0
- checkpoint_1007000/target.decoder.layers_21.encoder_decoder_attention.value.kernel/.zarray +1 -0
- checkpoint_1007000/target.decoder.layers_21.encoder_decoder_attention.value.kernel/.zarray.__tmp11496306268209692467.~1663960300547034~ +1 -0
- checkpoint_1007000/target.decoder.layers_21.encoder_decoder_attention.value.kernel/.zarray.__tmp12655539606937909516.~1663960300685932~ +1 -0
- checkpoint_1007000/target.decoder.layers_21.encoder_decoder_attention.value.kernel/.zarray.__tmp3544814769853161108.~1663960300728937~ +1 -0
- checkpoint_1007000/target.decoder.layers_21.encoder_decoder_attention.value.kernel/.zarray.__tmp4608099628127010795.~1663960300823469~ +1 -0
- checkpoint_1007000/target.decoder.layers_21.encoder_decoder_attention.value.kernel/.zarray.__tmp5588453964102254496.~1663960300425654~ +1 -0
- checkpoint_1007000/target.decoder.layers_21.encoder_decoder_attention.value.kernel/.zarray.__tmp7659060619832595388.~1663960300384182~ +1 -0
- checkpoint_1007000/target.decoder.layers_21.encoder_decoder_attention.value.kernel/.zarray.__tmp9264541749749270809.~1663960300775468~ +1 -0
- checkpoint_1007000/target.decoder.layers_21.encoder_decoder_attention.value.kernel/0.0 +3 -0
- checkpoint_1007000/target.decoder.layers_21.encoder_decoder_attention.value.kernel/0.1 +3 -0
- checkpoint_1007000/target.decoder.layers_21.encoder_decoder_attention.value.kernel/0.2 +3 -0
- checkpoint_1007000/target.decoder.layers_21.encoder_decoder_attention.value.kernel/0.3 +3 -0
- checkpoint_1007000/target.decoder.layers_21.encoder_decoder_attention.value.kernel/0.4 +3 -0
- checkpoint_1007000/target.decoder.layers_21.encoder_decoder_attention.value.kernel/0.5 +3 -0
- checkpoint_1007000/target.decoder.layers_21.encoder_decoder_attention.value.kernel/0.6 +3 -0
- checkpoint_1007000/target.decoder.layers_21.encoder_decoder_attention.value.kernel/0.7 +3 -0
- checkpoint_1007000/target.decoder.layers_22.encoder_decoder_attention.key.kernel/.zarray +1 -0
- checkpoint_1007000/target.decoder.layers_22.encoder_decoder_attention.key.kernel/.zarray.__tmp10728710319527467546.~1663960300471589~ +1 -0
- checkpoint_1007000/target.decoder.layers_22.encoder_decoder_attention.key.kernel/.zarray.__tmp12169895662662803389.~1663960300466249~ +1 -0
- checkpoint_1007000/target.decoder.layers_22.encoder_decoder_attention.key.kernel/.zarray.__tmp12797161462038635779.~1663960300548669~ +1 -0
- checkpoint_1007000/target.decoder.layers_22.encoder_decoder_attention.key.kernel/.zarray.__tmp1564285186274598784.~1663960300271762~ +1 -0
- checkpoint_1007000/target.decoder.layers_22.encoder_decoder_attention.key.kernel/.zarray.__tmp2668172169137704345.~1663960300495913~ +1 -0
- checkpoint_1007000/target.decoder.layers_22.encoder_decoder_attention.key.kernel/.zarray.__tmp588842737493045608.~1663960300779135~ +1 -0
.gitattributes
CHANGED
|
@@ -3507,3 +3507,51 @@ checkpoint_1007000/target.encoder.layers_13.attention.key.kernel/0.5 filter=lfs
|
|
| 3507 |
checkpoint_1007000/target.encoder.layers_13.attention.key.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
| 3508 |
checkpoint_1007000/target.encoder.layers_13.attention.key.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
| 3509 |
checkpoint_1007000/target.encoder.layers_13.attention.key.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 3507 |
checkpoint_1007000/target.encoder.layers_13.attention.key.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
| 3508 |
checkpoint_1007000/target.encoder.layers_13.attention.key.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
| 3509 |
checkpoint_1007000/target.encoder.layers_13.attention.key.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
| 3510 |
+
checkpoint_1007000/target.decoder.layers_21.encoder_decoder_attention.value.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 3511 |
+
checkpoint_1007000/target.decoder.layers_21.encoder_decoder_attention.value.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
| 3512 |
+
checkpoint_1007000/target.decoder.layers_21.encoder_decoder_attention.value.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 3513 |
+
checkpoint_1007000/target.decoder.layers_21.encoder_decoder_attention.value.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
| 3514 |
+
checkpoint_1007000/target.decoder.layers_21.encoder_decoder_attention.value.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
| 3515 |
+
checkpoint_1007000/target.decoder.layers_21.encoder_decoder_attention.value.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
| 3516 |
+
checkpoint_1007000/target.decoder.layers_21.encoder_decoder_attention.value.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
| 3517 |
+
checkpoint_1007000/target.decoder.layers_21.encoder_decoder_attention.value.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
| 3518 |
+
checkpoint_1007000/target.decoder.layers_8.self_attention.value.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 3519 |
+
checkpoint_1007000/target.decoder.layers_8.self_attention.value.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
| 3520 |
+
checkpoint_1007000/target.decoder.layers_8.self_attention.value.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 3521 |
+
checkpoint_1007000/target.decoder.layers_8.self_attention.value.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
| 3522 |
+
checkpoint_1007000/target.decoder.layers_8.self_attention.value.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
| 3523 |
+
checkpoint_1007000/target.decoder.layers_8.self_attention.value.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
| 3524 |
+
checkpoint_1007000/target.decoder.layers_8.self_attention.value.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
| 3525 |
+
checkpoint_1007000/target.decoder.layers_8.self_attention.value.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
| 3526 |
+
checkpoint_1007000/target.decoder.layers_18.self_attention.value.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 3527 |
+
checkpoint_1007000/target.decoder.layers_18.self_attention.value.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
| 3528 |
+
checkpoint_1007000/target.decoder.layers_18.self_attention.value.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 3529 |
+
checkpoint_1007000/target.decoder.layers_18.self_attention.value.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
| 3530 |
+
checkpoint_1007000/target.decoder.layers_18.self_attention.value.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
| 3531 |
+
checkpoint_1007000/target.decoder.layers_18.self_attention.value.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
| 3532 |
+
checkpoint_1007000/target.decoder.layers_18.self_attention.value.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
| 3533 |
+
checkpoint_1007000/target.decoder.layers_18.self_attention.value.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
| 3534 |
+
checkpoint_1007000/target.decoder.layers_22.encoder_decoder_attention.key.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 3535 |
+
checkpoint_1007000/target.decoder.layers_22.encoder_decoder_attention.key.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
| 3536 |
+
checkpoint_1007000/target.decoder.layers_22.encoder_decoder_attention.key.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 3537 |
+
checkpoint_1007000/target.decoder.layers_22.encoder_decoder_attention.key.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
| 3538 |
+
checkpoint_1007000/target.decoder.layers_22.encoder_decoder_attention.key.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
| 3539 |
+
checkpoint_1007000/target.decoder.layers_22.encoder_decoder_attention.key.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
| 3540 |
+
checkpoint_1007000/target.decoder.layers_22.encoder_decoder_attention.key.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
| 3541 |
+
checkpoint_1007000/target.decoder.layers_22.encoder_decoder_attention.key.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
| 3542 |
+
checkpoint_1007000/target.encoder.layers_5.attention.value.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 3543 |
+
checkpoint_1007000/target.encoder.layers_5.attention.value.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
| 3544 |
+
checkpoint_1007000/target.encoder.layers_5.attention.value.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 3545 |
+
checkpoint_1007000/target.encoder.layers_5.attention.value.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
| 3546 |
+
checkpoint_1007000/target.encoder.layers_5.attention.value.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
| 3547 |
+
checkpoint_1007000/target.encoder.layers_5.attention.value.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
| 3548 |
+
checkpoint_1007000/target.encoder.layers_5.attention.value.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
| 3549 |
+
checkpoint_1007000/target.encoder.layers_5.attention.value.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
| 3550 |
+
checkpoint_1007000/target.encoder.layers_0.mlp.wi_0.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 3551 |
+
checkpoint_1007000/target.encoder.layers_0.mlp.wi_0.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
| 3552 |
+
checkpoint_1007000/target.encoder.layers_0.mlp.wi_0.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 3553 |
+
checkpoint_1007000/target.encoder.layers_0.mlp.wi_0.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
| 3554 |
+
checkpoint_1007000/target.encoder.layers_0.mlp.wi_0.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
| 3555 |
+
checkpoint_1007000/target.encoder.layers_0.mlp.wi_0.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
| 3556 |
+
checkpoint_1007000/target.encoder.layers_0.mlp.wi_0.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
| 3557 |
+
checkpoint_1007000/target.encoder.layers_0.mlp.wi_0.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
checkpoint_1007000/state.param_states.encoder.layers_4.pre_mlp_layer_norm.scale.v/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096],"zarr_format":2}
|
checkpoint_1007000/state.param_states.encoder.layers_4.pre_mlp_layer_norm.scale.v/0
ADDED
|
Binary file (15.3 kB). View file
|
|
|
checkpoint_1007000/state.param_states.encoder.layers_8.pre_mlp_layer_norm.scale.v/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096],"zarr_format":2}
|
checkpoint_1007000/state.param_states.encoder.layers_8.pre_mlp_layer_norm.scale.v/0
ADDED
|
Binary file (15.3 kB). View file
|
|
|
checkpoint_1007000/target.decoder.layers_1.pre_self_attention_layer_norm.scale/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_1.pre_self_attention_layer_norm.scale/0
ADDED
|
Binary file (15.1 kB). View file
|
|
|
checkpoint_1007000/target.decoder.layers_18.self_attention.value.kernel/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_18.self_attention.value.kernel/.zarray.__tmp10549553869379367245.~1663960300865419~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_18.self_attention.value.kernel/.zarray.__tmp11121093595175635601.~1663960300384125~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_18.self_attention.value.kernel/.zarray.__tmp160614029260815911.~1663960300553404~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_18.self_attention.value.kernel/.zarray.__tmp5834752992321814715.~1663960300776849~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_18.self_attention.value.kernel/.zarray.__tmp700358743334726418.~1663960300468524~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_18.self_attention.value.kernel/.zarray.__tmp7579797148608786836.~1663960300347922~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_18.self_attention.value.kernel/.zarray.__tmp9044194797125352365.~1663960300420679~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_18.self_attention.value.kernel/0.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:782017b399e3b0690720b609bbe42e168b510da77955c7b6a2b58d3a48e4a96a
|
| 3 |
+
size 7806843
|
checkpoint_1007000/target.decoder.layers_18.self_attention.value.kernel/0.1
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ddc0831929c5877a18526d22d826c0ef7c2e995f0cb2c2db8049e81ee3a00586
|
| 3 |
+
size 7827565
|
checkpoint_1007000/target.decoder.layers_18.self_attention.value.kernel/0.2
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b05d7cba70df9a6f6ad25d889e9218a66897bacbbd556b2f259e36e69b6bea5b
|
| 3 |
+
size 7804923
|
checkpoint_1007000/target.decoder.layers_18.self_attention.value.kernel/0.3
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3bca929c5bad9a2704bf0febfb684339ae5837627ab22a47e31f612b31725c0a
|
| 3 |
+
size 7802557
|
checkpoint_1007000/target.decoder.layers_18.self_attention.value.kernel/0.4
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b067c18174ff4d4f12176be08345a2fdf80d1e6e1098db5d5aa5071a9f2e01c8
|
| 3 |
+
size 7816371
|
checkpoint_1007000/target.decoder.layers_18.self_attention.value.kernel/0.5
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:87adecab49c8a699c02ca790b4adaa6b38fa6321be245cf6151759b1daf67923
|
| 3 |
+
size 7804117
|
checkpoint_1007000/target.decoder.layers_18.self_attention.value.kernel/0.6
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c8ad04b7b2198ff8af02e7079b28af77138031b2a6a751134decb8bc9adb4cf2
|
| 3 |
+
size 7804157
|
checkpoint_1007000/target.decoder.layers_18.self_attention.value.kernel/0.7
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:654624529939948e926136a7f8ece7bc0a0cbf4b0f7dbbd90cd0f099581154a7
|
| 3 |
+
size 7811580
|
checkpoint_1007000/target.decoder.layers_20.pre_cross_attention_layer_norm.scale/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_20.pre_cross_attention_layer_norm.scale/0
ADDED
|
Binary file (14.5 kB). View file
|
|
|
checkpoint_1007000/target.decoder.layers_20.pre_mlp_layer_norm.scale/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_20.pre_mlp_layer_norm.scale/0
ADDED
|
Binary file (13.9 kB). View file
|
|
|
checkpoint_1007000/target.decoder.layers_21.encoder_decoder_attention.value.kernel/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_21.encoder_decoder_attention.value.kernel/.zarray.__tmp11496306268209692467.~1663960300547034~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_21.encoder_decoder_attention.value.kernel/.zarray.__tmp12655539606937909516.~1663960300685932~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_21.encoder_decoder_attention.value.kernel/.zarray.__tmp3544814769853161108.~1663960300728937~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_21.encoder_decoder_attention.value.kernel/.zarray.__tmp4608099628127010795.~1663960300823469~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_21.encoder_decoder_attention.value.kernel/.zarray.__tmp5588453964102254496.~1663960300425654~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_21.encoder_decoder_attention.value.kernel/.zarray.__tmp7659060619832595388.~1663960300384182~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_21.encoder_decoder_attention.value.kernel/.zarray.__tmp9264541749749270809.~1663960300775468~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_21.encoder_decoder_attention.value.kernel/0.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b7968b078d437966fc9854af7c8ac07e906c3be452f02105edb3d3d0c9d7298a
|
| 3 |
+
size 7806578
|
checkpoint_1007000/target.decoder.layers_21.encoder_decoder_attention.value.kernel/0.1
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7982a67358e2ee6e0fab2d4d193ead6c6ee0f718930a33557e22e0e7dd8a6188
|
| 3 |
+
size 7806770
|
checkpoint_1007000/target.decoder.layers_21.encoder_decoder_attention.value.kernel/0.2
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f7796a3e2c730d976095b69db803729ede20ce9ebe647d1f8350808e6ae87484
|
| 3 |
+
size 7804420
|
checkpoint_1007000/target.decoder.layers_21.encoder_decoder_attention.value.kernel/0.3
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c17dc3278387de7da12a547360f4331a066e49a89c9b10538fd16f8d315f5b64
|
| 3 |
+
size 7816022
|
checkpoint_1007000/target.decoder.layers_21.encoder_decoder_attention.value.kernel/0.4
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:429f4e80d0f835d8eb91401215511ed1d8c9eee0fa8fc6cdaf18f9be738a9ee2
|
| 3 |
+
size 7809431
|
checkpoint_1007000/target.decoder.layers_21.encoder_decoder_attention.value.kernel/0.5
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f46b3672ea395cb8c32ba65832652d12d4babc3a3511697846ecba0900fa137c
|
| 3 |
+
size 7802528
|
checkpoint_1007000/target.decoder.layers_21.encoder_decoder_attention.value.kernel/0.6
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ae8dbe18ec21a84330c5dcbda403f2329664b447ea7d0c75f9cc6c1d312603f1
|
| 3 |
+
size 7807602
|
checkpoint_1007000/target.decoder.layers_21.encoder_decoder_attention.value.kernel/0.7
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:56a29fc3bc64b295551b5bd56e48dc3656ec743e08ea4855f5978cb6f7a94620
|
| 3 |
+
size 7803910
|
checkpoint_1007000/target.decoder.layers_22.encoder_decoder_attention.key.kernel/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_22.encoder_decoder_attention.key.kernel/.zarray.__tmp10728710319527467546.~1663960300471589~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_22.encoder_decoder_attention.key.kernel/.zarray.__tmp12169895662662803389.~1663960300466249~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_22.encoder_decoder_attention.key.kernel/.zarray.__tmp12797161462038635779.~1663960300548669~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_22.encoder_decoder_attention.key.kernel/.zarray.__tmp1564285186274598784.~1663960300271762~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_22.encoder_decoder_attention.key.kernel/.zarray.__tmp2668172169137704345.~1663960300495913~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_22.encoder_decoder_attention.key.kernel/.zarray.__tmp588842737493045608.~1663960300779135~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|