Commit
·
c285da1
1
Parent(s):
6cfb111
Upload part 65
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- .gitattributes +46 -0
- checkpoint_1007000/state.param_states.encoder.layers_11.pre_mlp_layer_norm.scale.v/.zarray +1 -0
- checkpoint_1007000/state.param_states.encoder.layers_11.pre_mlp_layer_norm.scale.v/0 +0 -0
- checkpoint_1007000/state.param_states.encoder.layers_21.pre_attention_layer_norm.scale.v/.zarray +1 -0
- checkpoint_1007000/state.param_states.encoder.layers_21.pre_attention_layer_norm.scale.v/0 +0 -0
- checkpoint_1007000/target.decoder.layers_0.pre_self_attention_layer_norm.scale/.zarray +1 -0
- checkpoint_1007000/target.decoder.layers_0.pre_self_attention_layer_norm.scale/0 +0 -0
- checkpoint_1007000/target.decoder.layers_21.self_attention.out.kernel/.zarray +1 -0
- checkpoint_1007000/target.decoder.layers_21.self_attention.out.kernel/.zarray.__tmp12063062229005786519.~1663960300686802~ +1 -0
- checkpoint_1007000/target.decoder.layers_21.self_attention.out.kernel/.zarray.__tmp12307278983738319259.~1663960300308641~ +1 -0
- checkpoint_1007000/target.decoder.layers_21.self_attention.out.kernel/.zarray.__tmp5058963194176952291.~1663960300133053~ +1 -0
- checkpoint_1007000/target.decoder.layers_21.self_attention.out.kernel/.zarray.__tmp5977200547747821933.~1663960300268308~ +1 -0
- checkpoint_1007000/target.decoder.layers_21.self_attention.out.kernel/.zarray.__tmp9689018784294402003.~1663960300422829~ +1 -0
- checkpoint_1007000/target.decoder.layers_21.self_attention.out.kernel/.zarray.__tmp992409324478886072.~1663960300384650~ +1 -0
- checkpoint_1007000/target.decoder.layers_21.self_attention.out.kernel/0.0 +3 -0
- checkpoint_1007000/target.decoder.layers_21.self_attention.out.kernel/1.0 +3 -0
- checkpoint_1007000/target.decoder.layers_21.self_attention.out.kernel/2.0 +3 -0
- checkpoint_1007000/target.decoder.layers_21.self_attention.out.kernel/3.0 +3 -0
- checkpoint_1007000/target.decoder.layers_21.self_attention.out.kernel/4.0 +3 -0
- checkpoint_1007000/target.decoder.layers_21.self_attention.out.kernel/5.0 +3 -0
- checkpoint_1007000/target.decoder.layers_21.self_attention.out.kernel/6.0 +3 -0
- checkpoint_1007000/target.decoder.layers_21.self_attention.out.kernel/7.0 +3 -0
- checkpoint_1007000/target.decoder.layers_3.self_attention.value.kernel/.zarray +1 -0
- checkpoint_1007000/target.decoder.layers_3.self_attention.value.kernel/.zarray.__tmp10058268431463911414.~1663960300730374~ +1 -0
- checkpoint_1007000/target.decoder.layers_3.self_attention.value.kernel/.zarray.__tmp13354842767530236424.~1663960300686744~ +1 -0
- checkpoint_1007000/target.decoder.layers_3.self_attention.value.kernel/.zarray.__tmp14939280105210165697.~1663960300942053~ +1 -0
- checkpoint_1007000/target.decoder.layers_3.self_attention.value.kernel/.zarray.__tmp17688027251386092614.~1663960300865438~ +1 -0
- checkpoint_1007000/target.decoder.layers_3.self_attention.value.kernel/.zarray.__tmp3830925692305029951.~1663960300627445~ +1 -0
- checkpoint_1007000/target.decoder.layers_3.self_attention.value.kernel/.zarray.__tmp536837156884482554.~1663960300501024~ +1 -0
- checkpoint_1007000/target.decoder.layers_3.self_attention.value.kernel/.zarray.__tmp9302524747060270724.~1663960301025200~ +1 -0
- checkpoint_1007000/target.decoder.layers_3.self_attention.value.kernel/0.0 +3 -0
- checkpoint_1007000/target.decoder.layers_3.self_attention.value.kernel/0.1 +3 -0
- checkpoint_1007000/target.decoder.layers_3.self_attention.value.kernel/0.2 +3 -0
- checkpoint_1007000/target.decoder.layers_3.self_attention.value.kernel/0.3 +3 -0
- checkpoint_1007000/target.decoder.layers_3.self_attention.value.kernel/0.4 +3 -0
- checkpoint_1007000/target.decoder.layers_3.self_attention.value.kernel/0.5 +3 -0
- checkpoint_1007000/target.decoder.layers_3.self_attention.value.kernel/0.6 +3 -0
- checkpoint_1007000/target.decoder.layers_3.self_attention.value.kernel/0.7 +3 -0
- checkpoint_1007000/target.decoder.layers_4.mlp.wi_1.kernel/.zarray +1 -0
- checkpoint_1007000/target.decoder.layers_4.mlp.wi_1.kernel/.zarray.__tmp10735797227639527861.~1663960300684736~ +1 -0
- checkpoint_1007000/target.decoder.layers_4.mlp.wi_1.kernel/.zarray.__tmp11225109844392461786.~1663960300774747~ +1 -0
- checkpoint_1007000/target.decoder.layers_4.mlp.wi_1.kernel/.zarray.__tmp12350913800725825337.~1663960300423436~ +1 -0
- checkpoint_1007000/target.decoder.layers_4.mlp.wi_1.kernel/.zarray.__tmp18238927269669482103.~1663960300348437~ +1 -0
- checkpoint_1007000/target.decoder.layers_4.mlp.wi_1.kernel/.zarray.__tmp5281722543268233658.~1663960300551891~ +1 -0
- checkpoint_1007000/target.decoder.layers_4.mlp.wi_1.kernel/.zarray.__tmp703045921884514821.~1663960300600889~ +1 -0
- checkpoint_1007000/target.decoder.layers_4.mlp.wi_1.kernel/.zarray.__tmp8849042923007444349.~1663960300550553~ +1 -0
- checkpoint_1007000/target.decoder.layers_4.mlp.wi_1.kernel/0.0 +3 -0
- checkpoint_1007000/target.decoder.layers_4.mlp.wi_1.kernel/0.1 +3 -0
- checkpoint_1007000/target.decoder.layers_4.mlp.wi_1.kernel/0.2 +3 -0
- checkpoint_1007000/target.decoder.layers_4.mlp.wi_1.kernel/0.3 +3 -0
.gitattributes
CHANGED
|
@@ -3235,3 +3235,49 @@ checkpoint_1007000/target.decoder.layers_7.self_attention.out.kernel/7.0 filter=
|
|
| 3235 |
checkpoint_1007000/target.decoder.layers_7.self_attention.out.kernel/5.0 filter=lfs diff=lfs merge=lfs -text
|
| 3236 |
checkpoint_1007000/target.decoder.layers_7.self_attention.out.kernel/2.0 filter=lfs diff=lfs merge=lfs -text
|
| 3237 |
checkpoint_1007000/target.decoder.layers_7.self_attention.out.kernel/4.0 filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 3235 |
checkpoint_1007000/target.decoder.layers_7.self_attention.out.kernel/5.0 filter=lfs diff=lfs merge=lfs -text
|
| 3236 |
checkpoint_1007000/target.decoder.layers_7.self_attention.out.kernel/2.0 filter=lfs diff=lfs merge=lfs -text
|
| 3237 |
checkpoint_1007000/target.decoder.layers_7.self_attention.out.kernel/4.0 filter=lfs diff=lfs merge=lfs -text
|
| 3238 |
+
checkpoint_1007000/target.encoder.layers_9.attention.value.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 3239 |
+
checkpoint_1007000/target.encoder.layers_9.attention.value.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
| 3240 |
+
checkpoint_1007000/target.encoder.layers_9.attention.value.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 3241 |
+
checkpoint_1007000/target.encoder.layers_9.attention.value.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
| 3242 |
+
checkpoint_1007000/target.encoder.layers_9.attention.value.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
| 3243 |
+
checkpoint_1007000/target.encoder.layers_9.attention.value.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
| 3244 |
+
checkpoint_1007000/target.encoder.layers_9.attention.value.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
| 3245 |
+
checkpoint_1007000/target.encoder.layers_9.attention.value.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
| 3246 |
+
checkpoint_1007000/target.decoder.layers_6.encoder_decoder_attention.key.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 3247 |
+
checkpoint_1007000/target.decoder.layers_6.encoder_decoder_attention.key.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
| 3248 |
+
checkpoint_1007000/target.decoder.layers_6.encoder_decoder_attention.key.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 3249 |
+
checkpoint_1007000/target.decoder.layers_6.encoder_decoder_attention.key.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
| 3250 |
+
checkpoint_1007000/target.decoder.layers_6.encoder_decoder_attention.key.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
| 3251 |
+
checkpoint_1007000/target.decoder.layers_6.encoder_decoder_attention.key.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
| 3252 |
+
checkpoint_1007000/target.decoder.layers_6.encoder_decoder_attention.key.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
| 3253 |
+
checkpoint_1007000/target.decoder.layers_6.encoder_decoder_attention.key.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
| 3254 |
+
checkpoint_1007000/target.decoder.layers_3.self_attention.value.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 3255 |
+
checkpoint_1007000/target.decoder.layers_3.self_attention.value.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
| 3256 |
+
checkpoint_1007000/target.decoder.layers_3.self_attention.value.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 3257 |
+
checkpoint_1007000/target.decoder.layers_3.self_attention.value.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
| 3258 |
+
checkpoint_1007000/target.decoder.layers_3.self_attention.value.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
| 3259 |
+
checkpoint_1007000/target.decoder.layers_3.self_attention.value.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
| 3260 |
+
checkpoint_1007000/target.decoder.layers_3.self_attention.value.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
| 3261 |
+
checkpoint_1007000/target.decoder.layers_3.self_attention.value.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
| 3262 |
+
checkpoint_1007000/target.decoder.layers_4.mlp.wi_1.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 3263 |
+
checkpoint_1007000/target.decoder.layers_4.mlp.wi_1.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
| 3264 |
+
checkpoint_1007000/target.decoder.layers_4.mlp.wi_1.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 3265 |
+
checkpoint_1007000/target.decoder.layers_4.mlp.wi_1.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
| 3266 |
+
checkpoint_1007000/target.decoder.layers_4.mlp.wi_1.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
| 3267 |
+
checkpoint_1007000/target.decoder.layers_4.mlp.wi_1.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
| 3268 |
+
checkpoint_1007000/target.decoder.layers_4.mlp.wi_1.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
| 3269 |
+
checkpoint_1007000/target.decoder.layers_4.mlp.wi_1.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
| 3270 |
+
checkpoint_1007000/target.decoder.layers_21.self_attention.out.kernel/6.0 filter=lfs diff=lfs merge=lfs -text
|
| 3271 |
+
checkpoint_1007000/target.decoder.layers_21.self_attention.out.kernel/1.0 filter=lfs diff=lfs merge=lfs -text
|
| 3272 |
+
checkpoint_1007000/target.decoder.layers_21.self_attention.out.kernel/3.0 filter=lfs diff=lfs merge=lfs -text
|
| 3273 |
+
checkpoint_1007000/target.decoder.layers_21.self_attention.out.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 3274 |
+
checkpoint_1007000/target.decoder.layers_21.self_attention.out.kernel/7.0 filter=lfs diff=lfs merge=lfs -text
|
| 3275 |
+
checkpoint_1007000/target.decoder.layers_21.self_attention.out.kernel/5.0 filter=lfs diff=lfs merge=lfs -text
|
| 3276 |
+
checkpoint_1007000/target.decoder.layers_21.self_attention.out.kernel/2.0 filter=lfs diff=lfs merge=lfs -text
|
| 3277 |
+
checkpoint_1007000/target.decoder.layers_21.self_attention.out.kernel/4.0 filter=lfs diff=lfs merge=lfs -text
|
| 3278 |
+
checkpoint_1007000/target.encoder.layers_17.attention.query.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 3279 |
+
checkpoint_1007000/target.encoder.layers_17.attention.query.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
| 3280 |
+
checkpoint_1007000/target.encoder.layers_17.attention.query.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 3281 |
+
checkpoint_1007000/target.encoder.layers_17.attention.query.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
| 3282 |
+
checkpoint_1007000/target.encoder.layers_17.attention.query.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
| 3283 |
+
checkpoint_1007000/target.encoder.layers_17.attention.query.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
checkpoint_1007000/state.param_states.encoder.layers_11.pre_mlp_layer_norm.scale.v/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096],"zarr_format":2}
|
checkpoint_1007000/state.param_states.encoder.layers_11.pre_mlp_layer_norm.scale.v/0
ADDED
|
Binary file (15.3 kB). View file
|
|
|
checkpoint_1007000/state.param_states.encoder.layers_21.pre_attention_layer_norm.scale.v/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096],"zarr_format":2}
|
checkpoint_1007000/state.param_states.encoder.layers_21.pre_attention_layer_norm.scale.v/0
ADDED
|
Binary file (14.7 kB). View file
|
|
|
checkpoint_1007000/target.decoder.layers_0.pre_self_attention_layer_norm.scale/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_0.pre_self_attention_layer_norm.scale/0
ADDED
|
Binary file (14.7 kB). View file
|
|
|
checkpoint_1007000/target.decoder.layers_21.self_attention.out.kernel/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[512,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_21.self_attention.out.kernel/.zarray.__tmp12063062229005786519.~1663960300686802~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[512,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_21.self_attention.out.kernel/.zarray.__tmp12307278983738319259.~1663960300308641~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[512,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_21.self_attention.out.kernel/.zarray.__tmp5058963194176952291.~1663960300133053~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[512,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_21.self_attention.out.kernel/.zarray.__tmp5977200547747821933.~1663960300268308~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[512,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_21.self_attention.out.kernel/.zarray.__tmp9689018784294402003.~1663960300422829~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[512,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_21.self_attention.out.kernel/.zarray.__tmp992409324478886072.~1663960300384650~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[512,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_21.self_attention.out.kernel/0.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2f80599baf4db6cae318d67990cf4db8b965d048caaaf63bdf95fa2bc64a28af
|
| 3 |
+
size 7799722
|
checkpoint_1007000/target.decoder.layers_21.self_attention.out.kernel/1.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c9b787c5a7e85de26fa45970f0f5806421775a9e6586b3e49d8a666b4249d4ec
|
| 3 |
+
size 7801313
|
checkpoint_1007000/target.decoder.layers_21.self_attention.out.kernel/2.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e11c3ceb62fcef7d64b9de4f72d96dc9c5afc2adc12e6a9c2d03a8134b8cca82
|
| 3 |
+
size 7801180
|
checkpoint_1007000/target.decoder.layers_21.self_attention.out.kernel/3.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:dc41fc1e4cd29490b65ad073ae69b379ce5a7907074837cb4d1dc81d717bb1b5
|
| 3 |
+
size 7799131
|
checkpoint_1007000/target.decoder.layers_21.self_attention.out.kernel/4.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:08ce4266e66607c6eac269ba5705ec77ec29a4dd5aa794fcfebd79be0a7a78a3
|
| 3 |
+
size 7800397
|
checkpoint_1007000/target.decoder.layers_21.self_attention.out.kernel/5.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:353d4dd940a5d2594765b77c82b88069c3efce2138222e2f200dc7053dba0c20
|
| 3 |
+
size 7800162
|
checkpoint_1007000/target.decoder.layers_21.self_attention.out.kernel/6.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:044160f5088a9dddb12363dc59ecb3c965e618fbb79b52356fe466b8cefb76e7
|
| 3 |
+
size 7799455
|
checkpoint_1007000/target.decoder.layers_21.self_attention.out.kernel/7.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a8e67bd4f562d07464aa01a30c991431b29ed6169c429059359514a50e02574a
|
| 3 |
+
size 7798274
|
checkpoint_1007000/target.decoder.layers_3.self_attention.value.kernel/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_3.self_attention.value.kernel/.zarray.__tmp10058268431463911414.~1663960300730374~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_3.self_attention.value.kernel/.zarray.__tmp13354842767530236424.~1663960300686744~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_3.self_attention.value.kernel/.zarray.__tmp14939280105210165697.~1663960300942053~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_3.self_attention.value.kernel/.zarray.__tmp17688027251386092614.~1663960300865438~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_3.self_attention.value.kernel/.zarray.__tmp3830925692305029951.~1663960300627445~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_3.self_attention.value.kernel/.zarray.__tmp536837156884482554.~1663960300501024~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_3.self_attention.value.kernel/.zarray.__tmp9302524747060270724.~1663960301025200~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_3.self_attention.value.kernel/0.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2dc3538d721df73402a216ee99aa426fe9ce4d5a4eab7a0eaa0c0c1011a25859
|
| 3 |
+
size 7823209
|
checkpoint_1007000/target.decoder.layers_3.self_attention.value.kernel/0.1
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7bf0c7e73d7ff3bb7b778d0e220ef0abefcef34b0a8990004df4068437e3fd31
|
| 3 |
+
size 7822150
|
checkpoint_1007000/target.decoder.layers_3.self_attention.value.kernel/0.2
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:18fdcb54b823835969e8c17809ea78b77ca108ed940c5c91ccad477188c3414e
|
| 3 |
+
size 7819731
|
checkpoint_1007000/target.decoder.layers_3.self_attention.value.kernel/0.3
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0d1a0fcc9c7fff9d4dcc79f4381f977479f59c380f358f1e544099de92223c8e
|
| 3 |
+
size 7820801
|
checkpoint_1007000/target.decoder.layers_3.self_attention.value.kernel/0.4
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c64f41beae3922a79a1cbada90ba096fb66aa621569a282766809202c096da29
|
| 3 |
+
size 7823925
|
checkpoint_1007000/target.decoder.layers_3.self_attention.value.kernel/0.5
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3bc3e102fa9204a0490b65a53003cedcd63a762a39f0aff9048429c5170cf1bf
|
| 3 |
+
size 7821268
|
checkpoint_1007000/target.decoder.layers_3.self_attention.value.kernel/0.6
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c902c46923bc6a386091a50f3b00c07b698fd7de9b9dfa3dba8cb07b24e85285
|
| 3 |
+
size 7821659
|
checkpoint_1007000/target.decoder.layers_3.self_attention.value.kernel/0.7
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:df024f96a48c0fb347283360e2b92c2bcf8c40a5169960d6a452609b1f881d0c
|
| 3 |
+
size 7824710
|
checkpoint_1007000/target.decoder.layers_4.mlp.wi_1.kernel/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_4.mlp.wi_1.kernel/.zarray.__tmp10735797227639527861.~1663960300684736~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_4.mlp.wi_1.kernel/.zarray.__tmp11225109844392461786.~1663960300774747~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_4.mlp.wi_1.kernel/.zarray.__tmp12350913800725825337.~1663960300423436~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_4.mlp.wi_1.kernel/.zarray.__tmp18238927269669482103.~1663960300348437~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_4.mlp.wi_1.kernel/.zarray.__tmp5281722543268233658.~1663960300551891~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_4.mlp.wi_1.kernel/.zarray.__tmp703045921884514821.~1663960300600889~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_4.mlp.wi_1.kernel/.zarray.__tmp8849042923007444349.~1663960300550553~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_4.mlp.wi_1.kernel/0.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a1e737aa0c902137364f61d0758ebcd730e762549d699825af3bc5baecc893a4
|
| 3 |
+
size 19542114
|
checkpoint_1007000/target.decoder.layers_4.mlp.wi_1.kernel/0.1
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a294763ac0b5545790eb62bbef17e818695bd020fb7435cdbc7e53a4d49c1fe2
|
| 3 |
+
size 19542449
|
checkpoint_1007000/target.decoder.layers_4.mlp.wi_1.kernel/0.2
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:df987cee688129f92d9aae6b6abe81e1df52a7b1bc9100f6755eb024abf8272d
|
| 3 |
+
size 19542725
|
checkpoint_1007000/target.decoder.layers_4.mlp.wi_1.kernel/0.3
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a07b1efc576f5b6999ed726d67ad282f5191c4687f5241da0b3aebbbf7cc7763
|
| 3 |
+
size 19541115
|