Commit
·
6cfb111
1
Parent(s):
824ee4f
Upload part 64
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- .gitattributes +48 -0
- checkpoint_1007000/state.param_states.decoder.layers_21.pre_mlp_layer_norm.scale.v/.zarray +1 -0
- checkpoint_1007000/state.param_states.decoder.layers_21.pre_mlp_layer_norm.scale.v/0 +0 -0
- checkpoint_1007000/state.param_states.decoder.layers_7.pre_cross_attention_layer_norm.scale.v/.zarray +1 -0
- checkpoint_1007000/state.param_states.decoder.layers_7.pre_cross_attention_layer_norm.scale.v/0 +0 -0
- checkpoint_1007000/state.param_states.encoder.layers_19.pre_attention_layer_norm.scale.v/.zarray +1 -0
- checkpoint_1007000/state.param_states.encoder.layers_19.pre_attention_layer_norm.scale.v/0 +0 -0
- checkpoint_1007000/target.decoder.layers_11.mlp.wi_1.kernel/.zarray +1 -0
- checkpoint_1007000/target.decoder.layers_11.mlp.wi_1.kernel/.zarray.__tmp12181212485329137517.~1663960300826378~ +1 -0
- checkpoint_1007000/target.decoder.layers_11.mlp.wi_1.kernel/.zarray.__tmp17790706748405652845.~1663960300688192~ +1 -0
- checkpoint_1007000/target.decoder.layers_11.mlp.wi_1.kernel/.zarray.__tmp18195175323702989595.~1663960300090157~ +1 -0
- checkpoint_1007000/target.decoder.layers_11.mlp.wi_1.kernel/.zarray.__tmp4865545297524934550.~1663960300307608~ +1 -0
- checkpoint_1007000/target.decoder.layers_11.mlp.wi_1.kernel/.zarray.__tmp8183705587183143898.~1663960300726035~ +1 -0
- checkpoint_1007000/target.decoder.layers_11.mlp.wi_1.kernel/.zarray.__tmp9199685975903289795.~1663960300351135~ +1 -0
- checkpoint_1007000/target.decoder.layers_11.mlp.wi_1.kernel/0.0 +3 -0
- checkpoint_1007000/target.decoder.layers_11.mlp.wi_1.kernel/0.1 +3 -0
- checkpoint_1007000/target.decoder.layers_11.mlp.wi_1.kernel/0.2 +3 -0
- checkpoint_1007000/target.decoder.layers_11.mlp.wi_1.kernel/0.3 +3 -0
- checkpoint_1007000/target.decoder.layers_11.mlp.wi_1.kernel/0.4 +3 -0
- checkpoint_1007000/target.decoder.layers_11.mlp.wi_1.kernel/0.5 +3 -0
- checkpoint_1007000/target.decoder.layers_11.mlp.wi_1.kernel/0.6 +3 -0
- checkpoint_1007000/target.decoder.layers_11.mlp.wi_1.kernel/0.7 +3 -0
- checkpoint_1007000/target.decoder.layers_17.self_attention.query.kernel/.zarray +1 -0
- checkpoint_1007000/target.decoder.layers_17.self_attention.query.kernel/.zarray.__tmp123133317181209426.~1663960300865681~ +1 -0
- checkpoint_1007000/target.decoder.layers_17.self_attention.query.kernel/.zarray.__tmp12829050581861680553.~1663960300728711~ +1 -0
- checkpoint_1007000/target.decoder.layers_17.self_attention.query.kernel/.zarray.__tmp12983276121360685771.~1663960300500371~ +1 -0
- checkpoint_1007000/target.decoder.layers_17.self_attention.query.kernel/.zarray.__tmp1528149515108167277.~1663960300777568~ +1 -0
- checkpoint_1007000/target.decoder.layers_17.self_attention.query.kernel/.zarray.__tmp1687850696384403133.~1663960300313523~ +1 -0
- checkpoint_1007000/target.decoder.layers_17.self_attention.query.kernel/.zarray.__tmp4591981584490319116.~1663960300421486~ +1 -0
- checkpoint_1007000/target.decoder.layers_17.self_attention.query.kernel/.zarray.__tmp7033595672112296407.~1663960300384128~ +1 -0
- checkpoint_1007000/target.decoder.layers_17.self_attention.query.kernel/0.0 +3 -0
- checkpoint_1007000/target.decoder.layers_17.self_attention.query.kernel/0.1 +3 -0
- checkpoint_1007000/target.decoder.layers_17.self_attention.query.kernel/0.2 +3 -0
- checkpoint_1007000/target.decoder.layers_17.self_attention.query.kernel/0.3 +3 -0
- checkpoint_1007000/target.decoder.layers_17.self_attention.query.kernel/0.4 +3 -0
- checkpoint_1007000/target.decoder.layers_17.self_attention.query.kernel/0.5 +3 -0
- checkpoint_1007000/target.decoder.layers_17.self_attention.query.kernel/0.6 +3 -0
- checkpoint_1007000/target.decoder.layers_17.self_attention.query.kernel/0.7 +3 -0
- checkpoint_1007000/target.decoder.layers_22.encoder_decoder_attention.query.kernel/.zarray +1 -0
- checkpoint_1007000/target.decoder.layers_22.encoder_decoder_attention.query.kernel/.zarray.__tmp13412709914363784685.~1663960300601562~ +1 -0
- checkpoint_1007000/target.decoder.layers_22.encoder_decoder_attention.query.kernel/.zarray.__tmp14980511374361568976.~1663960300421148~ +1 -0
- checkpoint_1007000/target.decoder.layers_22.encoder_decoder_attention.query.kernel/.zarray.__tmp16452437899863196389.~1663960300501046~ +1 -0
- checkpoint_1007000/target.decoder.layers_22.encoder_decoder_attention.query.kernel/.zarray.__tmp2798774854545907582.~1663960300941517~ +1 -0
- checkpoint_1007000/target.decoder.layers_22.encoder_decoder_attention.query.kernel/.zarray.__tmp6451480922883845549.~1663960300546575~ +1 -0
- checkpoint_1007000/target.decoder.layers_22.encoder_decoder_attention.query.kernel/.zarray.__tmp7083799652499692707.~1663960300686230~ +1 -0
- checkpoint_1007000/target.decoder.layers_22.encoder_decoder_attention.query.kernel/.zarray.__tmp7360943157167004366.~1663960300627130~ +1 -0
- checkpoint_1007000/target.decoder.layers_22.encoder_decoder_attention.query.kernel/0.0 +3 -0
- checkpoint_1007000/target.decoder.layers_22.encoder_decoder_attention.query.kernel/0.1 +3 -0
- checkpoint_1007000/target.decoder.layers_22.encoder_decoder_attention.query.kernel/0.2 +3 -0
- checkpoint_1007000/target.decoder.layers_22.encoder_decoder_attention.query.kernel/0.3 +3 -0
.gitattributes
CHANGED
|
@@ -3187,3 +3187,51 @@ checkpoint_1007000/target.encoder.layers_6.attention.key.kernel/0.5 filter=lfs d
|
|
| 3187 |
checkpoint_1007000/target.encoder.layers_6.attention.key.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
| 3188 |
checkpoint_1007000/target.encoder.layers_6.attention.key.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
| 3189 |
checkpoint_1007000/target.encoder.layers_6.attention.key.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 3187 |
checkpoint_1007000/target.encoder.layers_6.attention.key.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
| 3188 |
checkpoint_1007000/target.encoder.layers_6.attention.key.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
| 3189 |
checkpoint_1007000/target.encoder.layers_6.attention.key.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
| 3190 |
+
checkpoint_1007000/target.encoder.layers_5.attention.out.kernel/6.0 filter=lfs diff=lfs merge=lfs -text
|
| 3191 |
+
checkpoint_1007000/target.encoder.layers_5.attention.out.kernel/1.0 filter=lfs diff=lfs merge=lfs -text
|
| 3192 |
+
checkpoint_1007000/target.encoder.layers_5.attention.out.kernel/3.0 filter=lfs diff=lfs merge=lfs -text
|
| 3193 |
+
checkpoint_1007000/target.encoder.layers_5.attention.out.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 3194 |
+
checkpoint_1007000/target.encoder.layers_5.attention.out.kernel/7.0 filter=lfs diff=lfs merge=lfs -text
|
| 3195 |
+
checkpoint_1007000/target.encoder.layers_5.attention.out.kernel/5.0 filter=lfs diff=lfs merge=lfs -text
|
| 3196 |
+
checkpoint_1007000/target.encoder.layers_5.attention.out.kernel/2.0 filter=lfs diff=lfs merge=lfs -text
|
| 3197 |
+
checkpoint_1007000/target.encoder.layers_5.attention.out.kernel/4.0 filter=lfs diff=lfs merge=lfs -text
|
| 3198 |
+
checkpoint_1007000/target.decoder.layers_17.self_attention.query.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 3199 |
+
checkpoint_1007000/target.decoder.layers_17.self_attention.query.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
| 3200 |
+
checkpoint_1007000/target.decoder.layers_17.self_attention.query.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 3201 |
+
checkpoint_1007000/target.decoder.layers_17.self_attention.query.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
| 3202 |
+
checkpoint_1007000/target.decoder.layers_17.self_attention.query.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
| 3203 |
+
checkpoint_1007000/target.decoder.layers_17.self_attention.query.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
| 3204 |
+
checkpoint_1007000/target.decoder.layers_17.self_attention.query.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
| 3205 |
+
checkpoint_1007000/target.decoder.layers_17.self_attention.query.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
| 3206 |
+
checkpoint_1007000/target.encoder.layers_11.attention.key.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 3207 |
+
checkpoint_1007000/target.encoder.layers_11.attention.key.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
| 3208 |
+
checkpoint_1007000/target.encoder.layers_11.attention.key.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 3209 |
+
checkpoint_1007000/target.encoder.layers_11.attention.key.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
| 3210 |
+
checkpoint_1007000/target.encoder.layers_11.attention.key.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
| 3211 |
+
checkpoint_1007000/target.encoder.layers_11.attention.key.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
| 3212 |
+
checkpoint_1007000/target.encoder.layers_11.attention.key.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
| 3213 |
+
checkpoint_1007000/target.encoder.layers_11.attention.key.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
| 3214 |
+
checkpoint_1007000/target.decoder.layers_11.mlp.wi_1.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 3215 |
+
checkpoint_1007000/target.decoder.layers_11.mlp.wi_1.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
| 3216 |
+
checkpoint_1007000/target.decoder.layers_11.mlp.wi_1.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 3217 |
+
checkpoint_1007000/target.decoder.layers_11.mlp.wi_1.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
| 3218 |
+
checkpoint_1007000/target.decoder.layers_11.mlp.wi_1.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
| 3219 |
+
checkpoint_1007000/target.decoder.layers_11.mlp.wi_1.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
| 3220 |
+
checkpoint_1007000/target.decoder.layers_11.mlp.wi_1.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
| 3221 |
+
checkpoint_1007000/target.decoder.layers_11.mlp.wi_1.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
| 3222 |
+
checkpoint_1007000/target.decoder.layers_22.encoder_decoder_attention.query.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 3223 |
+
checkpoint_1007000/target.decoder.layers_22.encoder_decoder_attention.query.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
| 3224 |
+
checkpoint_1007000/target.decoder.layers_22.encoder_decoder_attention.query.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 3225 |
+
checkpoint_1007000/target.decoder.layers_22.encoder_decoder_attention.query.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
| 3226 |
+
checkpoint_1007000/target.decoder.layers_22.encoder_decoder_attention.query.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
| 3227 |
+
checkpoint_1007000/target.decoder.layers_22.encoder_decoder_attention.query.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
| 3228 |
+
checkpoint_1007000/target.decoder.layers_22.encoder_decoder_attention.query.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
| 3229 |
+
checkpoint_1007000/target.decoder.layers_22.encoder_decoder_attention.query.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
| 3230 |
+
checkpoint_1007000/target.decoder.layers_7.self_attention.out.kernel/6.0 filter=lfs diff=lfs merge=lfs -text
|
| 3231 |
+
checkpoint_1007000/target.decoder.layers_7.self_attention.out.kernel/1.0 filter=lfs diff=lfs merge=lfs -text
|
| 3232 |
+
checkpoint_1007000/target.decoder.layers_7.self_attention.out.kernel/3.0 filter=lfs diff=lfs merge=lfs -text
|
| 3233 |
+
checkpoint_1007000/target.decoder.layers_7.self_attention.out.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 3234 |
+
checkpoint_1007000/target.decoder.layers_7.self_attention.out.kernel/7.0 filter=lfs diff=lfs merge=lfs -text
|
| 3235 |
+
checkpoint_1007000/target.decoder.layers_7.self_attention.out.kernel/5.0 filter=lfs diff=lfs merge=lfs -text
|
| 3236 |
+
checkpoint_1007000/target.decoder.layers_7.self_attention.out.kernel/2.0 filter=lfs diff=lfs merge=lfs -text
|
| 3237 |
+
checkpoint_1007000/target.decoder.layers_7.self_attention.out.kernel/4.0 filter=lfs diff=lfs merge=lfs -text
|
checkpoint_1007000/state.param_states.decoder.layers_21.pre_mlp_layer_norm.scale.v/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096],"zarr_format":2}
|
checkpoint_1007000/state.param_states.decoder.layers_21.pre_mlp_layer_norm.scale.v/0
ADDED
|
Binary file (14.1 kB). View file
|
|
|
checkpoint_1007000/state.param_states.decoder.layers_7.pre_cross_attention_layer_norm.scale.v/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096],"zarr_format":2}
|
checkpoint_1007000/state.param_states.decoder.layers_7.pre_cross_attention_layer_norm.scale.v/0
ADDED
|
Binary file (14.9 kB). View file
|
|
|
checkpoint_1007000/state.param_states.encoder.layers_19.pre_attention_layer_norm.scale.v/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096],"zarr_format":2}
|
checkpoint_1007000/state.param_states.encoder.layers_19.pre_attention_layer_norm.scale.v/0
ADDED
|
Binary file (15 kB). View file
|
|
|
checkpoint_1007000/target.decoder.layers_11.mlp.wi_1.kernel/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_11.mlp.wi_1.kernel/.zarray.__tmp12181212485329137517.~1663960300826378~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_11.mlp.wi_1.kernel/.zarray.__tmp17790706748405652845.~1663960300688192~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_11.mlp.wi_1.kernel/.zarray.__tmp18195175323702989595.~1663960300090157~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_11.mlp.wi_1.kernel/.zarray.__tmp4865545297524934550.~1663960300307608~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_11.mlp.wi_1.kernel/.zarray.__tmp8183705587183143898.~1663960300726035~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_11.mlp.wi_1.kernel/.zarray.__tmp9199685975903289795.~1663960300351135~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_11.mlp.wi_1.kernel/0.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:bb0068fc004323a8b8c099b11fe03c6d93741de29296628303175441b4f711f3
|
| 3 |
+
size 19536103
|
checkpoint_1007000/target.decoder.layers_11.mlp.wi_1.kernel/0.1
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7bf698efca02ab098b65cc9d97466a849598f152ff9da3df775e9fce3e214146
|
| 3 |
+
size 19537137
|
checkpoint_1007000/target.decoder.layers_11.mlp.wi_1.kernel/0.2
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0591d702feb3807a84f0a883e4cdf548f85d52be16d81b45d88a6ba593346678
|
| 3 |
+
size 19536569
|
checkpoint_1007000/target.decoder.layers_11.mlp.wi_1.kernel/0.3
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6b7d09c5058adbc0964f40989c39fd51541adab854b31189cb6b3c186a896694
|
| 3 |
+
size 19535962
|
checkpoint_1007000/target.decoder.layers_11.mlp.wi_1.kernel/0.4
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5f821b90457e2882f364c392c13c5df9e5ae84a2966f8efb597f545d0157d252
|
| 3 |
+
size 19535786
|
checkpoint_1007000/target.decoder.layers_11.mlp.wi_1.kernel/0.5
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:01b4e4b73b6b28d21fc50c55b5d618e5d6b1f58ab2ad3c6a54d1cbc204f4a714
|
| 3 |
+
size 19537357
|
checkpoint_1007000/target.decoder.layers_11.mlp.wi_1.kernel/0.6
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:35bac1a6352cec8add1af27b8d61837eeefb822017ad694598b336022c42b860
|
| 3 |
+
size 19536466
|
checkpoint_1007000/target.decoder.layers_11.mlp.wi_1.kernel/0.7
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d787db36dadb6389880c7cac33fa333833838bec32937ca4a18092399a72b16c
|
| 3 |
+
size 19536420
|
checkpoint_1007000/target.decoder.layers_17.self_attention.query.kernel/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_17.self_attention.query.kernel/.zarray.__tmp123133317181209426.~1663960300865681~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_17.self_attention.query.kernel/.zarray.__tmp12829050581861680553.~1663960300728711~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_17.self_attention.query.kernel/.zarray.__tmp12983276121360685771.~1663960300500371~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_17.self_attention.query.kernel/.zarray.__tmp1528149515108167277.~1663960300777568~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_17.self_attention.query.kernel/.zarray.__tmp1687850696384403133.~1663960300313523~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_17.self_attention.query.kernel/.zarray.__tmp4591981584490319116.~1663960300421486~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_17.self_attention.query.kernel/.zarray.__tmp7033595672112296407.~1663960300384128~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_17.self_attention.query.kernel/0.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b42e1209b30c1c4efe33d264d090e55a9e20a477979994a874a661b2cf4f04bf
|
| 3 |
+
size 7806367
|
checkpoint_1007000/target.decoder.layers_17.self_attention.query.kernel/0.1
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e305fae3f56bd6e7c79693f66855806c6a144aea71eefd030bb9623be6da44e8
|
| 3 |
+
size 7809933
|
checkpoint_1007000/target.decoder.layers_17.self_attention.query.kernel/0.2
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:70faa1bdd0905a8331aba675289662407c80a04787460af3132207c89eb9da90
|
| 3 |
+
size 7816973
|
checkpoint_1007000/target.decoder.layers_17.self_attention.query.kernel/0.3
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c8bb788e5dc063088f2c6f457567ece64cfce724555c53ebddd77f31a0cbc94c
|
| 3 |
+
size 7808948
|
checkpoint_1007000/target.decoder.layers_17.self_attention.query.kernel/0.4
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a38019968be55403626f53c94953aa3b9e5183045d35ce7dcd9f0dc27a7f1b00
|
| 3 |
+
size 7811372
|
checkpoint_1007000/target.decoder.layers_17.self_attention.query.kernel/0.5
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:785c2e5d2be2dfbc2611dfd3e26998714671af6d421fe7b9af30c1f8593cbf4e
|
| 3 |
+
size 7808858
|
checkpoint_1007000/target.decoder.layers_17.self_attention.query.kernel/0.6
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6a5cb21640e9444724f299c8480ed796fa36182d3a1f382567194e92b0b2194d
|
| 3 |
+
size 7809894
|
checkpoint_1007000/target.decoder.layers_17.self_attention.query.kernel/0.7
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:97e00157e2b5473f653bf983af13e988a75598c684434a30cab8c65278271e96
|
| 3 |
+
size 7810759
|
checkpoint_1007000/target.decoder.layers_22.encoder_decoder_attention.query.kernel/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_22.encoder_decoder_attention.query.kernel/.zarray.__tmp13412709914363784685.~1663960300601562~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_22.encoder_decoder_attention.query.kernel/.zarray.__tmp14980511374361568976.~1663960300421148~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_22.encoder_decoder_attention.query.kernel/.zarray.__tmp16452437899863196389.~1663960300501046~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_22.encoder_decoder_attention.query.kernel/.zarray.__tmp2798774854545907582.~1663960300941517~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_22.encoder_decoder_attention.query.kernel/.zarray.__tmp6451480922883845549.~1663960300546575~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_22.encoder_decoder_attention.query.kernel/.zarray.__tmp7083799652499692707.~1663960300686230~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_22.encoder_decoder_attention.query.kernel/.zarray.__tmp7360943157167004366.~1663960300627130~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_22.encoder_decoder_attention.query.kernel/0.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e1bce25ad9db8bcf39f7922b82d165a67912ff0ea10bb01bbe97862de21de62f
|
| 3 |
+
size 7818065
|
checkpoint_1007000/target.decoder.layers_22.encoder_decoder_attention.query.kernel/0.1
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:13804b5d74b8e238869a326563bb5619e7a9501ae03a66b0c41ed63928dbd5a6
|
| 3 |
+
size 7817552
|
checkpoint_1007000/target.decoder.layers_22.encoder_decoder_attention.query.kernel/0.2
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5456f72755b5c2d5fefff105711bf90556c8ac380c9cd534e4b081984be8d661
|
| 3 |
+
size 7816066
|
checkpoint_1007000/target.decoder.layers_22.encoder_decoder_attention.query.kernel/0.3
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8da7dbb9774bfba01a4e072867151d563a9f45c5c1b1fd2f7772efd520d9ae25
|
| 3 |
+
size 7815808
|