Commit
·
595b88f
1
Parent(s):
0e11993
Upload part 4
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- .gitattributes +47 -0
- checkpoint_1007000/state.param_states.encoder.layers_16.pre_mlp_layer_norm.scale.v/.zarray +1 -0
- checkpoint_1007000/state.param_states.encoder.layers_16.pre_mlp_layer_norm.scale.v/0 +0 -0
- checkpoint_1007000/target.decoder.layers_0.mlp.wi_1.kernel/.zarray +1 -0
- checkpoint_1007000/target.decoder.layers_0.mlp.wi_1.kernel/.zarray.__tmp1051907682360705039.~1663960300129366~ +1 -0
- checkpoint_1007000/target.decoder.layers_0.mlp.wi_1.kernel/.zarray.__tmp12964120561355800237.~1663960299930878~ +1 -0
- checkpoint_1007000/target.decoder.layers_0.mlp.wi_1.kernel/.zarray.__tmp14120820778061497317.~1663960300020900~ +1 -0
- checkpoint_1007000/target.decoder.layers_0.mlp.wi_1.kernel/.zarray.__tmp14913800401621094618.~1663960301029013~ +1 -0
- checkpoint_1007000/target.decoder.layers_0.mlp.wi_1.kernel/.zarray.__tmp17456560980651184125.~1663960300548641~ +1 -0
- checkpoint_1007000/target.decoder.layers_0.mlp.wi_1.kernel/.zarray.__tmp7104034003937207927.~1663960300550773~ +1 -0
- checkpoint_1007000/target.decoder.layers_0.mlp.wi_1.kernel/0.0 +3 -0
- checkpoint_1007000/target.decoder.layers_0.mlp.wi_1.kernel/0.1 +3 -0
- checkpoint_1007000/target.decoder.layers_0.mlp.wi_1.kernel/0.2 +3 -0
- checkpoint_1007000/target.decoder.layers_0.mlp.wi_1.kernel/0.3 +3 -0
- checkpoint_1007000/target.decoder.layers_0.mlp.wi_1.kernel/0.4 +3 -0
- checkpoint_1007000/target.decoder.layers_0.mlp.wi_1.kernel/0.5 +3 -0
- checkpoint_1007000/target.decoder.layers_0.mlp.wi_1.kernel/0.6 +3 -0
- checkpoint_1007000/target.decoder.layers_0.mlp.wi_1.kernel/0.7 +3 -0
- checkpoint_1007000/target.decoder.layers_12.pre_self_attention_layer_norm.scale/.zarray +1 -0
- checkpoint_1007000/target.decoder.layers_12.pre_self_attention_layer_norm.scale/0 +0 -0
- checkpoint_1007000/target.decoder.layers_13.encoder_decoder_attention.out.kernel/.zarray +1 -0
- checkpoint_1007000/target.decoder.layers_13.encoder_decoder_attention.out.kernel/.zarray.__tmp13618632258628998883.~1663960300385308~ +1 -0
- checkpoint_1007000/target.decoder.layers_13.encoder_decoder_attention.out.kernel/.zarray.__tmp13883755724312397014.~1663960300885805~ +1 -0
- checkpoint_1007000/target.decoder.layers_13.encoder_decoder_attention.out.kernel/.zarray.__tmp15466256357474120295.~1663960300873100~ +1 -0
- checkpoint_1007000/target.decoder.layers_13.encoder_decoder_attention.out.kernel/.zarray.__tmp2035038049991381250.~1663960300550968~ +1 -0
- checkpoint_1007000/target.decoder.layers_13.encoder_decoder_attention.out.kernel/.zarray.__tmp2929896088676765696.~1663960300890288~ +1 -0
- checkpoint_1007000/target.decoder.layers_13.encoder_decoder_attention.out.kernel/.zarray.__tmp3206404155680097865.~1663960300468388~ +1 -0
- checkpoint_1007000/target.decoder.layers_13.encoder_decoder_attention.out.kernel/.zarray.__tmp9272383110870212341.~1663960300685356~ +1 -0
- checkpoint_1007000/target.decoder.layers_13.encoder_decoder_attention.out.kernel/2.0 +3 -0
- checkpoint_1007000/target.decoder.layers_13.encoder_decoder_attention.out.kernel/4.0 +3 -0
- checkpoint_1007000/target.decoder.layers_13.encoder_decoder_attention.out.kernel/5.0 +3 -0
- checkpoint_1007000/target.decoder.layers_17.encoder_decoder_attention.value.kernel/.zarray +1 -0
- checkpoint_1007000/target.decoder.layers_17.encoder_decoder_attention.value.kernel/.zarray.__tmp11100819509893764503.~1663960300549218~ +1 -0
- checkpoint_1007000/target.decoder.layers_17.encoder_decoder_attention.value.kernel/.zarray.__tmp1371689890356389666.~1663960300546815~ +1 -0
- checkpoint_1007000/target.decoder.layers_17.encoder_decoder_attention.value.kernel/.zarray.__tmp17200304346770231764.~1663960300554326~ +1 -0
- checkpoint_1007000/target.decoder.layers_17.encoder_decoder_attention.value.kernel/.zarray.__tmp3012749623555417058.~1663960300683754~ +1 -0
- checkpoint_1007000/target.decoder.layers_17.encoder_decoder_attention.value.kernel/.zarray.__tmp6162242579562817252.~1663960300872989~ +1 -0
- checkpoint_1007000/target.decoder.layers_17.encoder_decoder_attention.value.kernel/.zarray.__tmp7494574353364699209.~1663960300780189~ +1 -0
- checkpoint_1007000/target.decoder.layers_17.encoder_decoder_attention.value.kernel/.zarray.__tmp7720999365442451709.~1663960300312377~ +1 -0
- checkpoint_1007000/target.decoder.layers_17.encoder_decoder_attention.value.kernel/0.0 +3 -0
- checkpoint_1007000/target.decoder.layers_17.encoder_decoder_attention.value.kernel/0.1 +3 -0
- checkpoint_1007000/target.decoder.layers_17.encoder_decoder_attention.value.kernel/0.2 +3 -0
- checkpoint_1007000/target.decoder.layers_17.encoder_decoder_attention.value.kernel/0.3 +3 -0
- checkpoint_1007000/target.decoder.layers_17.encoder_decoder_attention.value.kernel/0.4 +3 -0
- checkpoint_1007000/target.decoder.layers_17.encoder_decoder_attention.value.kernel/0.5 +3 -0
- checkpoint_1007000/target.decoder.layers_17.encoder_decoder_attention.value.kernel/0.6 +3 -0
- checkpoint_1007000/target.decoder.layers_17.encoder_decoder_attention.value.kernel/0.7 +3 -0
- checkpoint_1007000/target.decoder.layers_18.self_attention.out.kernel/.zarray +1 -0
- checkpoint_1007000/target.decoder.layers_18.self_attention.out.kernel/.zarray.__tmp12023918215551030991.~1663960300467063~ +1 -0
- checkpoint_1007000/target.decoder.layers_18.self_attention.out.kernel/.zarray.__tmp13670210875818371004.~1663960300632918~ +1 -0
.gitattributes
CHANGED
|
@@ -224,3 +224,50 @@ checkpoint_1007000/target.decoder.layers_13.encoder_decoder_attention.out.kernel
|
|
| 224 |
checkpoint_1007000/target.decoder.layers_13.encoder_decoder_attention.out.kernel/3.0 filter=lfs diff=lfs merge=lfs -text
|
| 225 |
checkpoint_1007000/target.decoder.layers_13.encoder_decoder_attention.out.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 226 |
checkpoint_1007000/target.decoder.layers_13.encoder_decoder_attention.out.kernel/7.0 filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 224 |
checkpoint_1007000/target.decoder.layers_13.encoder_decoder_attention.out.kernel/3.0 filter=lfs diff=lfs merge=lfs -text
|
| 225 |
checkpoint_1007000/target.decoder.layers_13.encoder_decoder_attention.out.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 226 |
checkpoint_1007000/target.decoder.layers_13.encoder_decoder_attention.out.kernel/7.0 filter=lfs diff=lfs merge=lfs -text
|
| 227 |
+
checkpoint_1007000/target.decoder.layers_13.encoder_decoder_attention.out.kernel/5.0 filter=lfs diff=lfs merge=lfs -text
|
| 228 |
+
checkpoint_1007000/target.decoder.layers_13.encoder_decoder_attention.out.kernel/2.0 filter=lfs diff=lfs merge=lfs -text
|
| 229 |
+
checkpoint_1007000/target.decoder.layers_13.encoder_decoder_attention.out.kernel/4.0 filter=lfs diff=lfs merge=lfs -text
|
| 230 |
+
checkpoint_1007000/target.encoder.layers_9.attention.out.kernel/6.0 filter=lfs diff=lfs merge=lfs -text
|
| 231 |
+
checkpoint_1007000/target.encoder.layers_9.attention.out.kernel/1.0 filter=lfs diff=lfs merge=lfs -text
|
| 232 |
+
checkpoint_1007000/target.encoder.layers_9.attention.out.kernel/3.0 filter=lfs diff=lfs merge=lfs -text
|
| 233 |
+
checkpoint_1007000/target.encoder.layers_9.attention.out.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 234 |
+
checkpoint_1007000/target.encoder.layers_9.attention.out.kernel/7.0 filter=lfs diff=lfs merge=lfs -text
|
| 235 |
+
checkpoint_1007000/target.encoder.layers_9.attention.out.kernel/5.0 filter=lfs diff=lfs merge=lfs -text
|
| 236 |
+
checkpoint_1007000/target.encoder.layers_9.attention.out.kernel/2.0 filter=lfs diff=lfs merge=lfs -text
|
| 237 |
+
checkpoint_1007000/target.encoder.layers_9.attention.out.kernel/4.0 filter=lfs diff=lfs merge=lfs -text
|
| 238 |
+
checkpoint_1007000/target.decoder.layers_0.mlp.wi_1.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 239 |
+
checkpoint_1007000/target.decoder.layers_0.mlp.wi_1.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
| 240 |
+
checkpoint_1007000/target.decoder.layers_0.mlp.wi_1.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 241 |
+
checkpoint_1007000/target.decoder.layers_0.mlp.wi_1.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
| 242 |
+
checkpoint_1007000/target.decoder.layers_0.mlp.wi_1.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
| 243 |
+
checkpoint_1007000/target.decoder.layers_0.mlp.wi_1.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
| 244 |
+
checkpoint_1007000/target.decoder.layers_0.mlp.wi_1.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
| 245 |
+
checkpoint_1007000/target.decoder.layers_0.mlp.wi_1.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
| 246 |
+
checkpoint_1007000/target.decoder.layers_17.encoder_decoder_attention.value.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 247 |
+
checkpoint_1007000/target.decoder.layers_17.encoder_decoder_attention.value.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
| 248 |
+
checkpoint_1007000/target.decoder.layers_17.encoder_decoder_attention.value.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 249 |
+
checkpoint_1007000/target.decoder.layers_17.encoder_decoder_attention.value.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
| 250 |
+
checkpoint_1007000/target.decoder.layers_17.encoder_decoder_attention.value.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
| 251 |
+
checkpoint_1007000/target.decoder.layers_17.encoder_decoder_attention.value.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
| 252 |
+
checkpoint_1007000/target.decoder.layers_17.encoder_decoder_attention.value.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
| 253 |
+
checkpoint_1007000/target.decoder.layers_17.encoder_decoder_attention.value.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
| 254 |
+
checkpoint_1007000/target.decoder.layers_18.self_attention.out.kernel/6.0 filter=lfs diff=lfs merge=lfs -text
|
| 255 |
+
checkpoint_1007000/target.decoder.layers_18.self_attention.out.kernel/1.0 filter=lfs diff=lfs merge=lfs -text
|
| 256 |
+
checkpoint_1007000/target.decoder.layers_18.self_attention.out.kernel/3.0 filter=lfs diff=lfs merge=lfs -text
|
| 257 |
+
checkpoint_1007000/target.decoder.layers_18.self_attention.out.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 258 |
+
checkpoint_1007000/target.decoder.layers_18.self_attention.out.kernel/7.0 filter=lfs diff=lfs merge=lfs -text
|
| 259 |
+
checkpoint_1007000/target.decoder.layers_18.self_attention.out.kernel/5.0 filter=lfs diff=lfs merge=lfs -text
|
| 260 |
+
checkpoint_1007000/target.decoder.layers_18.self_attention.out.kernel/2.0 filter=lfs diff=lfs merge=lfs -text
|
| 261 |
+
checkpoint_1007000/target.decoder.layers_18.self_attention.out.kernel/4.0 filter=lfs diff=lfs merge=lfs -text
|
| 262 |
+
checkpoint_1007000/target.decoder.layers_19.encoder_decoder_attention.query.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 263 |
+
checkpoint_1007000/target.decoder.layers_19.encoder_decoder_attention.query.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
| 264 |
+
checkpoint_1007000/target.decoder.layers_19.encoder_decoder_attention.query.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 265 |
+
checkpoint_1007000/target.decoder.layers_19.encoder_decoder_attention.query.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
| 266 |
+
checkpoint_1007000/target.decoder.layers_19.encoder_decoder_attention.query.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
| 267 |
+
checkpoint_1007000/target.decoder.layers_19.encoder_decoder_attention.query.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
| 268 |
+
checkpoint_1007000/target.decoder.layers_19.encoder_decoder_attention.query.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
| 269 |
+
checkpoint_1007000/target.decoder.layers_19.encoder_decoder_attention.query.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
| 270 |
+
checkpoint_1007000/target.decoder.layers_20.encoder_decoder_attention.value.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 271 |
+
checkpoint_1007000/target.decoder.layers_20.encoder_decoder_attention.value.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
| 272 |
+
checkpoint_1007000/target.decoder.layers_20.encoder_decoder_attention.value.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 273 |
+
checkpoint_1007000/target.decoder.layers_20.encoder_decoder_attention.value.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
checkpoint_1007000/state.param_states.encoder.layers_16.pre_mlp_layer_norm.scale.v/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096],"zarr_format":2}
|
checkpoint_1007000/state.param_states.encoder.layers_16.pre_mlp_layer_norm.scale.v/0
ADDED
|
Binary file (15.1 kB). View file
|
|
|
checkpoint_1007000/target.decoder.layers_0.mlp.wi_1.kernel/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_0.mlp.wi_1.kernel/.zarray.__tmp1051907682360705039.~1663960300129366~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_0.mlp.wi_1.kernel/.zarray.__tmp12964120561355800237.~1663960299930878~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_0.mlp.wi_1.kernel/.zarray.__tmp14120820778061497317.~1663960300020900~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_0.mlp.wi_1.kernel/.zarray.__tmp14913800401621094618.~1663960301029013~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_0.mlp.wi_1.kernel/.zarray.__tmp17456560980651184125.~1663960300548641~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_0.mlp.wi_1.kernel/.zarray.__tmp7104034003937207927.~1663960300550773~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_0.mlp.wi_1.kernel/0.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:14bef27d700692b45804a4cdd0fa1a743af0ba53872a8f191e0c0d1db9103e40
|
| 3 |
+
size 19530340
|
checkpoint_1007000/target.decoder.layers_0.mlp.wi_1.kernel/0.1
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:50fd221c85e54c3bc1120680891ec50bbe06c0f7bd7b3ce5d4086c8168645aad
|
| 3 |
+
size 19529694
|
checkpoint_1007000/target.decoder.layers_0.mlp.wi_1.kernel/0.2
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7392a9eb8b5ebaa3493931f8c5fa3cca990bd78067e838706dc6684fd6a6d207
|
| 3 |
+
size 19530942
|
checkpoint_1007000/target.decoder.layers_0.mlp.wi_1.kernel/0.3
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f46dbebd25bc48cee7a0afeb9c4127cb40600f4e8547243d4145f03a8fa0ec4d
|
| 3 |
+
size 19531273
|
checkpoint_1007000/target.decoder.layers_0.mlp.wi_1.kernel/0.4
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ec91873c4f00d584d120d138519b23db73f2e9924a0c63d24932983dc1923f62
|
| 3 |
+
size 19530299
|
checkpoint_1007000/target.decoder.layers_0.mlp.wi_1.kernel/0.5
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e14b66d2deb01f4ccc91b68d2f04eaf5d17ad30b29d67a32fe841cf2be0f1ffb
|
| 3 |
+
size 19529876
|
checkpoint_1007000/target.decoder.layers_0.mlp.wi_1.kernel/0.6
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:fd18ef041fb1d5bd1bc4f5a83b8a2949002a1f8a13f3faa295ec4fc54d750e98
|
| 3 |
+
size 19529774
|
checkpoint_1007000/target.decoder.layers_0.mlp.wi_1.kernel/0.7
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ac01ca9ed39333903ef9ec4ba7ec1d6835a5155f5dc53ab924c7b1d405e4ecc4
|
| 3 |
+
size 19529798
|
checkpoint_1007000/target.decoder.layers_12.pre_self_attention_layer_norm.scale/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_12.pre_self_attention_layer_norm.scale/0
ADDED
|
Binary file (14.7 kB). View file
|
|
|
checkpoint_1007000/target.decoder.layers_13.encoder_decoder_attention.out.kernel/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[512,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_13.encoder_decoder_attention.out.kernel/.zarray.__tmp13618632258628998883.~1663960300385308~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[512,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_13.encoder_decoder_attention.out.kernel/.zarray.__tmp13883755724312397014.~1663960300885805~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[512,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_13.encoder_decoder_attention.out.kernel/.zarray.__tmp15466256357474120295.~1663960300873100~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[512,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_13.encoder_decoder_attention.out.kernel/.zarray.__tmp2035038049991381250.~1663960300550968~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[512,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_13.encoder_decoder_attention.out.kernel/.zarray.__tmp2929896088676765696.~1663960300890288~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[512,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_13.encoder_decoder_attention.out.kernel/.zarray.__tmp3206404155680097865.~1663960300468388~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[512,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_13.encoder_decoder_attention.out.kernel/.zarray.__tmp9272383110870212341.~1663960300685356~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[512,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_13.encoder_decoder_attention.out.kernel/2.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2909bc3d5db25afb1377ffac466fac467e5149cba4abe41519ab690738d3429c
|
| 3 |
+
size 7820248
|
checkpoint_1007000/target.decoder.layers_13.encoder_decoder_attention.out.kernel/4.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7551f95f0b9eb6428e3110878daeded88160d7e2dfcfd5514ef5889875f0a25b
|
| 3 |
+
size 7819611
|
checkpoint_1007000/target.decoder.layers_13.encoder_decoder_attention.out.kernel/5.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c26ec4d87a9a4a459414ae8d92e4df29ae74a4056500d8b3402a250216219814
|
| 3 |
+
size 7818781
|
checkpoint_1007000/target.decoder.layers_17.encoder_decoder_attention.value.kernel/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_17.encoder_decoder_attention.value.kernel/.zarray.__tmp11100819509893764503.~1663960300549218~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_17.encoder_decoder_attention.value.kernel/.zarray.__tmp1371689890356389666.~1663960300546815~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_17.encoder_decoder_attention.value.kernel/.zarray.__tmp17200304346770231764.~1663960300554326~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_17.encoder_decoder_attention.value.kernel/.zarray.__tmp3012749623555417058.~1663960300683754~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_17.encoder_decoder_attention.value.kernel/.zarray.__tmp6162242579562817252.~1663960300872989~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_17.encoder_decoder_attention.value.kernel/.zarray.__tmp7494574353364699209.~1663960300780189~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_17.encoder_decoder_attention.value.kernel/.zarray.__tmp7720999365442451709.~1663960300312377~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_17.encoder_decoder_attention.value.kernel/0.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a7cd24297e97a4d384164c2997a585e79a63e2901cb9c676b3a54dd38ca23405
|
| 3 |
+
size 7821761
|
checkpoint_1007000/target.decoder.layers_17.encoder_decoder_attention.value.kernel/0.1
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:940710026e40c6675f887fcc4b119cb03cdc38b48c8509dee0e101205875d287
|
| 3 |
+
size 7819900
|
checkpoint_1007000/target.decoder.layers_17.encoder_decoder_attention.value.kernel/0.2
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:92af55ec67a23e5459fbbf85a7eb300f5f5b7a6bae4867a1bab3aa5ad386934d
|
| 3 |
+
size 7819637
|
checkpoint_1007000/target.decoder.layers_17.encoder_decoder_attention.value.kernel/0.3
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c417eb254d04edcaae7f08577ef82f1696fd696ec4ac51c8b76d2b360d969544
|
| 3 |
+
size 7820625
|
checkpoint_1007000/target.decoder.layers_17.encoder_decoder_attention.value.kernel/0.4
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:713792a1b9ec558587b827d3e0a7df08be0351114316c915b1df138d313ac344
|
| 3 |
+
size 7820300
|
checkpoint_1007000/target.decoder.layers_17.encoder_decoder_attention.value.kernel/0.5
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:22553541501c405f7b384978b380de10ce681e814230593a4e568d7ff8d93615
|
| 3 |
+
size 7821657
|
checkpoint_1007000/target.decoder.layers_17.encoder_decoder_attention.value.kernel/0.6
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9a9eef31dfdfbe0fc758a31e6c4e176c71e1e203eaed0432d42c076a22b4f827
|
| 3 |
+
size 7817956
|
checkpoint_1007000/target.decoder.layers_17.encoder_decoder_attention.value.kernel/0.7
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9f19304b834586663c2509c2bf46010adc9195fd8e3092b27b09a9e20c4ca1ba
|
| 3 |
+
size 7819409
|
checkpoint_1007000/target.decoder.layers_18.self_attention.out.kernel/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[512,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_18.self_attention.out.kernel/.zarray.__tmp12023918215551030991.~1663960300467063~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[512,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_18.self_attention.out.kernel/.zarray.__tmp13670210875818371004.~1663960300632918~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[512,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|