Commit
·
e236c2e
1
Parent(s):
595b88f
Upload part 5
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- .gitattributes +51 -0
- checkpoint_1007000/target.decoder.layers_14.encoder_decoder_attention.value.kernel/.zarray +1 -0
- checkpoint_1007000/target.decoder.layers_14.encoder_decoder_attention.value.kernel/.zarray.__tmp1139061284186010554.~1663960300553745~ +1 -0
- checkpoint_1007000/target.decoder.layers_14.encoder_decoder_attention.value.kernel/.zarray.__tmp13471597155206017405.~1663960300471944~ +1 -0
- checkpoint_1007000/target.decoder.layers_14.encoder_decoder_attention.value.kernel/.zarray.__tmp4440907516384387589.~1663960300310075~ +1 -0
- checkpoint_1007000/target.decoder.layers_14.encoder_decoder_attention.value.kernel/.zarray.__tmp480985462762398571.~1663960300307791~ +1 -0
- checkpoint_1007000/target.decoder.layers_14.encoder_decoder_attention.value.kernel/.zarray.__tmp5911277395789222629.~1663960300423841~ +1 -0
- checkpoint_1007000/target.decoder.layers_14.encoder_decoder_attention.value.kernel/.zarray.__tmp7796493714814977216.~1663960300611255~ +1 -0
- checkpoint_1007000/target.decoder.layers_14.encoder_decoder_attention.value.kernel/0.0 +3 -0
- checkpoint_1007000/target.decoder.layers_14.encoder_decoder_attention.value.kernel/0.1 +3 -0
- checkpoint_1007000/target.decoder.layers_14.encoder_decoder_attention.value.kernel/0.2 +3 -0
- checkpoint_1007000/target.decoder.layers_14.encoder_decoder_attention.value.kernel/0.3 +3 -0
- checkpoint_1007000/target.decoder.layers_14.encoder_decoder_attention.value.kernel/0.4 +3 -0
- checkpoint_1007000/target.decoder.layers_14.encoder_decoder_attention.value.kernel/0.5 +3 -0
- checkpoint_1007000/target.decoder.layers_14.encoder_decoder_attention.value.kernel/0.6 +3 -0
- checkpoint_1007000/target.decoder.layers_14.encoder_decoder_attention.value.kernel/0.7 +3 -0
- checkpoint_1007000/target.decoder.layers_20.encoder_decoder_attention.value.kernel/.zarray.__tmp10703318555379806604.~1663960300824228~ +1 -0
- checkpoint_1007000/target.decoder.layers_20.encoder_decoder_attention.value.kernel/.zarray.__tmp14290873638833964418.~1663960300496122~ +1 -0
- checkpoint_1007000/target.decoder.layers_20.encoder_decoder_attention.value.kernel/.zarray.__tmp1703848661665708881.~1663960300776834~ +1 -0
- checkpoint_1007000/target.decoder.layers_20.encoder_decoder_attention.value.kernel/.zarray.__tmp5914603630166378899.~1663960300685977~ +1 -0
- checkpoint_1007000/target.decoder.layers_20.encoder_decoder_attention.value.kernel/.zarray.__tmp8596125325754350577.~1663960301025800~ +1 -0
- checkpoint_1007000/target.decoder.layers_20.encoder_decoder_attention.value.kernel/0.2 +3 -0
- checkpoint_1007000/target.decoder.layers_20.encoder_decoder_attention.value.kernel/0.3 +3 -0
- checkpoint_1007000/target.decoder.layers_20.encoder_decoder_attention.value.kernel/0.4 +3 -0
- checkpoint_1007000/target.decoder.layers_20.encoder_decoder_attention.value.kernel/0.5 +3 -0
- checkpoint_1007000/target.decoder.layers_21.mlp.wo.kernel/.zarray +1 -0
- checkpoint_1007000/target.decoder.layers_21.mlp.wo.kernel/.zarray.__tmp12603200558239592285.~1663960300550168~ +1 -0
- checkpoint_1007000/target.decoder.layers_21.mlp.wo.kernel/.zarray.__tmp12839819994061784785.~1663960300425252~ +1 -0
- checkpoint_1007000/target.decoder.layers_21.mlp.wo.kernel/.zarray.__tmp16053894777534944423.~1663960300632211~ +1 -0
- checkpoint_1007000/target.decoder.layers_21.mlp.wo.kernel/.zarray.__tmp2878207316635960913.~1663960301069204~ +1 -0
- checkpoint_1007000/target.decoder.layers_21.mlp.wo.kernel/.zarray.__tmp3241036210249371302.~1663960300472378~ +1 -0
- checkpoint_1007000/target.decoder.layers_21.mlp.wo.kernel/.zarray.__tmp6214888084836174430.~1663960300176598~ +1 -0
- checkpoint_1007000/target.decoder.layers_21.mlp.wo.kernel/0.0 +3 -0
- checkpoint_1007000/target.decoder.layers_21.mlp.wo.kernel/1.0 +3 -0
- checkpoint_1007000/target.decoder.layers_21.mlp.wo.kernel/2.0 +3 -0
- checkpoint_1007000/target.decoder.layers_21.mlp.wo.kernel/3.0 +3 -0
- checkpoint_1007000/target.decoder.layers_21.mlp.wo.kernel/4.0 +3 -0
- checkpoint_1007000/target.decoder.layers_21.mlp.wo.kernel/5.0 +3 -0
- checkpoint_1007000/target.decoder.layers_21.mlp.wo.kernel/6.0 +3 -0
- checkpoint_1007000/target.decoder.layers_21.mlp.wo.kernel/7.0 +3 -0
- checkpoint_1007000/target.decoder.layers_21.self_attention.key.kernel/.zarray +1 -0
- checkpoint_1007000/target.decoder.layers_21.self_attention.key.kernel/.zarray.__tmp1231035134384504446.~1663960300385649~ +1 -0
- checkpoint_1007000/target.decoder.layers_21.self_attention.key.kernel/.zarray.__tmp14133491419075121412.~1663960300777355~ +1 -0
- checkpoint_1007000/target.decoder.layers_21.self_attention.key.kernel/.zarray.__tmp1652523638248181532.~1663960300622085~ +1 -0
- checkpoint_1007000/target.decoder.layers_21.self_attention.key.kernel/.zarray.__tmp5460461977166351782.~1663960301029540~ +1 -0
- checkpoint_1007000/target.decoder.layers_21.self_attention.key.kernel/0.0 +3 -0
- checkpoint_1007000/target.decoder.layers_21.self_attention.key.kernel/0.1 +3 -0
- checkpoint_1007000/target.decoder.layers_21.self_attention.key.kernel/0.2 +3 -0
- checkpoint_1007000/target.decoder.layers_21.self_attention.key.kernel/0.3 +3 -0
- checkpoint_1007000/target.decoder.layers_21.self_attention.key.kernel/0.5 +3 -0
.gitattributes
CHANGED
|
@@ -271,3 +271,54 @@ checkpoint_1007000/target.decoder.layers_20.encoder_decoder_attention.value.kern
|
|
| 271 |
checkpoint_1007000/target.decoder.layers_20.encoder_decoder_attention.value.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
| 272 |
checkpoint_1007000/target.decoder.layers_20.encoder_decoder_attention.value.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 273 |
checkpoint_1007000/target.decoder.layers_20.encoder_decoder_attention.value.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 271 |
checkpoint_1007000/target.decoder.layers_20.encoder_decoder_attention.value.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
| 272 |
checkpoint_1007000/target.decoder.layers_20.encoder_decoder_attention.value.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 273 |
checkpoint_1007000/target.decoder.layers_20.encoder_decoder_attention.value.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
| 274 |
+
checkpoint_1007000/target.decoder.layers_20.encoder_decoder_attention.value.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
| 275 |
+
checkpoint_1007000/target.decoder.layers_20.encoder_decoder_attention.value.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
| 276 |
+
checkpoint_1007000/target.decoder.layers_20.encoder_decoder_attention.value.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
| 277 |
+
checkpoint_1007000/target.decoder.layers_20.encoder_decoder_attention.value.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
| 278 |
+
checkpoint_1007000/target.decoder.layers_3.self_attention.out.kernel/6.0 filter=lfs diff=lfs merge=lfs -text
|
| 279 |
+
checkpoint_1007000/target.decoder.layers_3.self_attention.out.kernel/1.0 filter=lfs diff=lfs merge=lfs -text
|
| 280 |
+
checkpoint_1007000/target.decoder.layers_3.self_attention.out.kernel/3.0 filter=lfs diff=lfs merge=lfs -text
|
| 281 |
+
checkpoint_1007000/target.decoder.layers_3.self_attention.out.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 282 |
+
checkpoint_1007000/target.decoder.layers_3.self_attention.out.kernel/7.0 filter=lfs diff=lfs merge=lfs -text
|
| 283 |
+
checkpoint_1007000/target.decoder.layers_3.self_attention.out.kernel/5.0 filter=lfs diff=lfs merge=lfs -text
|
| 284 |
+
checkpoint_1007000/target.decoder.layers_3.self_attention.out.kernel/2.0 filter=lfs diff=lfs merge=lfs -text
|
| 285 |
+
checkpoint_1007000/target.decoder.layers_3.self_attention.out.kernel/4.0 filter=lfs diff=lfs merge=lfs -text
|
| 286 |
+
checkpoint_1007000/target.decoder.layers_14.encoder_decoder_attention.value.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 287 |
+
checkpoint_1007000/target.decoder.layers_14.encoder_decoder_attention.value.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
| 288 |
+
checkpoint_1007000/target.decoder.layers_14.encoder_decoder_attention.value.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 289 |
+
checkpoint_1007000/target.decoder.layers_14.encoder_decoder_attention.value.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
| 290 |
+
checkpoint_1007000/target.decoder.layers_14.encoder_decoder_attention.value.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
| 291 |
+
checkpoint_1007000/target.decoder.layers_14.encoder_decoder_attention.value.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
| 292 |
+
checkpoint_1007000/target.decoder.layers_14.encoder_decoder_attention.value.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
| 293 |
+
checkpoint_1007000/target.decoder.layers_14.encoder_decoder_attention.value.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
| 294 |
+
checkpoint_1007000/target.encoder.layers_2.mlp.wi_1.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 295 |
+
checkpoint_1007000/target.encoder.layers_2.mlp.wi_1.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
| 296 |
+
checkpoint_1007000/target.encoder.layers_2.mlp.wi_1.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 297 |
+
checkpoint_1007000/target.encoder.layers_2.mlp.wi_1.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
| 298 |
+
checkpoint_1007000/target.encoder.layers_2.mlp.wi_1.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
| 299 |
+
checkpoint_1007000/target.encoder.layers_2.mlp.wi_1.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
| 300 |
+
checkpoint_1007000/target.encoder.layers_2.mlp.wi_1.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
| 301 |
+
checkpoint_1007000/target.encoder.layers_2.mlp.wi_1.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
| 302 |
+
checkpoint_1007000/target.encoder.layers_15.attention.value.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 303 |
+
checkpoint_1007000/target.encoder.layers_15.attention.value.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
| 304 |
+
checkpoint_1007000/target.encoder.layers_15.attention.value.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 305 |
+
checkpoint_1007000/target.encoder.layers_15.attention.value.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
| 306 |
+
checkpoint_1007000/target.encoder.layers_15.attention.value.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
| 307 |
+
checkpoint_1007000/target.encoder.layers_15.attention.value.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
| 308 |
+
checkpoint_1007000/target.encoder.layers_15.attention.value.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
| 309 |
+
checkpoint_1007000/target.encoder.layers_15.attention.value.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
| 310 |
+
checkpoint_1007000/target.decoder.layers_21.mlp.wo.kernel/6.0 filter=lfs diff=lfs merge=lfs -text
|
| 311 |
+
checkpoint_1007000/target.decoder.layers_21.mlp.wo.kernel/1.0 filter=lfs diff=lfs merge=lfs -text
|
| 312 |
+
checkpoint_1007000/target.decoder.layers_21.mlp.wo.kernel/3.0 filter=lfs diff=lfs merge=lfs -text
|
| 313 |
+
checkpoint_1007000/target.decoder.layers_21.mlp.wo.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 314 |
+
checkpoint_1007000/target.decoder.layers_21.mlp.wo.kernel/7.0 filter=lfs diff=lfs merge=lfs -text
|
| 315 |
+
checkpoint_1007000/target.decoder.layers_21.mlp.wo.kernel/5.0 filter=lfs diff=lfs merge=lfs -text
|
| 316 |
+
checkpoint_1007000/target.decoder.layers_21.mlp.wo.kernel/2.0 filter=lfs diff=lfs merge=lfs -text
|
| 317 |
+
checkpoint_1007000/target.decoder.layers_21.mlp.wo.kernel/4.0 filter=lfs diff=lfs merge=lfs -text
|
| 318 |
+
checkpoint_1007000/target.decoder.layers_21.self_attention.key.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 319 |
+
checkpoint_1007000/target.decoder.layers_21.self_attention.key.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
| 320 |
+
checkpoint_1007000/target.decoder.layers_21.self_attention.key.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 321 |
+
checkpoint_1007000/target.decoder.layers_21.self_attention.key.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
| 322 |
+
checkpoint_1007000/target.decoder.layers_21.self_attention.key.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
| 323 |
+
checkpoint_1007000/target.decoder.layers_21.self_attention.key.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
| 324 |
+
checkpoint_1007000/target.decoder.layers_21.self_attention.key.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
checkpoint_1007000/target.decoder.layers_14.encoder_decoder_attention.value.kernel/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_14.encoder_decoder_attention.value.kernel/.zarray.__tmp1139061284186010554.~1663960300553745~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_14.encoder_decoder_attention.value.kernel/.zarray.__tmp13471597155206017405.~1663960300471944~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_14.encoder_decoder_attention.value.kernel/.zarray.__tmp4440907516384387589.~1663960300310075~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_14.encoder_decoder_attention.value.kernel/.zarray.__tmp480985462762398571.~1663960300307791~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_14.encoder_decoder_attention.value.kernel/.zarray.__tmp5911277395789222629.~1663960300423841~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_14.encoder_decoder_attention.value.kernel/.zarray.__tmp7796493714814977216.~1663960300611255~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_14.encoder_decoder_attention.value.kernel/0.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2262645582d02f027689b262997c58e0f0f49b8e9516eafcf9e66e016089f787
|
| 3 |
+
size 7796450
|
checkpoint_1007000/target.decoder.layers_14.encoder_decoder_attention.value.kernel/0.1
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:70b9012e0e2422286740b4c24b149b8e38955536d778543c33b69d1793d4da3a
|
| 3 |
+
size 7804207
|
checkpoint_1007000/target.decoder.layers_14.encoder_decoder_attention.value.kernel/0.2
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:03f373ccce06abda15353aeeeba002e93ec7b34137227e305da2f06fdd299225
|
| 3 |
+
size 7806291
|
checkpoint_1007000/target.decoder.layers_14.encoder_decoder_attention.value.kernel/0.3
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0983b793cf4bcc7d484ced533cf2338b417cc9898f10ddc5eb01899e474f7430
|
| 3 |
+
size 7808741
|
checkpoint_1007000/target.decoder.layers_14.encoder_decoder_attention.value.kernel/0.4
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7e81ddd372f7d835bb72b222d6ecff0a453bb0d23b16f2bffe3f4e54a66e459a
|
| 3 |
+
size 7808536
|
checkpoint_1007000/target.decoder.layers_14.encoder_decoder_attention.value.kernel/0.5
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9124d4dfc21c5f87c5018d0b246c096fdfe2715819e5b25dc127bbf599f68dbf
|
| 3 |
+
size 7804442
|
checkpoint_1007000/target.decoder.layers_14.encoder_decoder_attention.value.kernel/0.6
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:29069e74dc413e14419e8097b79bd8866ca0e852759f49602679eb3d043c02fe
|
| 3 |
+
size 7798807
|
checkpoint_1007000/target.decoder.layers_14.encoder_decoder_attention.value.kernel/0.7
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a7dbd616f8bbd32185331b0977f28d5cf8378d5d6d5be922d74a61caa540bba4
|
| 3 |
+
size 7805480
|
checkpoint_1007000/target.decoder.layers_20.encoder_decoder_attention.value.kernel/.zarray.__tmp10703318555379806604.~1663960300824228~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_20.encoder_decoder_attention.value.kernel/.zarray.__tmp14290873638833964418.~1663960300496122~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_20.encoder_decoder_attention.value.kernel/.zarray.__tmp1703848661665708881.~1663960300776834~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_20.encoder_decoder_attention.value.kernel/.zarray.__tmp5914603630166378899.~1663960300685977~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_20.encoder_decoder_attention.value.kernel/.zarray.__tmp8596125325754350577.~1663960301025800~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_20.encoder_decoder_attention.value.kernel/0.2
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a586bc15574db56a90d199d597cc545c4e7c9b553088cda1884a3662601cb3b0
|
| 3 |
+
size 7809186
|
checkpoint_1007000/target.decoder.layers_20.encoder_decoder_attention.value.kernel/0.3
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d036931f79032e53d16ccff0013cfd6f7ea308bac44ba25a4d62944741a27af7
|
| 3 |
+
size 7807707
|
checkpoint_1007000/target.decoder.layers_20.encoder_decoder_attention.value.kernel/0.4
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3146dacd8c7ba6949e55845c5126b77eb1716589468e721eb148886d4bdd7863
|
| 3 |
+
size 7812090
|
checkpoint_1007000/target.decoder.layers_20.encoder_decoder_attention.value.kernel/0.5
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:95b8d2c21f09c318e1bc0720b20fe4c01d0089025b4a3ad0123d1788f55d5d64
|
| 3 |
+
size 7806309
|
checkpoint_1007000/target.decoder.layers_21.mlp.wo.kernel/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[1280,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[10240,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_21.mlp.wo.kernel/.zarray.__tmp12603200558239592285.~1663960300550168~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[1280,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[10240,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_21.mlp.wo.kernel/.zarray.__tmp12839819994061784785.~1663960300425252~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[1280,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[10240,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_21.mlp.wo.kernel/.zarray.__tmp16053894777534944423.~1663960300632211~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[1280,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[10240,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_21.mlp.wo.kernel/.zarray.__tmp2878207316635960913.~1663960301069204~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[1280,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[10240,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_21.mlp.wo.kernel/.zarray.__tmp3241036210249371302.~1663960300472378~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[1280,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[10240,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_21.mlp.wo.kernel/.zarray.__tmp6214888084836174430.~1663960300176598~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[1280,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[10240,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_21.mlp.wo.kernel/0.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c6e33663abaa51418f510945d89bf5175391266f6f76b1f6515a2026f567ff7b
|
| 3 |
+
size 19536392
|
checkpoint_1007000/target.decoder.layers_21.mlp.wo.kernel/1.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8ab282060e89384ecd9081eeab29e217092231bfaab1d59db81c8f029478b7e6
|
| 3 |
+
size 19534648
|
checkpoint_1007000/target.decoder.layers_21.mlp.wo.kernel/2.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d5b5a912124e32e88d7694c5a83b2cace1aaa6d285c6bcf040110ce7b5248393
|
| 3 |
+
size 19535385
|
checkpoint_1007000/target.decoder.layers_21.mlp.wo.kernel/3.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6a6ce63df51ca18154c501424f7a29af495c11cd31ce8609c42bb6a6adee577f
|
| 3 |
+
size 19535860
|
checkpoint_1007000/target.decoder.layers_21.mlp.wo.kernel/4.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:335ff5f78e8804235c441a367cc3b31e3cde1c25e54f0d7478d647f230dcfa3c
|
| 3 |
+
size 19536246
|
checkpoint_1007000/target.decoder.layers_21.mlp.wo.kernel/5.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7bb0905a03fdc64846ec670f3c65db0ce8df9cbb2024b8462ce095fb93a86b9c
|
| 3 |
+
size 19536148
|
checkpoint_1007000/target.decoder.layers_21.mlp.wo.kernel/6.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:10a0ab66f7eb6e7fcf7b6ab861c3b148cbd5254bc97589e443ce7a70b23dd67e
|
| 3 |
+
size 19535348
|
checkpoint_1007000/target.decoder.layers_21.mlp.wo.kernel/7.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8620648da0ef5d58404728d7cf213f7569f86701f6474da9af804142b139ab52
|
| 3 |
+
size 19535299
|
checkpoint_1007000/target.decoder.layers_21.self_attention.key.kernel/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_21.self_attention.key.kernel/.zarray.__tmp1231035134384504446.~1663960300385649~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_21.self_attention.key.kernel/.zarray.__tmp14133491419075121412.~1663960300777355~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_21.self_attention.key.kernel/.zarray.__tmp1652523638248181532.~1663960300622085~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_21.self_attention.key.kernel/.zarray.__tmp5460461977166351782.~1663960301029540~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_21.self_attention.key.kernel/0.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0cb761afe1ebbca9bcbc8b2a74ee5cc53b871d98508e409fca22864e57c5d529
|
| 3 |
+
size 7809485
|
checkpoint_1007000/target.decoder.layers_21.self_attention.key.kernel/0.1
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:bbd0b3570fa5cfb2c5e6546760344a2ff65aa42fe98e7eb8cfa5c00ff23d7f14
|
| 3 |
+
size 7821547
|
checkpoint_1007000/target.decoder.layers_21.self_attention.key.kernel/0.2
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8bfeaeca59f8e1b09a6239e8c9055f29cbedf394a5dedaaa1bc96ec211e55777
|
| 3 |
+
size 7818791
|
checkpoint_1007000/target.decoder.layers_21.self_attention.key.kernel/0.3
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:fcc10612e6720bcdc118ea313415454a5df77d99604e3eeff110520aae5f3277
|
| 3 |
+
size 7813356
|
checkpoint_1007000/target.decoder.layers_21.self_attention.key.kernel/0.5
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d651586841dad03ff0720071d1788fef226a2127b3e7e92a2687eadaf39e598f
|
| 3 |
+
size 7809624
|