Commit
·
97cbfe7
1
Parent(s):
60f6115
Upload part 50
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- .gitattributes +48 -0
- checkpoint_1007000/state.param_states.decoder.layers_4.pre_cross_attention_layer_norm.scale.v/.zarray +1 -0
- checkpoint_1007000/state.param_states.decoder.layers_4.pre_cross_attention_layer_norm.scale.v/0 +0 -0
- checkpoint_1007000/state.param_states.encoder.layers_10.pre_attention_layer_norm.scale.v/.zarray +1 -0
- checkpoint_1007000/state.param_states.encoder.layers_10.pre_attention_layer_norm.scale.v/0 +0 -0
- checkpoint_1007000/state.param_states.encoder.layers_13.pre_attention_layer_norm.scale.v/.zarray +1 -0
- checkpoint_1007000/state.param_states.encoder.layers_13.pre_attention_layer_norm.scale.v/0 +0 -0
- checkpoint_1007000/target.decoder.layers_13.mlp.wi_1.kernel/.zarray +1 -0
- checkpoint_1007000/target.decoder.layers_13.mlp.wi_1.kernel/.zarray.__tmp11765571810778950051.~1663960300383759~ +1 -0
- checkpoint_1007000/target.decoder.layers_13.mlp.wi_1.kernel/.zarray.__tmp12912070580570867986.~1663960300500833~ +1 -0
- checkpoint_1007000/target.decoder.layers_13.mlp.wi_1.kernel/.zarray.__tmp1514902467801034416.~1663960300780080~ +1 -0
- checkpoint_1007000/target.decoder.layers_13.mlp.wi_1.kernel/.zarray.__tmp8901551791242477798.~1663960300683632~ +1 -0
- checkpoint_1007000/target.decoder.layers_13.mlp.wi_1.kernel/0.0 +3 -0
- checkpoint_1007000/target.decoder.layers_13.mlp.wi_1.kernel/0.1 +3 -0
- checkpoint_1007000/target.decoder.layers_13.mlp.wi_1.kernel/0.6 +3 -0
- checkpoint_1007000/target.decoder.layers_13.mlp.wi_1.kernel/0.7 +3 -0
- checkpoint_1007000/target.decoder.layers_13.self_attention.key.kernel/.zarray +1 -0
- checkpoint_1007000/target.decoder.layers_13.self_attention.key.kernel/.zarray.__tmp10324667221790502572.~1663960300499537~ +1 -0
- checkpoint_1007000/target.decoder.layers_13.self_attention.key.kernel/.zarray.__tmp10538194903622094863.~1663960300728954~ +1 -0
- checkpoint_1007000/target.decoder.layers_13.self_attention.key.kernel/.zarray.__tmp11940870617194847787.~1663960300686060~ +1 -0
- checkpoint_1007000/target.decoder.layers_13.self_attention.key.kernel/.zarray.__tmp12433849344879772157.~1663960300271694~ +1 -0
- checkpoint_1007000/target.decoder.layers_13.self_attention.key.kernel/.zarray.__tmp13999437852346953159.~1663960300090637~ +1 -0
- checkpoint_1007000/target.decoder.layers_13.self_attention.key.kernel/.zarray.__tmp18183955016099952054.~1663960300502067~ +1 -0
- checkpoint_1007000/target.decoder.layers_13.self_attention.key.kernel/0.0 +3 -0
- checkpoint_1007000/target.decoder.layers_13.self_attention.key.kernel/0.1 +3 -0
- checkpoint_1007000/target.decoder.layers_13.self_attention.key.kernel/0.2 +3 -0
- checkpoint_1007000/target.decoder.layers_13.self_attention.key.kernel/0.3 +3 -0
- checkpoint_1007000/target.decoder.layers_13.self_attention.key.kernel/0.4 +3 -0
- checkpoint_1007000/target.decoder.layers_13.self_attention.key.kernel/0.5 +3 -0
- checkpoint_1007000/target.decoder.layers_13.self_attention.key.kernel/0.6 +3 -0
- checkpoint_1007000/target.decoder.layers_13.self_attention.key.kernel/0.7 +3 -0
- checkpoint_1007000/target.decoder.layers_2.self_attention.query.kernel/.zarray +1 -0
- checkpoint_1007000/target.decoder.layers_2.self_attention.query.kernel/.zarray.__tmp12802281532173975450.~1663960300548609~ +1 -0
- checkpoint_1007000/target.decoder.layers_2.self_attention.query.kernel/.zarray.__tmp14103607313915582811.~1663960300685478~ +1 -0
- checkpoint_1007000/target.decoder.layers_2.self_attention.query.kernel/.zarray.__tmp16104034802188478716.~1663960300551451~ +1 -0
- checkpoint_1007000/target.decoder.layers_2.self_attention.query.kernel/.zarray.__tmp1667756116761455245.~1663960300823209~ +1 -0
- checkpoint_1007000/target.decoder.layers_2.self_attention.query.kernel/.zarray.__tmp17875011171297452638.~1663960300466131~ +1 -0
- checkpoint_1007000/target.decoder.layers_2.self_attention.query.kernel/.zarray.__tmp6087844182203796233.~1663960300731622~ +1 -0
- checkpoint_1007000/target.decoder.layers_2.self_attention.query.kernel/.zarray.__tmp9039702464578184575.~1663960300468210~ +1 -0
- checkpoint_1007000/target.decoder.layers_2.self_attention.query.kernel/0.0 +3 -0
- checkpoint_1007000/target.decoder.layers_2.self_attention.query.kernel/0.1 +3 -0
- checkpoint_1007000/target.decoder.layers_2.self_attention.query.kernel/0.2 +3 -0
- checkpoint_1007000/target.decoder.layers_2.self_attention.query.kernel/0.3 +3 -0
- checkpoint_1007000/target.decoder.layers_2.self_attention.query.kernel/0.4 +3 -0
- checkpoint_1007000/target.decoder.layers_2.self_attention.query.kernel/0.5 +3 -0
- checkpoint_1007000/target.decoder.layers_2.self_attention.query.kernel/0.6 +3 -0
- checkpoint_1007000/target.decoder.layers_2.self_attention.query.kernel/0.7 +3 -0
- checkpoint_1007000/target.decoder.layers_21.encoder_decoder_attention.key.kernel/.zarray +1 -0
- checkpoint_1007000/target.decoder.layers_21.encoder_decoder_attention.key.kernel/.zarray.__tmp3372111309395329355.~1663960300601058~ +1 -0
- checkpoint_1007000/target.decoder.layers_21.encoder_decoder_attention.key.kernel/.zarray.__tmp8212117750309176957.~1663960300308686~ +1 -0
.gitattributes
CHANGED
|
@@ -2527,3 +2527,51 @@ checkpoint_1007000/target.decoder.layers_3.mlp.wi_1.kernel/0.1 filter=lfs diff=l
|
|
| 2527 |
checkpoint_1007000/target.decoder.layers_3.mlp.wi_1.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
| 2528 |
checkpoint_1007000/target.decoder.layers_3.mlp.wi_1.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 2529 |
checkpoint_1007000/target.decoder.layers_3.mlp.wi_1.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 2527 |
checkpoint_1007000/target.decoder.layers_3.mlp.wi_1.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
| 2528 |
checkpoint_1007000/target.decoder.layers_3.mlp.wi_1.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 2529 |
checkpoint_1007000/target.decoder.layers_3.mlp.wi_1.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
| 2530 |
+
checkpoint_1007000/target.decoder.layers_3.mlp.wi_1.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
| 2531 |
+
checkpoint_1007000/target.decoder.layers_3.mlp.wi_1.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
| 2532 |
+
checkpoint_1007000/target.decoder.layers_3.mlp.wi_1.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
| 2533 |
+
checkpoint_1007000/target.decoder.layers_3.mlp.wi_1.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
| 2534 |
+
checkpoint_1007000/target.decoder.layers_2.self_attention.query.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 2535 |
+
checkpoint_1007000/target.decoder.layers_2.self_attention.query.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
| 2536 |
+
checkpoint_1007000/target.decoder.layers_2.self_attention.query.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 2537 |
+
checkpoint_1007000/target.decoder.layers_2.self_attention.query.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
| 2538 |
+
checkpoint_1007000/target.decoder.layers_2.self_attention.query.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
| 2539 |
+
checkpoint_1007000/target.decoder.layers_2.self_attention.query.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
| 2540 |
+
checkpoint_1007000/target.decoder.layers_2.self_attention.query.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
| 2541 |
+
checkpoint_1007000/target.decoder.layers_2.self_attention.query.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
| 2542 |
+
checkpoint_1007000/target.encoder.layers_20.mlp.wo.kernel/6.0 filter=lfs diff=lfs merge=lfs -text
|
| 2543 |
+
checkpoint_1007000/target.encoder.layers_20.mlp.wo.kernel/1.0 filter=lfs diff=lfs merge=lfs -text
|
| 2544 |
+
checkpoint_1007000/target.encoder.layers_20.mlp.wo.kernel/3.0 filter=lfs diff=lfs merge=lfs -text
|
| 2545 |
+
checkpoint_1007000/target.encoder.layers_20.mlp.wo.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 2546 |
+
checkpoint_1007000/target.encoder.layers_20.mlp.wo.kernel/7.0 filter=lfs diff=lfs merge=lfs -text
|
| 2547 |
+
checkpoint_1007000/target.encoder.layers_20.mlp.wo.kernel/5.0 filter=lfs diff=lfs merge=lfs -text
|
| 2548 |
+
checkpoint_1007000/target.encoder.layers_20.mlp.wo.kernel/2.0 filter=lfs diff=lfs merge=lfs -text
|
| 2549 |
+
checkpoint_1007000/target.encoder.layers_20.mlp.wo.kernel/4.0 filter=lfs diff=lfs merge=lfs -text
|
| 2550 |
+
checkpoint_1007000/target.decoder.layers_21.encoder_decoder_attention.key.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 2551 |
+
checkpoint_1007000/target.decoder.layers_21.encoder_decoder_attention.key.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
| 2552 |
+
checkpoint_1007000/target.decoder.layers_21.encoder_decoder_attention.key.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 2553 |
+
checkpoint_1007000/target.decoder.layers_21.encoder_decoder_attention.key.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
| 2554 |
+
checkpoint_1007000/target.decoder.layers_21.encoder_decoder_attention.key.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
| 2555 |
+
checkpoint_1007000/target.decoder.layers_21.encoder_decoder_attention.key.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
| 2556 |
+
checkpoint_1007000/target.decoder.layers_21.encoder_decoder_attention.key.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
| 2557 |
+
checkpoint_1007000/target.decoder.layers_21.encoder_decoder_attention.key.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
| 2558 |
+
checkpoint_1007000/target.decoder.layers_23.mlp.wo.kernel/6.0 filter=lfs diff=lfs merge=lfs -text
|
| 2559 |
+
checkpoint_1007000/target.decoder.layers_23.mlp.wo.kernel/1.0 filter=lfs diff=lfs merge=lfs -text
|
| 2560 |
+
checkpoint_1007000/target.decoder.layers_23.mlp.wo.kernel/3.0 filter=lfs diff=lfs merge=lfs -text
|
| 2561 |
+
checkpoint_1007000/target.decoder.layers_23.mlp.wo.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 2562 |
+
checkpoint_1007000/target.decoder.layers_23.mlp.wo.kernel/7.0 filter=lfs diff=lfs merge=lfs -text
|
| 2563 |
+
checkpoint_1007000/target.decoder.layers_23.mlp.wo.kernel/5.0 filter=lfs diff=lfs merge=lfs -text
|
| 2564 |
+
checkpoint_1007000/target.decoder.layers_23.mlp.wo.kernel/2.0 filter=lfs diff=lfs merge=lfs -text
|
| 2565 |
+
checkpoint_1007000/target.decoder.layers_23.mlp.wo.kernel/4.0 filter=lfs diff=lfs merge=lfs -text
|
| 2566 |
+
checkpoint_1007000/target.decoder.layers_13.self_attention.key.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 2567 |
+
checkpoint_1007000/target.decoder.layers_13.self_attention.key.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
| 2568 |
+
checkpoint_1007000/target.decoder.layers_13.self_attention.key.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 2569 |
+
checkpoint_1007000/target.decoder.layers_13.self_attention.key.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
| 2570 |
+
checkpoint_1007000/target.decoder.layers_13.self_attention.key.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
| 2571 |
+
checkpoint_1007000/target.decoder.layers_13.self_attention.key.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
| 2572 |
+
checkpoint_1007000/target.decoder.layers_13.self_attention.key.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
| 2573 |
+
checkpoint_1007000/target.decoder.layers_13.self_attention.key.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
| 2574 |
+
checkpoint_1007000/target.decoder.layers_13.mlp.wi_1.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 2575 |
+
checkpoint_1007000/target.decoder.layers_13.mlp.wi_1.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
| 2576 |
+
checkpoint_1007000/target.decoder.layers_13.mlp.wi_1.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 2577 |
+
checkpoint_1007000/target.decoder.layers_13.mlp.wi_1.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
checkpoint_1007000/state.param_states.decoder.layers_4.pre_cross_attention_layer_norm.scale.v/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096],"zarr_format":2}
|
checkpoint_1007000/state.param_states.decoder.layers_4.pre_cross_attention_layer_norm.scale.v/0
ADDED
|
Binary file (14.8 kB). View file
|
|
|
checkpoint_1007000/state.param_states.encoder.layers_10.pre_attention_layer_norm.scale.v/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096],"zarr_format":2}
|
checkpoint_1007000/state.param_states.encoder.layers_10.pre_attention_layer_norm.scale.v/0
ADDED
|
Binary file (15.3 kB). View file
|
|
|
checkpoint_1007000/state.param_states.encoder.layers_13.pre_attention_layer_norm.scale.v/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096],"zarr_format":2}
|
checkpoint_1007000/state.param_states.encoder.layers_13.pre_attention_layer_norm.scale.v/0
ADDED
|
Binary file (15.2 kB). View file
|
|
|
checkpoint_1007000/target.decoder.layers_13.mlp.wi_1.kernel/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_13.mlp.wi_1.kernel/.zarray.__tmp11765571810778950051.~1663960300383759~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_13.mlp.wi_1.kernel/.zarray.__tmp12912070580570867986.~1663960300500833~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_13.mlp.wi_1.kernel/.zarray.__tmp1514902467801034416.~1663960300780080~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_13.mlp.wi_1.kernel/.zarray.__tmp8901551791242477798.~1663960300683632~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_13.mlp.wi_1.kernel/0.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:797652dd19b6a7d15d232e8308c2b2c728c50055b92292dd99b66bfa3a180fa1
|
| 3 |
+
size 19515855
|
checkpoint_1007000/target.decoder.layers_13.mlp.wi_1.kernel/0.1
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:dc64d1eb358ab1930c54c69cc757c1658ac355b449f42b923b50e195c7001a16
|
| 3 |
+
size 19517652
|
checkpoint_1007000/target.decoder.layers_13.mlp.wi_1.kernel/0.6
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2860ac818f2adb26c364ba03a9092c48033432ab678dfc4c546695b38046a210
|
| 3 |
+
size 19516865
|
checkpoint_1007000/target.decoder.layers_13.mlp.wi_1.kernel/0.7
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8062c3038efb769e01665d46ef76e493681012dbebc840d69d0e389dfcdafd5a
|
| 3 |
+
size 19517069
|
checkpoint_1007000/target.decoder.layers_13.self_attention.key.kernel/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_13.self_attention.key.kernel/.zarray.__tmp10324667221790502572.~1663960300499537~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_13.self_attention.key.kernel/.zarray.__tmp10538194903622094863.~1663960300728954~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_13.self_attention.key.kernel/.zarray.__tmp11940870617194847787.~1663960300686060~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_13.self_attention.key.kernel/.zarray.__tmp12433849344879772157.~1663960300271694~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_13.self_attention.key.kernel/.zarray.__tmp13999437852346953159.~1663960300090637~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_13.self_attention.key.kernel/.zarray.__tmp18183955016099952054.~1663960300502067~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_13.self_attention.key.kernel/0.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:76c57762aa9b527b2f57ebc464adef65af11e134ac7a08cd38db9fb5d28e64b5
|
| 3 |
+
size 7823817
|
checkpoint_1007000/target.decoder.layers_13.self_attention.key.kernel/0.1
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4ebf5e734977623ae92fb7d7097f7a53af720cc81ea1339af16d7082eba52343
|
| 3 |
+
size 7837991
|
checkpoint_1007000/target.decoder.layers_13.self_attention.key.kernel/0.2
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d9b6688ec136d0784a2ba199fb59c43eda4b6c511a7213826b6a0c53685faabf
|
| 3 |
+
size 7825347
|
checkpoint_1007000/target.decoder.layers_13.self_attention.key.kernel/0.3
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:94d8deb95897b6233f6dbc675420b8bef25306d558c22aa1e588130993583d74
|
| 3 |
+
size 7819281
|
checkpoint_1007000/target.decoder.layers_13.self_attention.key.kernel/0.4
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1f490c7434d964f1102e06c0df9e029ed0650e2a7467deca384aa28441a6b97a
|
| 3 |
+
size 7824657
|
checkpoint_1007000/target.decoder.layers_13.self_attention.key.kernel/0.5
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2253532a4110268abe70f7ee95e4e6dfb95ec76c27bb06a5f522422456fdee58
|
| 3 |
+
size 7828966
|
checkpoint_1007000/target.decoder.layers_13.self_attention.key.kernel/0.6
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8faecf863edf6ae66baa97e378df7e0a44ed0acc3ac512fa1b5422111ad8dc09
|
| 3 |
+
size 7827872
|
checkpoint_1007000/target.decoder.layers_13.self_attention.key.kernel/0.7
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:357fd023b070e3e6ef85f997f3f6a4ecaaec2c934545a979535662414a5c2a2d
|
| 3 |
+
size 7820282
|
checkpoint_1007000/target.decoder.layers_2.self_attention.query.kernel/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_2.self_attention.query.kernel/.zarray.__tmp12802281532173975450.~1663960300548609~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_2.self_attention.query.kernel/.zarray.__tmp14103607313915582811.~1663960300685478~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_2.self_attention.query.kernel/.zarray.__tmp16104034802188478716.~1663960300551451~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_2.self_attention.query.kernel/.zarray.__tmp1667756116761455245.~1663960300823209~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_2.self_attention.query.kernel/.zarray.__tmp17875011171297452638.~1663960300466131~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_2.self_attention.query.kernel/.zarray.__tmp6087844182203796233.~1663960300731622~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_2.self_attention.query.kernel/.zarray.__tmp9039702464578184575.~1663960300468210~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_2.self_attention.query.kernel/0.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d4162852f71226fb6e7354171f8211586e69011528c437ecb30922e96b8dfdb1
|
| 3 |
+
size 7818932
|
checkpoint_1007000/target.decoder.layers_2.self_attention.query.kernel/0.1
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:fda52e13947e30ccb5e51a4db493cc43ec2ad0c07dd97bcb60f35b6f492ca5da
|
| 3 |
+
size 7812725
|
checkpoint_1007000/target.decoder.layers_2.self_attention.query.kernel/0.2
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:95077a967d79730722a94abe247249d206a61684180e38380de8b8b6abd71ecb
|
| 3 |
+
size 7803585
|
checkpoint_1007000/target.decoder.layers_2.self_attention.query.kernel/0.3
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:bcc1a839c32af04f551f74bf959bf8eb7d8916ccef815e0f808d35e17055a470
|
| 3 |
+
size 7812503
|
checkpoint_1007000/target.decoder.layers_2.self_attention.query.kernel/0.4
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a0440b48df7d5da20a81dc188a83c1e6708e3a4f2eadb66f615fea284bf668f9
|
| 3 |
+
size 7816813
|
checkpoint_1007000/target.decoder.layers_2.self_attention.query.kernel/0.5
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7ed5cc904e6ab8c263bf30ad7169a485a48be167d03f347669f8e527f1f813ce
|
| 3 |
+
size 7801610
|
checkpoint_1007000/target.decoder.layers_2.self_attention.query.kernel/0.6
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4cda6ccbafa682fa7ad71455efec4e68bb215038dbd57e95af254093866fe418
|
| 3 |
+
size 7821553
|
checkpoint_1007000/target.decoder.layers_2.self_attention.query.kernel/0.7
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4bff8760a1d5c453e4ceedaaee643cb422656a3f19b7d0f0650a9d22c7c75f9d
|
| 3 |
+
size 7814083
|
checkpoint_1007000/target.decoder.layers_21.encoder_decoder_attention.key.kernel/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_21.encoder_decoder_attention.key.kernel/.zarray.__tmp3372111309395329355.~1663960300601058~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_21.encoder_decoder_attention.key.kernel/.zarray.__tmp8212117750309176957.~1663960300308686~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|