Commit
·
e4b46a6
1
Parent(s):
fde254a
Upload part 54
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- .gitattributes +52 -0
- checkpoint_1007000/state.param_states.decoder.layers_19.pre_cross_attention_layer_norm.scale.v/.zarray +1 -0
- checkpoint_1007000/state.param_states.decoder.layers_19.pre_cross_attention_layer_norm.scale.v/0 +0 -0
- checkpoint_1007000/state.param_states.decoder.layers_5.pre_cross_attention_layer_norm.scale.v/.zarray +1 -0
- checkpoint_1007000/state.param_states.decoder.layers_5.pre_cross_attention_layer_norm.scale.v/0 +0 -0
- checkpoint_1007000/target.decoder.layers_10.mlp.wo.kernel/.zarray +1 -0
- checkpoint_1007000/target.decoder.layers_10.mlp.wo.kernel/.zarray.__tmp12556689117730967044.~1663960300067269~ +1 -0
- checkpoint_1007000/target.decoder.layers_10.mlp.wo.kernel/.zarray.__tmp2198192486624046698.~1663960301112693~ +1 -0
- checkpoint_1007000/target.decoder.layers_10.mlp.wo.kernel/.zarray.__tmp4289778998305236925.~1663960300016046~ +1 -0
- checkpoint_1007000/target.decoder.layers_10.mlp.wo.kernel/0.0 +3 -0
- checkpoint_1007000/target.decoder.layers_10.mlp.wo.kernel/1.0 +3 -0
- checkpoint_1007000/target.decoder.layers_10.mlp.wo.kernel/2.0 +3 -0
- checkpoint_1007000/target.decoder.layers_10.mlp.wo.kernel/3.0 +3 -0
- checkpoint_1007000/target.decoder.layers_10.mlp.wo.kernel/4.0 +3 -0
- checkpoint_1007000/target.decoder.layers_10.mlp.wo.kernel/5.0 +3 -0
- checkpoint_1007000/target.decoder.layers_10.mlp.wo.kernel/6.0 +3 -0
- checkpoint_1007000/target.decoder.layers_10.mlp.wo.kernel/7.0 +3 -0
- checkpoint_1007000/target.decoder.layers_11.mlp.wi_0.kernel/.zarray +1 -0
- checkpoint_1007000/target.decoder.layers_11.mlp.wi_0.kernel/.zarray.__tmp10770559433335723149.~1663960300550170~ +1 -0
- checkpoint_1007000/target.decoder.layers_11.mlp.wi_0.kernel/.zarray.__tmp12608879935475681094.~1663960300728156~ +1 -0
- checkpoint_1007000/target.decoder.layers_11.mlp.wi_0.kernel/.zarray.__tmp18328120602218273837.~1663960300471175~ +1 -0
- checkpoint_1007000/target.decoder.layers_11.mlp.wi_0.kernel/.zarray.__tmp2623057869094272155.~1663960300493629~ +1 -0
- checkpoint_1007000/target.decoder.layers_11.mlp.wi_0.kernel/.zarray.__tmp4168994715625229474.~1663960300989987~ +1 -0
- checkpoint_1007000/target.decoder.layers_11.mlp.wi_0.kernel/.zarray.__tmp5600032214776525345.~1663960300420545~ +1 -0
- checkpoint_1007000/target.decoder.layers_11.mlp.wi_0.kernel/0.0 +3 -0
- checkpoint_1007000/target.decoder.layers_11.mlp.wi_0.kernel/0.1 +3 -0
- checkpoint_1007000/target.decoder.layers_11.mlp.wi_0.kernel/0.2 +3 -0
- checkpoint_1007000/target.decoder.layers_11.mlp.wi_0.kernel/0.3 +3 -0
- checkpoint_1007000/target.decoder.layers_11.mlp.wi_0.kernel/0.4 +3 -0
- checkpoint_1007000/target.decoder.layers_11.mlp.wi_0.kernel/0.5 +3 -0
- checkpoint_1007000/target.decoder.layers_11.mlp.wi_0.kernel/0.6 +3 -0
- checkpoint_1007000/target.decoder.layers_11.mlp.wi_0.kernel/0.7 +3 -0
- checkpoint_1007000/target.decoder.layers_11.pre_mlp_layer_norm.scale/.zarray +1 -0
- checkpoint_1007000/target.decoder.layers_11.pre_mlp_layer_norm.scale/0 +0 -0
- checkpoint_1007000/target.decoder.layers_12.mlp.wi_0.kernel/.zarray +1 -0
- checkpoint_1007000/target.decoder.layers_12.mlp.wi_0.kernel/.zarray.__tmp17477021328867075685.~1663960300307643~ +1 -0
- checkpoint_1007000/target.decoder.layers_12.mlp.wi_0.kernel/.zarray.__tmp8601028490451669708.~1663960300312763~ +1 -0
- checkpoint_1007000/target.decoder.layers_12.mlp.wi_0.kernel/0.0 +3 -0
- checkpoint_1007000/target.decoder.layers_12.mlp.wi_0.kernel/0.1 +3 -0
- checkpoint_1007000/target.decoder.layers_12.mlp.wi_0.kernel/0.2 +3 -0
- checkpoint_1007000/target.decoder.layers_12.mlp.wi_0.kernel/0.3 +3 -0
- checkpoint_1007000/target.decoder.layers_12.mlp.wi_0.kernel/0.4 +3 -0
- checkpoint_1007000/target.decoder.layers_12.mlp.wi_0.kernel/0.5 +3 -0
- checkpoint_1007000/target.decoder.layers_12.mlp.wi_0.kernel/0.6 +3 -0
- checkpoint_1007000/target.decoder.layers_12.mlp.wi_0.kernel/0.7 +3 -0
- checkpoint_1007000/target.decoder.layers_17.encoder_decoder_attention.out.kernel/.zarray +1 -0
- checkpoint_1007000/target.decoder.layers_17.encoder_decoder_attention.out.kernel/.zarray.__tmp11103892762810324551.~1663960300272621~ +1 -0
- checkpoint_1007000/target.decoder.layers_17.encoder_decoder_attention.out.kernel/.zarray.__tmp1294020699136088639.~1663960300885466~ +1 -0
- checkpoint_1007000/target.decoder.layers_17.encoder_decoder_attention.out.kernel/.zarray.__tmp13195707986353451157.~1663960300549776~ +1 -0
- checkpoint_1007000/target.decoder.layers_17.encoder_decoder_attention.out.kernel/.zarray.__tmp16486626858036458649.~1663960300423204~ +1 -0
.gitattributes
CHANGED
|
@@ -2721,3 +2721,55 @@ checkpoint_1007000/target.encoder.layers_19.attention.out.kernel/3.0 filter=lfs
|
|
| 2721 |
checkpoint_1007000/target.encoder.layers_19.attention.out.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 2722 |
checkpoint_1007000/target.encoder.layers_19.attention.out.kernel/7.0 filter=lfs diff=lfs merge=lfs -text
|
| 2723 |
checkpoint_1007000/target.encoder.layers_19.attention.out.kernel/5.0 filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 2721 |
checkpoint_1007000/target.encoder.layers_19.attention.out.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 2722 |
checkpoint_1007000/target.encoder.layers_19.attention.out.kernel/7.0 filter=lfs diff=lfs merge=lfs -text
|
| 2723 |
checkpoint_1007000/target.encoder.layers_19.attention.out.kernel/5.0 filter=lfs diff=lfs merge=lfs -text
|
| 2724 |
+
checkpoint_1007000/target.encoder.layers_19.attention.out.kernel/2.0 filter=lfs diff=lfs merge=lfs -text
|
| 2725 |
+
checkpoint_1007000/target.encoder.layers_19.attention.out.kernel/4.0 filter=lfs diff=lfs merge=lfs -text
|
| 2726 |
+
checkpoint_1007000/target.decoder.layers_17.encoder_decoder_attention.out.kernel/6.0 filter=lfs diff=lfs merge=lfs -text
|
| 2727 |
+
checkpoint_1007000/target.decoder.layers_17.encoder_decoder_attention.out.kernel/1.0 filter=lfs diff=lfs merge=lfs -text
|
| 2728 |
+
checkpoint_1007000/target.decoder.layers_17.encoder_decoder_attention.out.kernel/3.0 filter=lfs diff=lfs merge=lfs -text
|
| 2729 |
+
checkpoint_1007000/target.decoder.layers_17.encoder_decoder_attention.out.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 2730 |
+
checkpoint_1007000/target.decoder.layers_17.encoder_decoder_attention.out.kernel/7.0 filter=lfs diff=lfs merge=lfs -text
|
| 2731 |
+
checkpoint_1007000/target.decoder.layers_17.encoder_decoder_attention.out.kernel/5.0 filter=lfs diff=lfs merge=lfs -text
|
| 2732 |
+
checkpoint_1007000/target.decoder.layers_17.encoder_decoder_attention.out.kernel/2.0 filter=lfs diff=lfs merge=lfs -text
|
| 2733 |
+
checkpoint_1007000/target.decoder.layers_17.encoder_decoder_attention.out.kernel/4.0 filter=lfs diff=lfs merge=lfs -text
|
| 2734 |
+
checkpoint_1007000/target.encoder.layers_7.mlp.wi_1.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 2735 |
+
checkpoint_1007000/target.encoder.layers_7.mlp.wi_1.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
| 2736 |
+
checkpoint_1007000/target.encoder.layers_7.mlp.wi_1.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 2737 |
+
checkpoint_1007000/target.encoder.layers_7.mlp.wi_1.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
| 2738 |
+
checkpoint_1007000/target.encoder.layers_7.mlp.wi_1.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
| 2739 |
+
checkpoint_1007000/target.encoder.layers_7.mlp.wi_1.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
| 2740 |
+
checkpoint_1007000/target.encoder.layers_7.mlp.wi_1.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
| 2741 |
+
checkpoint_1007000/target.encoder.layers_7.mlp.wi_1.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
| 2742 |
+
checkpoint_1007000/target.decoder.layers_10.mlp.wo.kernel/6.0 filter=lfs diff=lfs merge=lfs -text
|
| 2743 |
+
checkpoint_1007000/target.decoder.layers_10.mlp.wo.kernel/1.0 filter=lfs diff=lfs merge=lfs -text
|
| 2744 |
+
checkpoint_1007000/target.decoder.layers_10.mlp.wo.kernel/3.0 filter=lfs diff=lfs merge=lfs -text
|
| 2745 |
+
checkpoint_1007000/target.decoder.layers_10.mlp.wo.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 2746 |
+
checkpoint_1007000/target.decoder.layers_10.mlp.wo.kernel/7.0 filter=lfs diff=lfs merge=lfs -text
|
| 2747 |
+
checkpoint_1007000/target.decoder.layers_10.mlp.wo.kernel/5.0 filter=lfs diff=lfs merge=lfs -text
|
| 2748 |
+
checkpoint_1007000/target.decoder.layers_10.mlp.wo.kernel/2.0 filter=lfs diff=lfs merge=lfs -text
|
| 2749 |
+
checkpoint_1007000/target.decoder.layers_10.mlp.wo.kernel/4.0 filter=lfs diff=lfs merge=lfs -text
|
| 2750 |
+
checkpoint_1007000/target.decoder.layers_12.mlp.wi_0.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 2751 |
+
checkpoint_1007000/target.decoder.layers_12.mlp.wi_0.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
| 2752 |
+
checkpoint_1007000/target.decoder.layers_12.mlp.wi_0.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 2753 |
+
checkpoint_1007000/target.decoder.layers_12.mlp.wi_0.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
| 2754 |
+
checkpoint_1007000/target.decoder.layers_12.mlp.wi_0.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
| 2755 |
+
checkpoint_1007000/target.decoder.layers_12.mlp.wi_0.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
| 2756 |
+
checkpoint_1007000/target.decoder.layers_12.mlp.wi_0.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
| 2757 |
+
checkpoint_1007000/target.decoder.layers_12.mlp.wi_0.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
| 2758 |
+
checkpoint_1007000/target.decoder.layers_11.mlp.wi_0.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 2759 |
+
checkpoint_1007000/target.decoder.layers_11.mlp.wi_0.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
| 2760 |
+
checkpoint_1007000/target.decoder.layers_11.mlp.wi_0.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 2761 |
+
checkpoint_1007000/target.decoder.layers_11.mlp.wi_0.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
| 2762 |
+
checkpoint_1007000/target.decoder.layers_11.mlp.wi_0.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
| 2763 |
+
checkpoint_1007000/target.decoder.layers_11.mlp.wi_0.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
| 2764 |
+
checkpoint_1007000/target.decoder.layers_11.mlp.wi_0.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
| 2765 |
+
checkpoint_1007000/target.decoder.layers_11.mlp.wi_0.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
| 2766 |
+
checkpoint_1007000/target.encoder.layers_13.mlp.wi_0.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 2767 |
+
checkpoint_1007000/target.encoder.layers_13.mlp.wi_0.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
| 2768 |
+
checkpoint_1007000/target.encoder.layers_13.mlp.wi_0.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 2769 |
+
checkpoint_1007000/target.encoder.layers_13.mlp.wi_0.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
| 2770 |
+
checkpoint_1007000/target.encoder.layers_13.mlp.wi_0.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
| 2771 |
+
checkpoint_1007000/target.encoder.layers_13.mlp.wi_0.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
| 2772 |
+
checkpoint_1007000/target.encoder.layers_13.mlp.wi_0.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
| 2773 |
+
checkpoint_1007000/target.encoder.layers_13.mlp.wi_0.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
| 2774 |
+
checkpoint_1007000/target.decoder.layers_19.self_attention.out.kernel/6.0 filter=lfs diff=lfs merge=lfs -text
|
| 2775 |
+
checkpoint_1007000/target.decoder.layers_19.self_attention.out.kernel/1.0 filter=lfs diff=lfs merge=lfs -text
|
checkpoint_1007000/state.param_states.decoder.layers_19.pre_cross_attention_layer_norm.scale.v/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096],"zarr_format":2}
|
checkpoint_1007000/state.param_states.decoder.layers_19.pre_cross_attention_layer_norm.scale.v/0
ADDED
|
Binary file (14.6 kB). View file
|
|
|
checkpoint_1007000/state.param_states.decoder.layers_5.pre_cross_attention_layer_norm.scale.v/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096],"zarr_format":2}
|
checkpoint_1007000/state.param_states.decoder.layers_5.pre_cross_attention_layer_norm.scale.v/0
ADDED
|
Binary file (15 kB). View file
|
|
|
checkpoint_1007000/target.decoder.layers_10.mlp.wo.kernel/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[1280,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[10240,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_10.mlp.wo.kernel/.zarray.__tmp12556689117730967044.~1663960300067269~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[1280,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[10240,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_10.mlp.wo.kernel/.zarray.__tmp2198192486624046698.~1663960301112693~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[1280,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[10240,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_10.mlp.wo.kernel/.zarray.__tmp4289778998305236925.~1663960300016046~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[1280,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[10240,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_10.mlp.wo.kernel/0.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4871fadfd724ae526ac399f41461dc64e6b800d40e92c5374cd0a5ee6f73270e
|
| 3 |
+
size 19546237
|
checkpoint_1007000/target.decoder.layers_10.mlp.wo.kernel/1.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d1fd2862e3b98615aa920829cb9b36ae279b26cb8c42dfa3f14b97c25e579ca9
|
| 3 |
+
size 19546822
|
checkpoint_1007000/target.decoder.layers_10.mlp.wo.kernel/2.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7cba1c05bff1419ab92ce02e9fa53119d2e70f1224481d34e47f7a19479b016b
|
| 3 |
+
size 19546486
|
checkpoint_1007000/target.decoder.layers_10.mlp.wo.kernel/3.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b355a32ca184ce9421536e5778a138837aa4c11c31d1f6a84750de5f90a08f7e
|
| 3 |
+
size 19546009
|
checkpoint_1007000/target.decoder.layers_10.mlp.wo.kernel/4.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b6b5972ce171633cdf3c344d530907031e71a803269d29dc5fa0169afdd552a0
|
| 3 |
+
size 19546921
|
checkpoint_1007000/target.decoder.layers_10.mlp.wo.kernel/5.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d542314d533f9d257f3ef36c61646e72722226e132d420a46d923f7e93193a6b
|
| 3 |
+
size 19547266
|
checkpoint_1007000/target.decoder.layers_10.mlp.wo.kernel/6.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a112c1adbb586f74a2affe0bf83f00795abea744b57cbcbbc41dce416ac08c03
|
| 3 |
+
size 19546485
|
checkpoint_1007000/target.decoder.layers_10.mlp.wo.kernel/7.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a476bcabe007fc01135991cfc8b67de0aab86f026bd67df9c0a50f073e0e8ccd
|
| 3 |
+
size 19546869
|
checkpoint_1007000/target.decoder.layers_11.mlp.wi_0.kernel/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_11.mlp.wi_0.kernel/.zarray.__tmp10770559433335723149.~1663960300550170~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_11.mlp.wi_0.kernel/.zarray.__tmp12608879935475681094.~1663960300728156~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_11.mlp.wi_0.kernel/.zarray.__tmp18328120602218273837.~1663960300471175~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_11.mlp.wi_0.kernel/.zarray.__tmp2623057869094272155.~1663960300493629~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_11.mlp.wi_0.kernel/.zarray.__tmp4168994715625229474.~1663960300989987~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_11.mlp.wi_0.kernel/.zarray.__tmp5600032214776525345.~1663960300420545~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_11.mlp.wi_0.kernel/0.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0763e03b25b5d9c9a079fb7da87b0e5ad381f71e901f80ac7d880dbc9fb8477f
|
| 3 |
+
size 19537386
|
checkpoint_1007000/target.decoder.layers_11.mlp.wi_0.kernel/0.1
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:160c0a13cbafadcad8662236599609e17bc5aa89d7cf11ff1bd65d87d2e00b5b
|
| 3 |
+
size 19537978
|
checkpoint_1007000/target.decoder.layers_11.mlp.wi_0.kernel/0.2
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1734d29b6b1f6eccecc8c8687d2cb25b9c5a941594ff283daff044f9b04398de
|
| 3 |
+
size 19537869
|
checkpoint_1007000/target.decoder.layers_11.mlp.wi_0.kernel/0.3
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c52f154fdf3447d5b385c4a2c447aafe9154d10c63850999ff9a128d7f9f0a9a
|
| 3 |
+
size 19537563
|
checkpoint_1007000/target.decoder.layers_11.mlp.wi_0.kernel/0.4
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3f21e317c04b90080e6a83e669df3cfb56398bf1c70a35da7f3b5cbb3c024ba5
|
| 3 |
+
size 19536732
|
checkpoint_1007000/target.decoder.layers_11.mlp.wi_0.kernel/0.5
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:523b1998241d63cb669f588b6502f0656ef722117ab00b9612513b043dcce54e
|
| 3 |
+
size 19538457
|
checkpoint_1007000/target.decoder.layers_11.mlp.wi_0.kernel/0.6
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d50a6456885c58171e331f0bc727d4a7909e1600cd4e150c4b3169a9965d3efe
|
| 3 |
+
size 19537378
|
checkpoint_1007000/target.decoder.layers_11.mlp.wi_0.kernel/0.7
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:42bdb34c089ea9007ea23a08d1bc618a7d0a080fa110c3cd0d0fb72b5c977b9d
|
| 3 |
+
size 19537214
|
checkpoint_1007000/target.decoder.layers_11.pre_mlp_layer_norm.scale/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_11.pre_mlp_layer_norm.scale/0
ADDED
|
Binary file (14.8 kB). View file
|
|
|
checkpoint_1007000/target.decoder.layers_12.mlp.wi_0.kernel/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_12.mlp.wi_0.kernel/.zarray.__tmp17477021328867075685.~1663960300307643~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_12.mlp.wi_0.kernel/.zarray.__tmp8601028490451669708.~1663960300312763~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_12.mlp.wi_0.kernel/0.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:423dc9b3a2988ffa86e9dc8934c7827c9a4d674dfe3587ca961d4cd3efac2d42
|
| 3 |
+
size 19535427
|
checkpoint_1007000/target.decoder.layers_12.mlp.wi_0.kernel/0.1
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4508366ddbb72d6aafde91161bfe228372df6e176db6d38e1438915fda4f4a25
|
| 3 |
+
size 19534271
|
checkpoint_1007000/target.decoder.layers_12.mlp.wi_0.kernel/0.2
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:929f13a291e155b63bc522b7d33f2693631766a3dba6e1eb13aa01fabd0ea5f2
|
| 3 |
+
size 19533620
|
checkpoint_1007000/target.decoder.layers_12.mlp.wi_0.kernel/0.3
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4551e2915c52ebffe717ac7a14d4bff0e565cf1ee201926971e1d2284ea4e7f8
|
| 3 |
+
size 19534262
|
checkpoint_1007000/target.decoder.layers_12.mlp.wi_0.kernel/0.4
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f5adfe4b57f43f75ee97dbf036921f77b43257e27e011944a37578c3765314ec
|
| 3 |
+
size 19534040
|
checkpoint_1007000/target.decoder.layers_12.mlp.wi_0.kernel/0.5
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c11d423d8196f6097ec998703bd41c4253127a92b3595b30cff9fc1118f01023
|
| 3 |
+
size 19534504
|
checkpoint_1007000/target.decoder.layers_12.mlp.wi_0.kernel/0.6
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:122f8a68622afc7481c9d515bcc7c59657a74e70318e51a18443a5d1db24d2c8
|
| 3 |
+
size 19533720
|
checkpoint_1007000/target.decoder.layers_12.mlp.wi_0.kernel/0.7
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ac5e0e10ea7a0a9c7d03e17b6dae865036023e3615ff30beadf2bbe2d9be70b4
|
| 3 |
+
size 19534123
|
checkpoint_1007000/target.decoder.layers_17.encoder_decoder_attention.out.kernel/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[512,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_17.encoder_decoder_attention.out.kernel/.zarray.__tmp11103892762810324551.~1663960300272621~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[512,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_17.encoder_decoder_attention.out.kernel/.zarray.__tmp1294020699136088639.~1663960300885466~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[512,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_17.encoder_decoder_attention.out.kernel/.zarray.__tmp13195707986353451157.~1663960300549776~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[512,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_17.encoder_decoder_attention.out.kernel/.zarray.__tmp16486626858036458649.~1663960300423204~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[512,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|