Commit
·
02a5523
1
Parent(s):
ffa5744
Upload part 61
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- .gitattributes +45 -0
- checkpoint_1007000/state.param_states.decoder.layers_1.pre_mlp_layer_norm.scale.v/.zarray +1 -0
- checkpoint_1007000/state.param_states.decoder.layers_1.pre_mlp_layer_norm.scale.v/0 +0 -0
- checkpoint_1007000/state.param_states.decoder.layers_12.pre_self_attention_layer_norm.scale.v/.zarray +1 -0
- checkpoint_1007000/state.param_states.decoder.layers_12.pre_self_attention_layer_norm.scale.v/0 +0 -0
- checkpoint_1007000/state.param_states.decoder.layers_18.pre_mlp_layer_norm.scale.v/.zarray +1 -0
- checkpoint_1007000/state.param_states.decoder.layers_18.pre_mlp_layer_norm.scale.v/0 +0 -0
- checkpoint_1007000/state.param_states.decoder.layers_3.pre_cross_attention_layer_norm.scale.v/.zarray +1 -0
- checkpoint_1007000/state.param_states.decoder.layers_3.pre_cross_attention_layer_norm.scale.v/0 +0 -0
- checkpoint_1007000/state.param_states.encoder.layers_16.pre_attention_layer_norm.scale.v/.zarray +1 -0
- checkpoint_1007000/state.param_states.encoder.layers_16.pre_attention_layer_norm.scale.v/0 +0 -0
- checkpoint_1007000/target.decoder.layers_1.mlp.wi_1.kernel/.zarray +1 -0
- checkpoint_1007000/target.decoder.layers_1.mlp.wi_1.kernel/.zarray.__tmp10517390467754450665.~1663960300551712~ +1 -0
- checkpoint_1007000/target.decoder.layers_1.mlp.wi_1.kernel/.zarray.__tmp11150637201827260636.~1663960299931181~ +1 -0
- checkpoint_1007000/target.decoder.layers_1.mlp.wi_1.kernel/.zarray.__tmp13682278226412302013.~1663960300351390~ +1 -0
- checkpoint_1007000/target.decoder.layers_1.mlp.wi_1.kernel/.zarray.__tmp15470470356051346968.~1663960300466733~ +1 -0
- checkpoint_1007000/target.decoder.layers_1.mlp.wi_1.kernel/.zarray.__tmp16070463848400767033.~1663960300725298~ +1 -0
- checkpoint_1007000/target.decoder.layers_1.mlp.wi_1.kernel/.zarray.__tmp4715606895551759948.~1663960301026880~ +1 -0
- checkpoint_1007000/target.decoder.layers_1.mlp.wi_1.kernel/.zarray.__tmp6990172224503877914.~1663960300312662~ +1 -0
- checkpoint_1007000/target.decoder.layers_1.mlp.wi_1.kernel/0.0 +3 -0
- checkpoint_1007000/target.decoder.layers_1.mlp.wi_1.kernel/0.1 +3 -0
- checkpoint_1007000/target.decoder.layers_1.mlp.wi_1.kernel/0.2 +3 -0
- checkpoint_1007000/target.decoder.layers_1.mlp.wi_1.kernel/0.3 +3 -0
- checkpoint_1007000/target.decoder.layers_1.mlp.wi_1.kernel/0.4 +3 -0
- checkpoint_1007000/target.decoder.layers_1.mlp.wi_1.kernel/0.5 +3 -0
- checkpoint_1007000/target.decoder.layers_1.mlp.wi_1.kernel/0.6 +3 -0
- checkpoint_1007000/target.decoder.layers_1.mlp.wi_1.kernel/0.7 +3 -0
- checkpoint_1007000/target.decoder.layers_23.mlp.wi_0.kernel/.zarray +1 -0
- checkpoint_1007000/target.decoder.layers_23.mlp.wi_0.kernel/.zarray.__tmp1205921361634409564.~1663960300983122~ +1 -0
- checkpoint_1007000/target.decoder.layers_23.mlp.wi_0.kernel/.zarray.__tmp14490137502884448524.~1663960300686127~ +1 -0
- checkpoint_1007000/target.decoder.layers_23.mlp.wi_0.kernel/.zarray.__tmp15544941891285971030.~1663960300986688~ +1 -0
- checkpoint_1007000/target.decoder.layers_23.mlp.wi_0.kernel/.zarray.__tmp17118588101480905845.~1663960300775461~ +1 -0
- checkpoint_1007000/target.decoder.layers_23.mlp.wi_0.kernel/.zarray.__tmp395293112486858167.~1663960300611240~ +1 -0
- checkpoint_1007000/target.decoder.layers_23.mlp.wi_0.kernel/.zarray.__tmp4344476625017950312.~1663960300550364~ +1 -0
- checkpoint_1007000/target.decoder.layers_23.mlp.wi_0.kernel/.zarray.__tmp6123013506858204450.~1663960300467733~ +1 -0
- checkpoint_1007000/target.decoder.layers_23.mlp.wi_0.kernel/0.0 +3 -0
- checkpoint_1007000/target.decoder.layers_23.mlp.wi_0.kernel/0.1 +3 -0
- checkpoint_1007000/target.decoder.layers_23.mlp.wi_0.kernel/0.2 +3 -0
- checkpoint_1007000/target.decoder.layers_23.mlp.wi_0.kernel/0.3 +3 -0
- checkpoint_1007000/target.decoder.layers_23.mlp.wi_0.kernel/0.4 +3 -0
- checkpoint_1007000/target.decoder.layers_23.mlp.wi_0.kernel/0.5 +3 -0
- checkpoint_1007000/target.decoder.layers_23.mlp.wi_0.kernel/0.6 +3 -0
- checkpoint_1007000/target.decoder.layers_23.mlp.wi_0.kernel/0.7 +3 -0
- checkpoint_1007000/target.decoder.layers_8.mlp.wi_0.kernel/.zarray +1 -0
- checkpoint_1007000/target.decoder.layers_8.mlp.wi_0.kernel/.zarray.__tmp13237028885599976962.~1663960300501371~ +1 -0
- checkpoint_1007000/target.decoder.layers_8.mlp.wi_0.kernel/.zarray.__tmp13643889958327600749.~1663960300821896~ +1 -0
- checkpoint_1007000/target.decoder.layers_8.mlp.wi_0.kernel/.zarray.__tmp15168251722097899504.~1663960300688295~ +1 -0
- checkpoint_1007000/target.decoder.layers_8.mlp.wi_0.kernel/.zarray.__tmp17964654552989045865.~1663960301113138~ +1 -0
- checkpoint_1007000/target.decoder.layers_8.mlp.wi_0.kernel/.zarray.__tmp18083641489968413635.~1663960300628382~ +1 -0
- checkpoint_1007000/target.decoder.layers_8.mlp.wi_0.kernel/.zarray.__tmp7637522368554115615.~1663960300467550~ +1 -0
.gitattributes
CHANGED
|
@@ -3056,3 +3056,48 @@ checkpoint_1007000/target.encoder.layers_22.mlp.wo.kernel/1.0 filter=lfs diff=lf
|
|
| 3056 |
checkpoint_1007000/target.encoder.layers_22.mlp.wo.kernel/3.0 filter=lfs diff=lfs merge=lfs -text
|
| 3057 |
checkpoint_1007000/target.encoder.layers_22.mlp.wo.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 3058 |
checkpoint_1007000/target.encoder.layers_22.mlp.wo.kernel/7.0 filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 3056 |
checkpoint_1007000/target.encoder.layers_22.mlp.wo.kernel/3.0 filter=lfs diff=lfs merge=lfs -text
|
| 3057 |
checkpoint_1007000/target.encoder.layers_22.mlp.wo.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 3058 |
checkpoint_1007000/target.encoder.layers_22.mlp.wo.kernel/7.0 filter=lfs diff=lfs merge=lfs -text
|
| 3059 |
+
checkpoint_1007000/target.encoder.layers_22.mlp.wo.kernel/5.0 filter=lfs diff=lfs merge=lfs -text
|
| 3060 |
+
checkpoint_1007000/target.encoder.layers_22.mlp.wo.kernel/2.0 filter=lfs diff=lfs merge=lfs -text
|
| 3061 |
+
checkpoint_1007000/target.encoder.layers_22.mlp.wo.kernel/4.0 filter=lfs diff=lfs merge=lfs -text
|
| 3062 |
+
checkpoint_1007000/target.decoder.layers_23.mlp.wi_0.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 3063 |
+
checkpoint_1007000/target.decoder.layers_23.mlp.wi_0.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
| 3064 |
+
checkpoint_1007000/target.decoder.layers_23.mlp.wi_0.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 3065 |
+
checkpoint_1007000/target.decoder.layers_23.mlp.wi_0.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
| 3066 |
+
checkpoint_1007000/target.decoder.layers_23.mlp.wi_0.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
| 3067 |
+
checkpoint_1007000/target.decoder.layers_23.mlp.wi_0.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
| 3068 |
+
checkpoint_1007000/target.decoder.layers_23.mlp.wi_0.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
| 3069 |
+
checkpoint_1007000/target.decoder.layers_23.mlp.wi_0.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
| 3070 |
+
checkpoint_1007000/target.decoder.layers_8.mlp.wi_0.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 3071 |
+
checkpoint_1007000/target.decoder.layers_8.mlp.wi_0.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
| 3072 |
+
checkpoint_1007000/target.decoder.layers_8.mlp.wi_0.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 3073 |
+
checkpoint_1007000/target.decoder.layers_8.mlp.wi_0.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
| 3074 |
+
checkpoint_1007000/target.decoder.layers_8.mlp.wi_0.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
| 3075 |
+
checkpoint_1007000/target.decoder.layers_8.mlp.wi_0.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
| 3076 |
+
checkpoint_1007000/target.decoder.layers_8.mlp.wi_0.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
| 3077 |
+
checkpoint_1007000/target.decoder.layers_8.mlp.wi_0.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
| 3078 |
+
checkpoint_1007000/target.encoder.layers_19.attention.key.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 3079 |
+
checkpoint_1007000/target.encoder.layers_19.attention.key.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
| 3080 |
+
checkpoint_1007000/target.encoder.layers_19.attention.key.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 3081 |
+
checkpoint_1007000/target.encoder.layers_19.attention.key.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
| 3082 |
+
checkpoint_1007000/target.encoder.layers_19.attention.key.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
| 3083 |
+
checkpoint_1007000/target.encoder.layers_19.attention.key.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
| 3084 |
+
checkpoint_1007000/target.encoder.layers_19.attention.key.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
| 3085 |
+
checkpoint_1007000/target.encoder.layers_19.attention.key.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
| 3086 |
+
checkpoint_1007000/target.encoder.layers_13.attention.value.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 3087 |
+
checkpoint_1007000/target.encoder.layers_13.attention.value.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
| 3088 |
+
checkpoint_1007000/target.encoder.layers_13.attention.value.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 3089 |
+
checkpoint_1007000/target.encoder.layers_13.attention.value.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
| 3090 |
+
checkpoint_1007000/target.encoder.layers_13.attention.value.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
| 3091 |
+
checkpoint_1007000/target.encoder.layers_13.attention.value.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
| 3092 |
+
checkpoint_1007000/target.encoder.layers_13.attention.value.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
| 3093 |
+
checkpoint_1007000/target.encoder.layers_13.attention.value.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
| 3094 |
+
checkpoint_1007000/target.decoder.layers_1.mlp.wi_1.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 3095 |
+
checkpoint_1007000/target.decoder.layers_1.mlp.wi_1.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
| 3096 |
+
checkpoint_1007000/target.decoder.layers_1.mlp.wi_1.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 3097 |
+
checkpoint_1007000/target.decoder.layers_1.mlp.wi_1.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
| 3098 |
+
checkpoint_1007000/target.decoder.layers_1.mlp.wi_1.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
| 3099 |
+
checkpoint_1007000/target.decoder.layers_1.mlp.wi_1.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
| 3100 |
+
checkpoint_1007000/target.decoder.layers_1.mlp.wi_1.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
| 3101 |
+
checkpoint_1007000/target.decoder.layers_1.mlp.wi_1.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
| 3102 |
+
checkpoint_1007000/target.encoder.layers_11.mlp.wi_1.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 3103 |
+
checkpoint_1007000/target.encoder.layers_11.mlp.wi_1.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
checkpoint_1007000/state.param_states.decoder.layers_1.pre_mlp_layer_norm.scale.v/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096],"zarr_format":2}
|
checkpoint_1007000/state.param_states.decoder.layers_1.pre_mlp_layer_norm.scale.v/0
ADDED
|
Binary file (14.7 kB). View file
|
|
|
checkpoint_1007000/state.param_states.decoder.layers_12.pre_self_attention_layer_norm.scale.v/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096],"zarr_format":2}
|
checkpoint_1007000/state.param_states.decoder.layers_12.pre_self_attention_layer_norm.scale.v/0
ADDED
|
Binary file (15 kB). View file
|
|
|
checkpoint_1007000/state.param_states.decoder.layers_18.pre_mlp_layer_norm.scale.v/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096],"zarr_format":2}
|
checkpoint_1007000/state.param_states.decoder.layers_18.pre_mlp_layer_norm.scale.v/0
ADDED
|
Binary file (14.7 kB). View file
|
|
|
checkpoint_1007000/state.param_states.decoder.layers_3.pre_cross_attention_layer_norm.scale.v/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096],"zarr_format":2}
|
checkpoint_1007000/state.param_states.decoder.layers_3.pre_cross_attention_layer_norm.scale.v/0
ADDED
|
Binary file (14.8 kB). View file
|
|
|
checkpoint_1007000/state.param_states.encoder.layers_16.pre_attention_layer_norm.scale.v/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096],"zarr_format":2}
|
checkpoint_1007000/state.param_states.encoder.layers_16.pre_attention_layer_norm.scale.v/0
ADDED
|
Binary file (15.1 kB). View file
|
|
|
checkpoint_1007000/target.decoder.layers_1.mlp.wi_1.kernel/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_1.mlp.wi_1.kernel/.zarray.__tmp10517390467754450665.~1663960300551712~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_1.mlp.wi_1.kernel/.zarray.__tmp11150637201827260636.~1663960299931181~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_1.mlp.wi_1.kernel/.zarray.__tmp13682278226412302013.~1663960300351390~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_1.mlp.wi_1.kernel/.zarray.__tmp15470470356051346968.~1663960300466733~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_1.mlp.wi_1.kernel/.zarray.__tmp16070463848400767033.~1663960300725298~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_1.mlp.wi_1.kernel/.zarray.__tmp4715606895551759948.~1663960301026880~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_1.mlp.wi_1.kernel/.zarray.__tmp6990172224503877914.~1663960300312662~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_1.mlp.wi_1.kernel/0.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b9e4faaffefa68d0753e03fc5dd2add117dafbf4cba53d4bf5faff4d3cc784f4
|
| 3 |
+
size 19551416
|
checkpoint_1007000/target.decoder.layers_1.mlp.wi_1.kernel/0.1
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:125ca94584e43a23ff5ba638737336c0e846db1354397db5c5aaa6d746bf5352
|
| 3 |
+
size 19553386
|
checkpoint_1007000/target.decoder.layers_1.mlp.wi_1.kernel/0.2
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:33a855a902087dca244634db728891cb3daed423328cb871a9bc56e6df8bf358
|
| 3 |
+
size 19550112
|
checkpoint_1007000/target.decoder.layers_1.mlp.wi_1.kernel/0.3
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c981cfd3877b71f030e8b3289b293f6a104ad7926d718113afeb38fe26b6767a
|
| 3 |
+
size 19548468
|
checkpoint_1007000/target.decoder.layers_1.mlp.wi_1.kernel/0.4
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8202531e39c0a6c13024489a34244e8ce7301a222d638de251435d4fa2161c0e
|
| 3 |
+
size 19554293
|
checkpoint_1007000/target.decoder.layers_1.mlp.wi_1.kernel/0.5
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5dd3cdc538c0928eb56e401c0db5652b5e5156919431cc9ab99a32c72c646801
|
| 3 |
+
size 19551504
|
checkpoint_1007000/target.decoder.layers_1.mlp.wi_1.kernel/0.6
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b04f458b7a967d094514abbd273acb2942908f70a94b19b6f54dc79338438eaf
|
| 3 |
+
size 19552201
|
checkpoint_1007000/target.decoder.layers_1.mlp.wi_1.kernel/0.7
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:60d76da189edf5507d59f20c12e78b64fa3e88355e1bf184b47c42aa2e7830cd
|
| 3 |
+
size 19549034
|
checkpoint_1007000/target.decoder.layers_23.mlp.wi_0.kernel/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_23.mlp.wi_0.kernel/.zarray.__tmp1205921361634409564.~1663960300983122~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_23.mlp.wi_0.kernel/.zarray.__tmp14490137502884448524.~1663960300686127~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_23.mlp.wi_0.kernel/.zarray.__tmp15544941891285971030.~1663960300986688~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_23.mlp.wi_0.kernel/.zarray.__tmp17118588101480905845.~1663960300775461~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_23.mlp.wi_0.kernel/.zarray.__tmp395293112486858167.~1663960300611240~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_23.mlp.wi_0.kernel/.zarray.__tmp4344476625017950312.~1663960300550364~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_23.mlp.wi_0.kernel/.zarray.__tmp6123013506858204450.~1663960300467733~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_23.mlp.wi_0.kernel/0.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:397a3400fc4aa96af7ddf04278f44969348df657de4cf6f5b8f10e1a75305268
|
| 3 |
+
size 19510734
|
checkpoint_1007000/target.decoder.layers_23.mlp.wi_0.kernel/0.1
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:000dd2446172b8d366481ade78170fd6f9f3056c82070ac068a709d0865b74e4
|
| 3 |
+
size 19511520
|
checkpoint_1007000/target.decoder.layers_23.mlp.wi_0.kernel/0.2
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:242d070bc64c9cac51ee565e7fb41d4bdaaa63161bcdc111f9ec74b33a9c6db5
|
| 3 |
+
size 19511365
|
checkpoint_1007000/target.decoder.layers_23.mlp.wi_0.kernel/0.3
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a8353b30b4b0edcf86f4732a3bf3756bc6c3c5ac4fd1d4dca8e73a815dd4ce5e
|
| 3 |
+
size 19511543
|
checkpoint_1007000/target.decoder.layers_23.mlp.wi_0.kernel/0.4
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2723e2b2f8580cb6dcab13d114ba5fd495222ba43a3542160fb79b5390091294
|
| 3 |
+
size 19510496
|
checkpoint_1007000/target.decoder.layers_23.mlp.wi_0.kernel/0.5
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:726083799b011d8463da02395f290d1dff448abc7d8b578e31861129565b4df5
|
| 3 |
+
size 19511750
|
checkpoint_1007000/target.decoder.layers_23.mlp.wi_0.kernel/0.6
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:09373a51b94ad4759a12f3ea9d78451b05bf077d6e6dd4811ebce8cd84b7b499
|
| 3 |
+
size 19511508
|
checkpoint_1007000/target.decoder.layers_23.mlp.wi_0.kernel/0.7
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4472dc90739c8ab991963969a82b08f03f766bb6e7fe803af295161188dc976d
|
| 3 |
+
size 19511126
|
checkpoint_1007000/target.decoder.layers_8.mlp.wi_0.kernel/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_8.mlp.wi_0.kernel/.zarray.__tmp13237028885599976962.~1663960300501371~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_8.mlp.wi_0.kernel/.zarray.__tmp13643889958327600749.~1663960300821896~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_8.mlp.wi_0.kernel/.zarray.__tmp15168251722097899504.~1663960300688295~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_8.mlp.wi_0.kernel/.zarray.__tmp17964654552989045865.~1663960301113138~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_8.mlp.wi_0.kernel/.zarray.__tmp18083641489968413635.~1663960300628382~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_8.mlp.wi_0.kernel/.zarray.__tmp7637522368554115615.~1663960300467550~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|