Commit
·
eeee4a0
1
Parent(s):
0f3aef5
Upload part 40
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- .gitattributes +48 -0
- checkpoint_1007000/state.param_states.encoder.layers_12.pre_attention_layer_norm.scale.v/.zarray +1 -0
- checkpoint_1007000/state.param_states.encoder.layers_12.pre_attention_layer_norm.scale.v/0 +0 -0
- checkpoint_1007000/state.param_states.encoder.layers_19.pre_mlp_layer_norm.scale.v/.zarray +1 -0
- checkpoint_1007000/state.param_states.encoder.layers_19.pre_mlp_layer_norm.scale.v/0 +0 -0
- checkpoint_1007000/target.decoder.decoder_norm.scale/.zarray +1 -0
- checkpoint_1007000/target.decoder.decoder_norm.scale/0 +0 -0
- checkpoint_1007000/target.decoder.layers_15.mlp.wi_1.kernel/.zarray +1 -0
- checkpoint_1007000/target.decoder.layers_15.mlp.wi_1.kernel/.zarray.__tmp15590069018174250927.~1663960300308256~ +1 -0
- checkpoint_1007000/target.decoder.layers_15.mlp.wi_1.kernel/.zarray.__tmp15744899109354973635.~1663960300421932~ +1 -0
- checkpoint_1007000/target.decoder.layers_15.mlp.wi_1.kernel/.zarray.__tmp18375236708728796867.~1663960300688867~ +1 -0
- checkpoint_1007000/target.decoder.layers_15.mlp.wi_1.kernel/.zarray.__tmp2103911721188231572.~1663960300822920~ +1 -0
- checkpoint_1007000/target.decoder.layers_15.mlp.wi_1.kernel/.zarray.__tmp4333629875821823980.~1663960300551128~ +1 -0
- checkpoint_1007000/target.decoder.layers_15.mlp.wi_1.kernel/.zarray.__tmp7696852913333449298.~1663960300272803~ +1 -0
- checkpoint_1007000/target.decoder.layers_15.mlp.wi_1.kernel/.zarray.__tmp9885211211724445706.~1663960300632501~ +1 -0
- checkpoint_1007000/target.decoder.layers_15.mlp.wi_1.kernel/0.0 +3 -0
- checkpoint_1007000/target.decoder.layers_15.mlp.wi_1.kernel/0.1 +3 -0
- checkpoint_1007000/target.decoder.layers_15.mlp.wi_1.kernel/0.2 +3 -0
- checkpoint_1007000/target.decoder.layers_15.mlp.wi_1.kernel/0.3 +3 -0
- checkpoint_1007000/target.decoder.layers_15.mlp.wi_1.kernel/0.4 +3 -0
- checkpoint_1007000/target.decoder.layers_15.mlp.wi_1.kernel/0.5 +3 -0
- checkpoint_1007000/target.decoder.layers_15.mlp.wi_1.kernel/0.6 +3 -0
- checkpoint_1007000/target.decoder.layers_15.mlp.wi_1.kernel/0.7 +3 -0
- checkpoint_1007000/target.decoder.layers_16.encoder_decoder_attention.query.kernel/.zarray.__tmp14275400193037987122.~1663960300384017~ +1 -0
- checkpoint_1007000/target.decoder.layers_16.encoder_decoder_attention.query.kernel/.zarray.__tmp5453924144578779166.~1663960300467517~ +1 -0
- checkpoint_1007000/target.decoder.layers_16.encoder_decoder_attention.query.kernel/0.0 +3 -0
- checkpoint_1007000/target.decoder.layers_16.encoder_decoder_attention.query.kernel/0.1 +3 -0
- checkpoint_1007000/target.decoder.layers_16.encoder_decoder_attention.query.kernel/0.6 +3 -0
- checkpoint_1007000/target.decoder.layers_16.encoder_decoder_attention.query.kernel/0.7 +3 -0
- checkpoint_1007000/target.decoder.layers_2.self_attention.value.kernel/.zarray.__tmp14805654823044195203.~1663960300941182~ +1 -0
- checkpoint_1007000/target.decoder.layers_2.self_attention.value.kernel/.zarray.__tmp18402290304374832220.~1663960300610766~ +1 -0
- checkpoint_1007000/target.decoder.layers_2.self_attention.value.kernel/.zarray.__tmp6102370472552948078.~1663960300501139~ +1 -0
- checkpoint_1007000/target.decoder.layers_2.self_attention.value.kernel/.zarray.__tmp6369220955053798728.~1663960300890367~ +1 -0
- checkpoint_1007000/target.decoder.layers_2.self_attention.value.kernel/.zarray.__tmp7004825582130560441.~1663960300601053~ +1 -0
- checkpoint_1007000/target.decoder.layers_2.self_attention.value.kernel/0.2 +3 -0
- checkpoint_1007000/target.decoder.layers_2.self_attention.value.kernel/0.3 +3 -0
- checkpoint_1007000/target.decoder.layers_2.self_attention.value.kernel/0.4 +3 -0
- checkpoint_1007000/target.decoder.layers_2.self_attention.value.kernel/0.5 +3 -0
- checkpoint_1007000/target.decoder.layers_21.mlp.wi_1.kernel/.zarray +1 -0
- checkpoint_1007000/target.decoder.layers_21.mlp.wi_1.kernel/.zarray.__tmp13176058321298810016.~1663960300549058~ +1 -0
- checkpoint_1007000/target.decoder.layers_21.mlp.wi_1.kernel/.zarray.__tmp1715683602810787734.~1663960300986925~ +1 -0
- checkpoint_1007000/target.decoder.layers_21.mlp.wi_1.kernel/.zarray.__tmp1806355867141919373.~1663960300862420~ +1 -0
- checkpoint_1007000/target.decoder.layers_21.mlp.wi_1.kernel/.zarray.__tmp18355203970343633918.~1663960300466384~ +1 -0
- checkpoint_1007000/target.decoder.layers_21.mlp.wi_1.kernel/.zarray.__tmp18395826612412633390.~1663960300551073~ +1 -0
- checkpoint_1007000/target.decoder.layers_21.mlp.wi_1.kernel/.zarray.__tmp8508567864372588290.~1663960300472419~ +1 -0
- checkpoint_1007000/target.decoder.layers_21.mlp.wi_1.kernel/.zarray.__tmp9748784751914184662.~1663960300602153~ +1 -0
- checkpoint_1007000/target.decoder.layers_21.mlp.wi_1.kernel/0.0 +3 -0
- checkpoint_1007000/target.decoder.layers_21.mlp.wi_1.kernel/0.1 +3 -0
- checkpoint_1007000/target.decoder.layers_21.mlp.wi_1.kernel/0.2 +3 -0
- checkpoint_1007000/target.decoder.layers_21.mlp.wi_1.kernel/0.3 +3 -0
.gitattributes
CHANGED
|
@@ -2039,3 +2039,51 @@ checkpoint_1007000/target.decoder.layers_2.self_attention.value.kernel/0.1 filte
|
|
| 2039 |
checkpoint_1007000/target.decoder.layers_2.self_attention.value.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
| 2040 |
checkpoint_1007000/target.decoder.layers_2.self_attention.value.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 2041 |
checkpoint_1007000/target.decoder.layers_2.self_attention.value.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 2039 |
checkpoint_1007000/target.decoder.layers_2.self_attention.value.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
| 2040 |
checkpoint_1007000/target.decoder.layers_2.self_attention.value.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 2041 |
checkpoint_1007000/target.decoder.layers_2.self_attention.value.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
| 2042 |
+
checkpoint_1007000/target.decoder.layers_2.self_attention.value.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
| 2043 |
+
checkpoint_1007000/target.decoder.layers_2.self_attention.value.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
| 2044 |
+
checkpoint_1007000/target.decoder.layers_2.self_attention.value.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
| 2045 |
+
checkpoint_1007000/target.decoder.layers_2.self_attention.value.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
| 2046 |
+
checkpoint_1007000/target.encoder.layers_18.mlp.wi_0.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 2047 |
+
checkpoint_1007000/target.encoder.layers_18.mlp.wi_0.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
| 2048 |
+
checkpoint_1007000/target.encoder.layers_18.mlp.wi_0.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 2049 |
+
checkpoint_1007000/target.encoder.layers_18.mlp.wi_0.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
| 2050 |
+
checkpoint_1007000/target.encoder.layers_18.mlp.wi_0.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
| 2051 |
+
checkpoint_1007000/target.encoder.layers_18.mlp.wi_0.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
| 2052 |
+
checkpoint_1007000/target.encoder.layers_18.mlp.wi_0.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
| 2053 |
+
checkpoint_1007000/target.encoder.layers_18.mlp.wi_0.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
| 2054 |
+
checkpoint_1007000/target.decoder.layers_21.mlp.wi_1.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 2055 |
+
checkpoint_1007000/target.decoder.layers_21.mlp.wi_1.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
| 2056 |
+
checkpoint_1007000/target.decoder.layers_21.mlp.wi_1.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 2057 |
+
checkpoint_1007000/target.decoder.layers_21.mlp.wi_1.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
| 2058 |
+
checkpoint_1007000/target.decoder.layers_21.mlp.wi_1.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
| 2059 |
+
checkpoint_1007000/target.decoder.layers_21.mlp.wi_1.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
| 2060 |
+
checkpoint_1007000/target.decoder.layers_21.mlp.wi_1.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
| 2061 |
+
checkpoint_1007000/target.decoder.layers_21.mlp.wi_1.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
| 2062 |
+
checkpoint_1007000/target.encoder.layers_4.mlp.wo.kernel/6.0 filter=lfs diff=lfs merge=lfs -text
|
| 2063 |
+
checkpoint_1007000/target.encoder.layers_4.mlp.wo.kernel/1.0 filter=lfs diff=lfs merge=lfs -text
|
| 2064 |
+
checkpoint_1007000/target.encoder.layers_4.mlp.wo.kernel/3.0 filter=lfs diff=lfs merge=lfs -text
|
| 2065 |
+
checkpoint_1007000/target.encoder.layers_4.mlp.wo.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 2066 |
+
checkpoint_1007000/target.encoder.layers_4.mlp.wo.kernel/7.0 filter=lfs diff=lfs merge=lfs -text
|
| 2067 |
+
checkpoint_1007000/target.encoder.layers_4.mlp.wo.kernel/5.0 filter=lfs diff=lfs merge=lfs -text
|
| 2068 |
+
checkpoint_1007000/target.encoder.layers_4.mlp.wo.kernel/2.0 filter=lfs diff=lfs merge=lfs -text
|
| 2069 |
+
checkpoint_1007000/target.encoder.layers_4.mlp.wo.kernel/4.0 filter=lfs diff=lfs merge=lfs -text
|
| 2070 |
+
checkpoint_1007000/target.decoder.layers_9.encoder_decoder_attention.value.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 2071 |
+
checkpoint_1007000/target.decoder.layers_9.encoder_decoder_attention.value.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
| 2072 |
+
checkpoint_1007000/target.decoder.layers_9.encoder_decoder_attention.value.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 2073 |
+
checkpoint_1007000/target.decoder.layers_9.encoder_decoder_attention.value.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
| 2074 |
+
checkpoint_1007000/target.decoder.layers_9.encoder_decoder_attention.value.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
| 2075 |
+
checkpoint_1007000/target.decoder.layers_9.encoder_decoder_attention.value.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
| 2076 |
+
checkpoint_1007000/target.decoder.layers_9.encoder_decoder_attention.value.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
| 2077 |
+
checkpoint_1007000/target.decoder.layers_9.encoder_decoder_attention.value.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
| 2078 |
+
checkpoint_1007000/target.decoder.layers_15.mlp.wi_1.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 2079 |
+
checkpoint_1007000/target.decoder.layers_15.mlp.wi_1.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
| 2080 |
+
checkpoint_1007000/target.decoder.layers_15.mlp.wi_1.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 2081 |
+
checkpoint_1007000/target.decoder.layers_15.mlp.wi_1.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
| 2082 |
+
checkpoint_1007000/target.decoder.layers_15.mlp.wi_1.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
| 2083 |
+
checkpoint_1007000/target.decoder.layers_15.mlp.wi_1.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
| 2084 |
+
checkpoint_1007000/target.decoder.layers_15.mlp.wi_1.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
| 2085 |
+
checkpoint_1007000/target.decoder.layers_15.mlp.wi_1.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
| 2086 |
+
checkpoint_1007000/target.decoder.layers_16.encoder_decoder_attention.query.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 2087 |
+
checkpoint_1007000/target.decoder.layers_16.encoder_decoder_attention.query.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
| 2088 |
+
checkpoint_1007000/target.decoder.layers_16.encoder_decoder_attention.query.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 2089 |
+
checkpoint_1007000/target.decoder.layers_16.encoder_decoder_attention.query.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
checkpoint_1007000/state.param_states.encoder.layers_12.pre_attention_layer_norm.scale.v/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096],"zarr_format":2}
|
checkpoint_1007000/state.param_states.encoder.layers_12.pre_attention_layer_norm.scale.v/0
ADDED
|
Binary file (15.3 kB). View file
|
|
|
checkpoint_1007000/state.param_states.encoder.layers_19.pre_mlp_layer_norm.scale.v/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096],"zarr_format":2}
|
checkpoint_1007000/state.param_states.encoder.layers_19.pre_mlp_layer_norm.scale.v/0
ADDED
|
Binary file (14.9 kB). View file
|
|
|
checkpoint_1007000/target.decoder.decoder_norm.scale/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.decoder_norm.scale/0
ADDED
|
Binary file (14.3 kB). View file
|
|
|
checkpoint_1007000/target.decoder.layers_15.mlp.wi_1.kernel/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_15.mlp.wi_1.kernel/.zarray.__tmp15590069018174250927.~1663960300308256~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_15.mlp.wi_1.kernel/.zarray.__tmp15744899109354973635.~1663960300421932~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_15.mlp.wi_1.kernel/.zarray.__tmp18375236708728796867.~1663960300688867~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_15.mlp.wi_1.kernel/.zarray.__tmp2103911721188231572.~1663960300822920~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_15.mlp.wi_1.kernel/.zarray.__tmp4333629875821823980.~1663960300551128~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_15.mlp.wi_1.kernel/.zarray.__tmp7696852913333449298.~1663960300272803~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_15.mlp.wi_1.kernel/.zarray.__tmp9885211211724445706.~1663960300632501~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_15.mlp.wi_1.kernel/0.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:45ebfd0c4619eabdf9d89d4b4d4ca63be84cef787c197f35104910d2b96c1eb0
|
| 3 |
+
size 19499409
|
checkpoint_1007000/target.decoder.layers_15.mlp.wi_1.kernel/0.1
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:86bb7fb122a44e6a1626d0a228a3b16a73fd8733d882b16d7ea13ae71f669335
|
| 3 |
+
size 19499699
|
checkpoint_1007000/target.decoder.layers_15.mlp.wi_1.kernel/0.2
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:735386322dd1ca5a92f9ec8be01acd5f8bd440a63824c4d7e866cde0e7250f19
|
| 3 |
+
size 19499040
|
checkpoint_1007000/target.decoder.layers_15.mlp.wi_1.kernel/0.3
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0aae8a586369c2f5662ddbd2070c629eebb94005dc0c61880be17eda15621d26
|
| 3 |
+
size 19499866
|
checkpoint_1007000/target.decoder.layers_15.mlp.wi_1.kernel/0.4
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f2856535b155eb66ef1bb6a9a80aee5e8d7a23cc0b1352de5324af33bcde7c01
|
| 3 |
+
size 19500203
|
checkpoint_1007000/target.decoder.layers_15.mlp.wi_1.kernel/0.5
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9346c213d864a83e8b7c893834c5489aaa770ade387930c9a9a26fa71a4a4e4a
|
| 3 |
+
size 19499283
|
checkpoint_1007000/target.decoder.layers_15.mlp.wi_1.kernel/0.6
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b6c2de7332788264bc0cabe6465a6748c9b378a4eb961a7965d42059a58a0212
|
| 3 |
+
size 19499187
|
checkpoint_1007000/target.decoder.layers_15.mlp.wi_1.kernel/0.7
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b0923a051abb9de18aa5b6ecb18d9eb8278e79d17ec5ef71b12c8193c8594915
|
| 3 |
+
size 19499839
|
checkpoint_1007000/target.decoder.layers_16.encoder_decoder_attention.query.kernel/.zarray.__tmp14275400193037987122.~1663960300384017~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_16.encoder_decoder_attention.query.kernel/.zarray.__tmp5453924144578779166.~1663960300467517~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_16.encoder_decoder_attention.query.kernel/0.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2df3c7ee498018ada3395244f5cd966c96cfc36723a0170b446d5014ffc94a6e
|
| 3 |
+
size 7829506
|
checkpoint_1007000/target.decoder.layers_16.encoder_decoder_attention.query.kernel/0.1
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:846e55aa07403ec56feadbf63d504abb5486d9fa81b54a835aae87c970a90f0b
|
| 3 |
+
size 7817548
|
checkpoint_1007000/target.decoder.layers_16.encoder_decoder_attention.query.kernel/0.6
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:421ff9ef3aa7a31215303afde29fa305259111bfa93a74a9d8da996364a591ba
|
| 3 |
+
size 7817345
|
checkpoint_1007000/target.decoder.layers_16.encoder_decoder_attention.query.kernel/0.7
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8a24e3541ef54848bdd17cdf7301eb78109d3190dc5e5d938e28162f6021b72e
|
| 3 |
+
size 7818318
|
checkpoint_1007000/target.decoder.layers_2.self_attention.value.kernel/.zarray.__tmp14805654823044195203.~1663960300941182~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_2.self_attention.value.kernel/.zarray.__tmp18402290304374832220.~1663960300610766~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_2.self_attention.value.kernel/.zarray.__tmp6102370472552948078.~1663960300501139~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_2.self_attention.value.kernel/.zarray.__tmp6369220955053798728.~1663960300890367~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_2.self_attention.value.kernel/.zarray.__tmp7004825582130560441.~1663960300601053~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_2.self_attention.value.kernel/0.2
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2ab5a5157075ef0c92909267349a61d6aeaf4fd4d5dcb109c9410424b5075450
|
| 3 |
+
size 7815895
|
checkpoint_1007000/target.decoder.layers_2.self_attention.value.kernel/0.3
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1f2ccd22a40964baef1ed5a3ef1326f9a1a22436a2fc864a380269e328621512
|
| 3 |
+
size 7820427
|
checkpoint_1007000/target.decoder.layers_2.self_attention.value.kernel/0.4
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:584cfb0f56c6ebf2e9c2052d064b3b30a4e6de3dac3a16e5d9d1548fcbfcaa6c
|
| 3 |
+
size 7820338
|
checkpoint_1007000/target.decoder.layers_2.self_attention.value.kernel/0.5
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0f3959986e249abe9d5710ce77d2c294658b4c04951bfa49526e69a9d1f6495a
|
| 3 |
+
size 7820664
|
checkpoint_1007000/target.decoder.layers_21.mlp.wi_1.kernel/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_21.mlp.wi_1.kernel/.zarray.__tmp13176058321298810016.~1663960300549058~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_21.mlp.wi_1.kernel/.zarray.__tmp1715683602810787734.~1663960300986925~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_21.mlp.wi_1.kernel/.zarray.__tmp1806355867141919373.~1663960300862420~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_21.mlp.wi_1.kernel/.zarray.__tmp18355203970343633918.~1663960300466384~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_21.mlp.wi_1.kernel/.zarray.__tmp18395826612412633390.~1663960300551073~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_21.mlp.wi_1.kernel/.zarray.__tmp8508567864372588290.~1663960300472419~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_21.mlp.wi_1.kernel/.zarray.__tmp9748784751914184662.~1663960300602153~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_21.mlp.wi_1.kernel/0.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:81df7532ad11ecf0d825d107031c39b8bf566a2ef3564613c8f3f62d41ef1a7a
|
| 3 |
+
size 19498750
|
checkpoint_1007000/target.decoder.layers_21.mlp.wi_1.kernel/0.1
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5fd3fc124140dbd91842bd576c901cc6e858e15b06345bf2b28b4ae8c36185bf
|
| 3 |
+
size 19497807
|
checkpoint_1007000/target.decoder.layers_21.mlp.wi_1.kernel/0.2
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ef77f53082e13c6251d79725fe4283fe250ed0b42babd8461dd9baa7d0733a94
|
| 3 |
+
size 19498545
|
checkpoint_1007000/target.decoder.layers_21.mlp.wi_1.kernel/0.3
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:70f7ee4713350e57aa976c9faf964a9884e8334bd5f4253afc82a68a71aa3e34
|
| 3 |
+
size 19498564
|