Commit ·
0e11993
1
Parent(s): 340102f
Upload part 3
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- .gitattributes +53 -0
- checkpoint_1007000/state.param_states.decoder.layers_15.pre_mlp_layer_norm.scale.v/.zarray +1 -0
- checkpoint_1007000/state.param_states.decoder.layers_15.pre_mlp_layer_norm.scale.v/0 +0 -0
- checkpoint_1007000/state.param_states.decoder.layers_2.pre_self_attention_layer_norm.scale.v/.zarray +1 -0
- checkpoint_1007000/state.param_states.decoder.layers_2.pre_self_attention_layer_norm.scale.v/0 +0 -0
- checkpoint_1007000/state.param_states.encoder.layers_4.pre_attention_layer_norm.scale.v/.zarray +1 -0
- checkpoint_1007000/state.param_states.encoder.layers_4.pre_attention_layer_norm.scale.v/0 +0 -0
- checkpoint_1007000/target.decoder.layers_11.encoder_decoder_attention.value.kernel/.zarray +1 -0
- checkpoint_1007000/target.decoder.layers_11.encoder_decoder_attention.value.kernel/.zarray.__tmp10961565108918062831.~1663960300886268~ +1 -0
- checkpoint_1007000/target.decoder.layers_11.encoder_decoder_attention.value.kernel/.zarray.__tmp11793943505122929052.~1663960300505221~ +1 -0
- checkpoint_1007000/target.decoder.layers_11.encoder_decoder_attention.value.kernel/.zarray.__tmp1440098945699490157.~1663960300551568~ +1 -0
- checkpoint_1007000/target.decoder.layers_11.encoder_decoder_attention.value.kernel/.zarray.__tmp14628425770511553113.~1663960300312599~ +1 -0
- checkpoint_1007000/target.decoder.layers_11.encoder_decoder_attention.value.kernel/.zarray.__tmp18297844883934390469.~1663960300494925~ +1 -0
- checkpoint_1007000/target.decoder.layers_11.encoder_decoder_attention.value.kernel/.zarray.__tmp5864613505269189558.~1663960300425303~ +1 -0
- checkpoint_1007000/target.decoder.layers_11.encoder_decoder_attention.value.kernel/0.0 +3 -0
- checkpoint_1007000/target.decoder.layers_11.encoder_decoder_attention.value.kernel/0.1 +3 -0
- checkpoint_1007000/target.decoder.layers_11.encoder_decoder_attention.value.kernel/0.2 +3 -0
- checkpoint_1007000/target.decoder.layers_11.encoder_decoder_attention.value.kernel/0.3 +3 -0
- checkpoint_1007000/target.decoder.layers_11.encoder_decoder_attention.value.kernel/0.4 +3 -0
- checkpoint_1007000/target.decoder.layers_11.encoder_decoder_attention.value.kernel/0.5 +3 -0
- checkpoint_1007000/target.decoder.layers_11.encoder_decoder_attention.value.kernel/0.6 +3 -0
- checkpoint_1007000/target.decoder.layers_11.encoder_decoder_attention.value.kernel/0.7 +3 -0
- checkpoint_1007000/target.decoder.layers_13.encoder_decoder_attention.out.kernel/0.0 +3 -0
- checkpoint_1007000/target.decoder.layers_13.encoder_decoder_attention.out.kernel/1.0 +3 -0
- checkpoint_1007000/target.decoder.layers_13.encoder_decoder_attention.out.kernel/3.0 +3 -0
- checkpoint_1007000/target.decoder.layers_13.encoder_decoder_attention.out.kernel/6.0 +3 -0
- checkpoint_1007000/target.decoder.layers_13.encoder_decoder_attention.out.kernel/7.0 +3 -0
- checkpoint_1007000/target.decoder.layers_22.pre_cross_attention_layer_norm.scale/.zarray +1 -0
- checkpoint_1007000/target.decoder.layers_22.pre_cross_attention_layer_norm.scale/0 +0 -0
- checkpoint_1007000/target.decoder.layers_23.self_attention.out.kernel/.zarray +1 -0
- checkpoint_1007000/target.decoder.layers_23.self_attention.out.kernel/.zarray.__tmp12830070173218396735.~1663960300549727~ +1 -0
- checkpoint_1007000/target.decoder.layers_23.self_attention.out.kernel/.zarray.__tmp13183448119106705620.~1663960300385289~ +1 -0
- checkpoint_1007000/target.decoder.layers_23.self_attention.out.kernel/.zarray.__tmp15752704559821348252.~1663960300686341~ +1 -0
- checkpoint_1007000/target.decoder.layers_23.self_attention.out.kernel/.zarray.__tmp464211840814670155.~1663960300776596~ +1 -0
- checkpoint_1007000/target.decoder.layers_23.self_attention.out.kernel/.zarray.__tmp6750169135918407256.~1663960300872835~ +1 -0
- checkpoint_1007000/target.decoder.layers_23.self_attention.out.kernel/.zarray.__tmp7187338248637227935.~1663960300886001~ +1 -0
- checkpoint_1007000/target.decoder.layers_23.self_attention.out.kernel/.zarray.__tmp9319007599745864122.~1663960300351256~ +1 -0
- checkpoint_1007000/target.decoder.layers_23.self_attention.out.kernel/0.0 +3 -0
- checkpoint_1007000/target.decoder.layers_23.self_attention.out.kernel/1.0 +3 -0
- checkpoint_1007000/target.decoder.layers_23.self_attention.out.kernel/2.0 +3 -0
- checkpoint_1007000/target.decoder.layers_23.self_attention.out.kernel/3.0 +3 -0
- checkpoint_1007000/target.decoder.layers_23.self_attention.out.kernel/4.0 +3 -0
- checkpoint_1007000/target.decoder.layers_23.self_attention.out.kernel/5.0 +3 -0
- checkpoint_1007000/target.decoder.layers_23.self_attention.out.kernel/6.0 +3 -0
- checkpoint_1007000/target.decoder.layers_23.self_attention.out.kernel/7.0 +3 -0
- checkpoint_1007000/target.decoder.layers_3.encoder_decoder_attention.value.kernel/.zarray +1 -0
- checkpoint_1007000/target.decoder.layers_3.encoder_decoder_attention.value.kernel/.zarray.__tmp11933270201289857914.~1663960300307662~ +1 -0
- checkpoint_1007000/target.decoder.layers_3.encoder_decoder_attention.value.kernel/.zarray.__tmp1696731562003538842.~1663960300312759~ +1 -0
- checkpoint_1007000/target.decoder.layers_3.encoder_decoder_attention.value.kernel/0.0 +3 -0
- checkpoint_1007000/target.decoder.layers_3.encoder_decoder_attention.value.kernel/0.1 +3 -0
.gitattributes
CHANGED
|
@@ -171,3 +171,56 @@ checkpoint_1007000/target.decoder.layers_15.mlp.wi_0.kernel/0.5 filter=lfs diff=
|
|
| 171 |
checkpoint_1007000/target.decoder.layers_15.mlp.wi_0.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
| 172 |
checkpoint_1007000/target.decoder.layers_15.mlp.wi_0.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
| 173 |
checkpoint_1007000/target.decoder.layers_15.mlp.wi_0.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 171 |
checkpoint_1007000/target.decoder.layers_15.mlp.wi_0.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
| 172 |
checkpoint_1007000/target.decoder.layers_15.mlp.wi_0.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
| 173 |
checkpoint_1007000/target.decoder.layers_15.mlp.wi_0.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
| 174 |
+
checkpoint_1007000/target.encoder.layers_17.mlp.wi_0.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 175 |
+
checkpoint_1007000/target.encoder.layers_17.mlp.wi_0.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
| 176 |
+
checkpoint_1007000/target.encoder.layers_17.mlp.wi_0.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 177 |
+
checkpoint_1007000/target.encoder.layers_17.mlp.wi_0.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
| 178 |
+
checkpoint_1007000/target.encoder.layers_17.mlp.wi_0.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
| 179 |
+
checkpoint_1007000/target.encoder.layers_17.mlp.wi_0.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
| 180 |
+
checkpoint_1007000/target.encoder.layers_17.mlp.wi_0.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
| 181 |
+
checkpoint_1007000/target.encoder.layers_17.mlp.wi_0.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
| 182 |
+
checkpoint_1007000/target.decoder.layers_4.encoder_decoder_attention.key.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 183 |
+
checkpoint_1007000/target.decoder.layers_4.encoder_decoder_attention.key.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
| 184 |
+
checkpoint_1007000/target.decoder.layers_4.encoder_decoder_attention.key.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 185 |
+
checkpoint_1007000/target.decoder.layers_4.encoder_decoder_attention.key.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
| 186 |
+
checkpoint_1007000/target.decoder.layers_4.encoder_decoder_attention.key.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
| 187 |
+
checkpoint_1007000/target.decoder.layers_4.encoder_decoder_attention.key.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
| 188 |
+
checkpoint_1007000/target.decoder.layers_4.encoder_decoder_attention.key.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
| 189 |
+
checkpoint_1007000/target.decoder.layers_4.encoder_decoder_attention.key.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
| 190 |
+
checkpoint_1007000/target.decoder.layers_11.encoder_decoder_attention.value.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 191 |
+
checkpoint_1007000/target.decoder.layers_11.encoder_decoder_attention.value.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
| 192 |
+
checkpoint_1007000/target.decoder.layers_11.encoder_decoder_attention.value.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 193 |
+
checkpoint_1007000/target.decoder.layers_11.encoder_decoder_attention.value.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
| 194 |
+
checkpoint_1007000/target.decoder.layers_11.encoder_decoder_attention.value.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
| 195 |
+
checkpoint_1007000/target.decoder.layers_11.encoder_decoder_attention.value.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
| 196 |
+
checkpoint_1007000/target.decoder.layers_11.encoder_decoder_attention.value.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
| 197 |
+
checkpoint_1007000/target.decoder.layers_11.encoder_decoder_attention.value.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
| 198 |
+
checkpoint_1007000/target.decoder.layers_23.self_attention.out.kernel/6.0 filter=lfs diff=lfs merge=lfs -text
|
| 199 |
+
checkpoint_1007000/target.decoder.layers_23.self_attention.out.kernel/1.0 filter=lfs diff=lfs merge=lfs -text
|
| 200 |
+
checkpoint_1007000/target.decoder.layers_23.self_attention.out.kernel/3.0 filter=lfs diff=lfs merge=lfs -text
|
| 201 |
+
checkpoint_1007000/target.decoder.layers_23.self_attention.out.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 202 |
+
checkpoint_1007000/target.decoder.layers_23.self_attention.out.kernel/7.0 filter=lfs diff=lfs merge=lfs -text
|
| 203 |
+
checkpoint_1007000/target.decoder.layers_23.self_attention.out.kernel/5.0 filter=lfs diff=lfs merge=lfs -text
|
| 204 |
+
checkpoint_1007000/target.decoder.layers_23.self_attention.out.kernel/2.0 filter=lfs diff=lfs merge=lfs -text
|
| 205 |
+
checkpoint_1007000/target.decoder.layers_23.self_attention.out.kernel/4.0 filter=lfs diff=lfs merge=lfs -text
|
| 206 |
+
checkpoint_1007000/target.encoder.layers_18.mlp.wi_1.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 207 |
+
checkpoint_1007000/target.encoder.layers_18.mlp.wi_1.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
| 208 |
+
checkpoint_1007000/target.encoder.layers_18.mlp.wi_1.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 209 |
+
checkpoint_1007000/target.encoder.layers_18.mlp.wi_1.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
| 210 |
+
checkpoint_1007000/target.encoder.layers_18.mlp.wi_1.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
| 211 |
+
checkpoint_1007000/target.encoder.layers_18.mlp.wi_1.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
| 212 |
+
checkpoint_1007000/target.encoder.layers_18.mlp.wi_1.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
| 213 |
+
checkpoint_1007000/target.encoder.layers_18.mlp.wi_1.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
| 214 |
+
checkpoint_1007000/target.decoder.layers_3.encoder_decoder_attention.value.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 215 |
+
checkpoint_1007000/target.decoder.layers_3.encoder_decoder_attention.value.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
| 216 |
+
checkpoint_1007000/target.decoder.layers_3.encoder_decoder_attention.value.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 217 |
+
checkpoint_1007000/target.decoder.layers_3.encoder_decoder_attention.value.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
| 218 |
+
checkpoint_1007000/target.decoder.layers_3.encoder_decoder_attention.value.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
| 219 |
+
checkpoint_1007000/target.decoder.layers_3.encoder_decoder_attention.value.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
| 220 |
+
checkpoint_1007000/target.decoder.layers_3.encoder_decoder_attention.value.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
| 221 |
+
checkpoint_1007000/target.decoder.layers_3.encoder_decoder_attention.value.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
| 222 |
+
checkpoint_1007000/target.decoder.layers_13.encoder_decoder_attention.out.kernel/6.0 filter=lfs diff=lfs merge=lfs -text
|
| 223 |
+
checkpoint_1007000/target.decoder.layers_13.encoder_decoder_attention.out.kernel/1.0 filter=lfs diff=lfs merge=lfs -text
|
| 224 |
+
checkpoint_1007000/target.decoder.layers_13.encoder_decoder_attention.out.kernel/3.0 filter=lfs diff=lfs merge=lfs -text
|
| 225 |
+
checkpoint_1007000/target.decoder.layers_13.encoder_decoder_attention.out.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 226 |
+
checkpoint_1007000/target.decoder.layers_13.encoder_decoder_attention.out.kernel/7.0 filter=lfs diff=lfs merge=lfs -text
|
checkpoint_1007000/state.param_states.decoder.layers_15.pre_mlp_layer_norm.scale.v/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096],"zarr_format":2}
|
checkpoint_1007000/state.param_states.decoder.layers_15.pre_mlp_layer_norm.scale.v/0
ADDED
|
Binary file (14.9 kB). View file
|
|
|
checkpoint_1007000/state.param_states.decoder.layers_2.pre_self_attention_layer_norm.scale.v/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096],"zarr_format":2}
|
checkpoint_1007000/state.param_states.decoder.layers_2.pre_self_attention_layer_norm.scale.v/0
ADDED
|
Binary file (14.9 kB). View file
|
|
|
checkpoint_1007000/state.param_states.encoder.layers_4.pre_attention_layer_norm.scale.v/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096],"zarr_format":2}
|
checkpoint_1007000/state.param_states.encoder.layers_4.pre_attention_layer_norm.scale.v/0
ADDED
|
Binary file (15.3 kB). View file
|
|
|
checkpoint_1007000/target.decoder.layers_11.encoder_decoder_attention.value.kernel/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_11.encoder_decoder_attention.value.kernel/.zarray.__tmp10961565108918062831.~1663960300886268~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_11.encoder_decoder_attention.value.kernel/.zarray.__tmp11793943505122929052.~1663960300505221~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_11.encoder_decoder_attention.value.kernel/.zarray.__tmp1440098945699490157.~1663960300551568~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_11.encoder_decoder_attention.value.kernel/.zarray.__tmp14628425770511553113.~1663960300312599~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_11.encoder_decoder_attention.value.kernel/.zarray.__tmp18297844883934390469.~1663960300494925~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_11.encoder_decoder_attention.value.kernel/.zarray.__tmp5864613505269189558.~1663960300425303~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_11.encoder_decoder_attention.value.kernel/0.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:90c9202ca5e5fb3a2aa8667ebc11c696e348c7d7294a4f486ccdd7617959c0b5
|
| 3 |
+
size 7807159
|
checkpoint_1007000/target.decoder.layers_11.encoder_decoder_attention.value.kernel/0.1
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:569e5d696789228c98b20d6eadc4c084b39d92d16de38cd26847217f6f8f9aa4
|
| 3 |
+
size 7803093
|
checkpoint_1007000/target.decoder.layers_11.encoder_decoder_attention.value.kernel/0.2
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d19aae8e6a35d38ea596e8172a5c0a4f8f3f7f480dd7b006d498593d48e41d1a
|
| 3 |
+
size 7800620
|
checkpoint_1007000/target.decoder.layers_11.encoder_decoder_attention.value.kernel/0.3
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c376752ee217f9e951b7817b95616974b9671068f0661cddc7db8812775ea3fe
|
| 3 |
+
size 7800512
|
checkpoint_1007000/target.decoder.layers_11.encoder_decoder_attention.value.kernel/0.4
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c2197d856500ad390245050f46333b81f46bcfc1ae18f2bd33567254cb44810f
|
| 3 |
+
size 7802077
|
checkpoint_1007000/target.decoder.layers_11.encoder_decoder_attention.value.kernel/0.5
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d712262698bf9d323568301ee3309c5ce4da7b39e6fd23998de227b90012378f
|
| 3 |
+
size 7801706
|
checkpoint_1007000/target.decoder.layers_11.encoder_decoder_attention.value.kernel/0.6
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f8e206778aebad42372c5be8e83536ff04d60b1f0000f76f30c7dea8472aa883
|
| 3 |
+
size 7801882
|
checkpoint_1007000/target.decoder.layers_11.encoder_decoder_attention.value.kernel/0.7
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5b2eb1e8a794bab31e1efb00844560b8f03b47a3b7dd48a3ac371a2e2897c52a
|
| 3 |
+
size 7801473
|
checkpoint_1007000/target.decoder.layers_13.encoder_decoder_attention.out.kernel/0.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:bdb22f13224efe375960573e53d76fba304b3060484ee22dd2155a76a3cfd0b6
|
| 3 |
+
size 7820889
|
checkpoint_1007000/target.decoder.layers_13.encoder_decoder_attention.out.kernel/1.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e56680b2d21f9d8572593eb66ab7570bc2892be102b49c6046415bcc17fc270c
|
| 3 |
+
size 7819170
|
checkpoint_1007000/target.decoder.layers_13.encoder_decoder_attention.out.kernel/3.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c35a63d62b381ece9da62fc3914d1123a58d2dc109aa0e4a93d7fa9be391d207
|
| 3 |
+
size 7820038
|
checkpoint_1007000/target.decoder.layers_13.encoder_decoder_attention.out.kernel/6.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3b7b0ac3a91278650e3b24d806f278487abcb420087fa54230895a5ca8f6c6f6
|
| 3 |
+
size 7820254
|
checkpoint_1007000/target.decoder.layers_13.encoder_decoder_attention.out.kernel/7.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5b09510f34d4be78e56384341a5c8806819a24e2f2e37bbb65a0c882eb171602
|
| 3 |
+
size 7819902
|
checkpoint_1007000/target.decoder.layers_22.pre_cross_attention_layer_norm.scale/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_22.pre_cross_attention_layer_norm.scale/0
ADDED
|
Binary file (14.4 kB). View file
|
|
|
checkpoint_1007000/target.decoder.layers_23.self_attention.out.kernel/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[512,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_23.self_attention.out.kernel/.zarray.__tmp12830070173218396735.~1663960300549727~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[512,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_23.self_attention.out.kernel/.zarray.__tmp13183448119106705620.~1663960300385289~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[512,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_23.self_attention.out.kernel/.zarray.__tmp15752704559821348252.~1663960300686341~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[512,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_23.self_attention.out.kernel/.zarray.__tmp464211840814670155.~1663960300776596~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[512,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_23.self_attention.out.kernel/.zarray.__tmp6750169135918407256.~1663960300872835~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[512,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_23.self_attention.out.kernel/.zarray.__tmp7187338248637227935.~1663960300886001~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[512,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_23.self_attention.out.kernel/.zarray.__tmp9319007599745864122.~1663960300351256~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[512,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_23.self_attention.out.kernel/0.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9fd961bf37fbec24764a16aff20a002216bf3f7c82f5c860c9f0328814e3a911
|
| 3 |
+
size 7799538
|
checkpoint_1007000/target.decoder.layers_23.self_attention.out.kernel/1.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:994beed721b0806bd963f744990ae598e74b053cd8d7f4e75401b2d155d93d00
|
| 3 |
+
size 7805374
|
checkpoint_1007000/target.decoder.layers_23.self_attention.out.kernel/2.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:403f162887853ea97a5ea44c2125300183656ae2e01874a801effa941b002509
|
| 3 |
+
size 7803732
|
checkpoint_1007000/target.decoder.layers_23.self_attention.out.kernel/3.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:55952d638b3750fb9d99b95da16da4c2a9687799018c95a6259d6ec895235565
|
| 3 |
+
size 7810296
|
checkpoint_1007000/target.decoder.layers_23.self_attention.out.kernel/4.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:60a564ef1e01718bd811b4880b32a4015f4469db6f02ea8e2964ceb6c9813fe8
|
| 3 |
+
size 7807573
|
checkpoint_1007000/target.decoder.layers_23.self_attention.out.kernel/5.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ded9f6261b5cc982f4e06136bc32bebc20f767d262b4b4333d855cbb90dee23d
|
| 3 |
+
size 7803713
|
checkpoint_1007000/target.decoder.layers_23.self_attention.out.kernel/6.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b8f0d9e5cc20927dea18009eaab2e46825e460ee6e48391e57738bd074943b2a
|
| 3 |
+
size 7801571
|
checkpoint_1007000/target.decoder.layers_23.self_attention.out.kernel/7.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e2416339f505940a7e7dbbd87b4a6dcfb7648dfa2650ec1aaed129cb72331336
|
| 3 |
+
size 7805580
|
checkpoint_1007000/target.decoder.layers_3.encoder_decoder_attention.value.kernel/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_3.encoder_decoder_attention.value.kernel/.zarray.__tmp11933270201289857914.~1663960300307662~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_3.encoder_decoder_attention.value.kernel/.zarray.__tmp1696731562003538842.~1663960300312759~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_3.encoder_decoder_attention.value.kernel/0.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:dfe31aad0748136710555d63a57daed3dcd52bfa3a7fcad3fc3ac7cbeb05231b
|
| 3 |
+
size 7817313
|
checkpoint_1007000/target.decoder.layers_3.encoder_decoder_attention.value.kernel/0.1
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0db9fe80e418090a1aa80abfb1769af91fb6eafe0b822c2cb343afaec0e503dc
|
| 3 |
+
size 7825741
|