Commit
·
e6333a8
1
Parent(s):
a19f67e
Upload part 68
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- .gitattributes +45 -0
- checkpoint_1007000/state.param_states.decoder.layers_11.pre_mlp_layer_norm.scale.v/.zarray +1 -0
- checkpoint_1007000/state.param_states.decoder.layers_11.pre_mlp_layer_norm.scale.v/0 +0 -0
- checkpoint_1007000/state.param_states.decoder.layers_2.pre_mlp_layer_norm.scale.v/.zarray +1 -0
- checkpoint_1007000/state.param_states.decoder.layers_2.pre_mlp_layer_norm.scale.v/0 +0 -0
- checkpoint_1007000/state.param_states.decoder.layers_20.pre_mlp_layer_norm.scale.v/.zarray +1 -0
- checkpoint_1007000/state.param_states.decoder.layers_20.pre_mlp_layer_norm.scale.v/0 +0 -0
- checkpoint_1007000/state.param_states.encoder.layers_18.pre_attention_layer_norm.scale.v/.zarray +1 -0
- checkpoint_1007000/state.param_states.encoder.layers_18.pre_attention_layer_norm.scale.v/0 +0 -0
- checkpoint_1007000/target.decoder.layers_19.self_attention.query.kernel/.zarray.__tmp9965845325617335270.~1663960300776928~ +1 -0
- checkpoint_1007000/target.decoder.layers_19.self_attention.query.kernel/0.4 +3 -0
- checkpoint_1007000/target.decoder.layers_20.mlp.wi_0.kernel/.zarray +1 -0
- checkpoint_1007000/target.decoder.layers_20.mlp.wi_0.kernel/.zarray.__tmp10737010418154130528.~1663960300990168~ +1 -0
- checkpoint_1007000/target.decoder.layers_20.mlp.wi_0.kernel/.zarray.__tmp15085119283178330789.~1663960300553887~ +1 -0
- checkpoint_1007000/target.decoder.layers_20.mlp.wi_0.kernel/.zarray.__tmp17995146359337543296.~1663960300384585~ +1 -0
- checkpoint_1007000/target.decoder.layers_20.mlp.wi_0.kernel/.zarray.__tmp2502237801831035616.~1663960300546685~ +1 -0
- checkpoint_1007000/target.decoder.layers_20.mlp.wi_0.kernel/.zarray.__tmp2850853085514675605.~1663960300891189~ +1 -0
- checkpoint_1007000/target.decoder.layers_20.mlp.wi_0.kernel/.zarray.__tmp4195479506829954279.~1663960300421542~ +1 -0
- checkpoint_1007000/target.decoder.layers_20.mlp.wi_0.kernel/.zarray.__tmp5713260649823328635.~1663960300313238~ +1 -0
- checkpoint_1007000/target.decoder.layers_20.mlp.wi_0.kernel/0.0 +3 -0
- checkpoint_1007000/target.decoder.layers_20.mlp.wi_0.kernel/0.1 +3 -0
- checkpoint_1007000/target.decoder.layers_20.mlp.wi_0.kernel/0.2 +3 -0
- checkpoint_1007000/target.decoder.layers_20.mlp.wi_0.kernel/0.3 +3 -0
- checkpoint_1007000/target.decoder.layers_20.mlp.wi_0.kernel/0.4 +3 -0
- checkpoint_1007000/target.decoder.layers_20.mlp.wi_0.kernel/0.5 +3 -0
- checkpoint_1007000/target.decoder.layers_20.mlp.wi_0.kernel/0.6 +3 -0
- checkpoint_1007000/target.decoder.layers_20.mlp.wi_0.kernel/0.7 +3 -0
- checkpoint_1007000/target.decoder.layers_5.self_attention.out.kernel/.zarray +1 -0
- checkpoint_1007000/target.decoder.layers_5.self_attention.out.kernel/.zarray.__tmp12472498129906000649.~1663960300987181~ +1 -0
- checkpoint_1007000/target.decoder.layers_5.self_attention.out.kernel/.zarray.__tmp15997632327377674563.~1663960300385093~ +1 -0
- checkpoint_1007000/target.decoder.layers_5.self_attention.out.kernel/.zarray.__tmp17161090791735915174.~1663960300990295~ +1 -0
- checkpoint_1007000/target.decoder.layers_5.self_attention.out.kernel/.zarray.__tmp17678183565922492582.~1663960300887921~ +1 -0
- checkpoint_1007000/target.decoder.layers_5.self_attention.out.kernel/.zarray.__tmp2311522688625836680.~1663960300632690~ +1 -0
- checkpoint_1007000/target.decoder.layers_5.self_attention.out.kernel/.zarray.__tmp912729723844932576.~1663960300499988~ +1 -0
- checkpoint_1007000/target.decoder.layers_5.self_attention.out.kernel/.zarray.__tmp9597664565037842435.~1663960300550190~ +1 -0
- checkpoint_1007000/target.decoder.layers_5.self_attention.out.kernel/0.0 +3 -0
- checkpoint_1007000/target.decoder.layers_5.self_attention.out.kernel/1.0 +3 -0
- checkpoint_1007000/target.decoder.layers_5.self_attention.out.kernel/2.0 +3 -0
- checkpoint_1007000/target.decoder.layers_5.self_attention.out.kernel/3.0 +3 -0
- checkpoint_1007000/target.decoder.layers_5.self_attention.out.kernel/4.0 +3 -0
- checkpoint_1007000/target.decoder.layers_5.self_attention.out.kernel/5.0 +3 -0
- checkpoint_1007000/target.decoder.layers_5.self_attention.out.kernel/6.0 +3 -0
- checkpoint_1007000/target.decoder.layers_5.self_attention.out.kernel/7.0 +3 -0
- checkpoint_1007000/target.decoder.layers_5.self_attention.query.kernel/.zarray +1 -0
- checkpoint_1007000/target.decoder.layers_5.self_attention.query.kernel/.zarray.__tmp10784686010286414521.~1663960300622263~ +1 -0
- checkpoint_1007000/target.decoder.layers_5.self_attention.query.kernel/.zarray.__tmp1264248097414776324.~1663960300599753~ +1 -0
- checkpoint_1007000/target.decoder.layers_5.self_attention.query.kernel/.zarray.__tmp17781551333248209554.~1663960300504701~ +1 -0
- checkpoint_1007000/target.decoder.layers_5.self_attention.query.kernel/.zarray.__tmp187759084959598207.~1663960300730800~ +1 -0
- checkpoint_1007000/target.decoder.layers_5.self_attention.query.kernel/.zarray.__tmp2881458377027394845.~1663960300822313~ +1 -0
- checkpoint_1007000/target.decoder.layers_5.self_attention.query.kernel/.zarray.__tmp4363225482210754279.~1663960300504781~ +1 -0
.gitattributes
CHANGED
|
@@ -3370,3 +3370,48 @@ checkpoint_1007000/target.decoder.layers_19.self_attention.query.kernel/0.6 filt
|
|
| 3370 |
checkpoint_1007000/target.decoder.layers_19.self_attention.query.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
| 3371 |
checkpoint_1007000/target.decoder.layers_19.self_attention.query.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
| 3372 |
checkpoint_1007000/target.decoder.layers_19.self_attention.query.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 3370 |
checkpoint_1007000/target.decoder.layers_19.self_attention.query.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
| 3371 |
checkpoint_1007000/target.decoder.layers_19.self_attention.query.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
| 3372 |
checkpoint_1007000/target.decoder.layers_19.self_attention.query.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
| 3373 |
+
checkpoint_1007000/target.decoder.layers_19.self_attention.query.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
| 3374 |
+
checkpoint_1007000/target.encoder.layers_16.attention.out.kernel/6.0 filter=lfs diff=lfs merge=lfs -text
|
| 3375 |
+
checkpoint_1007000/target.encoder.layers_16.attention.out.kernel/1.0 filter=lfs diff=lfs merge=lfs -text
|
| 3376 |
+
checkpoint_1007000/target.encoder.layers_16.attention.out.kernel/3.0 filter=lfs diff=lfs merge=lfs -text
|
| 3377 |
+
checkpoint_1007000/target.encoder.layers_16.attention.out.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 3378 |
+
checkpoint_1007000/target.encoder.layers_16.attention.out.kernel/7.0 filter=lfs diff=lfs merge=lfs -text
|
| 3379 |
+
checkpoint_1007000/target.encoder.layers_16.attention.out.kernel/5.0 filter=lfs diff=lfs merge=lfs -text
|
| 3380 |
+
checkpoint_1007000/target.encoder.layers_16.attention.out.kernel/2.0 filter=lfs diff=lfs merge=lfs -text
|
| 3381 |
+
checkpoint_1007000/target.encoder.layers_16.attention.out.kernel/4.0 filter=lfs diff=lfs merge=lfs -text
|
| 3382 |
+
checkpoint_1007000/target.decoder.layers_5.self_attention.query.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 3383 |
+
checkpoint_1007000/target.decoder.layers_5.self_attention.query.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
| 3384 |
+
checkpoint_1007000/target.decoder.layers_5.self_attention.query.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 3385 |
+
checkpoint_1007000/target.decoder.layers_5.self_attention.query.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
| 3386 |
+
checkpoint_1007000/target.decoder.layers_5.self_attention.query.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
| 3387 |
+
checkpoint_1007000/target.decoder.layers_5.self_attention.query.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
| 3388 |
+
checkpoint_1007000/target.decoder.layers_5.self_attention.query.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
| 3389 |
+
checkpoint_1007000/target.decoder.layers_5.self_attention.query.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
| 3390 |
+
checkpoint_1007000/target.encoder.layers_1.mlp.wo.kernel/6.0 filter=lfs diff=lfs merge=lfs -text
|
| 3391 |
+
checkpoint_1007000/target.encoder.layers_1.mlp.wo.kernel/1.0 filter=lfs diff=lfs merge=lfs -text
|
| 3392 |
+
checkpoint_1007000/target.encoder.layers_1.mlp.wo.kernel/3.0 filter=lfs diff=lfs merge=lfs -text
|
| 3393 |
+
checkpoint_1007000/target.encoder.layers_1.mlp.wo.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 3394 |
+
checkpoint_1007000/target.encoder.layers_1.mlp.wo.kernel/7.0 filter=lfs diff=lfs merge=lfs -text
|
| 3395 |
+
checkpoint_1007000/target.encoder.layers_1.mlp.wo.kernel/5.0 filter=lfs diff=lfs merge=lfs -text
|
| 3396 |
+
checkpoint_1007000/target.encoder.layers_1.mlp.wo.kernel/2.0 filter=lfs diff=lfs merge=lfs -text
|
| 3397 |
+
checkpoint_1007000/target.encoder.layers_1.mlp.wo.kernel/4.0 filter=lfs diff=lfs merge=lfs -text
|
| 3398 |
+
checkpoint_1007000/target.decoder.layers_5.self_attention.out.kernel/6.0 filter=lfs diff=lfs merge=lfs -text
|
| 3399 |
+
checkpoint_1007000/target.decoder.layers_5.self_attention.out.kernel/1.0 filter=lfs diff=lfs merge=lfs -text
|
| 3400 |
+
checkpoint_1007000/target.decoder.layers_5.self_attention.out.kernel/3.0 filter=lfs diff=lfs merge=lfs -text
|
| 3401 |
+
checkpoint_1007000/target.decoder.layers_5.self_attention.out.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 3402 |
+
checkpoint_1007000/target.decoder.layers_5.self_attention.out.kernel/7.0 filter=lfs diff=lfs merge=lfs -text
|
| 3403 |
+
checkpoint_1007000/target.decoder.layers_5.self_attention.out.kernel/5.0 filter=lfs diff=lfs merge=lfs -text
|
| 3404 |
+
checkpoint_1007000/target.decoder.layers_5.self_attention.out.kernel/2.0 filter=lfs diff=lfs merge=lfs -text
|
| 3405 |
+
checkpoint_1007000/target.decoder.layers_5.self_attention.out.kernel/4.0 filter=lfs diff=lfs merge=lfs -text
|
| 3406 |
+
checkpoint_1007000/target.decoder.layers_20.mlp.wi_0.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 3407 |
+
checkpoint_1007000/target.decoder.layers_20.mlp.wi_0.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
| 3408 |
+
checkpoint_1007000/target.decoder.layers_20.mlp.wi_0.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 3409 |
+
checkpoint_1007000/target.decoder.layers_20.mlp.wi_0.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
| 3410 |
+
checkpoint_1007000/target.decoder.layers_20.mlp.wi_0.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
| 3411 |
+
checkpoint_1007000/target.decoder.layers_20.mlp.wi_0.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
| 3412 |
+
checkpoint_1007000/target.decoder.layers_20.mlp.wi_0.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
| 3413 |
+
checkpoint_1007000/target.decoder.layers_20.mlp.wi_0.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
| 3414 |
+
checkpoint_1007000/target.encoder.layers_1.attention.key.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 3415 |
+
checkpoint_1007000/target.encoder.layers_1.attention.key.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
| 3416 |
+
checkpoint_1007000/target.encoder.layers_1.attention.key.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 3417 |
+
checkpoint_1007000/target.encoder.layers_1.attention.key.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
checkpoint_1007000/state.param_states.decoder.layers_11.pre_mlp_layer_norm.scale.v/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096],"zarr_format":2}
|
checkpoint_1007000/state.param_states.decoder.layers_11.pre_mlp_layer_norm.scale.v/0
ADDED
|
Binary file (14.7 kB). View file
|
|
|
checkpoint_1007000/state.param_states.decoder.layers_2.pre_mlp_layer_norm.scale.v/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096],"zarr_format":2}
|
checkpoint_1007000/state.param_states.decoder.layers_2.pre_mlp_layer_norm.scale.v/0
ADDED
|
Binary file (14.8 kB). View file
|
|
|
checkpoint_1007000/state.param_states.decoder.layers_20.pre_mlp_layer_norm.scale.v/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096],"zarr_format":2}
|
checkpoint_1007000/state.param_states.decoder.layers_20.pre_mlp_layer_norm.scale.v/0
ADDED
|
Binary file (14.3 kB). View file
|
|
|
checkpoint_1007000/state.param_states.encoder.layers_18.pre_attention_layer_norm.scale.v/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096],"zarr_format":2}
|
checkpoint_1007000/state.param_states.encoder.layers_18.pre_attention_layer_norm.scale.v/0
ADDED
|
Binary file (15 kB). View file
|
|
|
checkpoint_1007000/target.decoder.layers_19.self_attention.query.kernel/.zarray.__tmp9965845325617335270.~1663960300776928~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_19.self_attention.query.kernel/0.4
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4edd1f8351210a9443b9c86a37f074379c0a5a6745564c2c87116742898cbabf
|
| 3 |
+
size 7808021
|
checkpoint_1007000/target.decoder.layers_20.mlp.wi_0.kernel/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_20.mlp.wi_0.kernel/.zarray.__tmp10737010418154130528.~1663960300990168~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_20.mlp.wi_0.kernel/.zarray.__tmp15085119283178330789.~1663960300553887~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_20.mlp.wi_0.kernel/.zarray.__tmp17995146359337543296.~1663960300384585~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_20.mlp.wi_0.kernel/.zarray.__tmp2502237801831035616.~1663960300546685~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_20.mlp.wi_0.kernel/.zarray.__tmp2850853085514675605.~1663960300891189~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_20.mlp.wi_0.kernel/.zarray.__tmp4195479506829954279.~1663960300421542~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_20.mlp.wi_0.kernel/.zarray.__tmp5713260649823328635.~1663960300313238~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_20.mlp.wi_0.kernel/0.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7b2cd8a0d2f95af5d023fea4f99b25ab22efa91e7c0aebdbba91eaaaddb5f991
|
| 3 |
+
size 19532230
|
checkpoint_1007000/target.decoder.layers_20.mlp.wi_0.kernel/0.1
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:93504f188626573533e369d40cad516922cd9234ba2dc5318dc0cea8eefa8aa2
|
| 3 |
+
size 19531039
|
checkpoint_1007000/target.decoder.layers_20.mlp.wi_0.kernel/0.2
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b90fc52edb0a7356fdc33b2e3fc6fc8a7fbd47a8b8e6cff369445c33abec6dcc
|
| 3 |
+
size 19532040
|
checkpoint_1007000/target.decoder.layers_20.mlp.wi_0.kernel/0.3
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9e81a1b49f465fa1322333dde569da6fc01cbfc4b795c10dbe8cdede5645abb9
|
| 3 |
+
size 19532134
|
checkpoint_1007000/target.decoder.layers_20.mlp.wi_0.kernel/0.4
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:58d6ab7b8ff335160181a9ba8bff2bf74eac6bb92d0412118f7d6d999fb7ff63
|
| 3 |
+
size 19532775
|
checkpoint_1007000/target.decoder.layers_20.mlp.wi_0.kernel/0.5
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:eeef924c703454dd3280143158db3f634f6bb29ec25dbccaaef2d3bdf9d90743
|
| 3 |
+
size 19532154
|
checkpoint_1007000/target.decoder.layers_20.mlp.wi_0.kernel/0.6
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5e813e9dde4628abb33e6a9bd95f4d2e5dd99b1522291317ba9f4ff68eeaa565
|
| 3 |
+
size 19531998
|
checkpoint_1007000/target.decoder.layers_20.mlp.wi_0.kernel/0.7
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:224b936dcf0f88ae4acae7c4523123173d15acc4abf8d3ea3730ad62f911394c
|
| 3 |
+
size 19532219
|
checkpoint_1007000/target.decoder.layers_5.self_attention.out.kernel/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[512,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_5.self_attention.out.kernel/.zarray.__tmp12472498129906000649.~1663960300987181~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[512,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_5.self_attention.out.kernel/.zarray.__tmp15997632327377674563.~1663960300385093~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[512,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_5.self_attention.out.kernel/.zarray.__tmp17161090791735915174.~1663960300990295~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[512,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_5.self_attention.out.kernel/.zarray.__tmp17678183565922492582.~1663960300887921~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[512,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_5.self_attention.out.kernel/.zarray.__tmp2311522688625836680.~1663960300632690~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[512,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_5.self_attention.out.kernel/.zarray.__tmp912729723844932576.~1663960300499988~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[512,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_5.self_attention.out.kernel/.zarray.__tmp9597664565037842435.~1663960300550190~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[512,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_5.self_attention.out.kernel/0.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:27a3d6ca530d2fc6ea4b07bfea03b159c5119fd4b6e56efc5f134d734fcd832f
|
| 3 |
+
size 7818488
|
checkpoint_1007000/target.decoder.layers_5.self_attention.out.kernel/1.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4623f357c785d32265d8e24d979cd63cb8ea5d0adbbeebfaa8259e92c863baf0
|
| 3 |
+
size 7815514
|
checkpoint_1007000/target.decoder.layers_5.self_attention.out.kernel/2.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:78b5e5e22ac68c54a580d02e9a15698cd19fcf21e6f460c42ca0fcd60f6d9236
|
| 3 |
+
size 7817706
|
checkpoint_1007000/target.decoder.layers_5.self_attention.out.kernel/3.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:434038e3f5fb6258dac91346eecb0af3aed520884bd415b2cc01eb86bce414c8
|
| 3 |
+
size 7822001
|
checkpoint_1007000/target.decoder.layers_5.self_attention.out.kernel/4.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:03154082b286cfd0a05625d7b1bf0d1a1018a0b7119556d6628dd3915aba8ef5
|
| 3 |
+
size 7822051
|
checkpoint_1007000/target.decoder.layers_5.self_attention.out.kernel/5.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:aa27423cf3f3f6f9fd188c1e542296767b7fd1184973bd3131baa910bf732d6b
|
| 3 |
+
size 7820709
|
checkpoint_1007000/target.decoder.layers_5.self_attention.out.kernel/6.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:fb06ea6d12ff8410eafc1e1d003b283d80425958dd851b753c45ea3b90a8e46a
|
| 3 |
+
size 7820646
|
checkpoint_1007000/target.decoder.layers_5.self_attention.out.kernel/7.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:71c3c01930b194a7bd0988353a530281cd3b4cdd242700d84073f08127e69272
|
| 3 |
+
size 7817407
|
checkpoint_1007000/target.decoder.layers_5.self_attention.query.kernel/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_5.self_attention.query.kernel/.zarray.__tmp10784686010286414521.~1663960300622263~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_5.self_attention.query.kernel/.zarray.__tmp1264248097414776324.~1663960300599753~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_5.self_attention.query.kernel/.zarray.__tmp17781551333248209554.~1663960300504701~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_5.self_attention.query.kernel/.zarray.__tmp187759084959598207.~1663960300730800~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_5.self_attention.query.kernel/.zarray.__tmp2881458377027394845.~1663960300822313~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_5.self_attention.query.kernel/.zarray.__tmp4363225482210754279.~1663960300504781~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|