Commit
·
8c8fd09
1
Parent(s):
51afe23
Upload part 38
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- .gitattributes +49 -0
- checkpoint_1007000/state.param_states.decoder.layers_10.pre_mlp_layer_norm.scale.v/.zarray +1 -0
- checkpoint_1007000/state.param_states.decoder.layers_10.pre_mlp_layer_norm.scale.v/0 +0 -0
- checkpoint_1007000/state.param_states.decoder.layers_11.pre_cross_attention_layer_norm.scale.v/.zarray +1 -0
- checkpoint_1007000/state.param_states.decoder.layers_11.pre_cross_attention_layer_norm.scale.v/0 +0 -0
- checkpoint_1007000/state.param_states.encoder.layers_22.pre_attention_layer_norm.scale.v/.zarray +1 -0
- checkpoint_1007000/state.param_states.encoder.layers_22.pre_attention_layer_norm.scale.v/0 +0 -0
- checkpoint_1007000/target.decoder.layers_12.encoder_decoder_attention.key.kernel/.zarray +1 -0
- checkpoint_1007000/target.decoder.layers_12.encoder_decoder_attention.key.kernel/.zarray.__tmp10666301048271400128.~1663960300601872~ +1 -0
- checkpoint_1007000/target.decoder.layers_12.encoder_decoder_attention.key.kernel/.zarray.__tmp10824035044865767718.~1663960300467900~ +1 -0
- checkpoint_1007000/target.decoder.layers_12.encoder_decoder_attention.key.kernel/.zarray.__tmp17491665953918277627.~1663960300775137~ +1 -0
- checkpoint_1007000/target.decoder.layers_12.encoder_decoder_attention.key.kernel/.zarray.__tmp2698586933318194643.~1663960300493108~ +1 -0
- checkpoint_1007000/target.decoder.layers_12.encoder_decoder_attention.key.kernel/.zarray.__tmp3063477194367769089.~1663960300728221~ +1 -0
- checkpoint_1007000/target.decoder.layers_12.encoder_decoder_attention.key.kernel/.zarray.__tmp3629286470904913908.~1663960300685961~ +1 -0
- checkpoint_1007000/target.decoder.layers_12.encoder_decoder_attention.key.kernel/.zarray.__tmp5154167650306256182.~1663960300499769~ +1 -0
- checkpoint_1007000/target.decoder.layers_12.encoder_decoder_attention.key.kernel/0.0 +3 -0
- checkpoint_1007000/target.decoder.layers_12.encoder_decoder_attention.key.kernel/0.1 +3 -0
- checkpoint_1007000/target.decoder.layers_12.encoder_decoder_attention.key.kernel/0.2 +3 -0
- checkpoint_1007000/target.decoder.layers_12.encoder_decoder_attention.key.kernel/0.3 +3 -0
- checkpoint_1007000/target.decoder.layers_12.encoder_decoder_attention.key.kernel/0.4 +3 -0
- checkpoint_1007000/target.decoder.layers_12.encoder_decoder_attention.key.kernel/0.5 +3 -0
- checkpoint_1007000/target.decoder.layers_12.encoder_decoder_attention.key.kernel/0.6 +3 -0
- checkpoint_1007000/target.decoder.layers_12.encoder_decoder_attention.key.kernel/0.7 +3 -0
- checkpoint_1007000/target.decoder.layers_20.self_attention.value.kernel/.zarray +1 -0
- checkpoint_1007000/target.decoder.layers_20.self_attention.value.kernel/.zarray.__tmp12292122855751842815.~1663960300886463~ +1 -0
- checkpoint_1007000/target.decoder.layers_20.self_attention.value.kernel/.zarray.__tmp12729170680231462171.~1663960300775671~ +1 -0
- checkpoint_1007000/target.decoder.layers_20.self_attention.value.kernel/.zarray.__tmp16288759272656539980.~1663960300622392~ +1 -0
- checkpoint_1007000/target.decoder.layers_20.self_attention.value.kernel/.zarray.__tmp2097918179125387591.~1663960300471042~ +1 -0
- checkpoint_1007000/target.decoder.layers_20.self_attention.value.kernel/.zarray.__tmp27539476875501871.~1663960300685425~ +1 -0
- checkpoint_1007000/target.decoder.layers_20.self_attention.value.kernel/.zarray.__tmp3982320326126219065.~1663960300498267~ +1 -0
- checkpoint_1007000/target.decoder.layers_20.self_attention.value.kernel/.zarray.__tmp4583192192703197948.~1663960300627170~ +1 -0
- checkpoint_1007000/target.decoder.layers_20.self_attention.value.kernel/0.0 +3 -0
- checkpoint_1007000/target.decoder.layers_20.self_attention.value.kernel/0.1 +3 -0
- checkpoint_1007000/target.decoder.layers_20.self_attention.value.kernel/0.2 +3 -0
- checkpoint_1007000/target.decoder.layers_20.self_attention.value.kernel/0.3 +3 -0
- checkpoint_1007000/target.decoder.layers_20.self_attention.value.kernel/0.4 +3 -0
- checkpoint_1007000/target.decoder.layers_20.self_attention.value.kernel/0.5 +3 -0
- checkpoint_1007000/target.decoder.layers_20.self_attention.value.kernel/0.6 +3 -0
- checkpoint_1007000/target.decoder.layers_20.self_attention.value.kernel/0.7 +3 -0
- checkpoint_1007000/target.decoder.layers_23.encoder_decoder_attention.out.kernel/.zarray +1 -0
- checkpoint_1007000/target.decoder.layers_23.encoder_decoder_attention.out.kernel/.zarray.__tmp10521466314548349909.~1663960300623733~ +1 -0
- checkpoint_1007000/target.decoder.layers_23.encoder_decoder_attention.out.kernel/.zarray.__tmp1268806510747428351.~1663960300776988~ +1 -0
- checkpoint_1007000/target.decoder.layers_23.encoder_decoder_attention.out.kernel/.zarray.__tmp5157424613732213906.~1663960301026243~ +1 -0
- checkpoint_1007000/target.decoder.layers_23.encoder_decoder_attention.out.kernel/.zarray.__tmp6307815978816431402.~1663960300500621~ +1 -0
- checkpoint_1007000/target.decoder.layers_23.encoder_decoder_attention.out.kernel/.zarray.__tmp7128591363366176481.~1663960300865877~ +1 -0
- checkpoint_1007000/target.decoder.layers_23.encoder_decoder_attention.out.kernel/.zarray.__tmp7446400039440086678.~1663960300687825~ +1 -0
- checkpoint_1007000/target.decoder.layers_23.encoder_decoder_attention.out.kernel/.zarray.__tmp7547867216114642093.~1663960300891116~ +1 -0
- checkpoint_1007000/target.decoder.layers_23.encoder_decoder_attention.out.kernel/0.0 +3 -0
- checkpoint_1007000/target.decoder.layers_23.encoder_decoder_attention.out.kernel/1.0 +3 -0
- checkpoint_1007000/target.decoder.layers_23.encoder_decoder_attention.out.kernel/2.0 +3 -0
.gitattributes
CHANGED
|
@@ -1941,3 +1941,52 @@ checkpoint_1007000/target.decoder.layers_13.encoder_decoder_attention.key.kernel
|
|
| 1941 |
checkpoint_1007000/target.decoder.layers_13.encoder_decoder_attention.key.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
| 1942 |
checkpoint_1007000/target.decoder.layers_7.encoder_decoder_attention.key.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 1943 |
checkpoint_1007000/target.decoder.layers_7.encoder_decoder_attention.key.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1941 |
checkpoint_1007000/target.decoder.layers_13.encoder_decoder_attention.key.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
| 1942 |
checkpoint_1007000/target.decoder.layers_7.encoder_decoder_attention.key.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 1943 |
checkpoint_1007000/target.decoder.layers_7.encoder_decoder_attention.key.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
| 1944 |
+
checkpoint_1007000/target.decoder.layers_7.encoder_decoder_attention.key.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 1945 |
+
checkpoint_1007000/target.decoder.layers_7.encoder_decoder_attention.key.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
| 1946 |
+
checkpoint_1007000/target.decoder.layers_7.encoder_decoder_attention.key.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
| 1947 |
+
checkpoint_1007000/target.decoder.layers_7.encoder_decoder_attention.key.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
| 1948 |
+
checkpoint_1007000/target.decoder.layers_7.encoder_decoder_attention.key.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
| 1949 |
+
checkpoint_1007000/target.decoder.layers_7.encoder_decoder_attention.key.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
| 1950 |
+
checkpoint_1007000/target.decoder.layers_12.encoder_decoder_attention.key.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 1951 |
+
checkpoint_1007000/target.decoder.layers_12.encoder_decoder_attention.key.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
| 1952 |
+
checkpoint_1007000/target.decoder.layers_12.encoder_decoder_attention.key.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 1953 |
+
checkpoint_1007000/target.decoder.layers_12.encoder_decoder_attention.key.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
| 1954 |
+
checkpoint_1007000/target.decoder.layers_12.encoder_decoder_attention.key.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
| 1955 |
+
checkpoint_1007000/target.decoder.layers_12.encoder_decoder_attention.key.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
| 1956 |
+
checkpoint_1007000/target.decoder.layers_12.encoder_decoder_attention.key.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
| 1957 |
+
checkpoint_1007000/target.decoder.layers_12.encoder_decoder_attention.key.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
| 1958 |
+
checkpoint_1007000/target.decoder.layers_23.encoder_decoder_attention.out.kernel/6.0 filter=lfs diff=lfs merge=lfs -text
|
| 1959 |
+
checkpoint_1007000/target.decoder.layers_23.encoder_decoder_attention.out.kernel/1.0 filter=lfs diff=lfs merge=lfs -text
|
| 1960 |
+
checkpoint_1007000/target.decoder.layers_23.encoder_decoder_attention.out.kernel/3.0 filter=lfs diff=lfs merge=lfs -text
|
| 1961 |
+
checkpoint_1007000/target.decoder.layers_23.encoder_decoder_attention.out.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 1962 |
+
checkpoint_1007000/target.decoder.layers_23.encoder_decoder_attention.out.kernel/7.0 filter=lfs diff=lfs merge=lfs -text
|
| 1963 |
+
checkpoint_1007000/target.decoder.layers_23.encoder_decoder_attention.out.kernel/5.0 filter=lfs diff=lfs merge=lfs -text
|
| 1964 |
+
checkpoint_1007000/target.decoder.layers_23.encoder_decoder_attention.out.kernel/2.0 filter=lfs diff=lfs merge=lfs -text
|
| 1965 |
+
checkpoint_1007000/target.decoder.layers_23.encoder_decoder_attention.out.kernel/4.0 filter=lfs diff=lfs merge=lfs -text
|
| 1966 |
+
checkpoint_1007000/target.encoder.layers_17.mlp.wo.kernel/6.0 filter=lfs diff=lfs merge=lfs -text
|
| 1967 |
+
checkpoint_1007000/target.encoder.layers_17.mlp.wo.kernel/1.0 filter=lfs diff=lfs merge=lfs -text
|
| 1968 |
+
checkpoint_1007000/target.encoder.layers_17.mlp.wo.kernel/3.0 filter=lfs diff=lfs merge=lfs -text
|
| 1969 |
+
checkpoint_1007000/target.encoder.layers_17.mlp.wo.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 1970 |
+
checkpoint_1007000/target.encoder.layers_17.mlp.wo.kernel/7.0 filter=lfs diff=lfs merge=lfs -text
|
| 1971 |
+
checkpoint_1007000/target.encoder.layers_17.mlp.wo.kernel/5.0 filter=lfs diff=lfs merge=lfs -text
|
| 1972 |
+
checkpoint_1007000/target.encoder.layers_17.mlp.wo.kernel/2.0 filter=lfs diff=lfs merge=lfs -text
|
| 1973 |
+
checkpoint_1007000/target.encoder.layers_17.mlp.wo.kernel/4.0 filter=lfs diff=lfs merge=lfs -text
|
| 1974 |
+
checkpoint_1007000/target.decoder.layers_20.self_attention.value.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 1975 |
+
checkpoint_1007000/target.decoder.layers_20.self_attention.value.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
| 1976 |
+
checkpoint_1007000/target.decoder.layers_20.self_attention.value.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 1977 |
+
checkpoint_1007000/target.decoder.layers_20.self_attention.value.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
| 1978 |
+
checkpoint_1007000/target.decoder.layers_20.self_attention.value.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
| 1979 |
+
checkpoint_1007000/target.decoder.layers_20.self_attention.value.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
| 1980 |
+
checkpoint_1007000/target.decoder.layers_20.self_attention.value.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
| 1981 |
+
checkpoint_1007000/target.decoder.layers_20.self_attention.value.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
| 1982 |
+
checkpoint_1007000/target.decoder.layers_9.mlp.wo.kernel/6.0 filter=lfs diff=lfs merge=lfs -text
|
| 1983 |
+
checkpoint_1007000/target.decoder.layers_9.mlp.wo.kernel/1.0 filter=lfs diff=lfs merge=lfs -text
|
| 1984 |
+
checkpoint_1007000/target.decoder.layers_9.mlp.wo.kernel/3.0 filter=lfs diff=lfs merge=lfs -text
|
| 1985 |
+
checkpoint_1007000/target.decoder.layers_9.mlp.wo.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 1986 |
+
checkpoint_1007000/target.decoder.layers_9.mlp.wo.kernel/7.0 filter=lfs diff=lfs merge=lfs -text
|
| 1987 |
+
checkpoint_1007000/target.decoder.layers_9.mlp.wo.kernel/5.0 filter=lfs diff=lfs merge=lfs -text
|
| 1988 |
+
checkpoint_1007000/target.decoder.layers_9.mlp.wo.kernel/2.0 filter=lfs diff=lfs merge=lfs -text
|
| 1989 |
+
checkpoint_1007000/target.decoder.layers_9.mlp.wo.kernel/4.0 filter=lfs diff=lfs merge=lfs -text
|
| 1990 |
+
checkpoint_1007000/target.encoder.layers_2.attention.key.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 1991 |
+
checkpoint_1007000/target.encoder.layers_2.attention.key.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
| 1992 |
+
checkpoint_1007000/target.encoder.layers_2.attention.key.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
checkpoint_1007000/state.param_states.decoder.layers_10.pre_mlp_layer_norm.scale.v/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096],"zarr_format":2}
|
checkpoint_1007000/state.param_states.decoder.layers_10.pre_mlp_layer_norm.scale.v/0
ADDED
|
Binary file (14.7 kB). View file
|
|
|
checkpoint_1007000/state.param_states.decoder.layers_11.pre_cross_attention_layer_norm.scale.v/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096],"zarr_format":2}
|
checkpoint_1007000/state.param_states.decoder.layers_11.pre_cross_attention_layer_norm.scale.v/0
ADDED
|
Binary file (14.8 kB). View file
|
|
|
checkpoint_1007000/state.param_states.encoder.layers_22.pre_attention_layer_norm.scale.v/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096],"zarr_format":2}
|
checkpoint_1007000/state.param_states.encoder.layers_22.pre_attention_layer_norm.scale.v/0
ADDED
|
Binary file (14.7 kB). View file
|
|
|
checkpoint_1007000/target.decoder.layers_12.encoder_decoder_attention.key.kernel/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_12.encoder_decoder_attention.key.kernel/.zarray.__tmp10666301048271400128.~1663960300601872~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_12.encoder_decoder_attention.key.kernel/.zarray.__tmp10824035044865767718.~1663960300467900~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_12.encoder_decoder_attention.key.kernel/.zarray.__tmp17491665953918277627.~1663960300775137~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_12.encoder_decoder_attention.key.kernel/.zarray.__tmp2698586933318194643.~1663960300493108~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_12.encoder_decoder_attention.key.kernel/.zarray.__tmp3063477194367769089.~1663960300728221~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_12.encoder_decoder_attention.key.kernel/.zarray.__tmp3629286470904913908.~1663960300685961~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_12.encoder_decoder_attention.key.kernel/.zarray.__tmp5154167650306256182.~1663960300499769~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_12.encoder_decoder_attention.key.kernel/0.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:032375b7f17b22d771bd0020429fa616e224566883048698b82fd3b42e509427
|
| 3 |
+
size 7812332
|
checkpoint_1007000/target.decoder.layers_12.encoder_decoder_attention.key.kernel/0.1
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:68f0450f185321f03b135f8ff09246f3f7ec1816ce112761991cc48b8fda3e8c
|
| 3 |
+
size 7812660
|
checkpoint_1007000/target.decoder.layers_12.encoder_decoder_attention.key.kernel/0.2
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:291c660532e38959ff70eb206b6d27fa4da2b2cf6fa8c4e436b81f5bddaf1617
|
| 3 |
+
size 7809139
|
checkpoint_1007000/target.decoder.layers_12.encoder_decoder_attention.key.kernel/0.3
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:cdba720983884ce8405ad6ce311c5d853b35e8a3b5a4a72027c818f66f669f02
|
| 3 |
+
size 7810129
|
checkpoint_1007000/target.decoder.layers_12.encoder_decoder_attention.key.kernel/0.4
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:72ba2c6261edbb62277ba045a91c28b20fef9ffc4b50e84534cbb158419a64b2
|
| 3 |
+
size 7810466
|
checkpoint_1007000/target.decoder.layers_12.encoder_decoder_attention.key.kernel/0.5
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6a74663521ab7b3ecc10255c186ae1d14ad14e96826a4db34e14fb86c47d57ad
|
| 3 |
+
size 7814949
|
checkpoint_1007000/target.decoder.layers_12.encoder_decoder_attention.key.kernel/0.6
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:09e3d94c7ec301f6390077762054354c0fcfd0e64d226d2c89fcb74e4ed6677e
|
| 3 |
+
size 7808788
|
checkpoint_1007000/target.decoder.layers_12.encoder_decoder_attention.key.kernel/0.7
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a7ae4715414d9737cc9fa3a13221d8a6dd9a41d1cc86ce0f7e11d198e2aa96c0
|
| 3 |
+
size 7815597
|
checkpoint_1007000/target.decoder.layers_20.self_attention.value.kernel/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_20.self_attention.value.kernel/.zarray.__tmp12292122855751842815.~1663960300886463~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_20.self_attention.value.kernel/.zarray.__tmp12729170680231462171.~1663960300775671~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_20.self_attention.value.kernel/.zarray.__tmp16288759272656539980.~1663960300622392~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_20.self_attention.value.kernel/.zarray.__tmp2097918179125387591.~1663960300471042~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_20.self_attention.value.kernel/.zarray.__tmp27539476875501871.~1663960300685425~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_20.self_attention.value.kernel/.zarray.__tmp3982320326126219065.~1663960300498267~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_20.self_attention.value.kernel/.zarray.__tmp4583192192703197948.~1663960300627170~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_20.self_attention.value.kernel/0.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:18e568963ea246fa4c96d9507370641c8b05c3f2b1ccae7c891f0ee063cc997c
|
| 3 |
+
size 7824823
|
checkpoint_1007000/target.decoder.layers_20.self_attention.value.kernel/0.1
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d3f1f3a96ad7c6a1331e850a7c197b91bb73b9af629e38437170681d61b0f828
|
| 3 |
+
size 7817700
|
checkpoint_1007000/target.decoder.layers_20.self_attention.value.kernel/0.2
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:67fabd789ec771df19421123c323a2f6e1cc2c61607759f43e5f66b2b53224ed
|
| 3 |
+
size 7819162
|
checkpoint_1007000/target.decoder.layers_20.self_attention.value.kernel/0.3
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:44375ccd546fbe9522b4ca02179b58ba2cf1e174954c3c74ea7b7f6ad87b3814
|
| 3 |
+
size 7806485
|
checkpoint_1007000/target.decoder.layers_20.self_attention.value.kernel/0.4
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c735eece22368768f537e6cbb51bfb6dcac3820ac98d552f11d3653d7ab8b4c3
|
| 3 |
+
size 7841992
|
checkpoint_1007000/target.decoder.layers_20.self_attention.value.kernel/0.5
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4a57bea9076d1b273248ede820670f20906fcc891448ad05e45ca66af2a97a3e
|
| 3 |
+
size 7806791
|
checkpoint_1007000/target.decoder.layers_20.self_attention.value.kernel/0.6
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:51870d868570ba8c0f9fe8925511883f27038c43b9e30d235a915750630b6814
|
| 3 |
+
size 7837160
|
checkpoint_1007000/target.decoder.layers_20.self_attention.value.kernel/0.7
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:05cb07201e1921a2ea5b8a2565defc464f8ff5b54e43fd3e4182b848f4026922
|
| 3 |
+
size 7807011
|
checkpoint_1007000/target.decoder.layers_23.encoder_decoder_attention.out.kernel/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[512,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_23.encoder_decoder_attention.out.kernel/.zarray.__tmp10521466314548349909.~1663960300623733~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[512,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_23.encoder_decoder_attention.out.kernel/.zarray.__tmp1268806510747428351.~1663960300776988~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[512,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_23.encoder_decoder_attention.out.kernel/.zarray.__tmp5157424613732213906.~1663960301026243~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[512,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_23.encoder_decoder_attention.out.kernel/.zarray.__tmp6307815978816431402.~1663960300500621~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[512,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_23.encoder_decoder_attention.out.kernel/.zarray.__tmp7128591363366176481.~1663960300865877~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[512,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_23.encoder_decoder_attention.out.kernel/.zarray.__tmp7446400039440086678.~1663960300687825~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[512,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_23.encoder_decoder_attention.out.kernel/.zarray.__tmp7547867216114642093.~1663960300891116~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[512,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_23.encoder_decoder_attention.out.kernel/0.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:896ef7c9ecff55837ea9d4c8216749900b5cc1ed23413c6bac17e2ba3a6ba16e
|
| 3 |
+
size 7799623
|
checkpoint_1007000/target.decoder.layers_23.encoder_decoder_attention.out.kernel/1.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:581c455bbebe40adcc8ece3e4fe2417feb72fa96535b23071f5584a891f544e7
|
| 3 |
+
size 7801952
|
checkpoint_1007000/target.decoder.layers_23.encoder_decoder_attention.out.kernel/2.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7b93228b4bffddaee05d244ad6e987ddf7895ab8f7d77a16ab335afebc63aae3
|
| 3 |
+
size 7803410
|