TimeRobber commited on
Commit
eeee4a0
·
1 Parent(s): 0f3aef5

Upload part 40

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. .gitattributes +48 -0
  2. checkpoint_1007000/state.param_states.encoder.layers_12.pre_attention_layer_norm.scale.v/.zarray +1 -0
  3. checkpoint_1007000/state.param_states.encoder.layers_12.pre_attention_layer_norm.scale.v/0 +0 -0
  4. checkpoint_1007000/state.param_states.encoder.layers_19.pre_mlp_layer_norm.scale.v/.zarray +1 -0
  5. checkpoint_1007000/state.param_states.encoder.layers_19.pre_mlp_layer_norm.scale.v/0 +0 -0
  6. checkpoint_1007000/target.decoder.decoder_norm.scale/.zarray +1 -0
  7. checkpoint_1007000/target.decoder.decoder_norm.scale/0 +0 -0
  8. checkpoint_1007000/target.decoder.layers_15.mlp.wi_1.kernel/.zarray +1 -0
  9. checkpoint_1007000/target.decoder.layers_15.mlp.wi_1.kernel/.zarray.__tmp15590069018174250927.~1663960300308256~ +1 -0
  10. checkpoint_1007000/target.decoder.layers_15.mlp.wi_1.kernel/.zarray.__tmp15744899109354973635.~1663960300421932~ +1 -0
  11. checkpoint_1007000/target.decoder.layers_15.mlp.wi_1.kernel/.zarray.__tmp18375236708728796867.~1663960300688867~ +1 -0
  12. checkpoint_1007000/target.decoder.layers_15.mlp.wi_1.kernel/.zarray.__tmp2103911721188231572.~1663960300822920~ +1 -0
  13. checkpoint_1007000/target.decoder.layers_15.mlp.wi_1.kernel/.zarray.__tmp4333629875821823980.~1663960300551128~ +1 -0
  14. checkpoint_1007000/target.decoder.layers_15.mlp.wi_1.kernel/.zarray.__tmp7696852913333449298.~1663960300272803~ +1 -0
  15. checkpoint_1007000/target.decoder.layers_15.mlp.wi_1.kernel/.zarray.__tmp9885211211724445706.~1663960300632501~ +1 -0
  16. checkpoint_1007000/target.decoder.layers_15.mlp.wi_1.kernel/0.0 +3 -0
  17. checkpoint_1007000/target.decoder.layers_15.mlp.wi_1.kernel/0.1 +3 -0
  18. checkpoint_1007000/target.decoder.layers_15.mlp.wi_1.kernel/0.2 +3 -0
  19. checkpoint_1007000/target.decoder.layers_15.mlp.wi_1.kernel/0.3 +3 -0
  20. checkpoint_1007000/target.decoder.layers_15.mlp.wi_1.kernel/0.4 +3 -0
  21. checkpoint_1007000/target.decoder.layers_15.mlp.wi_1.kernel/0.5 +3 -0
  22. checkpoint_1007000/target.decoder.layers_15.mlp.wi_1.kernel/0.6 +3 -0
  23. checkpoint_1007000/target.decoder.layers_15.mlp.wi_1.kernel/0.7 +3 -0
  24. checkpoint_1007000/target.decoder.layers_16.encoder_decoder_attention.query.kernel/.zarray.__tmp14275400193037987122.~1663960300384017~ +1 -0
  25. checkpoint_1007000/target.decoder.layers_16.encoder_decoder_attention.query.kernel/.zarray.__tmp5453924144578779166.~1663960300467517~ +1 -0
  26. checkpoint_1007000/target.decoder.layers_16.encoder_decoder_attention.query.kernel/0.0 +3 -0
  27. checkpoint_1007000/target.decoder.layers_16.encoder_decoder_attention.query.kernel/0.1 +3 -0
  28. checkpoint_1007000/target.decoder.layers_16.encoder_decoder_attention.query.kernel/0.6 +3 -0
  29. checkpoint_1007000/target.decoder.layers_16.encoder_decoder_attention.query.kernel/0.7 +3 -0
  30. checkpoint_1007000/target.decoder.layers_2.self_attention.value.kernel/.zarray.__tmp14805654823044195203.~1663960300941182~ +1 -0
  31. checkpoint_1007000/target.decoder.layers_2.self_attention.value.kernel/.zarray.__tmp18402290304374832220.~1663960300610766~ +1 -0
  32. checkpoint_1007000/target.decoder.layers_2.self_attention.value.kernel/.zarray.__tmp6102370472552948078.~1663960300501139~ +1 -0
  33. checkpoint_1007000/target.decoder.layers_2.self_attention.value.kernel/.zarray.__tmp6369220955053798728.~1663960300890367~ +1 -0
  34. checkpoint_1007000/target.decoder.layers_2.self_attention.value.kernel/.zarray.__tmp7004825582130560441.~1663960300601053~ +1 -0
  35. checkpoint_1007000/target.decoder.layers_2.self_attention.value.kernel/0.2 +3 -0
  36. checkpoint_1007000/target.decoder.layers_2.self_attention.value.kernel/0.3 +3 -0
  37. checkpoint_1007000/target.decoder.layers_2.self_attention.value.kernel/0.4 +3 -0
  38. checkpoint_1007000/target.decoder.layers_2.self_attention.value.kernel/0.5 +3 -0
  39. checkpoint_1007000/target.decoder.layers_21.mlp.wi_1.kernel/.zarray +1 -0
  40. checkpoint_1007000/target.decoder.layers_21.mlp.wi_1.kernel/.zarray.__tmp13176058321298810016.~1663960300549058~ +1 -0
  41. checkpoint_1007000/target.decoder.layers_21.mlp.wi_1.kernel/.zarray.__tmp1715683602810787734.~1663960300986925~ +1 -0
  42. checkpoint_1007000/target.decoder.layers_21.mlp.wi_1.kernel/.zarray.__tmp1806355867141919373.~1663960300862420~ +1 -0
  43. checkpoint_1007000/target.decoder.layers_21.mlp.wi_1.kernel/.zarray.__tmp18355203970343633918.~1663960300466384~ +1 -0
  44. checkpoint_1007000/target.decoder.layers_21.mlp.wi_1.kernel/.zarray.__tmp18395826612412633390.~1663960300551073~ +1 -0
  45. checkpoint_1007000/target.decoder.layers_21.mlp.wi_1.kernel/.zarray.__tmp8508567864372588290.~1663960300472419~ +1 -0
  46. checkpoint_1007000/target.decoder.layers_21.mlp.wi_1.kernel/.zarray.__tmp9748784751914184662.~1663960300602153~ +1 -0
  47. checkpoint_1007000/target.decoder.layers_21.mlp.wi_1.kernel/0.0 +3 -0
  48. checkpoint_1007000/target.decoder.layers_21.mlp.wi_1.kernel/0.1 +3 -0
  49. checkpoint_1007000/target.decoder.layers_21.mlp.wi_1.kernel/0.2 +3 -0
  50. checkpoint_1007000/target.decoder.layers_21.mlp.wi_1.kernel/0.3 +3 -0
.gitattributes CHANGED
@@ -2039,3 +2039,51 @@ checkpoint_1007000/target.decoder.layers_2.self_attention.value.kernel/0.1 filte
2039
  checkpoint_1007000/target.decoder.layers_2.self_attention.value.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
2040
  checkpoint_1007000/target.decoder.layers_2.self_attention.value.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
2041
  checkpoint_1007000/target.decoder.layers_2.self_attention.value.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
2039
  checkpoint_1007000/target.decoder.layers_2.self_attention.value.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
2040
  checkpoint_1007000/target.decoder.layers_2.self_attention.value.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
2041
  checkpoint_1007000/target.decoder.layers_2.self_attention.value.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
2042
+ checkpoint_1007000/target.decoder.layers_2.self_attention.value.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
2043
+ checkpoint_1007000/target.decoder.layers_2.self_attention.value.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
2044
+ checkpoint_1007000/target.decoder.layers_2.self_attention.value.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
2045
+ checkpoint_1007000/target.decoder.layers_2.self_attention.value.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
2046
+ checkpoint_1007000/target.encoder.layers_18.mlp.wi_0.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
2047
+ checkpoint_1007000/target.encoder.layers_18.mlp.wi_0.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
2048
+ checkpoint_1007000/target.encoder.layers_18.mlp.wi_0.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
2049
+ checkpoint_1007000/target.encoder.layers_18.mlp.wi_0.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
2050
+ checkpoint_1007000/target.encoder.layers_18.mlp.wi_0.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
2051
+ checkpoint_1007000/target.encoder.layers_18.mlp.wi_0.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
2052
+ checkpoint_1007000/target.encoder.layers_18.mlp.wi_0.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
2053
+ checkpoint_1007000/target.encoder.layers_18.mlp.wi_0.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
2054
+ checkpoint_1007000/target.decoder.layers_21.mlp.wi_1.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
2055
+ checkpoint_1007000/target.decoder.layers_21.mlp.wi_1.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
2056
+ checkpoint_1007000/target.decoder.layers_21.mlp.wi_1.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
2057
+ checkpoint_1007000/target.decoder.layers_21.mlp.wi_1.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
2058
+ checkpoint_1007000/target.decoder.layers_21.mlp.wi_1.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
2059
+ checkpoint_1007000/target.decoder.layers_21.mlp.wi_1.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
2060
+ checkpoint_1007000/target.decoder.layers_21.mlp.wi_1.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
2061
+ checkpoint_1007000/target.decoder.layers_21.mlp.wi_1.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
2062
+ checkpoint_1007000/target.encoder.layers_4.mlp.wo.kernel/6.0 filter=lfs diff=lfs merge=lfs -text
2063
+ checkpoint_1007000/target.encoder.layers_4.mlp.wo.kernel/1.0 filter=lfs diff=lfs merge=lfs -text
2064
+ checkpoint_1007000/target.encoder.layers_4.mlp.wo.kernel/3.0 filter=lfs diff=lfs merge=lfs -text
2065
+ checkpoint_1007000/target.encoder.layers_4.mlp.wo.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
2066
+ checkpoint_1007000/target.encoder.layers_4.mlp.wo.kernel/7.0 filter=lfs diff=lfs merge=lfs -text
2067
+ checkpoint_1007000/target.encoder.layers_4.mlp.wo.kernel/5.0 filter=lfs diff=lfs merge=lfs -text
2068
+ checkpoint_1007000/target.encoder.layers_4.mlp.wo.kernel/2.0 filter=lfs diff=lfs merge=lfs -text
2069
+ checkpoint_1007000/target.encoder.layers_4.mlp.wo.kernel/4.0 filter=lfs diff=lfs merge=lfs -text
2070
+ checkpoint_1007000/target.decoder.layers_9.encoder_decoder_attention.value.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
2071
+ checkpoint_1007000/target.decoder.layers_9.encoder_decoder_attention.value.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
2072
+ checkpoint_1007000/target.decoder.layers_9.encoder_decoder_attention.value.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
2073
+ checkpoint_1007000/target.decoder.layers_9.encoder_decoder_attention.value.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
2074
+ checkpoint_1007000/target.decoder.layers_9.encoder_decoder_attention.value.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
2075
+ checkpoint_1007000/target.decoder.layers_9.encoder_decoder_attention.value.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
2076
+ checkpoint_1007000/target.decoder.layers_9.encoder_decoder_attention.value.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
2077
+ checkpoint_1007000/target.decoder.layers_9.encoder_decoder_attention.value.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
2078
+ checkpoint_1007000/target.decoder.layers_15.mlp.wi_1.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
2079
+ checkpoint_1007000/target.decoder.layers_15.mlp.wi_1.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
2080
+ checkpoint_1007000/target.decoder.layers_15.mlp.wi_1.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
2081
+ checkpoint_1007000/target.decoder.layers_15.mlp.wi_1.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
2082
+ checkpoint_1007000/target.decoder.layers_15.mlp.wi_1.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
2083
+ checkpoint_1007000/target.decoder.layers_15.mlp.wi_1.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
2084
+ checkpoint_1007000/target.decoder.layers_15.mlp.wi_1.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
2085
+ checkpoint_1007000/target.decoder.layers_15.mlp.wi_1.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
2086
+ checkpoint_1007000/target.decoder.layers_16.encoder_decoder_attention.query.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
2087
+ checkpoint_1007000/target.decoder.layers_16.encoder_decoder_attention.query.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
2088
+ checkpoint_1007000/target.decoder.layers_16.encoder_decoder_attention.query.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
2089
+ checkpoint_1007000/target.decoder.layers_16.encoder_decoder_attention.query.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
checkpoint_1007000/state.param_states.encoder.layers_12.pre_attention_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096],"zarr_format":2}
checkpoint_1007000/state.param_states.encoder.layers_12.pre_attention_layer_norm.scale.v/0 ADDED
Binary file (15.3 kB). View file
 
checkpoint_1007000/state.param_states.encoder.layers_19.pre_mlp_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096],"zarr_format":2}
checkpoint_1007000/state.param_states.encoder.layers_19.pre_mlp_layer_norm.scale.v/0 ADDED
Binary file (14.9 kB). View file
 
checkpoint_1007000/target.decoder.decoder_norm.scale/.zarray ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096],"zarr_format":2}
checkpoint_1007000/target.decoder.decoder_norm.scale/0 ADDED
Binary file (14.3 kB). View file
 
checkpoint_1007000/target.decoder.layers_15.mlp.wi_1.kernel/.zarray ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_15.mlp.wi_1.kernel/.zarray.__tmp15590069018174250927.~1663960300308256~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_15.mlp.wi_1.kernel/.zarray.__tmp15744899109354973635.~1663960300421932~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_15.mlp.wi_1.kernel/.zarray.__tmp18375236708728796867.~1663960300688867~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_15.mlp.wi_1.kernel/.zarray.__tmp2103911721188231572.~1663960300822920~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_15.mlp.wi_1.kernel/.zarray.__tmp4333629875821823980.~1663960300551128~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_15.mlp.wi_1.kernel/.zarray.__tmp7696852913333449298.~1663960300272803~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_15.mlp.wi_1.kernel/.zarray.__tmp9885211211724445706.~1663960300632501~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_15.mlp.wi_1.kernel/0.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:45ebfd0c4619eabdf9d89d4b4d4ca63be84cef787c197f35104910d2b96c1eb0
3
+ size 19499409
checkpoint_1007000/target.decoder.layers_15.mlp.wi_1.kernel/0.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:86bb7fb122a44e6a1626d0a228a3b16a73fd8733d882b16d7ea13ae71f669335
3
+ size 19499699
checkpoint_1007000/target.decoder.layers_15.mlp.wi_1.kernel/0.2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:735386322dd1ca5a92f9ec8be01acd5f8bd440a63824c4d7e866cde0e7250f19
3
+ size 19499040
checkpoint_1007000/target.decoder.layers_15.mlp.wi_1.kernel/0.3 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0aae8a586369c2f5662ddbd2070c629eebb94005dc0c61880be17eda15621d26
3
+ size 19499866
checkpoint_1007000/target.decoder.layers_15.mlp.wi_1.kernel/0.4 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f2856535b155eb66ef1bb6a9a80aee5e8d7a23cc0b1352de5324af33bcde7c01
3
+ size 19500203
checkpoint_1007000/target.decoder.layers_15.mlp.wi_1.kernel/0.5 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9346c213d864a83e8b7c893834c5489aaa770ade387930c9a9a26fa71a4a4e4a
3
+ size 19499283
checkpoint_1007000/target.decoder.layers_15.mlp.wi_1.kernel/0.6 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b6c2de7332788264bc0cabe6465a6748c9b378a4eb961a7965d42059a58a0212
3
+ size 19499187
checkpoint_1007000/target.decoder.layers_15.mlp.wi_1.kernel/0.7 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b0923a051abb9de18aa5b6ecb18d9eb8278e79d17ec5ef71b12c8193c8594915
3
+ size 19499839
checkpoint_1007000/target.decoder.layers_16.encoder_decoder_attention.query.kernel/.zarray.__tmp14275400193037987122.~1663960300384017~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_16.encoder_decoder_attention.query.kernel/.zarray.__tmp5453924144578779166.~1663960300467517~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_16.encoder_decoder_attention.query.kernel/0.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2df3c7ee498018ada3395244f5cd966c96cfc36723a0170b446d5014ffc94a6e
3
+ size 7829506
checkpoint_1007000/target.decoder.layers_16.encoder_decoder_attention.query.kernel/0.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:846e55aa07403ec56feadbf63d504abb5486d9fa81b54a835aae87c970a90f0b
3
+ size 7817548
checkpoint_1007000/target.decoder.layers_16.encoder_decoder_attention.query.kernel/0.6 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:421ff9ef3aa7a31215303afde29fa305259111bfa93a74a9d8da996364a591ba
3
+ size 7817345
checkpoint_1007000/target.decoder.layers_16.encoder_decoder_attention.query.kernel/0.7 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8a24e3541ef54848bdd17cdf7301eb78109d3190dc5e5d938e28162f6021b72e
3
+ size 7818318
checkpoint_1007000/target.decoder.layers_2.self_attention.value.kernel/.zarray.__tmp14805654823044195203.~1663960300941182~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_2.self_attention.value.kernel/.zarray.__tmp18402290304374832220.~1663960300610766~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_2.self_attention.value.kernel/.zarray.__tmp6102370472552948078.~1663960300501139~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_2.self_attention.value.kernel/.zarray.__tmp6369220955053798728.~1663960300890367~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_2.self_attention.value.kernel/.zarray.__tmp7004825582130560441.~1663960300601053~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_2.self_attention.value.kernel/0.2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2ab5a5157075ef0c92909267349a61d6aeaf4fd4d5dcb109c9410424b5075450
3
+ size 7815895
checkpoint_1007000/target.decoder.layers_2.self_attention.value.kernel/0.3 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1f2ccd22a40964baef1ed5a3ef1326f9a1a22436a2fc864a380269e328621512
3
+ size 7820427
checkpoint_1007000/target.decoder.layers_2.self_attention.value.kernel/0.4 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:584cfb0f56c6ebf2e9c2052d064b3b30a4e6de3dac3a16e5d9d1548fcbfcaa6c
3
+ size 7820338
checkpoint_1007000/target.decoder.layers_2.self_attention.value.kernel/0.5 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0f3959986e249abe9d5710ce77d2c294658b4c04951bfa49526e69a9d1f6495a
3
+ size 7820664
checkpoint_1007000/target.decoder.layers_21.mlp.wi_1.kernel/.zarray ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_21.mlp.wi_1.kernel/.zarray.__tmp13176058321298810016.~1663960300549058~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_21.mlp.wi_1.kernel/.zarray.__tmp1715683602810787734.~1663960300986925~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_21.mlp.wi_1.kernel/.zarray.__tmp1806355867141919373.~1663960300862420~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_21.mlp.wi_1.kernel/.zarray.__tmp18355203970343633918.~1663960300466384~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_21.mlp.wi_1.kernel/.zarray.__tmp18395826612412633390.~1663960300551073~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_21.mlp.wi_1.kernel/.zarray.__tmp8508567864372588290.~1663960300472419~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_21.mlp.wi_1.kernel/.zarray.__tmp9748784751914184662.~1663960300602153~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_21.mlp.wi_1.kernel/0.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:81df7532ad11ecf0d825d107031c39b8bf566a2ef3564613c8f3f62d41ef1a7a
3
+ size 19498750
checkpoint_1007000/target.decoder.layers_21.mlp.wi_1.kernel/0.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5fd3fc124140dbd91842bd576c901cc6e858e15b06345bf2b28b4ae8c36185bf
3
+ size 19497807
checkpoint_1007000/target.decoder.layers_21.mlp.wi_1.kernel/0.2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ef77f53082e13c6251d79725fe4283fe250ed0b42babd8461dd9baa7d0733a94
3
+ size 19498545
checkpoint_1007000/target.decoder.layers_21.mlp.wi_1.kernel/0.3 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:70f7ee4713350e57aa976c9faf964a9884e8334bd5f4253afc82a68a71aa3e34
3
+ size 19498564