TimeRobber commited on
Commit
80d4197
·
1 Parent(s): e4b46a6

Upload part 55

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. .gitattributes +54 -0
  2. checkpoint_1007000/state.param_states.encoder.layers_9.pre_mlp_layer_norm.scale.v/.zarray +1 -0
  3. checkpoint_1007000/state.param_states.encoder.layers_9.pre_mlp_layer_norm.scale.v/0 +0 -0
  4. checkpoint_1007000/target.decoder.layers_10.self_attention.out.kernel/.zarray +1 -0
  5. checkpoint_1007000/target.decoder.layers_10.self_attention.out.kernel/.zarray.__tmp1105937564183758640.~1663960300385287~ +1 -0
  6. checkpoint_1007000/target.decoder.layers_10.self_attention.out.kernel/.zarray.__tmp15260046325040061733.~1663960300015249~ +1 -0
  7. checkpoint_1007000/target.decoder.layers_10.self_attention.out.kernel/.zarray.__tmp16338011193803630159.~1663960299960414~ +1 -0
  8. checkpoint_1007000/target.decoder.layers_10.self_attention.out.kernel/.zarray.__tmp17973336360947397177.~1663960300229539~ +1 -0
  9. checkpoint_1007000/target.decoder.layers_10.self_attention.out.kernel/.zarray.__tmp4456958716237740877.~1663960300269062~ +1 -0
  10. checkpoint_1007000/target.decoder.layers_10.self_attention.out.kernel/.zarray.__tmp6550413818954659962.~1663960300089897~ +1 -0
  11. checkpoint_1007000/target.decoder.layers_10.self_attention.out.kernel/0.0 +3 -0
  12. checkpoint_1007000/target.decoder.layers_10.self_attention.out.kernel/1.0 +3 -0
  13. checkpoint_1007000/target.decoder.layers_10.self_attention.out.kernel/2.0 +3 -0
  14. checkpoint_1007000/target.decoder.layers_10.self_attention.out.kernel/3.0 +3 -0
  15. checkpoint_1007000/target.decoder.layers_10.self_attention.out.kernel/4.0 +3 -0
  16. checkpoint_1007000/target.decoder.layers_10.self_attention.out.kernel/5.0 +3 -0
  17. checkpoint_1007000/target.decoder.layers_10.self_attention.out.kernel/6.0 +3 -0
  18. checkpoint_1007000/target.decoder.layers_10.self_attention.out.kernel/7.0 +3 -0
  19. checkpoint_1007000/target.decoder.layers_12.mlp.wo.kernel/.zarray +1 -0
  20. checkpoint_1007000/target.decoder.layers_12.mlp.wo.kernel/.zarray.__tmp10566777187724039402.~1663960300502375~ +1 -0
  21. checkpoint_1007000/target.decoder.layers_12.mlp.wo.kernel/.zarray.__tmp1347708317805751784.~1663960300822526~ +1 -0
  22. checkpoint_1007000/target.decoder.layers_12.mlp.wo.kernel/.zarray.__tmp13560500597481309211.~1663960300548101~ +1 -0
  23. checkpoint_1007000/target.decoder.layers_12.mlp.wo.kernel/.zarray.__tmp3254274290136234671.~1663960300826412~ +1 -0
  24. checkpoint_1007000/target.decoder.layers_12.mlp.wo.kernel/.zarray.__tmp3740934665043393579.~1663960300938689~ +1 -0
  25. checkpoint_1007000/target.decoder.layers_12.mlp.wo.kernel/.zarray.__tmp4268711832544831810.~1663960300729669~ +1 -0
  26. checkpoint_1007000/target.decoder.layers_12.mlp.wo.kernel/.zarray.__tmp9074334274789578976.~1663960300622114~ +1 -0
  27. checkpoint_1007000/target.decoder.layers_12.mlp.wo.kernel/0.0 +3 -0
  28. checkpoint_1007000/target.decoder.layers_12.mlp.wo.kernel/1.0 +3 -0
  29. checkpoint_1007000/target.decoder.layers_12.mlp.wo.kernel/2.0 +3 -0
  30. checkpoint_1007000/target.decoder.layers_12.mlp.wo.kernel/3.0 +3 -0
  31. checkpoint_1007000/target.decoder.layers_12.mlp.wo.kernel/4.0 +3 -0
  32. checkpoint_1007000/target.decoder.layers_12.mlp.wo.kernel/5.0 +3 -0
  33. checkpoint_1007000/target.decoder.layers_12.mlp.wo.kernel/6.0 +3 -0
  34. checkpoint_1007000/target.decoder.layers_12.mlp.wo.kernel/7.0 +3 -0
  35. checkpoint_1007000/target.decoder.layers_19.self_attention.out.kernel/.zarray +1 -0
  36. checkpoint_1007000/target.decoder.layers_19.self_attention.out.kernel/.zarray.__tmp17012158359598794522.~1663960300132054~ +1 -0
  37. checkpoint_1007000/target.decoder.layers_19.self_attention.out.kernel/0.0 +3 -0
  38. checkpoint_1007000/target.decoder.layers_19.self_attention.out.kernel/2.0 +3 -0
  39. checkpoint_1007000/target.decoder.layers_19.self_attention.out.kernel/3.0 +3 -0
  40. checkpoint_1007000/target.decoder.layers_19.self_attention.out.kernel/4.0 +3 -0
  41. checkpoint_1007000/target.decoder.layers_19.self_attention.out.kernel/5.0 +3 -0
  42. checkpoint_1007000/target.decoder.layers_19.self_attention.out.kernel/7.0 +3 -0
  43. checkpoint_1007000/target.decoder.layers_2.encoder_decoder_attention.out.kernel/.zarray +1 -0
  44. checkpoint_1007000/target.decoder.layers_2.encoder_decoder_attention.out.kernel/.zarray.__tmp13528873057967423628.~1663960300500187~ +1 -0
  45. checkpoint_1007000/target.decoder.layers_2.encoder_decoder_attention.out.kernel/.zarray.__tmp1499336269700896617.~1663960300729091~ +1 -0
  46. checkpoint_1007000/target.decoder.layers_2.encoder_decoder_attention.out.kernel/.zarray.__tmp17842300620868211239.~1663960300424968~ +1 -0
  47. checkpoint_1007000/target.decoder.layers_2.encoder_decoder_attention.out.kernel/0.0 +3 -0
  48. checkpoint_1007000/target.decoder.layers_2.encoder_decoder_attention.out.kernel/1.0 +3 -0
  49. checkpoint_1007000/target.decoder.layers_2.encoder_decoder_attention.out.kernel/2.0 +3 -0
  50. checkpoint_1007000/target.decoder.layers_2.encoder_decoder_attention.out.kernel/3.0 +3 -0
.gitattributes CHANGED
@@ -2773,3 +2773,57 @@ checkpoint_1007000/target.encoder.layers_13.mlp.wi_0.kernel/0.2 filter=lfs diff=
2773
  checkpoint_1007000/target.encoder.layers_13.mlp.wi_0.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
2774
  checkpoint_1007000/target.decoder.layers_19.self_attention.out.kernel/6.0 filter=lfs diff=lfs merge=lfs -text
2775
  checkpoint_1007000/target.decoder.layers_19.self_attention.out.kernel/1.0 filter=lfs diff=lfs merge=lfs -text
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
2773
  checkpoint_1007000/target.encoder.layers_13.mlp.wi_0.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
2774
  checkpoint_1007000/target.decoder.layers_19.self_attention.out.kernel/6.0 filter=lfs diff=lfs merge=lfs -text
2775
  checkpoint_1007000/target.decoder.layers_19.self_attention.out.kernel/1.0 filter=lfs diff=lfs merge=lfs -text
2776
+ checkpoint_1007000/target.decoder.layers_19.self_attention.out.kernel/3.0 filter=lfs diff=lfs merge=lfs -text
2777
+ checkpoint_1007000/target.decoder.layers_19.self_attention.out.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
2778
+ checkpoint_1007000/target.decoder.layers_19.self_attention.out.kernel/7.0 filter=lfs diff=lfs merge=lfs -text
2779
+ checkpoint_1007000/target.decoder.layers_19.self_attention.out.kernel/5.0 filter=lfs diff=lfs merge=lfs -text
2780
+ checkpoint_1007000/target.decoder.layers_19.self_attention.out.kernel/2.0 filter=lfs diff=lfs merge=lfs -text
2781
+ checkpoint_1007000/target.decoder.layers_19.self_attention.out.kernel/4.0 filter=lfs diff=lfs merge=lfs -text
2782
+ checkpoint_1007000/target.encoder.layers_8.mlp.wo.kernel/6.0 filter=lfs diff=lfs merge=lfs -text
2783
+ checkpoint_1007000/target.encoder.layers_8.mlp.wo.kernel/1.0 filter=lfs diff=lfs merge=lfs -text
2784
+ checkpoint_1007000/target.encoder.layers_8.mlp.wo.kernel/3.0 filter=lfs diff=lfs merge=lfs -text
2785
+ checkpoint_1007000/target.encoder.layers_8.mlp.wo.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
2786
+ checkpoint_1007000/target.encoder.layers_8.mlp.wo.kernel/7.0 filter=lfs diff=lfs merge=lfs -text
2787
+ checkpoint_1007000/target.encoder.layers_8.mlp.wo.kernel/5.0 filter=lfs diff=lfs merge=lfs -text
2788
+ checkpoint_1007000/target.encoder.layers_8.mlp.wo.kernel/2.0 filter=lfs diff=lfs merge=lfs -text
2789
+ checkpoint_1007000/target.encoder.layers_8.mlp.wo.kernel/4.0 filter=lfs diff=lfs merge=lfs -text
2790
+ checkpoint_1007000/target.decoder.layers_10.self_attention.out.kernel/6.0 filter=lfs diff=lfs merge=lfs -text
2791
+ checkpoint_1007000/target.decoder.layers_10.self_attention.out.kernel/1.0 filter=lfs diff=lfs merge=lfs -text
2792
+ checkpoint_1007000/target.decoder.layers_10.self_attention.out.kernel/3.0 filter=lfs diff=lfs merge=lfs -text
2793
+ checkpoint_1007000/target.decoder.layers_10.self_attention.out.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
2794
+ checkpoint_1007000/target.decoder.layers_10.self_attention.out.kernel/7.0 filter=lfs diff=lfs merge=lfs -text
2795
+ checkpoint_1007000/target.decoder.layers_10.self_attention.out.kernel/5.0 filter=lfs diff=lfs merge=lfs -text
2796
+ checkpoint_1007000/target.decoder.layers_10.self_attention.out.kernel/2.0 filter=lfs diff=lfs merge=lfs -text
2797
+ checkpoint_1007000/target.decoder.layers_10.self_attention.out.kernel/4.0 filter=lfs diff=lfs merge=lfs -text
2798
+ checkpoint_1007000/target.encoder.layers_6.attention.query.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
2799
+ checkpoint_1007000/target.encoder.layers_6.attention.query.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
2800
+ checkpoint_1007000/target.encoder.layers_6.attention.query.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
2801
+ checkpoint_1007000/target.encoder.layers_6.attention.query.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
2802
+ checkpoint_1007000/target.encoder.layers_6.attention.query.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
2803
+ checkpoint_1007000/target.encoder.layers_6.attention.query.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
2804
+ checkpoint_1007000/target.encoder.layers_6.attention.query.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
2805
+ checkpoint_1007000/target.encoder.layers_6.attention.query.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
2806
+ checkpoint_1007000/target.decoder.layers_4.encoder_decoder_attention.out.kernel/6.0 filter=lfs diff=lfs merge=lfs -text
2807
+ checkpoint_1007000/target.decoder.layers_4.encoder_decoder_attention.out.kernel/1.0 filter=lfs diff=lfs merge=lfs -text
2808
+ checkpoint_1007000/target.decoder.layers_4.encoder_decoder_attention.out.kernel/3.0 filter=lfs diff=lfs merge=lfs -text
2809
+ checkpoint_1007000/target.decoder.layers_4.encoder_decoder_attention.out.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
2810
+ checkpoint_1007000/target.decoder.layers_4.encoder_decoder_attention.out.kernel/7.0 filter=lfs diff=lfs merge=lfs -text
2811
+ checkpoint_1007000/target.decoder.layers_4.encoder_decoder_attention.out.kernel/5.0 filter=lfs diff=lfs merge=lfs -text
2812
+ checkpoint_1007000/target.decoder.layers_4.encoder_decoder_attention.out.kernel/2.0 filter=lfs diff=lfs merge=lfs -text
2813
+ checkpoint_1007000/target.decoder.layers_4.encoder_decoder_attention.out.kernel/4.0 filter=lfs diff=lfs merge=lfs -text
2814
+ checkpoint_1007000/target.decoder.layers_12.mlp.wo.kernel/6.0 filter=lfs diff=lfs merge=lfs -text
2815
+ checkpoint_1007000/target.decoder.layers_12.mlp.wo.kernel/1.0 filter=lfs diff=lfs merge=lfs -text
2816
+ checkpoint_1007000/target.decoder.layers_12.mlp.wo.kernel/3.0 filter=lfs diff=lfs merge=lfs -text
2817
+ checkpoint_1007000/target.decoder.layers_12.mlp.wo.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
2818
+ checkpoint_1007000/target.decoder.layers_12.mlp.wo.kernel/7.0 filter=lfs diff=lfs merge=lfs -text
2819
+ checkpoint_1007000/target.decoder.layers_12.mlp.wo.kernel/5.0 filter=lfs diff=lfs merge=lfs -text
2820
+ checkpoint_1007000/target.decoder.layers_12.mlp.wo.kernel/2.0 filter=lfs diff=lfs merge=lfs -text
2821
+ checkpoint_1007000/target.decoder.layers_12.mlp.wo.kernel/4.0 filter=lfs diff=lfs merge=lfs -text
2822
+ checkpoint_1007000/target.decoder.layers_2.encoder_decoder_attention.out.kernel/6.0 filter=lfs diff=lfs merge=lfs -text
2823
+ checkpoint_1007000/target.decoder.layers_2.encoder_decoder_attention.out.kernel/1.0 filter=lfs diff=lfs merge=lfs -text
2824
+ checkpoint_1007000/target.decoder.layers_2.encoder_decoder_attention.out.kernel/3.0 filter=lfs diff=lfs merge=lfs -text
2825
+ checkpoint_1007000/target.decoder.layers_2.encoder_decoder_attention.out.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
2826
+ checkpoint_1007000/target.decoder.layers_2.encoder_decoder_attention.out.kernel/7.0 filter=lfs diff=lfs merge=lfs -text
2827
+ checkpoint_1007000/target.decoder.layers_2.encoder_decoder_attention.out.kernel/5.0 filter=lfs diff=lfs merge=lfs -text
2828
+ checkpoint_1007000/target.decoder.layers_2.encoder_decoder_attention.out.kernel/2.0 filter=lfs diff=lfs merge=lfs -text
2829
+ checkpoint_1007000/target.decoder.layers_2.encoder_decoder_attention.out.kernel/4.0 filter=lfs diff=lfs merge=lfs -text
checkpoint_1007000/state.param_states.encoder.layers_9.pre_mlp_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096],"zarr_format":2}
checkpoint_1007000/state.param_states.encoder.layers_9.pre_mlp_layer_norm.scale.v/0 ADDED
Binary file (15.3 kB). View file
 
checkpoint_1007000/target.decoder.layers_10.self_attention.out.kernel/.zarray ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[512,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_10.self_attention.out.kernel/.zarray.__tmp1105937564183758640.~1663960300385287~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[512,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_10.self_attention.out.kernel/.zarray.__tmp15260046325040061733.~1663960300015249~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[512,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_10.self_attention.out.kernel/.zarray.__tmp16338011193803630159.~1663960299960414~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[512,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_10.self_attention.out.kernel/.zarray.__tmp17973336360947397177.~1663960300229539~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[512,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_10.self_attention.out.kernel/.zarray.__tmp4456958716237740877.~1663960300269062~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[512,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_10.self_attention.out.kernel/.zarray.__tmp6550413818954659962.~1663960300089897~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[512,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_10.self_attention.out.kernel/0.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:14d66b8a9a7fd4f9fca0e71aa936ed0d599101321b99c1015b85ea5eb9fcad98
3
+ size 7815329
checkpoint_1007000/target.decoder.layers_10.self_attention.out.kernel/1.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:859f60411b6d2a62bba21fc946b24481b11a49538f563ea9ebd6e9bbef8e3c4b
3
+ size 7814419
checkpoint_1007000/target.decoder.layers_10.self_attention.out.kernel/2.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:39d87eaf5730070828b8810551ac99870d193d974bb0c1f63eafea82417b5e75
3
+ size 7814004
checkpoint_1007000/target.decoder.layers_10.self_attention.out.kernel/3.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6c5ecf8051338723fd2e506791022c8ce49d75051daaaf5575601aedaf18e59a
3
+ size 7814979
checkpoint_1007000/target.decoder.layers_10.self_attention.out.kernel/4.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aaeb62ffe69e8e3dc6d8004d75418abb2d1f9bb635b89c66daace3fff4564f46
3
+ size 7815022
checkpoint_1007000/target.decoder.layers_10.self_attention.out.kernel/5.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:358210a1c8fbafbea4046fee6a4cb63707c0d2c97ff24708bbf5562fd734c855
3
+ size 7812398
checkpoint_1007000/target.decoder.layers_10.self_attention.out.kernel/6.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0038f285a990bf58bcf449aa175e5f3dc0d02824ad8582236077f560c6c55f40
3
+ size 7813357
checkpoint_1007000/target.decoder.layers_10.self_attention.out.kernel/7.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0031c644d7704833825c511a130eace4092be56785872cb86bf13175a714b938
3
+ size 7811733
checkpoint_1007000/target.decoder.layers_12.mlp.wo.kernel/.zarray ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[1280,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[10240,4096],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_12.mlp.wo.kernel/.zarray.__tmp10566777187724039402.~1663960300502375~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[1280,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[10240,4096],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_12.mlp.wo.kernel/.zarray.__tmp1347708317805751784.~1663960300822526~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[1280,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[10240,4096],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_12.mlp.wo.kernel/.zarray.__tmp13560500597481309211.~1663960300548101~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[1280,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[10240,4096],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_12.mlp.wo.kernel/.zarray.__tmp3254274290136234671.~1663960300826412~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[1280,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[10240,4096],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_12.mlp.wo.kernel/.zarray.__tmp3740934665043393579.~1663960300938689~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[1280,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[10240,4096],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_12.mlp.wo.kernel/.zarray.__tmp4268711832544831810.~1663960300729669~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[1280,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[10240,4096],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_12.mlp.wo.kernel/.zarray.__tmp9074334274789578976.~1663960300622114~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[1280,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[10240,4096],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_12.mlp.wo.kernel/0.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dad001c678352e4c543805f0c7c89996fc9335d8049ca42144477988bb944301
3
+ size 19547411
checkpoint_1007000/target.decoder.layers_12.mlp.wo.kernel/1.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:af2c9811711cc482bbfaa4bea1b79aee6ecce6a9aac00d97229547c421102c86
3
+ size 19547290
checkpoint_1007000/target.decoder.layers_12.mlp.wo.kernel/2.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:56df1744db0f6b3be75e5c70d388e0f37b43c9afde58038b29ff04e5a627f5a6
3
+ size 19547356
checkpoint_1007000/target.decoder.layers_12.mlp.wo.kernel/3.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:37abfe7f832307d1cd3b4e9ed215928b25621fbee2fb31ccfde54e1174ac2a12
3
+ size 19546715
checkpoint_1007000/target.decoder.layers_12.mlp.wo.kernel/4.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:976d917a3b4857c36e3686b8b38bcfda604a7d1ae0a074ec0159487f80140450
3
+ size 19547102
checkpoint_1007000/target.decoder.layers_12.mlp.wo.kernel/5.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4ca0a34a83edb4b4b0bcc4f63ee9177fc09b7b09ddc74c690a494bb9ee412745
3
+ size 19547223
checkpoint_1007000/target.decoder.layers_12.mlp.wo.kernel/6.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4569daf609e906701708f00b4325ed5f0438a367beffbcc748f585dd5048d204
3
+ size 19546611
checkpoint_1007000/target.decoder.layers_12.mlp.wo.kernel/7.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5f017dfaf0f98ed36896c81ace50bb55de7164a6e2545bd6558360cc20930c19
3
+ size 19547073
checkpoint_1007000/target.decoder.layers_19.self_attention.out.kernel/.zarray ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[512,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_19.self_attention.out.kernel/.zarray.__tmp17012158359598794522.~1663960300132054~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[512,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_19.self_attention.out.kernel/0.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:79d5b97e5dffddf344aa1a4c4aba71b5b45462f682d8b9a3ad25bcb55e9ad0fd
3
+ size 7804234
checkpoint_1007000/target.decoder.layers_19.self_attention.out.kernel/2.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e2a2690dec9b402469073c23bb92f0afe2cabf45bed4e5121a2c2329767736fd
3
+ size 7805172
checkpoint_1007000/target.decoder.layers_19.self_attention.out.kernel/3.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d05188293e8d66ccd355ac0cebce9dd73c2a1c781cd5f8ebad98d7f0d21143ab
3
+ size 7804864
checkpoint_1007000/target.decoder.layers_19.self_attention.out.kernel/4.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2fbaa2868fd28a1fbb535827a4e53826da1f3a7db432389e4d6b9dc54513f676
3
+ size 7803327
checkpoint_1007000/target.decoder.layers_19.self_attention.out.kernel/5.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8a3c69875e40a669ab8daae0f4af5af1720619f6612496ebec9617f4ce480b2f
3
+ size 7805047
checkpoint_1007000/target.decoder.layers_19.self_attention.out.kernel/7.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6e29169c980821ecdf9fc25ce4f1d04ea34a3173c5dbbb88878ba34e63422295
3
+ size 7803180
checkpoint_1007000/target.decoder.layers_2.encoder_decoder_attention.out.kernel/.zarray ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[512,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_2.encoder_decoder_attention.out.kernel/.zarray.__tmp13528873057967423628.~1663960300500187~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[512,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_2.encoder_decoder_attention.out.kernel/.zarray.__tmp1499336269700896617.~1663960300729091~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[512,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_2.encoder_decoder_attention.out.kernel/.zarray.__tmp17842300620868211239.~1663960300424968~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[512,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_2.encoder_decoder_attention.out.kernel/0.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9eb87bf15d477db621dc2176ce414fa22fc1f00ba7de640d8d4e50b2adf65141
3
+ size 7810379
checkpoint_1007000/target.decoder.layers_2.encoder_decoder_attention.out.kernel/1.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e9b0ed2565a589d24d3bedd1ad7a740c4cfed5cefa758e5ac8d2a0d81e90e970
3
+ size 7808995
checkpoint_1007000/target.decoder.layers_2.encoder_decoder_attention.out.kernel/2.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2c4d56de663b52dff8cf1fb27b9e1bf7aed9661e52a1435ebde4f7cf373f78f0
3
+ size 7809281
checkpoint_1007000/target.decoder.layers_2.encoder_decoder_attention.out.kernel/3.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:23ca5c0402acd6ab7c1efb59f6df9ff276b39e00803aa6778c0bba30ec514b42
3
+ size 7808493