TimeRobber commited on
Commit
f2038ac
·
1 Parent(s): 778d6b7

Upload part 13

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. .gitattributes +53 -0
  2. checkpoint_1007000/target.decoder.layers_1.self_attention.value.kernel/.zarray +1 -0
  3. checkpoint_1007000/target.decoder.layers_1.self_attention.value.kernel/.zarray.__tmp14658094100065076136.~1663960300090561~ +1 -0
  4. checkpoint_1007000/target.decoder.layers_1.self_attention.value.kernel/.zarray.__tmp16230492432462742032.~1663960300387076~ +1 -0
  5. checkpoint_1007000/target.decoder.layers_1.self_attention.value.kernel/.zarray.__tmp16379259808268770224.~1663960300175113~ +1 -0
  6. checkpoint_1007000/target.decoder.layers_1.self_attention.value.kernel/.zarray.__tmp8894115837369550982.~1663960299882008~ +1 -0
  7. checkpoint_1007000/target.decoder.layers_1.self_attention.value.kernel/.zarray.__tmp8990031795982035122.~1663960299958555~ +1 -0
  8. checkpoint_1007000/target.decoder.layers_1.self_attention.value.kernel/0.0 +3 -0
  9. checkpoint_1007000/target.decoder.layers_1.self_attention.value.kernel/0.1 +3 -0
  10. checkpoint_1007000/target.decoder.layers_1.self_attention.value.kernel/0.2 +3 -0
  11. checkpoint_1007000/target.decoder.layers_1.self_attention.value.kernel/0.3 +3 -0
  12. checkpoint_1007000/target.decoder.layers_1.self_attention.value.kernel/0.4 +3 -0
  13. checkpoint_1007000/target.decoder.layers_1.self_attention.value.kernel/0.5 +3 -0
  14. checkpoint_1007000/target.decoder.layers_1.self_attention.value.kernel/0.6 +3 -0
  15. checkpoint_1007000/target.decoder.layers_1.self_attention.value.kernel/0.7 +3 -0
  16. checkpoint_1007000/target.decoder.layers_17.encoder_decoder_attention.key.kernel/.zarray.__tmp11577145964185916981.~1663960300086131~ +1 -0
  17. checkpoint_1007000/target.decoder.layers_17.encoder_decoder_attention.key.kernel/.zarray.__tmp9374932084099255530.~1663960300271661~ +1 -0
  18. checkpoint_1007000/target.decoder.layers_17.encoder_decoder_attention.key.kernel/0.4 +3 -0
  19. checkpoint_1007000/target.decoder.layers_3.pre_mlp_layer_norm.scale/.zarray +1 -0
  20. checkpoint_1007000/target.decoder.layers_3.pre_mlp_layer_norm.scale/0 +0 -0
  21. checkpoint_1007000/target.decoder.layers_9.self_attention.key.kernel/.zarray +1 -0
  22. checkpoint_1007000/target.decoder.layers_9.self_attention.key.kernel/.zarray.__tmp11094273487534505663.~1663960300308880~ +1 -0
  23. checkpoint_1007000/target.decoder.layers_9.self_attention.key.kernel/.zarray.__tmp11832826128042483391.~1663960300601290~ +1 -0
  24. checkpoint_1007000/target.decoder.layers_9.self_attention.key.kernel/0.0 +3 -0
  25. checkpoint_1007000/target.decoder.layers_9.self_attention.key.kernel/0.1 +3 -0
  26. checkpoint_1007000/target.decoder.layers_9.self_attention.key.kernel/0.2 +3 -0
  27. checkpoint_1007000/target.decoder.layers_9.self_attention.key.kernel/0.3 +3 -0
  28. checkpoint_1007000/target.decoder.layers_9.self_attention.key.kernel/0.4 +3 -0
  29. checkpoint_1007000/target.decoder.layers_9.self_attention.key.kernel/0.5 +3 -0
  30. checkpoint_1007000/target.decoder.layers_9.self_attention.key.kernel/0.6 +3 -0
  31. checkpoint_1007000/target.decoder.layers_9.self_attention.key.kernel/0.7 +3 -0
  32. checkpoint_1007000/target.encoder.layers_0.attention.query.kernel/.zarray +1 -0
  33. checkpoint_1007000/target.encoder.layers_0.attention.query.kernel/.zarray.__tmp11545495112761785230.~1663960300421208~ +1 -0
  34. checkpoint_1007000/target.encoder.layers_0.attention.query.kernel/.zarray.__tmp13140827661821471681.~1663960300546318~ +1 -0
  35. checkpoint_1007000/target.encoder.layers_0.attention.query.kernel/.zarray.__tmp15222983945689583177.~1663960300941715~ +1 -0
  36. checkpoint_1007000/target.encoder.layers_0.attention.query.kernel/.zarray.__tmp162813558043179627.~1663960300688213~ +1 -0
  37. checkpoint_1007000/target.encoder.layers_0.attention.query.kernel/.zarray.__tmp2276807198409161350.~1663960300385594~ +1 -0
  38. checkpoint_1007000/target.encoder.layers_0.attention.query.kernel/.zarray.__tmp4389650834453463471.~1663960300423047~ +1 -0
  39. checkpoint_1007000/target.encoder.layers_0.attention.query.kernel/.zarray.__tmp8798756328389882663.~1663960300552107~ +1 -0
  40. checkpoint_1007000/target.encoder.layers_0.attention.query.kernel/0.0 +3 -0
  41. checkpoint_1007000/target.encoder.layers_0.attention.query.kernel/0.1 +3 -0
  42. checkpoint_1007000/target.encoder.layers_0.attention.query.kernel/0.2 +3 -0
  43. checkpoint_1007000/target.encoder.layers_0.attention.query.kernel/0.3 +3 -0
  44. checkpoint_1007000/target.encoder.layers_0.attention.query.kernel/0.4 +3 -0
  45. checkpoint_1007000/target.encoder.layers_0.attention.query.kernel/0.5 +3 -0
  46. checkpoint_1007000/target.encoder.layers_0.attention.query.kernel/0.6 +3 -0
  47. checkpoint_1007000/target.encoder.layers_0.attention.query.kernel/0.7 +3 -0
  48. checkpoint_1007000/target.encoder.layers_17.mlp.wi_1.kernel/.zarray +1 -0
  49. checkpoint_1007000/target.encoder.layers_17.mlp.wi_1.kernel/.zarray.__tmp13440713807143523604.~1663960300863191~ +1 -0
  50. checkpoint_1007000/target.encoder.layers_17.mlp.wi_1.kernel/.zarray.__tmp14332112127674379251.~1663960300421660~ +1 -0
.gitattributes CHANGED
@@ -650,3 +650,56 @@ checkpoint_1007000/target.decoder.layers_17.encoder_decoder_attention.key.kernel
650
  checkpoint_1007000/target.decoder.layers_17.encoder_decoder_attention.key.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
651
  checkpoint_1007000/target.decoder.layers_17.encoder_decoder_attention.key.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
652
  checkpoint_1007000/target.decoder.layers_17.encoder_decoder_attention.key.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
650
  checkpoint_1007000/target.decoder.layers_17.encoder_decoder_attention.key.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
651
  checkpoint_1007000/target.decoder.layers_17.encoder_decoder_attention.key.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
652
  checkpoint_1007000/target.decoder.layers_17.encoder_decoder_attention.key.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
653
+ checkpoint_1007000/target.decoder.layers_17.encoder_decoder_attention.key.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
654
+ checkpoint_1007000/target.encoder.layers_4.attention.query.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
655
+ checkpoint_1007000/target.encoder.layers_4.attention.query.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
656
+ checkpoint_1007000/target.encoder.layers_4.attention.query.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
657
+ checkpoint_1007000/target.encoder.layers_4.attention.query.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
658
+ checkpoint_1007000/target.encoder.layers_4.attention.query.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
659
+ checkpoint_1007000/target.encoder.layers_4.attention.query.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
660
+ checkpoint_1007000/target.encoder.layers_4.attention.query.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
661
+ checkpoint_1007000/target.encoder.layers_4.attention.query.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
662
+ checkpoint_1007000/target.encoder.layers_22.attention.value.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
663
+ checkpoint_1007000/target.encoder.layers_22.attention.value.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
664
+ checkpoint_1007000/target.encoder.layers_22.attention.value.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
665
+ checkpoint_1007000/target.encoder.layers_22.attention.value.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
666
+ checkpoint_1007000/target.encoder.layers_22.attention.value.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
667
+ checkpoint_1007000/target.encoder.layers_22.attention.value.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
668
+ checkpoint_1007000/target.encoder.layers_22.attention.value.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
669
+ checkpoint_1007000/target.encoder.layers_22.attention.value.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
670
+ checkpoint_1007000/target.encoder.layers_0.attention.query.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
671
+ checkpoint_1007000/target.encoder.layers_0.attention.query.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
672
+ checkpoint_1007000/target.encoder.layers_0.attention.query.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
673
+ checkpoint_1007000/target.encoder.layers_0.attention.query.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
674
+ checkpoint_1007000/target.encoder.layers_0.attention.query.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
675
+ checkpoint_1007000/target.encoder.layers_0.attention.query.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
676
+ checkpoint_1007000/target.encoder.layers_0.attention.query.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
677
+ checkpoint_1007000/target.encoder.layers_0.attention.query.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
678
+ checkpoint_1007000/target.encoder.layers_17.mlp.wi_1.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
679
+ checkpoint_1007000/target.encoder.layers_17.mlp.wi_1.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
680
+ checkpoint_1007000/target.encoder.layers_17.mlp.wi_1.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
681
+ checkpoint_1007000/target.encoder.layers_17.mlp.wi_1.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
682
+ checkpoint_1007000/target.encoder.layers_17.mlp.wi_1.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
683
+ checkpoint_1007000/target.encoder.layers_17.mlp.wi_1.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
684
+ checkpoint_1007000/target.encoder.layers_17.mlp.wi_1.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
685
+ checkpoint_1007000/target.encoder.layers_17.mlp.wi_1.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
686
+ checkpoint_1007000/target.decoder.layers_1.self_attention.value.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
687
+ checkpoint_1007000/target.decoder.layers_1.self_attention.value.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
688
+ checkpoint_1007000/target.decoder.layers_1.self_attention.value.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
689
+ checkpoint_1007000/target.decoder.layers_1.self_attention.value.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
690
+ checkpoint_1007000/target.decoder.layers_1.self_attention.value.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
691
+ checkpoint_1007000/target.decoder.layers_1.self_attention.value.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
692
+ checkpoint_1007000/target.decoder.layers_1.self_attention.value.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
693
+ checkpoint_1007000/target.decoder.layers_1.self_attention.value.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
694
+ checkpoint_1007000/target.decoder.layers_9.self_attention.key.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
695
+ checkpoint_1007000/target.decoder.layers_9.self_attention.key.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
696
+ checkpoint_1007000/target.decoder.layers_9.self_attention.key.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
697
+ checkpoint_1007000/target.decoder.layers_9.self_attention.key.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
698
+ checkpoint_1007000/target.decoder.layers_9.self_attention.key.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
699
+ checkpoint_1007000/target.decoder.layers_9.self_attention.key.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
700
+ checkpoint_1007000/target.decoder.layers_9.self_attention.key.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
701
+ checkpoint_1007000/target.decoder.layers_9.self_attention.key.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
702
+ checkpoint_1007000/target.encoder.layers_23.mlp.wo.kernel/6.0 filter=lfs diff=lfs merge=lfs -text
703
+ checkpoint_1007000/target.encoder.layers_23.mlp.wo.kernel/1.0 filter=lfs diff=lfs merge=lfs -text
704
+ checkpoint_1007000/target.encoder.layers_23.mlp.wo.kernel/3.0 filter=lfs diff=lfs merge=lfs -text
705
+ checkpoint_1007000/target.encoder.layers_23.mlp.wo.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
checkpoint_1007000/target.decoder.layers_1.self_attention.value.kernel/.zarray ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_1.self_attention.value.kernel/.zarray.__tmp14658094100065076136.~1663960300090561~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_1.self_attention.value.kernel/.zarray.__tmp16230492432462742032.~1663960300387076~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_1.self_attention.value.kernel/.zarray.__tmp16379259808268770224.~1663960300175113~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_1.self_attention.value.kernel/.zarray.__tmp8894115837369550982.~1663960299882008~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_1.self_attention.value.kernel/.zarray.__tmp8990031795982035122.~1663960299958555~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_1.self_attention.value.kernel/0.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f6a30f11bdff8e1816aa8440b48708a7446da358fd95ba3d84b3b27bcf99276d
3
+ size 7814640
checkpoint_1007000/target.decoder.layers_1.self_attention.value.kernel/0.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8c1a110c98bb3427119464208aa12990acd3f8a2b434922707c48bd38d341566
3
+ size 7804931
checkpoint_1007000/target.decoder.layers_1.self_attention.value.kernel/0.2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4ed545265752dcae41736ed90081534d7ad8de9f5fbba2296ef835877d18c480
3
+ size 7800278
checkpoint_1007000/target.decoder.layers_1.self_attention.value.kernel/0.3 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dbee059f811bc97efd1ccbbb5d4cffd2a0a4afccb117e6501d32b950b25544ae
3
+ size 7808749
checkpoint_1007000/target.decoder.layers_1.self_attention.value.kernel/0.4 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f3a76999e096fddc05ef11a6524d091a644a407fa8e6e8bc87e6507c1c8f7e0b
3
+ size 7816034
checkpoint_1007000/target.decoder.layers_1.self_attention.value.kernel/0.5 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:266f15d2c82e2b840700c6af2be4d7452d18af52e40a6191cda70316dc799af8
3
+ size 7807960
checkpoint_1007000/target.decoder.layers_1.self_attention.value.kernel/0.6 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c47ac0776e59f0c18898557365714e809deb2b35a0df08c2d1451326e37e9cde
3
+ size 7814802
checkpoint_1007000/target.decoder.layers_1.self_attention.value.kernel/0.7 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3ebc325295929c79465a68f4ea2b2fcab693b7ecc8b8b2677e445ace89a42300
3
+ size 7805270
checkpoint_1007000/target.decoder.layers_17.encoder_decoder_attention.key.kernel/.zarray.__tmp11577145964185916981.~1663960300086131~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_17.encoder_decoder_attention.key.kernel/.zarray.__tmp9374932084099255530.~1663960300271661~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_17.encoder_decoder_attention.key.kernel/0.4 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cfdc5b2eab1c9016cdd8fbc186a5a1bafac804b14ffe84aa7db25a2408b98a5c
3
+ size 7804594
checkpoint_1007000/target.decoder.layers_3.pre_mlp_layer_norm.scale/.zarray ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_3.pre_mlp_layer_norm.scale/0 ADDED
Binary file (15 kB). View file
 
checkpoint_1007000/target.decoder.layers_9.self_attention.key.kernel/.zarray ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_9.self_attention.key.kernel/.zarray.__tmp11094273487534505663.~1663960300308880~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_9.self_attention.key.kernel/.zarray.__tmp11832826128042483391.~1663960300601290~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_9.self_attention.key.kernel/0.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9ee6fe1523955408a6d544abb90f458a5c3fa3a42c181cf2e1bf65989eb4f18f
3
+ size 7812419
checkpoint_1007000/target.decoder.layers_9.self_attention.key.kernel/0.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:498b593babc6ec7160c59ee2a853be0f2289627025a534a120689602c08f027b
3
+ size 7821411
checkpoint_1007000/target.decoder.layers_9.self_attention.key.kernel/0.2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2129698ef8523b5a379085029aeb0a4a7193eb7b24f6fb2afd3f55af5b133dd6
3
+ size 7825787
checkpoint_1007000/target.decoder.layers_9.self_attention.key.kernel/0.3 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a647768208da0a3a89ad492f46b29000b1d3fd62c2a73275e64576eec1c9bdb9
3
+ size 7810434
checkpoint_1007000/target.decoder.layers_9.self_attention.key.kernel/0.4 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:480ec40a32fa68b8423fc3f033a5b56456eb04805b29b0601cc9dafa143680e0
3
+ size 7822797
checkpoint_1007000/target.decoder.layers_9.self_attention.key.kernel/0.5 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e19c2b1cdc06085ba40ea79f0e2b64dd32f6c49707eeb717b88a39123e814b5e
3
+ size 7826665
checkpoint_1007000/target.decoder.layers_9.self_attention.key.kernel/0.6 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bb3e300be6926f62c00a7dd5081aedebdaf6d32fa58c3d32d1ed6d4d35fbf19c
3
+ size 7817810
checkpoint_1007000/target.decoder.layers_9.self_attention.key.kernel/0.7 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dc4ba268ceab1c440fc7f1647fa7743326acdc8c56fff6b30af6ed914e15525b
3
+ size 7816754
checkpoint_1007000/target.encoder.layers_0.attention.query.kernel/.zarray ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
checkpoint_1007000/target.encoder.layers_0.attention.query.kernel/.zarray.__tmp11545495112761785230.~1663960300421208~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
checkpoint_1007000/target.encoder.layers_0.attention.query.kernel/.zarray.__tmp13140827661821471681.~1663960300546318~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
checkpoint_1007000/target.encoder.layers_0.attention.query.kernel/.zarray.__tmp15222983945689583177.~1663960300941715~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
checkpoint_1007000/target.encoder.layers_0.attention.query.kernel/.zarray.__tmp162813558043179627.~1663960300688213~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
checkpoint_1007000/target.encoder.layers_0.attention.query.kernel/.zarray.__tmp2276807198409161350.~1663960300385594~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
checkpoint_1007000/target.encoder.layers_0.attention.query.kernel/.zarray.__tmp4389650834453463471.~1663960300423047~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
checkpoint_1007000/target.encoder.layers_0.attention.query.kernel/.zarray.__tmp8798756328389882663.~1663960300552107~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
checkpoint_1007000/target.encoder.layers_0.attention.query.kernel/0.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ef0e14ac18af3fd3cea52c137befcb494d7b81d0252a5116d301ec76fe503e9c
3
+ size 7813809
checkpoint_1007000/target.encoder.layers_0.attention.query.kernel/0.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:93505479e928d6d35502b9a871a1982265b51dba82b87a685f1c77f4ba78c364
3
+ size 7815254
checkpoint_1007000/target.encoder.layers_0.attention.query.kernel/0.2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:252ca20d245d9180aed6c2a770be65f560be53252cb5e5d3ae2c3cb40bc677be
3
+ size 7813169
checkpoint_1007000/target.encoder.layers_0.attention.query.kernel/0.3 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bf249000e51b7ef82c68e838dfc86f613445605b2e46bb258b75cbc1d472b103
3
+ size 7815115
checkpoint_1007000/target.encoder.layers_0.attention.query.kernel/0.4 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:61f47f93552ec62e8aa7ab2b6f6c827f7e90f311f789d309aa8527b6029ea6bf
3
+ size 7814756
checkpoint_1007000/target.encoder.layers_0.attention.query.kernel/0.5 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1b71bdecd28cacca5c1221e3aa215e70f273947dd4ed7296a10faa8909049ef5
3
+ size 7818533
checkpoint_1007000/target.encoder.layers_0.attention.query.kernel/0.6 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3e553124a9d99ffc589ccb1358a6eac944930c4d98e5a7d97b4524c1caf4fcf7
3
+ size 7814298
checkpoint_1007000/target.encoder.layers_0.attention.query.kernel/0.7 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d21afbd5babd00fdd95cbf7fc03e030bb962e1bd4b96cd082e3b132f340b97c5
3
+ size 7813354
checkpoint_1007000/target.encoder.layers_17.mlp.wi_1.kernel/.zarray ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
checkpoint_1007000/target.encoder.layers_17.mlp.wi_1.kernel/.zarray.__tmp13440713807143523604.~1663960300863191~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
checkpoint_1007000/target.encoder.layers_17.mlp.wi_1.kernel/.zarray.__tmp14332112127674379251.~1663960300421660~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}