TimeRobber commited on
Commit
97cbfe7
·
1 Parent(s): 60f6115

Upload part 50

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. .gitattributes +48 -0
  2. checkpoint_1007000/state.param_states.decoder.layers_4.pre_cross_attention_layer_norm.scale.v/.zarray +1 -0
  3. checkpoint_1007000/state.param_states.decoder.layers_4.pre_cross_attention_layer_norm.scale.v/0 +0 -0
  4. checkpoint_1007000/state.param_states.encoder.layers_10.pre_attention_layer_norm.scale.v/.zarray +1 -0
  5. checkpoint_1007000/state.param_states.encoder.layers_10.pre_attention_layer_norm.scale.v/0 +0 -0
  6. checkpoint_1007000/state.param_states.encoder.layers_13.pre_attention_layer_norm.scale.v/.zarray +1 -0
  7. checkpoint_1007000/state.param_states.encoder.layers_13.pre_attention_layer_norm.scale.v/0 +0 -0
  8. checkpoint_1007000/target.decoder.layers_13.mlp.wi_1.kernel/.zarray +1 -0
  9. checkpoint_1007000/target.decoder.layers_13.mlp.wi_1.kernel/.zarray.__tmp11765571810778950051.~1663960300383759~ +1 -0
  10. checkpoint_1007000/target.decoder.layers_13.mlp.wi_1.kernel/.zarray.__tmp12912070580570867986.~1663960300500833~ +1 -0
  11. checkpoint_1007000/target.decoder.layers_13.mlp.wi_1.kernel/.zarray.__tmp1514902467801034416.~1663960300780080~ +1 -0
  12. checkpoint_1007000/target.decoder.layers_13.mlp.wi_1.kernel/.zarray.__tmp8901551791242477798.~1663960300683632~ +1 -0
  13. checkpoint_1007000/target.decoder.layers_13.mlp.wi_1.kernel/0.0 +3 -0
  14. checkpoint_1007000/target.decoder.layers_13.mlp.wi_1.kernel/0.1 +3 -0
  15. checkpoint_1007000/target.decoder.layers_13.mlp.wi_1.kernel/0.6 +3 -0
  16. checkpoint_1007000/target.decoder.layers_13.mlp.wi_1.kernel/0.7 +3 -0
  17. checkpoint_1007000/target.decoder.layers_13.self_attention.key.kernel/.zarray +1 -0
  18. checkpoint_1007000/target.decoder.layers_13.self_attention.key.kernel/.zarray.__tmp10324667221790502572.~1663960300499537~ +1 -0
  19. checkpoint_1007000/target.decoder.layers_13.self_attention.key.kernel/.zarray.__tmp10538194903622094863.~1663960300728954~ +1 -0
  20. checkpoint_1007000/target.decoder.layers_13.self_attention.key.kernel/.zarray.__tmp11940870617194847787.~1663960300686060~ +1 -0
  21. checkpoint_1007000/target.decoder.layers_13.self_attention.key.kernel/.zarray.__tmp12433849344879772157.~1663960300271694~ +1 -0
  22. checkpoint_1007000/target.decoder.layers_13.self_attention.key.kernel/.zarray.__tmp13999437852346953159.~1663960300090637~ +1 -0
  23. checkpoint_1007000/target.decoder.layers_13.self_attention.key.kernel/.zarray.__tmp18183955016099952054.~1663960300502067~ +1 -0
  24. checkpoint_1007000/target.decoder.layers_13.self_attention.key.kernel/0.0 +3 -0
  25. checkpoint_1007000/target.decoder.layers_13.self_attention.key.kernel/0.1 +3 -0
  26. checkpoint_1007000/target.decoder.layers_13.self_attention.key.kernel/0.2 +3 -0
  27. checkpoint_1007000/target.decoder.layers_13.self_attention.key.kernel/0.3 +3 -0
  28. checkpoint_1007000/target.decoder.layers_13.self_attention.key.kernel/0.4 +3 -0
  29. checkpoint_1007000/target.decoder.layers_13.self_attention.key.kernel/0.5 +3 -0
  30. checkpoint_1007000/target.decoder.layers_13.self_attention.key.kernel/0.6 +3 -0
  31. checkpoint_1007000/target.decoder.layers_13.self_attention.key.kernel/0.7 +3 -0
  32. checkpoint_1007000/target.decoder.layers_2.self_attention.query.kernel/.zarray +1 -0
  33. checkpoint_1007000/target.decoder.layers_2.self_attention.query.kernel/.zarray.__tmp12802281532173975450.~1663960300548609~ +1 -0
  34. checkpoint_1007000/target.decoder.layers_2.self_attention.query.kernel/.zarray.__tmp14103607313915582811.~1663960300685478~ +1 -0
  35. checkpoint_1007000/target.decoder.layers_2.self_attention.query.kernel/.zarray.__tmp16104034802188478716.~1663960300551451~ +1 -0
  36. checkpoint_1007000/target.decoder.layers_2.self_attention.query.kernel/.zarray.__tmp1667756116761455245.~1663960300823209~ +1 -0
  37. checkpoint_1007000/target.decoder.layers_2.self_attention.query.kernel/.zarray.__tmp17875011171297452638.~1663960300466131~ +1 -0
  38. checkpoint_1007000/target.decoder.layers_2.self_attention.query.kernel/.zarray.__tmp6087844182203796233.~1663960300731622~ +1 -0
  39. checkpoint_1007000/target.decoder.layers_2.self_attention.query.kernel/.zarray.__tmp9039702464578184575.~1663960300468210~ +1 -0
  40. checkpoint_1007000/target.decoder.layers_2.self_attention.query.kernel/0.0 +3 -0
  41. checkpoint_1007000/target.decoder.layers_2.self_attention.query.kernel/0.1 +3 -0
  42. checkpoint_1007000/target.decoder.layers_2.self_attention.query.kernel/0.2 +3 -0
  43. checkpoint_1007000/target.decoder.layers_2.self_attention.query.kernel/0.3 +3 -0
  44. checkpoint_1007000/target.decoder.layers_2.self_attention.query.kernel/0.4 +3 -0
  45. checkpoint_1007000/target.decoder.layers_2.self_attention.query.kernel/0.5 +3 -0
  46. checkpoint_1007000/target.decoder.layers_2.self_attention.query.kernel/0.6 +3 -0
  47. checkpoint_1007000/target.decoder.layers_2.self_attention.query.kernel/0.7 +3 -0
  48. checkpoint_1007000/target.decoder.layers_21.encoder_decoder_attention.key.kernel/.zarray +1 -0
  49. checkpoint_1007000/target.decoder.layers_21.encoder_decoder_attention.key.kernel/.zarray.__tmp3372111309395329355.~1663960300601058~ +1 -0
  50. checkpoint_1007000/target.decoder.layers_21.encoder_decoder_attention.key.kernel/.zarray.__tmp8212117750309176957.~1663960300308686~ +1 -0
.gitattributes CHANGED
@@ -2527,3 +2527,51 @@ checkpoint_1007000/target.decoder.layers_3.mlp.wi_1.kernel/0.1 filter=lfs diff=l
2527
  checkpoint_1007000/target.decoder.layers_3.mlp.wi_1.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
2528
  checkpoint_1007000/target.decoder.layers_3.mlp.wi_1.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
2529
  checkpoint_1007000/target.decoder.layers_3.mlp.wi_1.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
2527
  checkpoint_1007000/target.decoder.layers_3.mlp.wi_1.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
2528
  checkpoint_1007000/target.decoder.layers_3.mlp.wi_1.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
2529
  checkpoint_1007000/target.decoder.layers_3.mlp.wi_1.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
2530
+ checkpoint_1007000/target.decoder.layers_3.mlp.wi_1.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
2531
+ checkpoint_1007000/target.decoder.layers_3.mlp.wi_1.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
2532
+ checkpoint_1007000/target.decoder.layers_3.mlp.wi_1.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
2533
+ checkpoint_1007000/target.decoder.layers_3.mlp.wi_1.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
2534
+ checkpoint_1007000/target.decoder.layers_2.self_attention.query.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
2535
+ checkpoint_1007000/target.decoder.layers_2.self_attention.query.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
2536
+ checkpoint_1007000/target.decoder.layers_2.self_attention.query.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
2537
+ checkpoint_1007000/target.decoder.layers_2.self_attention.query.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
2538
+ checkpoint_1007000/target.decoder.layers_2.self_attention.query.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
2539
+ checkpoint_1007000/target.decoder.layers_2.self_attention.query.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
2540
+ checkpoint_1007000/target.decoder.layers_2.self_attention.query.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
2541
+ checkpoint_1007000/target.decoder.layers_2.self_attention.query.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
2542
+ checkpoint_1007000/target.encoder.layers_20.mlp.wo.kernel/6.0 filter=lfs diff=lfs merge=lfs -text
2543
+ checkpoint_1007000/target.encoder.layers_20.mlp.wo.kernel/1.0 filter=lfs diff=lfs merge=lfs -text
2544
+ checkpoint_1007000/target.encoder.layers_20.mlp.wo.kernel/3.0 filter=lfs diff=lfs merge=lfs -text
2545
+ checkpoint_1007000/target.encoder.layers_20.mlp.wo.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
2546
+ checkpoint_1007000/target.encoder.layers_20.mlp.wo.kernel/7.0 filter=lfs diff=lfs merge=lfs -text
2547
+ checkpoint_1007000/target.encoder.layers_20.mlp.wo.kernel/5.0 filter=lfs diff=lfs merge=lfs -text
2548
+ checkpoint_1007000/target.encoder.layers_20.mlp.wo.kernel/2.0 filter=lfs diff=lfs merge=lfs -text
2549
+ checkpoint_1007000/target.encoder.layers_20.mlp.wo.kernel/4.0 filter=lfs diff=lfs merge=lfs -text
2550
+ checkpoint_1007000/target.decoder.layers_21.encoder_decoder_attention.key.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
2551
+ checkpoint_1007000/target.decoder.layers_21.encoder_decoder_attention.key.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
2552
+ checkpoint_1007000/target.decoder.layers_21.encoder_decoder_attention.key.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
2553
+ checkpoint_1007000/target.decoder.layers_21.encoder_decoder_attention.key.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
2554
+ checkpoint_1007000/target.decoder.layers_21.encoder_decoder_attention.key.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
2555
+ checkpoint_1007000/target.decoder.layers_21.encoder_decoder_attention.key.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
2556
+ checkpoint_1007000/target.decoder.layers_21.encoder_decoder_attention.key.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
2557
+ checkpoint_1007000/target.decoder.layers_21.encoder_decoder_attention.key.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
2558
+ checkpoint_1007000/target.decoder.layers_23.mlp.wo.kernel/6.0 filter=lfs diff=lfs merge=lfs -text
2559
+ checkpoint_1007000/target.decoder.layers_23.mlp.wo.kernel/1.0 filter=lfs diff=lfs merge=lfs -text
2560
+ checkpoint_1007000/target.decoder.layers_23.mlp.wo.kernel/3.0 filter=lfs diff=lfs merge=lfs -text
2561
+ checkpoint_1007000/target.decoder.layers_23.mlp.wo.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
2562
+ checkpoint_1007000/target.decoder.layers_23.mlp.wo.kernel/7.0 filter=lfs diff=lfs merge=lfs -text
2563
+ checkpoint_1007000/target.decoder.layers_23.mlp.wo.kernel/5.0 filter=lfs diff=lfs merge=lfs -text
2564
+ checkpoint_1007000/target.decoder.layers_23.mlp.wo.kernel/2.0 filter=lfs diff=lfs merge=lfs -text
2565
+ checkpoint_1007000/target.decoder.layers_23.mlp.wo.kernel/4.0 filter=lfs diff=lfs merge=lfs -text
2566
+ checkpoint_1007000/target.decoder.layers_13.self_attention.key.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
2567
+ checkpoint_1007000/target.decoder.layers_13.self_attention.key.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
2568
+ checkpoint_1007000/target.decoder.layers_13.self_attention.key.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
2569
+ checkpoint_1007000/target.decoder.layers_13.self_attention.key.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
2570
+ checkpoint_1007000/target.decoder.layers_13.self_attention.key.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
2571
+ checkpoint_1007000/target.decoder.layers_13.self_attention.key.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
2572
+ checkpoint_1007000/target.decoder.layers_13.self_attention.key.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
2573
+ checkpoint_1007000/target.decoder.layers_13.self_attention.key.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
2574
+ checkpoint_1007000/target.decoder.layers_13.mlp.wi_1.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
2575
+ checkpoint_1007000/target.decoder.layers_13.mlp.wi_1.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
2576
+ checkpoint_1007000/target.decoder.layers_13.mlp.wi_1.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
2577
+ checkpoint_1007000/target.decoder.layers_13.mlp.wi_1.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
checkpoint_1007000/state.param_states.decoder.layers_4.pre_cross_attention_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096],"zarr_format":2}
checkpoint_1007000/state.param_states.decoder.layers_4.pre_cross_attention_layer_norm.scale.v/0 ADDED
Binary file (14.8 kB). View file
 
checkpoint_1007000/state.param_states.encoder.layers_10.pre_attention_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096],"zarr_format":2}
checkpoint_1007000/state.param_states.encoder.layers_10.pre_attention_layer_norm.scale.v/0 ADDED
Binary file (15.3 kB). View file
 
checkpoint_1007000/state.param_states.encoder.layers_13.pre_attention_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096],"zarr_format":2}
checkpoint_1007000/state.param_states.encoder.layers_13.pre_attention_layer_norm.scale.v/0 ADDED
Binary file (15.2 kB). View file
 
checkpoint_1007000/target.decoder.layers_13.mlp.wi_1.kernel/.zarray ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_13.mlp.wi_1.kernel/.zarray.__tmp11765571810778950051.~1663960300383759~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_13.mlp.wi_1.kernel/.zarray.__tmp12912070580570867986.~1663960300500833~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_13.mlp.wi_1.kernel/.zarray.__tmp1514902467801034416.~1663960300780080~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_13.mlp.wi_1.kernel/.zarray.__tmp8901551791242477798.~1663960300683632~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_13.mlp.wi_1.kernel/0.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:797652dd19b6a7d15d232e8308c2b2c728c50055b92292dd99b66bfa3a180fa1
3
+ size 19515855
checkpoint_1007000/target.decoder.layers_13.mlp.wi_1.kernel/0.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dc64d1eb358ab1930c54c69cc757c1658ac355b449f42b923b50e195c7001a16
3
+ size 19517652
checkpoint_1007000/target.decoder.layers_13.mlp.wi_1.kernel/0.6 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2860ac818f2adb26c364ba03a9092c48033432ab678dfc4c546695b38046a210
3
+ size 19516865
checkpoint_1007000/target.decoder.layers_13.mlp.wi_1.kernel/0.7 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8062c3038efb769e01665d46ef76e493681012dbebc840d69d0e389dfcdafd5a
3
+ size 19517069
checkpoint_1007000/target.decoder.layers_13.self_attention.key.kernel/.zarray ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_13.self_attention.key.kernel/.zarray.__tmp10324667221790502572.~1663960300499537~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_13.self_attention.key.kernel/.zarray.__tmp10538194903622094863.~1663960300728954~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_13.self_attention.key.kernel/.zarray.__tmp11940870617194847787.~1663960300686060~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_13.self_attention.key.kernel/.zarray.__tmp12433849344879772157.~1663960300271694~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_13.self_attention.key.kernel/.zarray.__tmp13999437852346953159.~1663960300090637~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_13.self_attention.key.kernel/.zarray.__tmp18183955016099952054.~1663960300502067~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_13.self_attention.key.kernel/0.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:76c57762aa9b527b2f57ebc464adef65af11e134ac7a08cd38db9fb5d28e64b5
3
+ size 7823817
checkpoint_1007000/target.decoder.layers_13.self_attention.key.kernel/0.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4ebf5e734977623ae92fb7d7097f7a53af720cc81ea1339af16d7082eba52343
3
+ size 7837991
checkpoint_1007000/target.decoder.layers_13.self_attention.key.kernel/0.2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d9b6688ec136d0784a2ba199fb59c43eda4b6c511a7213826b6a0c53685faabf
3
+ size 7825347
checkpoint_1007000/target.decoder.layers_13.self_attention.key.kernel/0.3 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:94d8deb95897b6233f6dbc675420b8bef25306d558c22aa1e588130993583d74
3
+ size 7819281
checkpoint_1007000/target.decoder.layers_13.self_attention.key.kernel/0.4 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1f490c7434d964f1102e06c0df9e029ed0650e2a7467deca384aa28441a6b97a
3
+ size 7824657
checkpoint_1007000/target.decoder.layers_13.self_attention.key.kernel/0.5 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2253532a4110268abe70f7ee95e4e6dfb95ec76c27bb06a5f522422456fdee58
3
+ size 7828966
checkpoint_1007000/target.decoder.layers_13.self_attention.key.kernel/0.6 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8faecf863edf6ae66baa97e378df7e0a44ed0acc3ac512fa1b5422111ad8dc09
3
+ size 7827872
checkpoint_1007000/target.decoder.layers_13.self_attention.key.kernel/0.7 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:357fd023b070e3e6ef85f997f3f6a4ecaaec2c934545a979535662414a5c2a2d
3
+ size 7820282
checkpoint_1007000/target.decoder.layers_2.self_attention.query.kernel/.zarray ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_2.self_attention.query.kernel/.zarray.__tmp12802281532173975450.~1663960300548609~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_2.self_attention.query.kernel/.zarray.__tmp14103607313915582811.~1663960300685478~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_2.self_attention.query.kernel/.zarray.__tmp16104034802188478716.~1663960300551451~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_2.self_attention.query.kernel/.zarray.__tmp1667756116761455245.~1663960300823209~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_2.self_attention.query.kernel/.zarray.__tmp17875011171297452638.~1663960300466131~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_2.self_attention.query.kernel/.zarray.__tmp6087844182203796233.~1663960300731622~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_2.self_attention.query.kernel/.zarray.__tmp9039702464578184575.~1663960300468210~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_2.self_attention.query.kernel/0.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d4162852f71226fb6e7354171f8211586e69011528c437ecb30922e96b8dfdb1
3
+ size 7818932
checkpoint_1007000/target.decoder.layers_2.self_attention.query.kernel/0.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fda52e13947e30ccb5e51a4db493cc43ec2ad0c07dd97bcb60f35b6f492ca5da
3
+ size 7812725
checkpoint_1007000/target.decoder.layers_2.self_attention.query.kernel/0.2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:95077a967d79730722a94abe247249d206a61684180e38380de8b8b6abd71ecb
3
+ size 7803585
checkpoint_1007000/target.decoder.layers_2.self_attention.query.kernel/0.3 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bcc1a839c32af04f551f74bf959bf8eb7d8916ccef815e0f808d35e17055a470
3
+ size 7812503
checkpoint_1007000/target.decoder.layers_2.self_attention.query.kernel/0.4 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a0440b48df7d5da20a81dc188a83c1e6708e3a4f2eadb66f615fea284bf668f9
3
+ size 7816813
checkpoint_1007000/target.decoder.layers_2.self_attention.query.kernel/0.5 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7ed5cc904e6ab8c263bf30ad7169a485a48be167d03f347669f8e527f1f813ce
3
+ size 7801610
checkpoint_1007000/target.decoder.layers_2.self_attention.query.kernel/0.6 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4cda6ccbafa682fa7ad71455efec4e68bb215038dbd57e95af254093866fe418
3
+ size 7821553
checkpoint_1007000/target.decoder.layers_2.self_attention.query.kernel/0.7 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4bff8760a1d5c453e4ceedaaee643cb422656a3f19b7d0f0650a9d22c7c75f9d
3
+ size 7814083
checkpoint_1007000/target.decoder.layers_21.encoder_decoder_attention.key.kernel/.zarray ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_21.encoder_decoder_attention.key.kernel/.zarray.__tmp3372111309395329355.~1663960300601058~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_21.encoder_decoder_attention.key.kernel/.zarray.__tmp8212117750309176957.~1663960300308686~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}