xinhe commited on
Commit
f2df194
·
verified ·
1 Parent(s): 5a934a0

Upload folder using huggingface_hub (part 2)

Browse files
.gitattributes CHANGED
@@ -34,3 +34,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
  tokenizer.json filter=lfs diff=lfs merge=lfs -text
 
 
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
  tokenizer.json filter=lfs diff=lfs merge=lfs -text
37
+ model.safetensors.index.json filter=lfs diff=lfs merge=lfs -text
model-00245-of-00282.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:05396c8410b500de19a9bb610083e63c33f2a2d965b6418c9344c77774fb31a0
3
- size 1532386504
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:05fca80abaaadac06ea7fa8124375020c4119e2e70b3508e4c067519f6044270
3
+ size 1533148232
model-00259-of-00282.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:dcca03b2b3d5318433845e61beb3e032fc59484bc3654693c8a35e8a3570e3fb
3
- size 1532386200
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:888e2ddd55d2ba621940b46dd977c6ec003b36d4fbc8d1fe48dcd094f240b2c0
3
+ size 1533147928
model-00274-of-00282.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d2250e8e3413aae6650f6d31139d428e0c4eda6ba5b2b190e60e849529fd2ff4
3
- size 1532398568
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fb4051587784b630d14064a3b129ebd6323bbc78eaaea7581cb59b64dcf713de
3
+ size 1533160296
model.safetensors.index.json CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:deed66c5d5102260b99056b51d21396a7977dc9a500bc481ca4f9586ef46300c
3
- size 11530961
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4719c71763835e4e7ea4261fc671b9fbc21ed6597d9b02f46d998ffeed2e6922
3
+ size 11528919
quantization_config.json CHANGED
@@ -58451,107 +58451,129 @@
58451
  "model.layers.0.mlp.gate_proj",
58452
  "model.layers.0.mlp.up_proj",
58453
  "model.layers.0.self_attn.indexer.weights_proj",
 
58454
  "model.layers.1.mlp.down_proj",
58455
  "model.layers.1.mlp.gate_proj",
58456
  "model.layers.1.mlp.up_proj",
58457
  "model.layers.1.self_attn.indexer.weights_proj",
 
58458
  "model.layers.10.mlp.gate",
58459
  "model.layers.10.self_attn.indexer.weights_proj",
 
58460
  "model.layers.11.mlp.gate",
58461
  "model.layers.12.mlp.gate",
58462
  "model.layers.13.mlp.gate",
58463
  "model.layers.14.mlp.gate",
58464
  "model.layers.14.self_attn.indexer.weights_proj",
 
58465
  "model.layers.15.mlp.gate",
58466
  "model.layers.16.mlp.gate",
58467
  "model.layers.17.mlp.gate",
58468
  "model.layers.18.mlp.gate",
58469
  "model.layers.18.self_attn.indexer.weights_proj",
 
58470
  "model.layers.19.mlp.gate",
58471
  "model.layers.2.mlp.down_proj",
58472
  "model.layers.2.mlp.gate_proj",
58473
  "model.layers.2.mlp.up_proj",
58474
  "model.layers.2.self_attn.indexer.weights_proj",
 
58475
  "model.layers.20.mlp.gate",
58476
  "model.layers.21.mlp.gate",
58477
  "model.layers.22.mlp.gate",
58478
  "model.layers.22.self_attn.indexer.weights_proj",
 
58479
  "model.layers.23.mlp.gate",
58480
  "model.layers.24.mlp.gate",
58481
  "model.layers.25.mlp.gate",
58482
  "model.layers.26.mlp.gate",
58483
  "model.layers.26.self_attn.indexer.weights_proj",
 
58484
  "model.layers.27.mlp.gate",
58485
  "model.layers.28.mlp.gate",
58486
  "model.layers.29.mlp.gate",
58487
  "model.layers.3.mlp.gate",
58488
  "model.layers.30.mlp.gate",
58489
  "model.layers.30.self_attn.indexer.weights_proj",
 
58490
  "model.layers.31.mlp.gate",
58491
  "model.layers.32.mlp.gate",
58492
  "model.layers.33.mlp.gate",
58493
  "model.layers.34.mlp.gate",
58494
  "model.layers.34.self_attn.indexer.weights_proj",
 
58495
  "model.layers.35.mlp.gate",
58496
  "model.layers.36.mlp.gate",
58497
  "model.layers.37.mlp.gate",
58498
  "model.layers.38.mlp.gate",
58499
  "model.layers.38.self_attn.indexer.weights_proj",
 
58500
  "model.layers.39.mlp.gate",
58501
  "model.layers.4.mlp.gate",
58502
  "model.layers.40.mlp.gate",
58503
  "model.layers.41.mlp.gate",
58504
  "model.layers.42.mlp.gate",
58505
  "model.layers.42.self_attn.indexer.weights_proj",
 
58506
  "model.layers.43.mlp.gate",
58507
  "model.layers.44.mlp.gate",
58508
  "model.layers.45.mlp.gate",
58509
  "model.layers.46.mlp.gate",
58510
  "model.layers.46.self_attn.indexer.weights_proj",
 
58511
  "model.layers.47.mlp.gate",
58512
  "model.layers.48.mlp.gate",
58513
  "model.layers.49.mlp.gate",
58514
  "model.layers.5.mlp.gate",
58515
  "model.layers.50.mlp.gate",
58516
  "model.layers.50.self_attn.indexer.weights_proj",
 
58517
  "model.layers.51.mlp.gate",
58518
  "model.layers.52.mlp.gate",
58519
  "model.layers.53.mlp.gate",
58520
  "model.layers.54.mlp.gate",
58521
  "model.layers.54.self_attn.indexer.weights_proj",
 
58522
  "model.layers.55.mlp.gate",
58523
  "model.layers.56.mlp.gate",
58524
  "model.layers.57.mlp.gate",
58525
  "model.layers.58.mlp.gate",
58526
  "model.layers.58.self_attn.indexer.weights_proj",
 
58527
  "model.layers.59.mlp.gate",
58528
  "model.layers.6.mlp.gate",
58529
  "model.layers.6.self_attn.indexer.weights_proj",
 
58530
  "model.layers.60.mlp.gate",
58531
  "model.layers.61.mlp.gate",
58532
  "model.layers.62.mlp.gate",
58533
  "model.layers.62.self_attn.indexer.weights_proj",
 
58534
  "model.layers.63.mlp.gate",
58535
  "model.layers.64.mlp.gate",
58536
  "model.layers.65.mlp.gate",
58537
  "model.layers.66.mlp.gate",
58538
  "model.layers.66.self_attn.indexer.weights_proj",
 
58539
  "model.layers.67.mlp.gate",
58540
  "model.layers.68.mlp.gate",
58541
  "model.layers.69.mlp.gate",
58542
  "model.layers.7.mlp.gate",
58543
  "model.layers.70.mlp.gate",
58544
  "model.layers.70.self_attn.indexer.weights_proj",
 
58545
  "model.layers.71.mlp.gate",
58546
  "model.layers.72.mlp.gate",
58547
  "model.layers.73.mlp.gate",
58548
  "model.layers.74.mlp.gate",
58549
  "model.layers.74.self_attn.indexer.weights_proj",
 
58550
  "model.layers.75.mlp.gate",
58551
  "model.layers.76.mlp.gate",
58552
  "model.layers.77.mlp.gate",
58553
  "model.layers.78.mlp.gate",
58554
  "model.layers.78.self_attn.indexer.weights_proj",
 
58555
  "model.layers.8.mlp.gate",
58556
  "model.layers.9.mlp.gate"
58557
  ],
 
58451
  "model.layers.0.mlp.gate_proj",
58452
  "model.layers.0.mlp.up_proj",
58453
  "model.layers.0.self_attn.indexer.weights_proj",
58454
+ "model.layers.0.self_attn.indexer.wk",
58455
  "model.layers.1.mlp.down_proj",
58456
  "model.layers.1.mlp.gate_proj",
58457
  "model.layers.1.mlp.up_proj",
58458
  "model.layers.1.self_attn.indexer.weights_proj",
58459
+ "model.layers.1.self_attn.indexer.wk",
58460
  "model.layers.10.mlp.gate",
58461
  "model.layers.10.self_attn.indexer.weights_proj",
58462
+ "model.layers.10.self_attn.indexer.wk",
58463
  "model.layers.11.mlp.gate",
58464
  "model.layers.12.mlp.gate",
58465
  "model.layers.13.mlp.gate",
58466
  "model.layers.14.mlp.gate",
58467
  "model.layers.14.self_attn.indexer.weights_proj",
58468
+ "model.layers.14.self_attn.indexer.wk",
58469
  "model.layers.15.mlp.gate",
58470
  "model.layers.16.mlp.gate",
58471
  "model.layers.17.mlp.gate",
58472
  "model.layers.18.mlp.gate",
58473
  "model.layers.18.self_attn.indexer.weights_proj",
58474
+ "model.layers.18.self_attn.indexer.wk",
58475
  "model.layers.19.mlp.gate",
58476
  "model.layers.2.mlp.down_proj",
58477
  "model.layers.2.mlp.gate_proj",
58478
  "model.layers.2.mlp.up_proj",
58479
  "model.layers.2.self_attn.indexer.weights_proj",
58480
+ "model.layers.2.self_attn.indexer.wk",
58481
  "model.layers.20.mlp.gate",
58482
  "model.layers.21.mlp.gate",
58483
  "model.layers.22.mlp.gate",
58484
  "model.layers.22.self_attn.indexer.weights_proj",
58485
+ "model.layers.22.self_attn.indexer.wk",
58486
  "model.layers.23.mlp.gate",
58487
  "model.layers.24.mlp.gate",
58488
  "model.layers.25.mlp.gate",
58489
  "model.layers.26.mlp.gate",
58490
  "model.layers.26.self_attn.indexer.weights_proj",
58491
+ "model.layers.26.self_attn.indexer.wk",
58492
  "model.layers.27.mlp.gate",
58493
  "model.layers.28.mlp.gate",
58494
  "model.layers.29.mlp.gate",
58495
  "model.layers.3.mlp.gate",
58496
  "model.layers.30.mlp.gate",
58497
  "model.layers.30.self_attn.indexer.weights_proj",
58498
+ "model.layers.30.self_attn.indexer.wk",
58499
  "model.layers.31.mlp.gate",
58500
  "model.layers.32.mlp.gate",
58501
  "model.layers.33.mlp.gate",
58502
  "model.layers.34.mlp.gate",
58503
  "model.layers.34.self_attn.indexer.weights_proj",
58504
+ "model.layers.34.self_attn.indexer.wk",
58505
  "model.layers.35.mlp.gate",
58506
  "model.layers.36.mlp.gate",
58507
  "model.layers.37.mlp.gate",
58508
  "model.layers.38.mlp.gate",
58509
  "model.layers.38.self_attn.indexer.weights_proj",
58510
+ "model.layers.38.self_attn.indexer.wk",
58511
  "model.layers.39.mlp.gate",
58512
  "model.layers.4.mlp.gate",
58513
  "model.layers.40.mlp.gate",
58514
  "model.layers.41.mlp.gate",
58515
  "model.layers.42.mlp.gate",
58516
  "model.layers.42.self_attn.indexer.weights_proj",
58517
+ "model.layers.42.self_attn.indexer.wk",
58518
  "model.layers.43.mlp.gate",
58519
  "model.layers.44.mlp.gate",
58520
  "model.layers.45.mlp.gate",
58521
  "model.layers.46.mlp.gate",
58522
  "model.layers.46.self_attn.indexer.weights_proj",
58523
+ "model.layers.46.self_attn.indexer.wk",
58524
  "model.layers.47.mlp.gate",
58525
  "model.layers.48.mlp.gate",
58526
  "model.layers.49.mlp.gate",
58527
  "model.layers.5.mlp.gate",
58528
  "model.layers.50.mlp.gate",
58529
  "model.layers.50.self_attn.indexer.weights_proj",
58530
+ "model.layers.50.self_attn.indexer.wk",
58531
  "model.layers.51.mlp.gate",
58532
  "model.layers.52.mlp.gate",
58533
  "model.layers.53.mlp.gate",
58534
  "model.layers.54.mlp.gate",
58535
  "model.layers.54.self_attn.indexer.weights_proj",
58536
+ "model.layers.54.self_attn.indexer.wk",
58537
  "model.layers.55.mlp.gate",
58538
  "model.layers.56.mlp.gate",
58539
  "model.layers.57.mlp.gate",
58540
  "model.layers.58.mlp.gate",
58541
  "model.layers.58.self_attn.indexer.weights_proj",
58542
+ "model.layers.58.self_attn.indexer.wk",
58543
  "model.layers.59.mlp.gate",
58544
  "model.layers.6.mlp.gate",
58545
  "model.layers.6.self_attn.indexer.weights_proj",
58546
+ "model.layers.6.self_attn.indexer.wk",
58547
  "model.layers.60.mlp.gate",
58548
  "model.layers.61.mlp.gate",
58549
  "model.layers.62.mlp.gate",
58550
  "model.layers.62.self_attn.indexer.weights_proj",
58551
+ "model.layers.62.self_attn.indexer.wk",
58552
  "model.layers.63.mlp.gate",
58553
  "model.layers.64.mlp.gate",
58554
  "model.layers.65.mlp.gate",
58555
  "model.layers.66.mlp.gate",
58556
  "model.layers.66.self_attn.indexer.weights_proj",
58557
+ "model.layers.66.self_attn.indexer.wk",
58558
  "model.layers.67.mlp.gate",
58559
  "model.layers.68.mlp.gate",
58560
  "model.layers.69.mlp.gate",
58561
  "model.layers.7.mlp.gate",
58562
  "model.layers.70.mlp.gate",
58563
  "model.layers.70.self_attn.indexer.weights_proj",
58564
+ "model.layers.70.self_attn.indexer.wk",
58565
  "model.layers.71.mlp.gate",
58566
  "model.layers.72.mlp.gate",
58567
  "model.layers.73.mlp.gate",
58568
  "model.layers.74.mlp.gate",
58569
  "model.layers.74.self_attn.indexer.weights_proj",
58570
+ "model.layers.74.self_attn.indexer.wk",
58571
  "model.layers.75.mlp.gate",
58572
  "model.layers.76.mlp.gate",
58573
  "model.layers.77.mlp.gate",
58574
  "model.layers.78.mlp.gate",
58575
  "model.layers.78.self_attn.indexer.weights_proj",
58576
+ "model.layers.78.self_attn.indexer.wk",
58577
  "model.layers.8.mlp.gate",
58578
  "model.layers.9.mlp.gate"
58579
  ],