Training in progress, step 90
Browse files- adapter_config.json +5 -5
- adapter_model.safetensors +1 -1
- dynamic_sampling_log.txt +91 -0
- tokenizer.json +2 -2
- training_args.bin +1 -1
adapter_config.json
CHANGED
|
@@ -29,13 +29,13 @@
|
|
| 29 |
"rank_pattern": {},
|
| 30 |
"revision": null,
|
| 31 |
"target_modules": [
|
| 32 |
-
"
|
| 33 |
-
"gate_proj",
|
| 34 |
-
"v_proj",
|
| 35 |
-
"up_proj",
|
| 36 |
"down_proj",
|
|
|
|
| 37 |
"q_proj",
|
| 38 |
-
"
|
|
|
|
|
|
|
| 39 |
],
|
| 40 |
"target_parameters": null,
|
| 41 |
"task_type": "CAUSAL_LM",
|
|
|
|
| 29 |
"rank_pattern": {},
|
| 30 |
"revision": null,
|
| 31 |
"target_modules": [
|
| 32 |
+
"k_proj",
|
|
|
|
|
|
|
|
|
|
| 33 |
"down_proj",
|
| 34 |
+
"gate_proj",
|
| 35 |
"q_proj",
|
| 36 |
+
"up_proj",
|
| 37 |
+
"v_proj",
|
| 38 |
+
"o_proj"
|
| 39 |
],
|
| 40 |
"target_parameters": null,
|
| 41 |
"task_type": "CAUSAL_LM",
|
adapter_model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 335605144
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:737947296bde632b56480be0a79326ce128a1469fd0749c69e5a1470288f632a
|
| 3 |
size 335605144
|
dynamic_sampling_log.txt
CHANGED
|
@@ -643,3 +643,94 @@ Step Attempts Total Prompts Valid Prompts Efficiency
|
|
| 643 |
79 1 6 6 100.0 %
|
| 644 |
79 2 12 6 50.0 %
|
| 645 |
79 5 30 6 20.0 %
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 643 |
79 1 6 6 100.0 %
|
| 644 |
79 2 12 6 50.0 %
|
| 645 |
79 5 30 6 20.0 %
|
| 646 |
+
80 3 18 6 33.3 %
|
| 647 |
+
80 5 30 6 20.0 %
|
| 648 |
+
80 3 18 6 33.3 %
|
| 649 |
+
80 4 24 6 25.0 %
|
| 650 |
+
80 2 12 6 50.0 %
|
| 651 |
+
80 2 12 6 50.0 %
|
| 652 |
+
80 5 30 6 20.0 %
|
| 653 |
+
80 2 12 6 50.0 %
|
| 654 |
+
81 7 42 6 14.3 %
|
| 655 |
+
81 5 30 6 20.0 %
|
| 656 |
+
81 3 18 6 33.3 %
|
| 657 |
+
80 3 18 6 33.3 %
|
| 658 |
+
80 8 48 6 12.5 %
|
| 659 |
+
80 3 18 6 33.3 %
|
| 660 |
+
80 4 24 6 25.0 %
|
| 661 |
+
80 5 30 6 20.0 %
|
| 662 |
+
80 2 12 6 50.0 %
|
| 663 |
+
80 2 12 6 50.0 %
|
| 664 |
+
80 1 6 6 100.0 %
|
| 665 |
+
81 2 12 6 50.0 %
|
| 666 |
+
81 9 54 6 11.1 %
|
| 667 |
+
81 3 18 6 33.3 %
|
| 668 |
+
81 5 30 6 20.0 %
|
| 669 |
+
81 5 30 6 20.0 %
|
| 670 |
+
81 2 12 6 50.0 %
|
| 671 |
+
81 3 18 6 33.3 %
|
| 672 |
+
81 1 6 6 100.0 %
|
| 673 |
+
82 3 18 6 33.3 %
|
| 674 |
+
82 2 12 6 50.0 %
|
| 675 |
+
82 2 12 6 50.0 %
|
| 676 |
+
82 1 6 6 100.0 %
|
| 677 |
+
82 1 6 6 100.0 %
|
| 678 |
+
82 10 60 6 10.0 %
|
| 679 |
+
82 6 36 6 16.7 %
|
| 680 |
+
82 3 18 6 33.3 %
|
| 681 |
+
83 1 6 6 100.0 %
|
| 682 |
+
83 6 36 6 16.7 %
|
| 683 |
+
83 15 90 6 6.7 %
|
| 684 |
+
83 3 18 6 33.3 %
|
| 685 |
+
83 5 30 6 20.0 %
|
| 686 |
+
83 6 36 6 16.7 %
|
| 687 |
+
83 2 12 6 50.0 %
|
| 688 |
+
83 4 24 6 25.0 %
|
| 689 |
+
84 3 18 6 33.3 %
|
| 690 |
+
84 1 6 6 100.0 %
|
| 691 |
+
84 8 48 6 12.5 %
|
| 692 |
+
84 4 24 6 25.0 %
|
| 693 |
+
84 5 30 6 20.0 %
|
| 694 |
+
84 4 24 6 25.0 %
|
| 695 |
+
84 4 24 6 25.0 %
|
| 696 |
+
84 2 12 6 50.0 %
|
| 697 |
+
85 6 36 6 16.7 %
|
| 698 |
+
85 1 6 6 100.0 %
|
| 699 |
+
85 6 36 6 16.7 %
|
| 700 |
+
85 2 12 6 50.0 %
|
| 701 |
+
85 8 48 6 12.5 %
|
| 702 |
+
85 2 12 6 50.0 %
|
| 703 |
+
85 5 30 6 20.0 %
|
| 704 |
+
85 6 36 6 16.7 %
|
| 705 |
+
86 1 6 6 100.0 %
|
| 706 |
+
86 1 6 6 100.0 %
|
| 707 |
+
86 4 24 6 25.0 %
|
| 708 |
+
86 4 24 6 25.0 %
|
| 709 |
+
86 3 18 6 33.3 %
|
| 710 |
+
86 3 18 6 33.3 %
|
| 711 |
+
86 12 72 6 8.3 %
|
| 712 |
+
86 2 12 6 50.0 %
|
| 713 |
+
87 8 48 6 12.5 %
|
| 714 |
+
87 3 18 6 33.3 %
|
| 715 |
+
87 4 24 6 25.0 %
|
| 716 |
+
87 1 6 6 100.0 %
|
| 717 |
+
87 9 54 6 11.1 %
|
| 718 |
+
87 5 30 6 20.0 %
|
| 719 |
+
87 2 12 6 50.0 %
|
| 720 |
+
87 3 18 6 33.3 %
|
| 721 |
+
88 7 42 6 14.3 %
|
| 722 |
+
88 4 24 6 25.0 %
|
| 723 |
+
88 8 48 6 12.5 %
|
| 724 |
+
88 1 6 6 100.0 %
|
| 725 |
+
88 2 12 6 50.0 %
|
| 726 |
+
88 12 72 6 8.3 %
|
| 727 |
+
88 5 30 6 20.0 %
|
| 728 |
+
88 2 12 6 50.0 %
|
| 729 |
+
89 3 18 6 33.3 %
|
| 730 |
+
89 7 42 6 14.3 %
|
| 731 |
+
89 4 24 6 25.0 %
|
| 732 |
+
89 1 6 6 100.0 %
|
| 733 |
+
89 3 18 6 33.3 %
|
| 734 |
+
89 4 24 6 25.0 %
|
| 735 |
+
89 5 30 6 20.0 %
|
| 736 |
+
89 2 12 6 50.0 %
|
tokenizer.json
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:26c881aaf4ef935b1516ec79ad6405dd2a459f2b5d431a8a4a1399c92f3ba022
|
| 3 |
+
size 17209711
|
training_args.bin
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 8760
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7d4abf5569a8ae3268c6481567587fda25fb103630a3e2caf29b2a09eb6e76e2
|
| 3 |
size 8760
|