Frinkles commited on
Commit
5f4e888
·
1 Parent(s): 4947329

initial_commit

Browse files
adapter_config.json CHANGED
@@ -21,9 +21,9 @@
21
  "revision": null,
22
  "target_modules": [
23
  "o_proj",
 
24
  "down_proj",
25
- "gate_up_proj",
26
- "qkv_proj"
27
  ],
28
  "task_type": "CAUSAL_LM",
29
  "use_dora": false,
 
21
  "revision": null,
22
  "target_modules": [
23
  "o_proj",
24
+ "qkv_proj",
25
  "down_proj",
26
+ "gate_up_proj"
 
27
  ],
28
  "task_type": "CAUSAL_LM",
29
  "use_dora": false,
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:509e03e583766096cb2af316df026b5160028032ac428d01fc9ab3221c1165e7
3
- size 50366024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:904ea480c61175d5fbe5c84367c1e51a5010c8f504e277f776237204a2b683c7
3
+ size 50366280
all_results.json DELETED
@@ -1,8 +0,0 @@
1
- {
2
- "epoch": 1.0,
3
- "total_flos": 3.1269503354535936e+16,
4
- "train_loss": 0.19359449498793657,
5
- "train_runtime": 1514.0603,
6
- "train_samples_per_second": 0.448,
7
- "train_steps_per_second": 0.112
8
- }
 
 
 
 
 
 
 
 
 
train_results.json DELETED
@@ -1,8 +0,0 @@
1
- {
2
- "epoch": 1.0,
3
- "total_flos": 3.1269503354535936e+16,
4
- "train_loss": 0.19359449498793657,
5
- "train_runtime": 1514.0603,
6
- "train_samples_per_second": 0.448,
7
- "train_steps_per_second": 0.112
8
- }
 
 
 
 
 
 
 
 
 
trainer_state.json DELETED
@@ -1,63 +0,0 @@
1
- {
2
- "best_metric": null,
3
- "best_model_checkpoint": null,
4
- "epoch": 1.0,
5
- "eval_steps": 500,
6
- "global_step": 170,
7
- "is_hyper_param_search": false,
8
- "is_local_process_zero": true,
9
- "is_world_process_zero": true,
10
- "log_history": [
11
- {
12
- "epoch": 0.29411764705882354,
13
- "grad_norm": NaN,
14
- "learning_rate": 4.83118057351089e-06,
15
- "loss": 0.6582,
16
- "step": 50
17
- },
18
- {
19
- "epoch": 0.5882352941176471,
20
- "grad_norm": NaN,
21
- "learning_rate": 2.6154586466143495e-06,
22
- "loss": 0.0,
23
- "step": 100
24
- },
25
- {
26
- "epoch": 0.8823529411764706,
27
- "grad_norm": NaN,
28
- "learning_rate": 2.620917716123444e-07,
29
- "loss": 0.0,
30
- "step": 150
31
- },
32
- {
33
- "epoch": 1.0,
34
- "step": 170,
35
- "total_flos": 3.1269503354535936e+16,
36
- "train_loss": 0.19359449498793657,
37
- "train_runtime": 1514.0603,
38
- "train_samples_per_second": 0.448,
39
- "train_steps_per_second": 0.112
40
- }
41
- ],
42
- "logging_steps": 50,
43
- "max_steps": 170,
44
- "num_input_tokens_seen": 0,
45
- "num_train_epochs": 1,
46
- "save_steps": 500,
47
- "stateful_callbacks": {
48
- "TrainerControl": {
49
- "args": {
50
- "should_epoch_stop": false,
51
- "should_evaluate": false,
52
- "should_log": false,
53
- "should_save": false,
54
- "should_training_stop": false
55
- },
56
- "attributes": {}
57
- }
58
- },
59
- "total_flos": 3.1269503354535936e+16,
60
- "train_batch_size": 4,
61
- "trial_name": null,
62
- "trial_params": null
63
- }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4844ff749272ef526f5f855db84ae0970596b037c1465ab89ba72153131c3b54
3
  size 5112
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bc2992b67251b74348a9756b8ed81c43339f905493587d245a0a389be273b198
3
  size 5112