emdemor commited on
Commit
0c905a5
·
verified ·
1 Parent(s): bb35aaf

Training in progress, step 10

Browse files
Files changed (3) hide show
  1. adapter_model.safetensors +1 -1
  2. state.json +7 -98
  3. training_args.bin +1 -1
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:79a7f9067104ba188f808a51c9fa02a0efe307c1fa192f76821eb446bfdce94c
3
  size 35668592
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1a4ee09134693faa7983f5fe727d61f4d6dca23f0ebcf928a221772b3ae314f8
3
  size 35668592
state.json CHANGED
@@ -1,108 +1,17 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 1.0,
5
  "eval_steps": 20,
6
- "global_step": 125,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
- "log_history": [
11
- {
12
- "epoch": 0.16,
13
- "grad_norm": 0.02559720166027546,
14
- "learning_rate": 9.375e-05,
15
- "loss": 1.9237,
16
- "step": 20
17
- },
18
- {
19
- "epoch": 0.16,
20
- "eval_loss": 1.8701050281524658,
21
- "eval_runtime": 294.1893,
22
- "eval_samples_per_second": 3.399,
23
- "eval_steps_per_second": 0.425,
24
- "step": 20
25
- },
26
- {
27
- "epoch": 0.32,
28
- "grad_norm": 0.07340741157531738,
29
- "learning_rate": 7.589285714285714e-05,
30
- "loss": 1.8479,
31
- "step": 40
32
- },
33
- {
34
- "epoch": 0.32,
35
- "eval_loss": 1.7706382274627686,
36
- "eval_runtime": 296.242,
37
- "eval_samples_per_second": 3.376,
38
- "eval_steps_per_second": 0.422,
39
- "step": 40
40
- },
41
- {
42
- "epoch": 0.48,
43
- "grad_norm": 0.08102620393037796,
44
- "learning_rate": 5.803571428571429e-05,
45
- "loss": 1.7419,
46
- "step": 60
47
- },
48
- {
49
- "epoch": 0.48,
50
- "eval_loss": 1.6613901853561401,
51
- "eval_runtime": 295.5311,
52
- "eval_samples_per_second": 3.384,
53
- "eval_steps_per_second": 0.423,
54
- "step": 60
55
- },
56
- {
57
- "epoch": 0.64,
58
- "grad_norm": 0.07056039571762085,
59
- "learning_rate": 4.107142857142857e-05,
60
- "loss": 1.674,
61
- "step": 80
62
- },
63
- {
64
- "epoch": 0.64,
65
- "eval_loss": 1.6176079511642456,
66
- "eval_runtime": 295.123,
67
- "eval_samples_per_second": 3.388,
68
- "eval_steps_per_second": 0.424,
69
- "step": 80
70
- },
71
- {
72
- "epoch": 0.8,
73
- "grad_norm": 0.06708831340074539,
74
- "learning_rate": 2.3214285714285715e-05,
75
- "loss": 1.6024,
76
- "step": 100
77
- },
78
- {
79
- "epoch": 0.8,
80
- "eval_loss": 1.5983840227127075,
81
- "eval_runtime": 296.3017,
82
- "eval_samples_per_second": 3.375,
83
- "eval_steps_per_second": 0.422,
84
- "step": 100
85
- },
86
- {
87
- "epoch": 0.96,
88
- "grad_norm": 0.07054605334997177,
89
- "learning_rate": 5.357142857142857e-06,
90
- "loss": 1.6203,
91
- "step": 120
92
- },
93
- {
94
- "epoch": 0.96,
95
- "eval_loss": 1.5859812498092651,
96
- "eval_runtime": 295.6456,
97
- "eval_samples_per_second": 3.382,
98
- "eval_steps_per_second": 0.423,
99
- "step": 120
100
- }
101
- ],
102
  "logging_steps": 20,
103
- "max_steps": 125,
104
  "num_input_tokens_seen": 0,
105
- "num_train_epochs": 1,
106
  "save_steps": 10,
107
  "stateful_callbacks": {
108
  "TrainerControl": {
@@ -110,13 +19,13 @@
110
  "should_epoch_stop": false,
111
  "should_evaluate": false,
112
  "should_log": false,
113
- "should_save": true,
114
  "should_training_stop": false
115
  },
116
  "attributes": {}
117
  }
118
  },
119
- "total_flos": 9518169977733120.0,
120
  "train_batch_size": 8,
121
  "trial_name": null,
122
  "trial_params": null
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 0.08,
5
  "eval_steps": 20,
6
+ "global_step": 10,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
+ "log_history": [],
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
11
  "logging_steps": 20,
12
+ "max_steps": 375,
13
  "num_input_tokens_seen": 0,
14
+ "num_train_epochs": 3,
15
  "save_steps": 10,
16
  "stateful_callbacks": {
17
  "TrainerControl": {
 
19
  "should_epoch_stop": false,
20
  "should_evaluate": false,
21
  "should_log": false,
22
+ "should_save": false,
23
  "should_training_stop": false
24
  },
25
  "attributes": {}
26
  }
27
  },
28
+ "total_flos": 0,
29
  "train_batch_size": 8,
30
  "trial_name": null,
31
  "trial_params": null
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:225e3f04ba656cad0bf2fa42949f5c5d1fb5107f8809a23333b8bb9683442f0f
3
  size 5432
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d5d622493f1ded4a4395a8a495be5ddb356e13976d1325eca2493ea80f1c746a
3
  size 5432