Leonardo6 commited on
Commit
fee7921
·
verified ·
1 Parent(s): 6e0c121

Training in progress, epoch 1, checkpoint

Browse files
checkpoint-10/model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0eeecf463da622ccf14842969df7287560061d79e2a45259d31e7ff666b2bb02
3
+ size 1214121120
checkpoint-10/trainer_state.json ADDED
@@ -0,0 +1,113 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_global_step": null,
3
+ "best_metric": null,
4
+ "best_model_checkpoint": null,
5
+ "epoch": 1.0,
6
+ "eval_steps": 500,
7
+ "global_step": 10,
8
+ "is_hyper_param_search": false,
9
+ "is_local_process_zero": true,
10
+ "is_world_process_zero": true,
11
+ "log_history": [
12
+ {
13
+ "epoch": 0.1,
14
+ "grad_norm": 4.817715644836426,
15
+ "learning_rate": 0.0,
16
+ "loss": 2.4596,
17
+ "step": 1
18
+ },
19
+ {
20
+ "epoch": 0.2,
21
+ "grad_norm": 4.894565105438232,
22
+ "learning_rate": 3.3333333333333335e-05,
23
+ "loss": 2.468,
24
+ "step": 2
25
+ },
26
+ {
27
+ "epoch": 0.3,
28
+ "grad_norm": 4.599151134490967,
29
+ "learning_rate": 6.666666666666667e-05,
30
+ "loss": 2.4369,
31
+ "step": 3
32
+ },
33
+ {
34
+ "epoch": 0.4,
35
+ "grad_norm": 4.634383678436279,
36
+ "learning_rate": 0.0001,
37
+ "loss": 2.4219,
38
+ "step": 4
39
+ },
40
+ {
41
+ "epoch": 0.5,
42
+ "grad_norm": 4.405484676361084,
43
+ "learning_rate": 9.997377845227576e-05,
44
+ "loss": 2.3884,
45
+ "step": 5
46
+ },
47
+ {
48
+ "epoch": 0.6,
49
+ "grad_norm": 4.227508068084717,
50
+ "learning_rate": 9.989514131188559e-05,
51
+ "loss": 2.3539,
52
+ "step": 6
53
+ },
54
+ {
55
+ "epoch": 0.7,
56
+ "grad_norm": 3.989192247390747,
57
+ "learning_rate": 9.97641710583307e-05,
58
+ "loss": 2.3132,
59
+ "step": 7
60
+ },
61
+ {
62
+ "epoch": 0.8,
63
+ "grad_norm": 3.904679775238037,
64
+ "learning_rate": 9.958100506132127e-05,
65
+ "loss": 2.2919,
66
+ "step": 8
67
+ },
68
+ {
69
+ "epoch": 0.9,
70
+ "grad_norm": 3.8267431259155273,
71
+ "learning_rate": 9.934583543669453e-05,
72
+ "loss": 2.2709,
73
+ "step": 9
74
+ },
75
+ {
76
+ "epoch": 1.0,
77
+ "grad_norm": 3.6127519607543945,
78
+ "learning_rate": 9.905890884491195e-05,
79
+ "loss": 2.2313,
80
+ "step": 10
81
+ },
82
+ {
83
+ "epoch": 1.0,
84
+ "eval_accuracy": 0.1856,
85
+ "eval_loss": 2.2107839584350586,
86
+ "eval_runtime": 18.3869,
87
+ "eval_samples_per_second": 543.864,
88
+ "eval_steps_per_second": 0.109,
89
+ "step": 10
90
+ }
91
+ ],
92
+ "logging_steps": 1,
93
+ "max_steps": 100,
94
+ "num_input_tokens_seen": 0,
95
+ "num_train_epochs": 10,
96
+ "save_steps": 1,
97
+ "stateful_callbacks": {
98
+ "TrainerControl": {
99
+ "args": {
100
+ "should_epoch_stop": false,
101
+ "should_evaluate": false,
102
+ "should_log": false,
103
+ "should_save": true,
104
+ "should_training_stop": false
105
+ },
106
+ "attributes": {}
107
+ }
108
+ },
109
+ "total_flos": 0.0,
110
+ "train_batch_size": 512,
111
+ "trial_name": null,
112
+ "trial_params": null
113
+ }
checkpoint-10/training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8791579e23520b4bd71b23dd7de782fc70967c05dcdd1d44ffc944f00ab7f116
3
+ size 5777