File size: 1,838 Bytes
a71298e
 
 
29a82e4
 
a71298e
 
 
 
 
 
 
29a82e4
 
a71298e
 
 
29a82e4
 
 
a71298e
 
 
29a82e4
 
 
a71298e
 
 
29a82e4
 
 
a71298e
 
 
29a82e4
 
 
a71298e
 
 
29a82e4
 
 
a71298e
 
 
29a82e4
 
 
a71298e
 
 
29a82e4
 
 
a71298e
 
 
29a82e4
 
 
a71298e
 
 
29a82e4
 
 
a71298e
 
 
29a82e4
15616f9
29a82e4
 
 
 
a71298e
 
 
29a82e4
 
 
 
a71298e
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
{
  "best_metric": null,
  "best_model_checkpoint": null,
  "epoch": 0.2455795677799607,
  "eval_steps": 500,
  "global_step": 500,
  "is_hyper_param_search": false,
  "is_local_process_zero": true,
  "is_world_process_zero": true,
  "log_history": [
    {
      "epoch": 0.02,
      "learning_rate": 8.999464304375242e-06,
      "loss": 0.7019,
      "step": 50
    },
    {
      "epoch": 0.05,
      "learning_rate": 8.997857345043108e-06,
      "loss": 0.6739,
      "step": 100
    },
    {
      "epoch": 0.07,
      "learning_rate": 8.99517950459963e-06,
      "loss": 0.6677,
      "step": 150
    },
    {
      "epoch": 0.1,
      "learning_rate": 8.99143142060366e-06,
      "loss": 0.6625,
      "step": 200
    },
    {
      "epoch": 0.12,
      "learning_rate": 8.98661398542506e-06,
      "loss": 0.6649,
      "step": 250
    },
    {
      "epoch": 0.15,
      "learning_rate": 8.980728346032255e-06,
      "loss": 0.6528,
      "step": 300
    },
    {
      "epoch": 0.17,
      "learning_rate": 8.973775903719142e-06,
      "loss": 0.6442,
      "step": 350
    },
    {
      "epoch": 0.2,
      "learning_rate": 8.965758313771466e-06,
      "loss": 0.6375,
      "step": 400
    },
    {
      "epoch": 0.22,
      "learning_rate": 8.956677485072722e-06,
      "loss": 0.6303,
      "step": 450
    },
    {
      "epoch": 0.25,
      "learning_rate": 8.946535579649664e-06,
      "loss": 0.634,
      "step": 500
    },
    {
      "epoch": 0.25,
      "eval_accuracy": 0.0,
      "eval_loss": 0.6457224488258362,
      "eval_runtime": 154.2695,
      "eval_samples_per_second": 87.989,
      "eval_steps_per_second": 14.669,
      "step": 500
    }
  ],
  "logging_steps": 50,
  "max_steps": 10180,
  "num_train_epochs": 5,
  "save_steps": 500,
  "total_flos": 0.0,
  "trial_name": null,
  "trial_params": null
}