File size: 2,201 Bytes
76e7554
 
 
 
 
 
 
 
 
 
 
 
1f64eba
76e7554
1f64eba
76e7554
 
 
 
1f64eba
76e7554
1f64eba
76e7554
 
 
 
1f64eba
76e7554
1f64eba
76e7554
 
 
 
1f64eba
 
 
 
76e7554
 
 
 
1f64eba
76e7554
1f64eba
76e7554
 
 
 
1f64eba
76e7554
1f64eba
76e7554
 
 
 
1f64eba
76e7554
1f64eba
76e7554
 
 
 
1f64eba
 
 
 
76e7554
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1f64eba
76e7554
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
{
  "best_metric": null,
  "best_model_checkpoint": null,
  "epoch": 0.0037203534335761897,
  "eval_steps": 3,
  "global_step": 6,
  "is_hyper_param_search": false,
  "is_local_process_zero": true,
  "is_world_process_zero": true,
  "log_history": [
    {
      "epoch": 0.0006200589055960316,
      "grad_norm": 0.16878783702850342,
      "learning_rate": 4.000000000000001e-06,
      "loss": 0.9729,
      "step": 1
    },
    {
      "epoch": 0.0012401178111920632,
      "grad_norm": 0.0865061804652214,
      "learning_rate": 8.000000000000001e-06,
      "loss": 0.6661,
      "step": 2
    },
    {
      "epoch": 0.0018601767167880949,
      "grad_norm": 0.0920981764793396,
      "learning_rate": 1.2e-05,
      "loss": 0.5954,
      "step": 3
    },
    {
      "epoch": 0.0018601767167880949,
      "eval_loss": 0.762992262840271,
      "eval_runtime": 33.3972,
      "eval_samples_per_second": 2.994,
      "eval_steps_per_second": 2.994,
      "step": 3
    },
    {
      "epoch": 0.0024802356223841263,
      "grad_norm": 0.10451442003250122,
      "learning_rate": 1.6000000000000003e-05,
      "loss": 0.7227,
      "step": 4
    },
    {
      "epoch": 0.0031002945279801583,
      "grad_norm": 0.11351602524518967,
      "learning_rate": 2e-05,
      "loss": 0.5719,
      "step": 5
    },
    {
      "epoch": 0.0037203534335761897,
      "grad_norm": 0.12484906613826752,
      "learning_rate": 1.9200000000000003e-05,
      "loss": 0.6972,
      "step": 6
    },
    {
      "epoch": 0.0037203534335761897,
      "eval_loss": 0.7615777850151062,
      "eval_runtime": 33.3804,
      "eval_samples_per_second": 2.996,
      "eval_steps_per_second": 2.996,
      "step": 6
    }
  ],
  "logging_steps": 1,
  "max_steps": 30,
  "num_input_tokens_seen": 0,
  "num_train_epochs": 1,
  "save_steps": 3,
  "stateful_callbacks": {
    "TrainerControl": {
      "args": {
        "should_epoch_stop": false,
        "should_evaluate": false,
        "should_log": false,
        "should_save": true,
        "should_training_stop": false
      },
      "attributes": {}
    }
  },
  "total_flos": 8918117859115008.0,
  "train_batch_size": 2,
  "trial_name": null,
  "trial_params": null
}