File size: 2,202 Bytes
3d972cf
 
 
 
 
 
 
 
 
 
 
 
10c5ca9
3d972cf
10c5ca9
3d972cf
 
 
 
10c5ca9
3d972cf
10c5ca9
3d972cf
 
 
 
10c5ca9
3d972cf
10c5ca9
3d972cf
 
 
 
10c5ca9
 
 
 
3d972cf
 
 
 
10c5ca9
3d972cf
10c5ca9
3d972cf
 
 
 
10c5ca9
3d972cf
10c5ca9
3d972cf
 
 
 
10c5ca9
3d972cf
10c5ca9
3d972cf
 
 
 
10c5ca9
 
 
 
3d972cf
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
10c5ca9
3d972cf
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
{
  "best_metric": null,
  "best_model_checkpoint": null,
  "epoch": 0.0037203534335761897,
  "eval_steps": 3,
  "global_step": 6,
  "is_hyper_param_search": false,
  "is_local_process_zero": true,
  "is_world_process_zero": true,
  "log_history": [
    {
      "epoch": 0.0006200589055960316,
      "grad_norm": 0.5875879526138306,
      "learning_rate": 4.000000000000001e-06,
      "loss": 1.179,
      "step": 1
    },
    {
      "epoch": 0.0012401178111920632,
      "grad_norm": 0.2559925317764282,
      "learning_rate": 8.000000000000001e-06,
      "loss": 0.9296,
      "step": 2
    },
    {
      "epoch": 0.0018601767167880949,
      "grad_norm": 0.27975356578826904,
      "learning_rate": 1.2e-05,
      "loss": 0.8212,
      "step": 3
    },
    {
      "epoch": 0.0018601767167880949,
      "eval_loss": 1.0227885246276855,
      "eval_runtime": 47.9985,
      "eval_samples_per_second": 2.083,
      "eval_steps_per_second": 2.083,
      "step": 3
    },
    {
      "epoch": 0.0024802356223841263,
      "grad_norm": 0.4077853858470917,
      "learning_rate": 1.6000000000000003e-05,
      "loss": 0.9553,
      "step": 4
    },
    {
      "epoch": 0.0031002945279801583,
      "grad_norm": 0.3481099307537079,
      "learning_rate": 2e-05,
      "loss": 0.8071,
      "step": 5
    },
    {
      "epoch": 0.0037203534335761897,
      "grad_norm": 0.33538541197776794,
      "learning_rate": 1.9200000000000003e-05,
      "loss": 0.9046,
      "step": 6
    },
    {
      "epoch": 0.0037203534335761897,
      "eval_loss": 1.0122885704040527,
      "eval_runtime": 48.1202,
      "eval_samples_per_second": 2.078,
      "eval_steps_per_second": 2.078,
      "step": 6
    }
  ],
  "logging_steps": 1,
  "max_steps": 30,
  "num_input_tokens_seen": 0,
  "num_train_epochs": 1,
  "save_steps": 3,
  "stateful_callbacks": {
    "TrainerControl": {
      "args": {
        "should_epoch_stop": false,
        "should_evaluate": false,
        "should_log": false,
        "should_save": true,
        "should_training_stop": false
      },
      "attributes": {}
    }
  },
  "total_flos": 1.422690662363136e+16,
  "train_batch_size": 2,
  "trial_name": null,
  "trial_params": null
}