File size: 2,199 Bytes
069e657
 
 
 
 
 
 
 
 
 
 
 
70fd4ce
069e657
70fd4ce
069e657
 
 
 
70fd4ce
069e657
70fd4ce
069e657
 
 
 
70fd4ce
069e657
70fd4ce
069e657
 
 
 
70fd4ce
 
 
 
069e657
 
 
 
70fd4ce
069e657
70fd4ce
069e657
 
 
 
70fd4ce
069e657
70fd4ce
069e657
 
 
 
70fd4ce
069e657
70fd4ce
069e657
 
 
 
70fd4ce
 
 
 
069e657
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
70fd4ce
069e657
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
{
  "best_metric": null,
  "best_model_checkpoint": null,
  "epoch": 0.0037203534335761897,
  "eval_steps": 3,
  "global_step": 6,
  "is_hyper_param_search": false,
  "is_local_process_zero": true,
  "is_world_process_zero": true,
  "log_history": [
    {
      "epoch": 0.0006200589055960316,
      "grad_norm": 0.6006524562835693,
      "learning_rate": 4.000000000000001e-06,
      "loss": 1.4363,
      "step": 1
    },
    {
      "epoch": 0.0012401178111920632,
      "grad_norm": 0.4452102482318878,
      "learning_rate": 8.000000000000001e-06,
      "loss": 1.1641,
      "step": 2
    },
    {
      "epoch": 0.0018601767167880949,
      "grad_norm": 0.418393075466156,
      "learning_rate": 1.2e-05,
      "loss": 1.0005,
      "step": 3
    },
    {
      "epoch": 0.0018601767167880949,
      "eval_loss": 1.2559138536453247,
      "eval_runtime": 50.2632,
      "eval_samples_per_second": 1.99,
      "eval_steps_per_second": 1.99,
      "step": 3
    },
    {
      "epoch": 0.0024802356223841263,
      "grad_norm": 0.4599858820438385,
      "learning_rate": 1.6000000000000003e-05,
      "loss": 1.1938,
      "step": 4
    },
    {
      "epoch": 0.0031002945279801583,
      "grad_norm": 0.4313387870788574,
      "learning_rate": 2e-05,
      "loss": 0.9897,
      "step": 5
    },
    {
      "epoch": 0.0037203534335761897,
      "grad_norm": 0.4715091586112976,
      "learning_rate": 1.9200000000000003e-05,
      "loss": 1.1105,
      "step": 6
    },
    {
      "epoch": 0.0037203534335761897,
      "eval_loss": 1.2492942810058594,
      "eval_runtime": 49.6589,
      "eval_samples_per_second": 2.014,
      "eval_steps_per_second": 2.014,
      "step": 6
    }
  ],
  "logging_steps": 1,
  "max_steps": 30,
  "num_input_tokens_seen": 0,
  "num_train_epochs": 1,
  "save_steps": 3,
  "stateful_callbacks": {
    "TrainerControl": {
      "args": {
        "should_epoch_stop": false,
        "should_evaluate": false,
        "should_log": false,
        "should_save": true,
        "should_training_stop": false
      },
      "attributes": {}
    }
  },
  "total_flos": 1.4145485023690752e+16,
  "train_batch_size": 2,
  "trial_name": null,
  "trial_params": null
}