File size: 2,247 Bytes
ca3eb55
e2ed871
d971e79
 
ca3eb55
 
e2ed871
ca3eb55
 
 
 
e2ed871
 
d971e79
e2ed871
d971e79
e2ed871
 
 
 
d971e79
e2ed871
d971e79
e2ed871
 
 
 
d971e79
e2ed871
d971e79
e2ed871
 
 
 
d971e79
e2ed871
d971e79
e2ed871
 
 
 
d971e79
e2ed871
d971e79
e2ed871
 
 
 
d971e79
e2ed871
d971e79
e2ed871
 
ca3eb55
 
d971e79
13ecce3
d971e79
 
 
 
 
 
 
e2ed871
ca3eb55
 
 
e2ed871
ca3eb55
 
 
 
 
 
 
 
 
 
 
 
 
 
 
498ff8d
ca3eb55
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
{
  "best_global_step": 315,
  "best_metric": 0.3333333333333333,
  "best_model_checkpoint": "/home/kat/git-repos/icse/results/rsa/20-05-2025:14-47-09/checkpoint-315",
  "epoch": 1.0,
  "eval_steps": 500,
  "global_step": 315,
  "is_hyper_param_search": false,
  "is_local_process_zero": true,
  "is_world_process_zero": true,
  "log_history": [
    {
      "epoch": 0.15873015873015872,
      "grad_norm": 3.1602320671081543,
      "learning_rate": 1.688888888888889e-05,
      "loss": 0.7162,
      "step": 50
    },
    {
      "epoch": 0.31746031746031744,
      "grad_norm": 3.1608448028564453,
      "learning_rate": 1.3714285714285716e-05,
      "loss": 0.7011,
      "step": 100
    },
    {
      "epoch": 0.47619047619047616,
      "grad_norm": 3.158813238143921,
      "learning_rate": 1.053968253968254e-05,
      "loss": 0.7355,
      "step": 150
    },
    {
      "epoch": 0.6349206349206349,
      "grad_norm": 2.464698553085327,
      "learning_rate": 7.3650793650793666e-06,
      "loss": 0.6762,
      "step": 200
    },
    {
      "epoch": 0.7936507936507936,
      "grad_norm": 3.153306007385254,
      "learning_rate": 4.190476190476191e-06,
      "loss": 0.7057,
      "step": 250
    },
    {
      "epoch": 0.9523809523809523,
      "grad_norm": 3.15567684173584,
      "learning_rate": 1.015873015873016e-06,
      "loss": 0.6662,
      "step": 300
    },
    {
      "epoch": 1.0,
      "eval_accuracy": 0.5,
      "eval_balanced_accuracy": 0.0,
      "eval_f1_score": 0.3333333333333333,
      "eval_loss": 0.7008427381515503,
      "eval_precision": 0.25,
      "eval_recall": 0.5,
      "eval_runtime": 2.266,
      "eval_samples_per_second": 28.243,
      "eval_steps_per_second": 28.243,
      "step": 315
    }
  ],
  "logging_steps": 50,
  "max_steps": 315,
  "num_input_tokens_seen": 0,
  "num_train_epochs": 1,
  "save_steps": 500,
  "stateful_callbacks": {
    "TrainerControl": {
      "args": {
        "should_epoch_stop": false,
        "should_evaluate": false,
        "should_log": false,
        "should_save": true,
        "should_training_stop": true
      },
      "attributes": {}
    }
  },
  "total_flos": 120596908320.0,
  "train_batch_size": 1,
  "trial_name": null,
  "trial_params": null
}