karim155 commited on
Commit
0de430a
·
verified ·
1 Parent(s): ec02065

Training in progress, epoch 0

Browse files
all_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "epoch": 2.4,
3
- "total_flos": 9545499876261888.0,
4
- "train_loss": 1.3307077884674072,
5
- "train_runtime": 26.0882,
6
- "train_samples_per_second": 18.399,
7
- "train_steps_per_second": 0.115
8
  }
 
1
  {
2
+ "epoch": 2.88,
3
+ "total_flos": 5.727299925757133e+16,
4
+ "train_loss": 1.1426812807718914,
5
+ "train_runtime": 417.2641,
6
+ "train_samples_per_second": 5.752,
7
+ "train_steps_per_second": 0.043
8
  }
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6848aa2e2e2108126b7410ebeaf4967496a1eae7e865db546a85d7145c7acfbc
3
  size 110352060
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:18c3cb66951c057e21db0ced12483119238a8131cae523c129e0294c76353d67
3
  size 110352060
runs/Aug18_23-53-31_e8f7099b712a/events.out.tfevents.1724025679.e8f7099b712a.297.4 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fc3f5402c97bd97e19525e86a5aff25eb522efd6878d1dda91fb7e8fae6a094e
3
+ size 404
runs/Aug19_00-04-27_e8f7099b712a/events.out.tfevents.1724025873.e8f7099b712a.297.5 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4eda5c25b905500eca524d41a7034fe7ea2c82043e5d6065fc21252b3b4b1bfa
3
+ size 5878
train_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "epoch": 2.4,
3
- "total_flos": 9545499876261888.0,
4
- "train_loss": 1.3307077884674072,
5
- "train_runtime": 26.0882,
6
- "train_samples_per_second": 18.399,
7
- "train_steps_per_second": 0.115
8
  }
 
1
  {
2
+ "epoch": 2.88,
3
+ "total_flos": 5.727299925757133e+16,
4
+ "train_loss": 1.1426812807718914,
5
+ "train_runtime": 417.2641,
6
+ "train_samples_per_second": 5.752,
7
+ "train_steps_per_second": 0.043
8
  }
trainer_state.json CHANGED
@@ -1,61 +1,68 @@
1
  {
2
- "best_metric": 1.3222624063491821,
3
- "best_model_checkpoint": "swin-tiny-patch4-window7-224-finetuned/checkpoint-3",
4
- "epoch": 2.4,
5
  "eval_steps": 500,
6
- "global_step": 3,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
- "epoch": 0.8,
13
  "eval_accuracy": {
14
- "accuracy": 0.425
15
  },
16
- "eval_logLoss": 1.452716588973999,
17
- "eval_loss": 1.452716588973999,
18
- "eval_runtime": 0.9167,
19
- "eval_samples_per_second": 43.635,
20
- "eval_steps_per_second": 2.182,
21
- "step": 1
22
  },
23
  {
24
  "epoch": 1.6,
 
 
 
 
 
 
 
25
  "eval_accuracy": {
26
- "accuracy": 0.4
27
  },
28
- "eval_logLoss": 1.3229997158050537,
29
- "eval_loss": 1.3229997158050537,
30
- "eval_runtime": 0.7445,
31
- "eval_samples_per_second": 53.725,
32
- "eval_steps_per_second": 2.686,
33
- "step": 2
34
  },
35
  {
36
- "epoch": 2.4,
37
  "eval_accuracy": {
38
- "accuracy": 0.425
39
  },
40
- "eval_logLoss": 1.3222624063491821,
41
- "eval_loss": 1.3222624063491821,
42
- "eval_runtime": 1.3083,
43
- "eval_samples_per_second": 30.575,
44
- "eval_steps_per_second": 1.529,
45
- "step": 3
46
  },
47
  {
48
- "epoch": 2.4,
49
- "step": 3,
50
- "total_flos": 9545499876261888.0,
51
- "train_loss": 1.3307077884674072,
52
- "train_runtime": 26.0882,
53
- "train_samples_per_second": 18.399,
54
- "train_steps_per_second": 0.115
55
  }
56
  ],
57
  "logging_steps": 10,
58
- "max_steps": 3,
59
  "num_input_tokens_seen": 0,
60
  "num_train_epochs": 3,
61
  "save_steps": 500,
@@ -71,7 +78,7 @@
71
  "attributes": {}
72
  }
73
  },
74
- "total_flos": 9545499876261888.0,
75
  "train_batch_size": 32,
76
  "trial_name": null,
77
  "trial_params": null
 
1
  {
2
+ "best_metric": 1.0755484104156494,
3
+ "best_model_checkpoint": "swin-tiny-patch4-window7-224-finetuned/checkpoint-18",
4
+ "epoch": 2.88,
5
  "eval_steps": 500,
6
+ "global_step": 18,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
+ "epoch": 0.96,
13
  "eval_accuracy": {
14
+ "accuracy": 0.415
15
  },
16
+ "eval_logLoss": 1.196082353591919,
17
+ "eval_loss": 1.196082592010498,
18
+ "eval_runtime": 68.3725,
19
+ "eval_samples_per_second": 2.925,
20
+ "eval_steps_per_second": 0.102,
21
+ "step": 6
22
  },
23
  {
24
  "epoch": 1.6,
25
+ "grad_norm": 3.4481194019317627,
26
+ "learning_rate": 2.5e-05,
27
+ "loss": 1.2502,
28
+ "step": 10
29
+ },
30
+ {
31
+ "epoch": 1.92,
32
  "eval_accuracy": {
33
+ "accuracy": 0.49
34
  },
35
+ "eval_logLoss": 1.0786902904510498,
36
+ "eval_loss": 1.0786901712417603,
37
+ "eval_runtime": 4.6591,
38
+ "eval_samples_per_second": 42.927,
39
+ "eval_steps_per_second": 1.502,
40
+ "step": 12
41
  },
42
  {
43
+ "epoch": 2.88,
44
  "eval_accuracy": {
45
+ "accuracy": 0.48
46
  },
47
+ "eval_logLoss": 1.0755484104156494,
48
+ "eval_loss": 1.0755484104156494,
49
+ "eval_runtime": 4.8873,
50
+ "eval_samples_per_second": 40.922,
51
+ "eval_steps_per_second": 1.432,
52
+ "step": 18
53
  },
54
  {
55
+ "epoch": 2.88,
56
+ "step": 18,
57
+ "total_flos": 5.727299925757133e+16,
58
+ "train_loss": 1.1426812807718914,
59
+ "train_runtime": 417.2641,
60
+ "train_samples_per_second": 5.752,
61
+ "train_steps_per_second": 0.043
62
  }
63
  ],
64
  "logging_steps": 10,
65
+ "max_steps": 18,
66
  "num_input_tokens_seen": 0,
67
  "num_train_epochs": 3,
68
  "save_steps": 500,
 
78
  "attributes": {}
79
  }
80
  },
81
+ "total_flos": 5.727299925757133e+16,
82
  "train_batch_size": 32,
83
  "trial_name": null,
84
  "trial_params": null
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b8795c87ce3fac9f300c8d1c5eca4ea67de143dd1e0c834e5d2939f25395beb7
3
  size 5240
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:776601c03cf5d73011085c6726d5efd93d6819be3f8baa0b4540e1fb6b0763b7
3
  size 5240