karim155 commited on
Commit
e2e7dd5
·
verified ·
1 Parent(s): 80e1c4c

Training in progress, epoch 0

Browse files
all_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "epoch": 2.88,
3
- "total_flos": 5.727299925757133e+16,
4
- "train_loss": 1.1426812807718914,
5
- "train_runtime": 417.2641,
6
- "train_samples_per_second": 5.752,
7
- "train_steps_per_second": 0.043
8
  }
 
1
  {
2
  "epoch": 2.88,
3
+ "total_flos": 1.1454599851514266e+17,
4
+ "train_loss": 1.034223583009508,
5
+ "train_runtime": 597.4423,
6
+ "train_samples_per_second": 8.034,
7
+ "train_steps_per_second": 0.06
8
  }
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2754a8794b28d4f477531124bf80b3acd335749104df0ab90e4530c0be87d992
3
  size 110352060
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:873780e294ef91fadba6ed031eaa71831cac484c699d9fc97b30c7e7a1644225
3
  size 110352060
runs/Aug19_00-04-27_e8f7099b712a/events.out.tfevents.1724026490.e8f7099b712a.297.6 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:db92d3350eeb0bfbc07ae235a95a047573e5fd3788e7e20d8b3bea3beb3e7037
3
+ size 404
runs/Aug19_00-20-42_e8f7099b712a/events.out.tfevents.1724026848.e8f7099b712a.297.7 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3e83c9f698580c30e14d8710a7b3546e16687d9d064198ca4258142c4a8e658e
3
+ size 6292
train_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "epoch": 2.88,
3
- "total_flos": 5.727299925757133e+16,
4
- "train_loss": 1.1426812807718914,
5
- "train_runtime": 417.2641,
6
- "train_samples_per_second": 5.752,
7
- "train_steps_per_second": 0.043
8
  }
 
1
  {
2
  "epoch": 2.88,
3
+ "total_flos": 1.1454599851514266e+17,
4
+ "train_loss": 1.034223583009508,
5
+ "train_runtime": 597.4423,
6
+ "train_samples_per_second": 8.034,
7
+ "train_steps_per_second": 0.06
8
  }
trainer_state.json CHANGED
@@ -1,68 +1,82 @@
1
  {
2
- "best_metric": 1.0755484104156494,
3
- "best_model_checkpoint": "swin-tiny-patch4-window7-224-finetuned/checkpoint-18",
4
  "epoch": 2.88,
5
  "eval_steps": 500,
6
- "global_step": 18,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
 
 
 
 
 
 
 
11
  {
12
  "epoch": 0.96,
13
  "eval_accuracy": {
14
- "accuracy": 0.415
15
  },
16
- "eval_logLoss": 1.196082353591919,
17
- "eval_loss": 1.196082592010498,
18
- "eval_runtime": 68.3725,
19
- "eval_samples_per_second": 2.925,
20
- "eval_steps_per_second": 0.102,
21
- "step": 6
22
  },
23
  {
24
  "epoch": 1.6,
25
- "grad_norm": 3.4481194019317627,
26
  "learning_rate": 2.5e-05,
27
- "loss": 1.2502,
28
- "step": 10
29
  },
30
  {
31
- "epoch": 1.92,
32
  "eval_accuracy": {
33
- "accuracy": 0.49
34
  },
35
- "eval_logLoss": 1.0786902904510498,
36
- "eval_loss": 1.0786901712417603,
37
- "eval_runtime": 4.6591,
38
- "eval_samples_per_second": 42.927,
39
- "eval_steps_per_second": 1.502,
40
- "step": 12
 
 
 
 
 
 
 
41
  },
42
  {
43
  "epoch": 2.88,
44
  "eval_accuracy": {
45
- "accuracy": 0.48
46
  },
47
- "eval_logLoss": 1.0755484104156494,
48
- "eval_loss": 1.0755484104156494,
49
- "eval_runtime": 4.8873,
50
- "eval_samples_per_second": 40.922,
51
- "eval_steps_per_second": 1.432,
52
- "step": 18
53
  },
54
  {
55
  "epoch": 2.88,
56
- "step": 18,
57
- "total_flos": 5.727299925757133e+16,
58
- "train_loss": 1.1426812807718914,
59
- "train_runtime": 417.2641,
60
- "train_samples_per_second": 5.752,
61
- "train_steps_per_second": 0.043
62
  }
63
  ],
64
  "logging_steps": 10,
65
- "max_steps": 18,
66
  "num_input_tokens_seen": 0,
67
  "num_train_epochs": 3,
68
  "save_steps": 500,
@@ -78,7 +92,7 @@
78
  "attributes": {}
79
  }
80
  },
81
- "total_flos": 5.727299925757133e+16,
82
  "train_batch_size": 32,
83
  "trial_name": null,
84
  "trial_params": null
 
1
  {
2
+ "best_metric": 0.871762752532959,
3
+ "best_model_checkpoint": "swin-tiny-patch4-window7-224-finetuned/checkpoint-25",
4
  "epoch": 2.88,
5
  "eval_steps": 500,
6
+ "global_step": 36,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
+ {
12
+ "epoch": 0.8,
13
+ "grad_norm": 5.137752532958984,
14
+ "learning_rate": 4.0625000000000005e-05,
15
+ "loss": 1.2933,
16
+ "step": 10
17
+ },
18
  {
19
  "epoch": 0.96,
20
  "eval_accuracy": {
21
+ "accuracy": 0.5525
22
  },
23
+ "eval_logLoss": 1.009933590888977,
24
+ "eval_loss": 1.0099334716796875,
25
+ "eval_runtime": 92.538,
26
+ "eval_samples_per_second": 4.323,
27
+ "eval_steps_per_second": 0.14,
28
+ "step": 12
29
  },
30
  {
31
  "epoch": 1.6,
32
+ "grad_norm": 4.288869857788086,
33
  "learning_rate": 2.5e-05,
34
+ "loss": 0.9637,
35
+ "step": 20
36
  },
37
  {
38
+ "epoch": 2.0,
39
  "eval_accuracy": {
40
+ "accuracy": 0.6125
41
  },
42
+ "eval_logLoss": 0.871762752532959,
43
+ "eval_loss": 0.871762752532959,
44
+ "eval_runtime": 9.6171,
45
+ "eval_samples_per_second": 41.593,
46
+ "eval_steps_per_second": 1.352,
47
+ "step": 25
48
+ },
49
+ {
50
+ "epoch": 2.4,
51
+ "grad_norm": 6.406833171844482,
52
+ "learning_rate": 9.375000000000001e-06,
53
+ "loss": 0.9461,
54
+ "step": 30
55
  },
56
  {
57
  "epoch": 2.88,
58
  "eval_accuracy": {
59
+ "accuracy": 0.6225
60
  },
61
+ "eval_logLoss": 0.8781986236572266,
62
+ "eval_loss": 0.8781986832618713,
63
+ "eval_runtime": 10.2528,
64
+ "eval_samples_per_second": 39.014,
65
+ "eval_steps_per_second": 1.268,
66
+ "step": 36
67
  },
68
  {
69
  "epoch": 2.88,
70
+ "step": 36,
71
+ "total_flos": 1.1454599851514266e+17,
72
+ "train_loss": 1.034223583009508,
73
+ "train_runtime": 597.4423,
74
+ "train_samples_per_second": 8.034,
75
+ "train_steps_per_second": 0.06
76
  }
77
  ],
78
  "logging_steps": 10,
79
+ "max_steps": 36,
80
  "num_input_tokens_seen": 0,
81
  "num_train_epochs": 3,
82
  "save_steps": 500,
 
92
  "attributes": {}
93
  }
94
  },
95
+ "total_flos": 1.1454599851514266e+17,
96
  "train_batch_size": 32,
97
  "trial_name": null,
98
  "trial_params": null
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:776601c03cf5d73011085c6726d5efd93d6819be3f8baa0b4540e1fb6b0763b7
3
  size 5240
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9f0825e68bcb0186ea443bdd539e6b3ef6ceb12ea12325f938bafef7df257c92
3
  size 5240