djbp commited on
Commit
bce2193
·
verified ·
1 Parent(s): 09b2431

Training in progress, epoch 0

Browse files
all_results.json ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 8.0,
3
+ "total_flos": 1.9019421639416218e+17,
4
+ "train_loss": 2.6748404184977215,
5
+ "train_runtime": 2549.9123,
6
+ "train_samples_per_second": 3.749,
7
+ "train_steps_per_second": 0.012
8
+ }
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:25adb1edd66215e1b4d731172fa87a7a4bb17ee0eb7d6015e40489d246080efb
3
  size 110398208
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:42758b103584d7cd49e63d3200625149d08137738e98ac59919396a9c4543afe
3
  size 110398208
runs/Jun27_07-26-45_c34ae8869574/events.out.tfevents.1719473207.c34ae8869574 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d648d825f11a0f482c52834586004804142e6de17315cfdd8187a4cc50b09eab
3
+ size 6361
runs/Jun27_07-36-11_c34ae8869574/events.out.tfevents.1719473776.c34ae8869574 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e771d4fc84d7ef0510c2f960aa174702843210a2b72ac09e24b62452a3811b55
3
+ size 7810
runs/Jun27_08-42-01_c3df91dfd599/events.out.tfevents.1719477728.c3df91dfd599 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2df81a7c4b1e1c5ef573f25786ff8164f9a2ae8763c0e33d957af5a9dbcd851e
3
+ size 6361
runs/Jun27_08-47-10_c3df91dfd599/events.out.tfevents.1719478034.c3df91dfd599 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b27dfcc0f4bc79894355421baa1e1b5f0306303b969d23024ae16878488efec0
3
+ size 8273
runs/Jun27_10-04-20_79e23ecbe329/events.out.tfevents.1719482662.79e23ecbe329 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d5c54d33a013507f6b06a4f04ca62301966108b0db4420afd425e0e14f9597ea
3
+ size 8224
train_results.json ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 8.0,
3
+ "total_flos": 1.9019421639416218e+17,
4
+ "train_loss": 2.6748404184977215,
5
+ "train_runtime": 2549.9123,
6
+ "train_samples_per_second": 3.749,
7
+ "train_steps_per_second": 0.012
8
+ }
trainer_state.json ADDED
@@ -0,0 +1,135 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_metric": 0.30022075055187636,
3
+ "best_model_checkpoint": "swin-tiny-patch4-window7-224-category-classification/checkpoint-26",
4
+ "epoch": 8.0,
5
+ "eval_steps": 500,
6
+ "global_step": 30,
7
+ "is_hyper_param_search": false,
8
+ "is_local_process_zero": true,
9
+ "is_world_process_zero": true,
10
+ "log_history": [
11
+ {
12
+ "epoch": 0.8,
13
+ "eval_accuracy": 0.05518763796909492,
14
+ "eval_loss": 3.007758617401123,
15
+ "eval_runtime": 188.9532,
16
+ "eval_samples_per_second": 4.795,
17
+ "eval_steps_per_second": 0.079,
18
+ "step": 3
19
+ },
20
+ {
21
+ "epoch": 1.8666666666666667,
22
+ "eval_accuracy": 0.1280353200883002,
23
+ "eval_loss": 2.8865292072296143,
24
+ "eval_runtime": 166.273,
25
+ "eval_samples_per_second": 5.449,
26
+ "eval_steps_per_second": 0.09,
27
+ "step": 7
28
+ },
29
+ {
30
+ "epoch": 2.6666666666666665,
31
+ "grad_norm": 4.288784980773926,
32
+ "learning_rate": 3.7037037037037037e-05,
33
+ "loss": 2.9474,
34
+ "step": 10
35
+ },
36
+ {
37
+ "epoch": 2.9333333333333336,
38
+ "eval_accuracy": 0.19646799116997793,
39
+ "eval_loss": 2.7917754650115967,
40
+ "eval_runtime": 156.11,
41
+ "eval_samples_per_second": 5.804,
42
+ "eval_steps_per_second": 0.096,
43
+ "step": 11
44
+ },
45
+ {
46
+ "epoch": 4.0,
47
+ "eval_accuracy": 0.23620309050772628,
48
+ "eval_loss": 2.694143056869507,
49
+ "eval_runtime": 155.6836,
50
+ "eval_samples_per_second": 5.819,
51
+ "eval_steps_per_second": 0.096,
52
+ "step": 15
53
+ },
54
+ {
55
+ "epoch": 4.8,
56
+ "eval_accuracy": 0.2582781456953642,
57
+ "eval_loss": 2.628232002258301,
58
+ "eval_runtime": 148.8415,
59
+ "eval_samples_per_second": 6.087,
60
+ "eval_steps_per_second": 0.101,
61
+ "step": 18
62
+ },
63
+ {
64
+ "epoch": 5.333333333333333,
65
+ "grad_norm": 4.339354515075684,
66
+ "learning_rate": 1.8518518518518518e-05,
67
+ "loss": 2.645,
68
+ "step": 20
69
+ },
70
+ {
71
+ "epoch": 5.866666666666667,
72
+ "eval_accuracy": 0.282560706401766,
73
+ "eval_loss": 2.5581247806549072,
74
+ "eval_runtime": 155.1024,
75
+ "eval_samples_per_second": 5.841,
76
+ "eval_steps_per_second": 0.097,
77
+ "step": 22
78
+ },
79
+ {
80
+ "epoch": 6.933333333333334,
81
+ "eval_accuracy": 0.30022075055187636,
82
+ "eval_loss": 2.515105962753296,
83
+ "eval_runtime": 149.6803,
84
+ "eval_samples_per_second": 6.053,
85
+ "eval_steps_per_second": 0.1,
86
+ "step": 26
87
+ },
88
+ {
89
+ "epoch": 8.0,
90
+ "grad_norm": 4.57526159286499,
91
+ "learning_rate": 0.0,
92
+ "loss": 2.4321,
93
+ "step": 30
94
+ },
95
+ {
96
+ "epoch": 8.0,
97
+ "eval_accuracy": 0.2980132450331126,
98
+ "eval_loss": 2.4982221126556396,
99
+ "eval_runtime": 169.9225,
100
+ "eval_samples_per_second": 5.332,
101
+ "eval_steps_per_second": 0.088,
102
+ "step": 30
103
+ },
104
+ {
105
+ "epoch": 8.0,
106
+ "step": 30,
107
+ "total_flos": 1.9019421639416218e+17,
108
+ "train_loss": 2.6748404184977215,
109
+ "train_runtime": 2549.9123,
110
+ "train_samples_per_second": 3.749,
111
+ "train_steps_per_second": 0.012
112
+ }
113
+ ],
114
+ "logging_steps": 10,
115
+ "max_steps": 30,
116
+ "num_input_tokens_seen": 0,
117
+ "num_train_epochs": 10,
118
+ "save_steps": 500,
119
+ "stateful_callbacks": {
120
+ "TrainerControl": {
121
+ "args": {
122
+ "should_epoch_stop": false,
123
+ "should_evaluate": false,
124
+ "should_log": false,
125
+ "should_save": true,
126
+ "should_training_stop": true
127
+ },
128
+ "attributes": {}
129
+ }
130
+ },
131
+ "total_flos": 1.9019421639416218e+17,
132
+ "train_batch_size": 64,
133
+ "trial_name": null,
134
+ "trial_params": null
135
+ }
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3e5163abb6b92fa6e78aff6612725e85119767ac2a5b4d32eb6967c07c80cc20
3
  size 4731
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8f70c68887969d626f0f5fbfe9b053bb1874e07deaf580b932ca8af4ac3c26a5
3
  size 4731