Hanhpt23 commited on
Commit
b3ed003
·
verified ·
1 Parent(s): 13c3a95

Hanhpt23/Clip-Soil-patch32

Browse files
Files changed (5) hide show
  1. README.md +2 -0
  2. all_results.json +10 -10
  3. eval_results.json +5 -5
  4. train_results.json +6 -6
  5. trainer_state.json +62 -13
README.md CHANGED
@@ -13,6 +13,8 @@ should probably proofread and complete it, then remove this comment. -->
13
  # Clip-Soil-patch32
14
 
15
  This model is a fine-tuned version of [openai/clip-vit-base-patch32](https://huggingface.co/openai/clip-vit-base-patch32) on an unknown dataset.
 
 
16
 
17
  ## Model description
18
 
 
13
  # Clip-Soil-patch32
14
 
15
  This model is a fine-tuned version of [openai/clip-vit-base-patch32](https://huggingface.co/openai/clip-vit-base-patch32) on an unknown dataset.
16
+ It achieves the following results on the evaluation set:
17
+ - Loss: 5.9887
18
 
19
  ## Model description
20
 
all_results.json CHANGED
@@ -1,12 +1,12 @@
1
  {
2
- "epoch": 1.0,
3
- "eval_loss": 1.8086835145950317,
4
- "eval_runtime": 2.0062,
5
- "eval_samples_per_second": 33.894,
6
- "eval_steps_per_second": 4.486,
7
- "total_flos": 35598202755192.0,
8
- "train_loss": 2.0196751185825894,
9
- "train_runtime": 33.4326,
10
- "train_samples_per_second": 18.305,
11
- "train_steps_per_second": 2.303
12
  }
 
1
  {
2
+ "epoch": 50.0,
3
+ "eval_loss": 5.988685131072998,
4
+ "eval_runtime": 0.9434,
5
+ "eval_samples_per_second": 72.078,
6
+ "eval_steps_per_second": 9.54,
7
+ "total_flos": 1779910137759600.0,
8
+ "train_loss": 0.6525665847976486,
9
+ "train_runtime": 847.6015,
10
+ "train_samples_per_second": 36.102,
11
+ "train_steps_per_second": 4.542
12
  }
eval_results.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
- "epoch": 1.0,
3
- "eval_loss": 1.8086835145950317,
4
- "eval_runtime": 2.0062,
5
- "eval_samples_per_second": 33.894,
6
- "eval_steps_per_second": 4.486
7
  }
 
1
  {
2
+ "epoch": 50.0,
3
+ "eval_loss": 5.988685131072998,
4
+ "eval_runtime": 0.9434,
5
+ "eval_samples_per_second": 72.078,
6
+ "eval_steps_per_second": 9.54
7
  }
train_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "epoch": 1.0,
3
- "total_flos": 35598202755192.0,
4
- "train_loss": 2.0196751185825894,
5
- "train_runtime": 33.4326,
6
- "train_samples_per_second": 18.305,
7
- "train_steps_per_second": 2.303
8
  }
 
1
  {
2
+ "epoch": 50.0,
3
+ "total_flos": 1779910137759600.0,
4
+ "train_loss": 0.6525665847976486,
5
+ "train_runtime": 847.6015,
6
+ "train_samples_per_second": 36.102,
7
+ "train_steps_per_second": 4.542
8
  }
trainer_state.json CHANGED
@@ -1,27 +1,76 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 1.0,
5
  "eval_steps": 500,
6
- "global_step": 77,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
- "epoch": 1.0,
13
- "step": 77,
14
- "total_flos": 35598202755192.0,
15
- "train_loss": 2.0196751185825894,
16
- "train_runtime": 33.4326,
17
- "train_samples_per_second": 18.305,
18
- "train_steps_per_second": 2.303
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
19
  }
20
  ],
21
  "logging_steps": 500,
22
- "max_steps": 77,
23
  "num_input_tokens_seen": 0,
24
- "num_train_epochs": 1,
25
  "save_steps": 500,
26
  "stateful_callbacks": {
27
  "TrainerControl": {
@@ -29,13 +78,13 @@
29
  "should_epoch_stop": false,
30
  "should_evaluate": false,
31
  "should_log": false,
32
- "should_save": false,
33
  "should_training_stop": false
34
  },
35
  "attributes": {}
36
  }
37
  },
38
- "total_flos": 35598202755192.0,
39
  "train_batch_size": 8,
40
  "trial_name": null,
41
  "trial_params": null
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 50.0,
5
  "eval_steps": 500,
6
+ "global_step": 3850,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
+ "epoch": 6.4935064935064934,
13
+ "grad_norm": 17.624969482421875,
14
+ "learning_rate": 4.3506493506493503e-05,
15
+ "loss": 1.7452,
16
+ "step": 500
17
+ },
18
+ {
19
+ "epoch": 12.987012987012987,
20
+ "grad_norm": 15.936542510986328,
21
+ "learning_rate": 3.701298701298702e-05,
22
+ "loss": 1.1727,
23
+ "step": 1000
24
+ },
25
+ {
26
+ "epoch": 19.48051948051948,
27
+ "grad_norm": 22.365955352783203,
28
+ "learning_rate": 3.051948051948052e-05,
29
+ "loss": 0.8119,
30
+ "step": 1500
31
+ },
32
+ {
33
+ "epoch": 25.974025974025974,
34
+ "grad_norm": 19.36739730834961,
35
+ "learning_rate": 2.4025974025974027e-05,
36
+ "loss": 0.5254,
37
+ "step": 2000
38
+ },
39
+ {
40
+ "epoch": 32.467532467532465,
41
+ "grad_norm": 4.489462852478027,
42
+ "learning_rate": 1.7532467532467535e-05,
43
+ "loss": 0.3811,
44
+ "step": 2500
45
+ },
46
+ {
47
+ "epoch": 38.96103896103896,
48
+ "grad_norm": 0.12353431433439255,
49
+ "learning_rate": 1.103896103896104e-05,
50
+ "loss": 0.2244,
51
+ "step": 3000
52
+ },
53
+ {
54
+ "epoch": 45.45454545454545,
55
+ "grad_norm": 4.508783340454102,
56
+ "learning_rate": 4.5454545454545455e-06,
57
+ "loss": 0.1191,
58
+ "step": 3500
59
+ },
60
+ {
61
+ "epoch": 50.0,
62
+ "step": 3850,
63
+ "total_flos": 1779910137759600.0,
64
+ "train_loss": 0.6525665847976486,
65
+ "train_runtime": 847.6015,
66
+ "train_samples_per_second": 36.102,
67
+ "train_steps_per_second": 4.542
68
  }
69
  ],
70
  "logging_steps": 500,
71
+ "max_steps": 3850,
72
  "num_input_tokens_seen": 0,
73
+ "num_train_epochs": 50,
74
  "save_steps": 500,
75
  "stateful_callbacks": {
76
  "TrainerControl": {
 
78
  "should_epoch_stop": false,
79
  "should_evaluate": false,
80
  "should_log": false,
81
+ "should_save": true,
82
  "should_training_stop": false
83
  },
84
  "attributes": {}
85
  }
86
  },
87
+ "total_flos": 1779910137759600.0,
88
  "train_batch_size": 8,
89
  "trial_name": null,
90
  "trial_params": null