CatkinChen commited on
Commit
cb22ec8
·
verified ·
1 Parent(s): 48bc857

Add training data

Browse files
Files changed (1) hide show
  1. training_data.json +15 -39
training_data.json CHANGED
@@ -1,37 +1,13 @@
1
  {
2
  "train_losses": [
3
- 8522.687722167968,
4
- 5948.037609863281,
5
- 5299.650319824219,
6
- 5164.902270507812,
7
- 5124.975241699219,
8
- 4882.509072265625,
9
- 4695.139870605469,
10
- 4494.95626953125,
11
- 3769.9364306640623,
12
- 3455.5234362792967,
13
- 3113.4037646484376,
14
- 2894.6963244628905,
15
- 2755.5655737304687,
16
- 2669.2157153320313,
17
- 2610.3932897949217
18
  ],
19
  "test_losses": [
20
- 5174.157824707031,
21
- 4697.121484375,
22
- 4170.104797363281,
23
- 4119.477563476563,
24
- 4505.739526367188,
25
- 4108.995947265625,
26
- 4981.743469238281,
27
- 4981.943542480469,
28
- 5563.02421875,
29
- 6102.1019287109375,
30
- 6386.164367675781,
31
- 6654.9200439453125,
32
- 7023.874938964844,
33
- 7218.628796386719,
34
- 7328.070239257812
35
  ],
36
  "config": {
37
  "epochs": 15,
@@ -50,7 +26,7 @@
50
  "initial_dw_beta": 0.02,
51
  "final_dw_beta": 1.0,
52
  "dw_beta_shape": "linear",
53
- "warmup_epoch_ratio": 0.4
54
  },
55
  "free_bits": 0.15,
56
  "focal_loss_alpha": 0.75,
@@ -59,16 +35,16 @@
59
  "enable_dropout_on_latent": true,
60
  "enable_dropout_on_decoder": true,
61
  "early_stopping": {
62
- "enabled": false,
63
  "patience": 3,
64
  "min_delta": 0.01,
65
- "triggered": false,
66
- "best_epoch": null
67
  }
68
  },
69
- "final_train_loss": 2610.3932897949217,
70
- "final_test_loss": 7328.070239257812,
71
- "total_epochs": 15,
72
- "best_train_loss": 2610.3932897949217,
73
- "best_test_loss": 4108.995947265625
74
  }
 
1
  {
2
  "train_losses": [
3
+ 8604.43171875,
4
+ 5975.3112109375,
5
+ 5188.482888183594
 
 
 
 
 
 
 
 
 
 
 
 
6
  ],
7
  "test_losses": [
8
+ 5092.959655761719,
9
+ 4591.594555664063,
10
+ 4268.6180419921875
 
 
 
 
 
 
 
 
 
 
 
 
11
  ],
12
  "config": {
13
  "epochs": 15,
 
26
  "initial_dw_beta": 0.02,
27
  "final_dw_beta": 1.0,
28
  "dw_beta_shape": "linear",
29
+ "warmup_epoch_ratio": 0.2
30
  },
31
  "free_bits": 0.15,
32
  "focal_loss_alpha": 0.75,
 
35
  "enable_dropout_on_latent": true,
36
  "enable_dropout_on_decoder": true,
37
  "early_stopping": {
38
+ "enabled": true,
39
  "patience": 3,
40
  "min_delta": 0.01,
41
+ "triggered": true,
42
+ "best_epoch": 3
43
  }
44
  },
45
+ "final_train_loss": 5188.482888183594,
46
+ "final_test_loss": 4268.6180419921875,
47
+ "total_epochs": 3,
48
+ "best_train_loss": 5188.482888183594,
49
+ "best_test_loss": 4268.6180419921875
50
  }