CatkinChen commited on
Commit
9fe6ce1
·
verified ·
1 Parent(s): 00405b9

Add training data

Browse files
Files changed (1) hide show
  1. training_data.json +63 -44
training_data.json CHANGED
@@ -1,63 +1,82 @@
1
  {
2
  "train_losses": [
3
- 8840.943349609375,
4
- 5997.839943847656,
5
- 5144.925102539062,
6
- 5292.724506835937,
7
- 4626.860837402343,
8
- 4236.542509765625,
9
- 3929.224425048828,
10
- 3200.1126879882813,
11
- 2780.4872631835938,
12
- 2538.591198730469,
13
- 2381.423229980469,
14
- 2263.6071203613283,
15
- 2203.3307653808592,
16
- 2151.2380603027345,
17
- 2110.144202880859
18
  ],
19
  "test_losses": [
20
- 5255.883227539062,
21
- 4322.146154785156,
22
- 4260.568579101562,
23
- 4361.874780273438,
24
- 4510.580639648438,
25
- 5458.825817871094,
26
- 6068.390393066406,
27
- 6140.3800048828125,
28
- 6816.257507324219,
29
- 7403.943029785156,
30
- 8169.396142578125,
31
- 8850.116650390624,
32
- 8851.075305175782,
33
- 8749.574572753907,
34
- 9020.297473144532
35
  ],
36
  "config": {
37
  "epochs": 15,
38
- "batch_size": 1024,
39
  "max_learning_rate": 0.001,
40
  "sequence_size": 32,
41
  "shuffle_batches": true,
42
  "shuffle_within_batch": true,
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
43
  "adaptive_weighting": {
44
  "initial_mi_beta": 0.0,
45
  "final_mi_beta": 0.0,
46
  "mi_beta_shape": "constant",
47
- "initial_tc_beta": 5.0,
48
- "final_tc_beta": 5.0,
49
  "tc_beta_shape": "constant",
50
- "initial_dw_beta": 0.02,
51
  "final_dw_beta": 1.0,
52
  "dw_beta_shape": "linear",
53
  "warmup_epoch_ratio": 0.2
54
  },
55
- "free_bits": 0.15,
56
- "focal_loss_alpha": 0.75,
57
- "focal_loss_gamma": 2.0,
58
- "dropout_rate": 0.1,
59
- "enable_dropout_on_latent": true,
60
- "enable_dropout_on_decoder": true,
 
61
  "early_stopping": {
62
  "enabled": false,
63
  "patience": 3,
@@ -66,9 +85,9 @@
66
  "best_epoch": null
67
  }
68
  },
69
- "final_train_loss": 2110.144202880859,
70
- "final_test_loss": 9020.297473144532,
71
  "total_epochs": 15,
72
- "best_train_loss": 2110.144202880859,
73
- "best_test_loss": 4260.568579101562
74
  }
 
1
  {
2
  "train_losses": [
3
+ 158443.7097314453,
4
+ 79525.31055175781,
5
+ 55150.76360839844,
6
+ 27544.720600585937,
7
+ 21215.07262207031,
8
+ 15201.550209960937,
9
+ 17076.67155517578,
10
+ 13131.717595214845,
11
+ 11821.861442871093,
12
+ 11532.774877929687,
13
+ 12098.519575195312,
14
+ 10800.846364746094,
15
+ 11168.50675048828,
16
+ 11143.719829101563,
17
+ 10742.088754882812
18
  ],
19
  "test_losses": [
20
+ 38101.2255859375,
21
+ 32535.043115234374,
22
+ 12535.003198242188,
23
+ 7116.39462890625,
24
+ 8404.210815429688,
25
+ 5529.595751953125,
26
+ 5309.565930175781,
27
+ 5373.602978515625,
28
+ 5507.798205566406,
29
+ 5121.186975097657,
30
+ 4946.643518066407,
31
+ 4945.580090332031,
32
+ 5142.907373046875,
33
+ 5019.152258300781,
34
+ 4867.249340820313
35
  ],
36
  "config": {
37
  "epochs": 15,
38
+ "batch_size": 32,
39
  "max_learning_rate": 0.001,
40
  "sequence_size": 32,
41
  "shuffle_batches": true,
42
  "shuffle_within_batch": true,
43
+ "vae_config": {
44
+ "latent_dim": 96,
45
+ "encoder_dropout": 0.1,
46
+ "decoder_dropout": 0.1,
47
+ "initial_mi_beta": 0.0,
48
+ "final_mi_beta": 0.0,
49
+ "mi_beta_shape": "constant",
50
+ "initial_tc_beta": 10.0,
51
+ "final_tc_beta": 10.0,
52
+ "tc_beta_shape": "constant",
53
+ "initial_dw_beta": 0.2,
54
+ "final_dw_beta": 1.0,
55
+ "dw_beta_shape": "linear",
56
+ "warmup_epoch_ratio": 0.2,
57
+ "free_bits": 0.15,
58
+ "focal_loss_alpha": 0.5,
59
+ "focal_loss_gamma": 2.0
60
+ },
61
  "adaptive_weighting": {
62
  "initial_mi_beta": 0.0,
63
  "final_mi_beta": 0.0,
64
  "mi_beta_shape": "constant",
65
+ "initial_tc_beta": 10.0,
66
+ "final_tc_beta": 10.0,
67
  "tc_beta_shape": "constant",
68
+ "initial_dw_beta": 0.2,
69
  "final_dw_beta": 1.0,
70
  "dw_beta_shape": "linear",
71
  "warmup_epoch_ratio": 0.2
72
  },
73
+ "regularization": {
74
+ "encoder_dropout": 0.1,
75
+ "decoder_dropout": 0.1,
76
+ "free_bits": 0.15,
77
+ "focal_loss_alpha": 0.5,
78
+ "focal_loss_gamma": 2.0
79
+ },
80
  "early_stopping": {
81
  "enabled": false,
82
  "patience": 3,
 
85
  "best_epoch": null
86
  }
87
  },
88
+ "final_train_loss": 10742.088754882812,
89
+ "final_test_loss": 4867.249340820313,
90
  "total_epochs": 15,
91
+ "best_train_loss": 10742.088754882812,
92
+ "best_test_loss": 4867.249340820313
93
  }