CatkinChen commited on
Commit
49ce502
·
verified ·
1 Parent(s): ac49d3a

Add training data

Browse files
Files changed (1) hide show
  1. training_data.json +44 -44
training_data.json CHANGED
@@ -1,37 +1,37 @@
1
  {
2
  "train_losses": [
3
- 158443.7097314453,
4
- 79525.31055175781,
5
- 55150.76360839844,
6
- 27544.720600585937,
7
- 21215.07262207031,
8
- 15201.550209960937,
9
- 17076.67155517578,
10
- 13131.717595214845,
11
- 11821.861442871093,
12
- 11532.774877929687,
13
- 12098.519575195312,
14
- 10800.846364746094,
15
- 11168.50675048828,
16
- 11143.719829101563,
17
- 10742.088754882812
18
  ],
19
  "test_losses": [
20
- 38101.2255859375,
21
- 32535.043115234374,
22
- 12535.003198242188,
23
- 7116.39462890625,
24
- 8404.210815429688,
25
- 5529.595751953125,
26
- 5309.565930175781,
27
- 5373.602978515625,
28
- 5507.798205566406,
29
- 5121.186975097657,
30
- 4946.643518066407,
31
- 4945.580090332031,
32
- 5142.907373046875,
33
- 5019.152258300781,
34
- 4867.249340820313
35
  ],
36
  "config": {
37
  "epochs": 15,
@@ -44,30 +44,30 @@
44
  "latent_dim": 96,
45
  "encoder_dropout": 0.1,
46
  "decoder_dropout": 0.1,
47
- "initial_mi_beta": 0.0,
48
- "final_mi_beta": 0.0,
49
  "mi_beta_shape": "constant",
50
- "initial_tc_beta": 10.0,
51
- "final_tc_beta": 10.0,
52
  "tc_beta_shape": "constant",
53
  "initial_dw_beta": 0.2,
54
  "final_dw_beta": 1.0,
55
- "dw_beta_shape": "linear",
56
  "warmup_epoch_ratio": 0.2,
57
  "free_bits": 0.15,
58
  "focal_loss_alpha": 0.5,
59
  "focal_loss_gamma": 2.0
60
  },
61
  "adaptive_weighting": {
62
- "initial_mi_beta": 0.0,
63
- "final_mi_beta": 0.0,
64
  "mi_beta_shape": "constant",
65
- "initial_tc_beta": 10.0,
66
- "final_tc_beta": 10.0,
67
  "tc_beta_shape": "constant",
68
  "initial_dw_beta": 0.2,
69
  "final_dw_beta": 1.0,
70
- "dw_beta_shape": "linear",
71
  "warmup_epoch_ratio": 0.2
72
  },
73
  "regularization": {
@@ -85,9 +85,9 @@
85
  "best_epoch": null
86
  }
87
  },
88
- "final_train_loss": 10742.088754882812,
89
- "final_test_loss": 4867.249340820313,
90
  "total_epochs": 15,
91
- "best_train_loss": 10742.088754882812,
92
- "best_test_loss": 4867.249340820313
93
  }
 
1
  {
2
  "train_losses": [
3
+ 151209.8428808594,
4
+ 96542.593515625,
5
+ 64421.11040039062,
6
+ 33749.90318359375,
7
+ 19004.055146484374,
8
+ 16831.15723876953,
9
+ 15080.03873046875,
10
+ 12901.305888671875,
11
+ 12439.551579589845,
12
+ 11211.600803222656,
13
+ 12005.076337890625,
14
+ 9869.182932128906,
15
+ 9778.175876464844,
16
+ 9639.344291992187,
17
+ 9386.756044921874
18
  ],
19
  "test_losses": [
20
+ 58844.00859375,
21
+ 26590.416088867187,
22
+ 6761.0640869140625,
23
+ 5468.9392578125,
24
+ 5257.670593261719,
25
+ 4997.675915527344,
26
+ 5334.108666992188,
27
+ 4735.450335693359,
28
+ 4672.923291015625,
29
+ 4978.906188964844,
30
+ 4423.438391113281,
31
+ 4382.65751953125,
32
+ 4135.9177734375,
33
+ 4164.897058105469,
34
+ 4150.397497558593
35
  ],
36
  "config": {
37
  "epochs": 15,
 
44
  "latent_dim": 96,
45
  "encoder_dropout": 0.1,
46
  "decoder_dropout": 0.1,
47
+ "initial_mi_beta": 1.0,
48
+ "final_mi_beta": 1.0,
49
  "mi_beta_shape": "constant",
50
+ "initial_tc_beta": 5.0,
51
+ "final_tc_beta": 5.0,
52
  "tc_beta_shape": "constant",
53
  "initial_dw_beta": 0.2,
54
  "final_dw_beta": 1.0,
55
+ "dw_beta_shape": "custom",
56
  "warmup_epoch_ratio": 0.2,
57
  "free_bits": 0.15,
58
  "focal_loss_alpha": 0.5,
59
  "focal_loss_gamma": 2.0
60
  },
61
  "adaptive_weighting": {
62
+ "initial_mi_beta": 1.0,
63
+ "final_mi_beta": 1.0,
64
  "mi_beta_shape": "constant",
65
+ "initial_tc_beta": 5.0,
66
+ "final_tc_beta": 5.0,
67
  "tc_beta_shape": "constant",
68
  "initial_dw_beta": 0.2,
69
  "final_dw_beta": 1.0,
70
+ "dw_beta_shape": "custom",
71
  "warmup_epoch_ratio": 0.2
72
  },
73
  "regularization": {
 
85
  "best_epoch": null
86
  }
87
  },
88
+ "final_train_loss": 9386.756044921874,
89
+ "final_test_loss": 4150.397497558593,
90
  "total_epochs": 15,
91
+ "best_train_loss": 9386.756044921874,
92
+ "best_test_loss": 4135.9177734375
93
  }