CatkinChen commited on
Commit
3bdd0a9
·
verified ·
1 Parent(s): 43fc0fb

Add training data

Browse files
Files changed (1) hide show
  1. training_data.json +40 -40
training_data.json CHANGED
@@ -1,37 +1,37 @@
1
  {
2
  "train_losses": [
3
- 2100.769680175781,
4
- 1210.195811767578,
5
- 1176.4252709960938,
6
- 1143.586368408203,
7
- 1115.7994873046875,
8
- 1091.0681024169921,
9
- 1068.894476928711,
10
- 1061.0595739746093,
11
- 1048.5140423583985,
12
- 1030.019833984375,
13
- 1021.6400866699219,
14
- 1014.914428100586,
15
- 1012.0101983642578,
16
- 1008.9616821289062,
17
- 1007.0355267333985
18
  ],
19
  "test_losses": [
20
- 1278.497021484375,
21
- 1241.6509338378905,
22
- 1210.9466491699218,
23
- 1211.009942626953,
24
- 1160.8113220214843,
25
- 1111.9551544189453,
26
- 1074.8253112792968,
27
- 1102.0312622070312,
28
- 1043.075909423828,
29
- 1020.9971008300781,
30
- 1005.1833709716797,
31
- 1002.2283630371094,
32
- 997.1159881591797,
33
- 993.3500823974609,
34
- 993.1695037841797
35
  ],
36
  "config": {
37
  "epochs": 15,
@@ -47,14 +47,14 @@
47
  "initial_mi_beta": 1.0,
48
  "final_mi_beta": 1.0,
49
  "mi_beta_shape": "constant",
50
- "initial_tc_beta": 10.0,
51
  "final_tc_beta": 10.0,
52
- "tc_beta_shape": "constant",
53
  "initial_dw_beta": 0.2,
54
  "final_dw_beta": 1.0,
55
  "dw_beta_shape": "custom",
56
  "warmup_epoch_ratio": 0.2,
57
- "free_bits": 0.15,
58
  "focal_loss_alpha": 0.5,
59
  "focal_loss_gamma": 2.0
60
  },
@@ -62,9 +62,9 @@
62
  "initial_mi_beta": 1.0,
63
  "final_mi_beta": 1.0,
64
  "mi_beta_shape": "constant",
65
- "initial_tc_beta": 10.0,
66
  "final_tc_beta": 10.0,
67
- "tc_beta_shape": "constant",
68
  "initial_dw_beta": 0.2,
69
  "final_dw_beta": 1.0,
70
  "dw_beta_shape": "custom",
@@ -73,7 +73,7 @@
73
  "regularization": {
74
  "encoder_dropout": 0.1,
75
  "decoder_dropout": 0.1,
76
- "free_bits": 0.15,
77
  "focal_loss_alpha": 0.5,
78
  "focal_loss_gamma": 2.0
79
  },
@@ -85,9 +85,9 @@
85
  "best_epoch": null
86
  }
87
  },
88
- "final_train_loss": 1007.0355267333985,
89
- "final_test_loss": 993.1695037841797,
90
  "total_epochs": 15,
91
- "best_train_loss": 1007.0355267333985,
92
- "best_test_loss": 993.1695037841797
93
  }
 
1
  {
2
  "train_losses": [
3
+ 2136.5024682617186,
4
+ 1198.3308361816407,
5
+ 1161.5707946777343,
6
+ 1123.9894409179688,
7
+ 1090.3879553222657,
8
+ 1057.5052581787108,
9
+ 1034.7834246826171,
10
+ 1018.692387084961,
11
+ 1008.2613201904297,
12
+ 1000.2829901123047,
13
+ 993.2367407226562,
14
+ 987.9076995849609,
15
+ 984.4344122314453,
16
+ 982.5031854248047,
17
+ 980.7457598876953
18
  ],
19
  "test_losses": [
20
+ 1273.5531799316407,
21
+ 1226.4591247558594,
22
+ 1197.41689453125,
23
+ 1164.7423767089845,
24
+ 1098.9119689941406,
25
+ 1046.8178466796876,
26
+ 1028.4834930419922,
27
+ 1017.2713775634766,
28
+ 1018.4531524658203,
29
+ 1009.554721069336,
30
+ 1002.5865447998046,
31
+ 985.553515625,
32
+ 986.9031860351563,
33
+ 991.0865600585937,
34
+ 990.1863067626953
35
  ],
36
  "config": {
37
  "epochs": 15,
 
47
  "initial_mi_beta": 1.0,
48
  "final_mi_beta": 1.0,
49
  "mi_beta_shape": "constant",
50
+ "initial_tc_beta": 0.0,
51
  "final_tc_beta": 10.0,
52
+ "tc_beta_shape": "custom",
53
  "initial_dw_beta": 0.2,
54
  "final_dw_beta": 1.0,
55
  "dw_beta_shape": "custom",
56
  "warmup_epoch_ratio": 0.2,
57
+ "free_bits": 0.75,
58
  "focal_loss_alpha": 0.5,
59
  "focal_loss_gamma": 2.0
60
  },
 
62
  "initial_mi_beta": 1.0,
63
  "final_mi_beta": 1.0,
64
  "mi_beta_shape": "constant",
65
+ "initial_tc_beta": 0.0,
66
  "final_tc_beta": 10.0,
67
+ "tc_beta_shape": "custom",
68
  "initial_dw_beta": 0.2,
69
  "final_dw_beta": 1.0,
70
  "dw_beta_shape": "custom",
 
73
  "regularization": {
74
  "encoder_dropout": 0.1,
75
  "decoder_dropout": 0.1,
76
+ "free_bits": 0.75,
77
  "focal_loss_alpha": 0.5,
78
  "focal_loss_gamma": 2.0
79
  },
 
85
  "best_epoch": null
86
  }
87
  },
88
+ "final_train_loss": 980.7457598876953,
89
+ "final_test_loss": 990.1863067626953,
90
  "total_epochs": 15,
91
+ "best_train_loss": 980.7457598876953,
92
+ "best_test_loss": 985.553515625
93
  }