CatkinChen commited on
Commit
80c3c17
·
verified ·
1 Parent(s): 0008c97

Add training data

Browse files
Files changed (1) hide show
  1. training_data.json +38 -37
training_data.json CHANGED
@@ -1,44 +1,43 @@
1
  {
2
  "train_losses": [
3
- 7049.438330078125,
4
- 5887.628120117188,
5
- 5277.642026367187,
6
- 4594.689287109375,
7
- 3546.2805078125,
8
- 1424.719789428711,
9
- 1127.6089764404296,
10
- 840.4840567016602,
11
- 688.1939489746094,
12
- 602.3454461669921,
13
- 562.8847897338867,
14
- 533.8131185913086,
15
- 522.2901638793945,
16
- 515.8702670288086,
17
- 507.2388348388672
18
  ],
19
  "test_losses": [
20
- 5279.287158203125,
21
- 4462.337194824218,
22
- 4125.337866210937,
23
- 3586.261376953125,
24
- 2795.8281372070314,
25
- 1348.6051147460937,
26
- 1711.0676147460938,
27
- 2111.490283203125,
28
- 2405.6600982666014,
29
- 2786.551837158203,
30
- 2962.615338134766,
31
- 3259.63317565918,
32
- 3414.8231872558595,
33
- 3715.608850097656,
34
- 3996.8146850585936
35
  ],
36
  "config": {
37
  "epochs": 15,
38
  "batch_size": 32,
39
  "learning_rate": 0.0005,
40
  "sequence_size": 32,
41
- "include_inventory": false,
42
  "adaptive_weighting": {
43
  "initial_weight_emb": 1.5,
44
  "final_weight_emb": 0.0,
@@ -47,14 +46,16 @@
47
  "final_weight_raw": 1.0,
48
  "weight_raw_shape": "linear",
49
  "initial_kl_beta": 0.0001,
50
- "final_kl_beta": 0.5,
51
  "kl_beta_shape": "cosine",
52
  "warmup_epoch_ratio": 0.4
53
- }
 
 
54
  },
55
- "final_train_loss": 507.2388348388672,
56
- "final_test_loss": 3996.8146850585936,
57
  "total_epochs": 15,
58
- "best_train_loss": 507.2388348388672,
59
- "best_test_loss": 1348.6051147460937
60
  }
 
1
  {
2
  "train_losses": [
3
+ 6835.843090820313,
4
+ 5569.674467773438,
5
+ 4928.053500976563,
6
+ 4278.040825195312,
7
+ 3407.1733154296876,
8
+ 1707.017879638672,
9
+ 1678.5513446044922,
10
+ 1690.340132446289,
11
+ 1636.4783825683594,
12
+ 1561.4304962158203,
13
+ 1430.3591986083984,
14
+ 1286.2933282470703,
15
+ 1134.876439819336,
16
+ 999.4317224121094,
17
+ 912.4670324707031
18
  ],
19
  "test_losses": [
20
+ 4925.1087646484375,
21
+ 4224.336853027344,
22
+ 3812.184326171875,
23
+ 3274.811474609375,
24
+ 2596.8716430664062,
25
+ 1195.6449188232423,
26
+ 1303.003598022461,
27
+ 1479.3368133544923,
28
+ 1686.8121704101563,
29
+ 1969.0001953125,
30
+ 2295.1075073242187,
31
+ 2735.835479736328,
32
+ 2956.7591918945313,
33
+ 3227.5116333007813,
34
+ 3502.591668701172
35
  ],
36
  "config": {
37
  "epochs": 15,
38
  "batch_size": 32,
39
  "learning_rate": 0.0005,
40
  "sequence_size": 32,
 
41
  "adaptive_weighting": {
42
  "initial_weight_emb": 1.5,
43
  "final_weight_emb": 0.0,
 
46
  "final_weight_raw": 1.0,
47
  "weight_raw_shape": "linear",
48
  "initial_kl_beta": 0.0001,
49
+ "final_kl_beta": 0.4,
50
  "kl_beta_shape": "cosine",
51
  "warmup_epoch_ratio": 0.4
52
+ },
53
+ "total_correlation_beta_multiplier": 15.0,
54
+ "free_bits": 0.15
55
  },
56
+ "final_train_loss": 912.4670324707031,
57
+ "final_test_loss": 3502.591668701172,
58
  "total_epochs": 15,
59
+ "best_train_loss": 912.4670324707031,
60
+ "best_test_loss": 1195.6449188232423
61
  }