File size: 2,113 Bytes
c617722
 
 
 
 
d108cd5
25c6e51
c617722
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
9ef7c0a
ddefc59
7cd7c4d
c617722
7cd7c4d
 
ddefc59
 
 
 
7cb5a03
 
ddefc59
dc7232b
898c960
dc7232b
ddefc59
 
7cb5a03
ddefc59
dc7232b
ddefc59
 
 
c617722
7cb5a03
 
7cd7c4d
dc7232b
898c960
dc7232b
ddefc59
f12eee8
7cb5a03
41a0d34
25c6e51
ddefc59
 
 
dc7232b
ddefc59
 
 
7cd7c4d
cc774a5
7cd7c4d
 
cc774a5
 
7cd7c4d
c617722
dc7232b
 
 
 
9ef7c0a
c617722
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
{
  "model_type": "MultiModalHackVAE",
  "framework": "PyTorch",
  "task": "representation-learning",
  "dataset": "NetHack Learning Dataset",
  "latent_dim": 96,
  "lowrank_dim": 0,
  "architecture": "Multi-modal Variational Autoencoder for NetHack game states",
  "author": "Xu Chen",
  "description": "Advanced NetHack VAE",
  "tags": [
    "nethack",
    "reinforcement-learning",
    "multimodal",
    "world-modeling",
    "vae"
  ],
  "use_cases": [
    "Game state representation learning",
    "RL agent state abstraction",
    "NetHack gameplay analysis"
  ],
  "training_config": {
    "epochs": 15,
    "batch_size": 32,
    "max_learning_rate": 0.001,
    "sequence_size": 32,
    "shuffle_batches": true,
    "shuffle_within_batch": true,
    "vae_config": {
      "latent_dim": 96,
      "encoder_dropout": 0.1,
      "decoder_dropout": 0.1,
      "initial_mi_beta": 1.0,
      "final_mi_beta": 1.0,
      "mi_beta_shape": "constant",
      "initial_tc_beta": 0.0,
      "final_tc_beta": 10.0,
      "tc_beta_shape": "custom",
      "initial_dw_beta": 0.2,
      "final_dw_beta": 1.0,
      "dw_beta_shape": "custom",
      "warmup_epoch_ratio": 0.2,
      "free_bits": 0.75,
      "focal_loss_alpha": 0.5,
      "focal_loss_gamma": 2.0
    },
    "adaptive_weighting": {
      "initial_mi_beta": 1.0,
      "final_mi_beta": 1.0,
      "mi_beta_shape": "constant",
      "initial_tc_beta": 0.0,
      "final_tc_beta": 10.0,
      "tc_beta_shape": "custom",
      "initial_dw_beta": 0.2,
      "final_dw_beta": 1.0,
      "dw_beta_shape": "custom",
      "warmup_epoch_ratio": 0.2
    },
    "regularization": {
      "encoder_dropout": 0.1,
      "decoder_dropout": 0.1,
      "free_bits": 0.75,
      "focal_loss_alpha": 0.5,
      "focal_loss_gamma": 2.0
    },
    "early_stopping": {
      "enabled": false,
      "patience": 3,
      "min_delta": 0.01,
      "triggered": false,
      "best_epoch": null
    }
  },
  "final_train_loss": 980.7457598876953,
  "final_test_loss": 990.1863067626953,
  "best_train_loss": 980.7457598876953,
  "best_test_loss": 985.553515625,
  "total_epochs": 15
}