| trainer: "any-order-flow" |
| dataset: "safe-drugs" |
|
|
| |
| hf_dataset: |
| name: "datamol-io/safe-gpt" |
| smiles_column: "smiles" |
|
|
| model: |
| hidden_size: 768 |
| n_heads: 12 |
| cond_dim: 128 |
| dropout: 0.05 |
| n_blocks: 12 |
| torch_dtype: 'float32' |
|
|
| interpolant: |
| type: "any-order" |
| tokens: null |
| pad_token: null |
| mask_token: null |
| max_length: 256 |
| insert_schedule: |
| type: "linear" |
| unmask_schedule: |
| type: "linear" |
|
|
| training: |
| only_embed_insert: true |
| batch_size: 2048 |
| per_gpu_batch_size: 64 |
| cpus: 4 |
| learning_rate: 3e-4 |
| nodes: 1 |
| devices: 2 |
| max_steps: 500000 |
| weight_decay: 0.03 |
| checkpoint_dir: "checkpoints/pretrain_mol" |
| save_top_k: 3 |
| save_every_n_steps: 1000 |
| |
| loss_fn: |
| unmask: "elbo" |
| insert: "expectation" |
| reset_lr: false |
| warmup_steps: 2000 |
| ema_decay: 0.9999 |
| filter_max_length: false |
| |
| wandb: |
| entity: null |
| project: "a2d2-mol" |
| name: "a2d2-mol" |
| path: "./wandb" |
|
|