File size: 569 Bytes
975624b
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
import torch

# Set device cuda for GPU if it is available, otherwise run on the CPU
device = torch.device("cuda" if torch.cuda.is_available() else "cpu")

# loss
t_p = 0.25  # optimal: 1/8 ~ 1/32
zeta = 3  # optimal: 2 ~ 5
# m = 0.2

# Training hyperparameters
min_epochs = 3
max_epochs = 30
learning_rate = 5e-5
unfreeze_ratio = 1
mlm_weight = 0.5  # optimal: 0.5~0.75

# Dataset
batch_size = 100
split_ratio = 0.2

# Logger
log_every_n_steps = 50
ckcpt_every_n_steps = 5000

# Compute related
accelerator = "gpu"
devices = 1  # number of gpus
precision = "16-mixed"