File size: 569 Bytes
975624b | 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 | import torch
# Set device cuda for GPU if it is available, otherwise run on the CPU
device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
# loss
t_p = 0.25 # optimal: 1/8 ~ 1/32
zeta = 3 # optimal: 2 ~ 5
# m = 0.2
# Training hyperparameters
min_epochs = 3
max_epochs = 30
learning_rate = 5e-5
unfreeze_ratio = 1
mlm_weight = 0.5 # optimal: 0.5~0.75
# Dataset
batch_size = 100
split_ratio = 0.2
# Logger
log_every_n_steps = 50
ckcpt_every_n_steps = 5000
# Compute related
accelerator = "gpu"
devices = 1 # number of gpus
precision = "16-mixed"
|