CalliReader / config /configu.py
gtang666's picture
Codes
ed1622f verified
import torch
import os
device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
# 路径配置
VIT_MODEL_PATH = '/home/luoyx/InternVL/CalliReader/params/vit_model.pt'
MLP1_PATH = '/home/luoyx/InternVL/CalliReader/params/params/mlp1.pth'
TOK_EMBEDDING_PATH = '/home/luoyx/InternVL/CalliReader/params/token_embedding.pth'
TOKENIZER_PATH = 'InternVL'
NORM_PARAMS_PATH='/home/luoyx/InternVL/CalliReader/params/gauss_norm_mu_sigma.pth'
NORM_TOK_EMBEDDING_PATH='/home/luoyx/InternVL/CalliReader/params/gauss_norm.pth'
NEW_1000_TOK_EMBEDDING_PATH='/home/luoyx/InternVL/CalliReader/params/new1000_token_embedding.pth'
INTERNVL_PATH='InternVL'
IMAGENET_MEAN = (0.485, 0.456, 0.406)
IMAGENET_STD = (0.229, 0.224, 0.225)
SEED=42
# 训练配置
BATCH_SIZE = 256
USE_WARMUP=False
LR = 1e-4 # original 1e-4
WEIGHT_DECAY = 1e-5
WARMUP_STEPS = 2000 # *4 = total training steps
NUM_EPOCHS = 13
NUM_WORKERS = 4
TRAIN_INTER = 10
VAL_INTER = 500
DOWNSAMPLE_RATIO = 0.5
NUM_LAYERS=4
GRAD_ACCU = 1
MODEL_NAME = 'PERCEIVER'
# 数据路径
TRAIN_DATA_PATH = ""
VAL_DATA_PATH = ''
TEST_DATA_PATH = ''
TRAIN_RATIO = 1#0.556 #0.02
VAL_RATIO = 0.2#0.1
# 36000 steps 8 cards 20 epochs, ~ 0.52 data ratio
# LOGS andSAVE_NAME
# 每一次跑新的实验切记一定需要修改!!!!
LOG_NAME = ''
SAVE_NAME = LOG_NAME+'.pth'
# DDP
WORLD_SIZE = torch.cuda.device_count()
# 如果我们要加载训练一半的模型,两个都不能是none!!
# LOAD CHECKPOINT AND RESUME TRAINING
# PERCEIVER_CHECKPOINT ="/home/luoyx/InternVL/CalliReader/params/perceiver_4_n01_1e-4_new.pth"
# RESUME = 26500
PERCEIVER_CHECKPOINT ='/home/luoyx/InternVL/CalliReader/params/callialign.pth'
RESUME = 50000
ORDERFORMER_CHECKPOINT='/home/luoyx/InternVL/CalliReader/params/orderformer.pth'
YOLO_CHECKPOINT="/home/luoyx/InternVL/CalliReader/params/best.pt"