|
|
import torch |
|
|
import os |
|
|
|
|
|
device = torch.device("cuda" if torch.cuda.is_available() else "cpu") |
|
|
|
|
|
|
|
|
VIT_MODEL_PATH = '/home/luoyx/InternVL/CalliReader/params/vit_model.pt' |
|
|
MLP1_PATH = '/home/luoyx/InternVL/CalliReader/params/params/mlp1.pth' |
|
|
TOK_EMBEDDING_PATH = '/home/luoyx/InternVL/CalliReader/params/token_embedding.pth' |
|
|
TOKENIZER_PATH = 'InternVL' |
|
|
NORM_PARAMS_PATH='/home/luoyx/InternVL/CalliReader/params/gauss_norm_mu_sigma.pth' |
|
|
NORM_TOK_EMBEDDING_PATH='/home/luoyx/InternVL/CalliReader/params/gauss_norm.pth' |
|
|
NEW_1000_TOK_EMBEDDING_PATH='/home/luoyx/InternVL/CalliReader/params/new1000_token_embedding.pth' |
|
|
INTERNVL_PATH='InternVL' |
|
|
|
|
|
|
|
|
IMAGENET_MEAN = (0.485, 0.456, 0.406) |
|
|
IMAGENET_STD = (0.229, 0.224, 0.225) |
|
|
SEED=42 |
|
|
|
|
|
|
|
|
BATCH_SIZE = 256 |
|
|
USE_WARMUP=False |
|
|
LR = 1e-4 |
|
|
WEIGHT_DECAY = 1e-5 |
|
|
WARMUP_STEPS = 2000 |
|
|
NUM_EPOCHS = 13 |
|
|
NUM_WORKERS = 4 |
|
|
TRAIN_INTER = 10 |
|
|
VAL_INTER = 500 |
|
|
DOWNSAMPLE_RATIO = 0.5 |
|
|
NUM_LAYERS=4 |
|
|
GRAD_ACCU = 1 |
|
|
MODEL_NAME = 'PERCEIVER' |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
TRAIN_DATA_PATH = "" |
|
|
VAL_DATA_PATH = '' |
|
|
TEST_DATA_PATH = '' |
|
|
TRAIN_RATIO = 1 |
|
|
VAL_RATIO = 0.2 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
LOG_NAME = '' |
|
|
SAVE_NAME = LOG_NAME+'.pth' |
|
|
|
|
|
|
|
|
WORLD_SIZE = torch.cuda.device_count() |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
PERCEIVER_CHECKPOINT ='/home/luoyx/InternVL/CalliReader/params/callialign.pth' |
|
|
RESUME = 50000 |
|
|
ORDERFORMER_CHECKPOINT='/home/luoyx/InternVL/CalliReader/params/orderformer.pth' |
|
|
YOLO_CHECKPOINT="/home/luoyx/InternVL/CalliReader/params/best.pt" |