| import os
|
|
|
|
|
| DATA_TRAIN_INDEX_PATH = ""
|
| DATA_EVAL_INDEX_PATH = ""
|
|
|
|
|
| PATCH_STREAM = True
|
| PATCH_SIZE = 16
|
| PATCH_LENGTH = 2048
|
| CHAR_NUM_LAYERS = 3
|
| PATCH_NUM_LAYERS = 12
|
| HIDDEN_SIZE = 768
|
|
|
|
|
| BATCH_SIZE = 4
|
| LEARNING_RATE = 1e-4
|
| NUM_EPOCHS = 128
|
| ACCUMULATION_STEPS = 1
|
| PATCH_SAMPLING_BATCH_SIZE = 0
|
| LOAD_FROM_CHECKPOINT = False
|
| WANDB_LOGGING = False
|
| WANDB_KEY = '<your_wandb_key>'
|
|
|
| EXP_TAG = 'pretrain'
|
| NAME = EXP_TAG + \
|
| "_p_size_" + str(PATCH_SIZE) + \
|
| "_p_length_" + str(PATCH_LENGTH) + \
|
| "_p_layers_" + str(PATCH_NUM_LAYERS) + \
|
| "_c_layers_" + str(CHAR_NUM_LAYERS) + \
|
| "_h_size_" + str(HIDDEN_SIZE) + \
|
| "_lr_" + str(LEARNING_RATE) + \
|
| "_batch_" + str(BATCH_SIZE)
|
|
|
| WEIGHTS_PATH = "weights_notagen_" + NAME + ".pth"
|
| LOGS_PATH = "logs_notagen_" + NAME + ".txt"
|
| WANDB_NAME = NAME
|
|
|
|
|
|
|