| | import os
|
| |
|
| |
|
| | DATA_TRAIN_INDEX_PATH = ""
|
| | DATA_EVAL_INDEX_PATH = ""
|
| |
|
| |
|
| | PATCH_STREAM = True
|
| | PATCH_SIZE = 16
|
| | PATCH_LENGTH = 1024
|
| | CHAR_NUM_LAYERS = 6
|
| | PATCH_NUM_LAYERS = 20
|
| | HIDDEN_SIZE = 1280
|
| |
|
| |
|
| | BATCH_SIZE = 1
|
| | LEARNING_RATE = 1e-5
|
| | NUM_EPOCHS = 64
|
| | ACCUMULATION_STEPS = 1
|
| | PATCH_SAMPLING_BATCH_SIZE = 0
|
| | LOAD_FROM_CHECKPOINT = False
|
| | WANDB_LOGGING = False
|
| | WANDB_KEY = '<your_wandb_key>'
|
| |
|
| | PRETRAINED_PATH = ""
|
| | EXP_TAG = ''
|
| | NAME = EXP_TAG + \
|
| | "_p_size_" + str(PATCH_SIZE) + \
|
| | "_p_length_" + str(PATCH_LENGTH) + \
|
| | "_p_layers_" + str(PATCH_NUM_LAYERS) + \
|
| | "_c_layers_" + str(CHAR_NUM_LAYERS) + \
|
| | "_h_size_" + str(HIDDEN_SIZE) + \
|
| | "_lr_" + str(LEARNING_RATE) + \
|
| | "_batch_" + str(BATCH_SIZE)
|
| |
|
| | WEIGHTS_PATH = "weights_notagen_" + NAME + ".pth"
|
| | LOGS_PATH = "logs_notagen_" + NAME + ".txt"
|
| | WANDB_NAME = NAME
|
| |
|