| import torch |
|
|
| class CFG: |
| debug = False |
| batch_size = 32 |
| num_workers = 2 |
| head_lr = 1e-3 |
| image_encoder_lr = 1e-4 |
| text_encoder_lr = 1e-5 |
| weight_decay = 1e-3 |
| patience = 1 |
| factor = 0.8 |
| epochs = 1 |
| device = torch.device("cuda" if torch.cuda.is_available() else "cpu") |
|
|
| model_name = 'resnet50' |
| image_embedding = 2048 |
| text_encoder_model = "distilbert-base-uncased" |
| text_embedding = 768 |
| text_tokenizer = "distilbert-base-uncased" |
| max_length = 200 |
|
|
| pretrained = True |
| trainable = True |
| temperature = 1.0 |
|
|
| |
| size = 224 |
|
|
| |
| num_projection_layers = 1 |
| projection_dim = 256 |
| dropout = 0.1 |