ReGeo

File size: 5,770 Bytes

085b09f

{
    "ResumeFromPreviousRun": "/home/tobias.rothlin/data/TrainingSnapshots/Regression_2",
    "DatasetConfig": {
        "base_model": "openai/clip-vit-large-patch14-336",
        "augmentaion_pipeline": [
            {
                "name": "RandomRotation",
                "params": {
                    "degrees": 10
                }
            },
            {
                "name": "ColorJitter",
                "params": {
                    "brightness": 0.5,
                    "contrast": 0.2,
                    "saturation": 0.4,
                    "hue": 0.01
                }
            },
            {
                "name": "RandomPerspective",
                "params": {
                    "distortion_scale": 0.2,
                    "p": 0.5
                }
            }
        ],
        "normalize_labels": true,
        "use_cached_dataloader": false,
        "load_for_contrast_learning": false,
        "use_pre_calculated_embeddings": false,
        "load_pooling_output": false,
        "use_gaussian_smoothing": true,
        "workers": 4
    },
    "DataLoaderConfig": {
        "Train": {
            "batch_size": 64,
            "shuffle": true,
            "num_workers": 8,
            "pin_memory": true,
            "prefetch_factor": 20
        },
        "Test": {
            "batch_size": 64,
            "shuffle": true,
            "num_workers": 8,
            "pin_memory": true,
            "prefetch_factor": 20
        }
    },
    "ModelConfig": {
        "use_location_head": true,
        "use_similarity_head": false,
        "freeze_base_model": true,
        "LocationHeadClip": {
            "mean_locatation_head_output": false,
            "layers": [
                {
                    "d_model": 1024,
                    "nhead": 8
                },
                {
                    "d_model": 1024,
                    "nhead": 8
                }
            ],
            "linear_layer_mapping": {
                "in_features": 1024,
                "out_features": 1024
            }
        },
        "RegressionHead": {
            "layer_group": [
                [
                    {
                        "type": "Linear",
                        "in_features": 1024,
                        "out_features": 1024
                    },
                    {
                        "type": "Dropout",
                        "p": 0.3
                    },
                    {
                        "type": "LayerNorm",
                        "normalized_shape": 1024
                    },
                    {
                        "type": "ReLU"
                    }
                ],
                [
                    {
                        "type": "Linear",
                        "in_features": 1024,
                        "out_features": 512
                    },
                    {
                        "type": "Dropout",
                        "p": 0.2
                    },
                    {
                        "type": "LayerNorm",
                        "normalized_shape": 512
                    },
                    {
                        "type": "ReLU"
                    }
                ],
                [
                    {
                        "type": "Linear",
                        "in_features": 512,
                        "out_features": 256
                    },
                    {
                        "type": "Dropout",
                        "p": 0.1
                    },
                    {
                        "type": "LayerNorm",
                        "normalized_shape": 256
                    },
                    {
                        "type": "ReLU"
                    }
                ],
                [
                    {
                        "type": "Linear",
                        "in_features": 256,
                        "out_features": 64
                    },
                    {
                        "type": "Dropout",
                        "p": 0.1
                    },
                    {
                        "type": "LayerNorm",
                        "normalized_shape": 64
                    },
                    {
                        "type": "ReLU"
                    }
                ],
                [
                    {
                        "type": "Linear",
                        "in_features": 64,
                        "out_features": 32
                    },
                    {
                        "type": "Dropout",
                        "p": 0.1
                    },
                    {
                        "type": "LayerNorm",
                        "normalized_shape": 32
                    },
                    {
                        "type": "ReLU"
                    }
                ],
                [
                    {
                        "type": "Linear",
                        "in_features": 32,
                        "out_features": 2
                    },
                    {
                        "type": "Tanh"
                    }
                ]
            ]
        }
    },
    "TrainingConfig": {
        "Epochs": 6,
        "SaveEvery": 10000,
        "RunName": "Regression_Best_Long",
        "SnapshotPath": "/home/tobias.rothlin/data/TrainingSnapshots",
        "LogMLFlow": false,
        "MLFlowExperimentName": "ClipLocationDecoder",
        "GradientAccumulationSteps": 1,
        "ContrastLearningStrategy": null,
        "LearningRate": 5e-05,
        "Amsgrad": true,
        "WeightDecay": 0.0001,
        "Betas": [
            0.9,
            0.98
        ],
        "Gamma": 0.9
    }
}