File size: 3,006 Bytes
8e31903
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
{
    "dataset_reader": {
        "type": "s2s_manual_reader",
        "source_token_indexer": {
            "tokens": {
                "type": "pretrained_transformer",
                "do_lowercase": false,
                "model_name": "./roberta"
            }
        },
        "target_token_indexer": {
            "tokens": {
                "type": "single_id"
            }
        },
        "tokenizer": {
            "word_splitter": {
                "type": "just_spaces"
            }
        }
    },
    "iterator": {
        "type": "basic",
        "batch_size": 32
    },
    "model": {
        "type": "geo_s2s",
        "beam_size": 10,
        "encoder": {
            "dropout": 0.5,
            "emb_dim": 768,
            "hid_dim": 512,
            "input_dim": 21128
        },
        "knowledge_points_ratio": 0,
        "max_decoding_steps": 16,
        "resnet_pretrained": "./",
        "scheduled_sampling_ratio": 0,
        "source_embedder": {
            "token_embedders": {}
        },
        "target_embedding_dim": 512
    },
    "train_data_path": "./GeoQA-Data/GeoQA-Pro/pro_train.pk",
    "validation_data_path": "./GeoQA-Data/GeoQA-Pro/pro_dev.pk",
    "test_data_path": "./GeoQA-Data/GeoQA-Pro/pro_test.pk",
    "trainer": {
        "cuda_device": 0,
        "grad_norm": 10,
        "learning_rate_scheduler": {
            "type": "reduce_on_plateau",
            "factor": 0.6,
            "mode": "max",
            "patience": 5
        },
        "num_epochs": 100,
        "optimizer": {
            "type": "adam",
            "lr": 0.001,
            "parameter_groups": [
                [
                    [
                        "mcan",
                        "merge_att",
                        "channel_transform",
                        "attflat_img",
                        "attflat_lang",
                        "decode_transform"
                    ],
                    {
                        "lr": 1e-05
                    }
                ],
                [
                    [
                        "resnet"
                    ],
                    {
                        "lr": 1e-05
                    }
                ],
                [
                    [
                        "source_embedder",
                        "encoder.embedding"
                    ],
                    {
                        "lr": 2e-05
                    }
                ],
                [
                    [
                        "encoder.concat_trans",
                        "encoder.concat_trans_",
                        "encoder.lstm_embedding",
                        "encoder.trans",
                        "encoder.norm",
                        "encoder.concat_norm"
                    ],
                    {
                        "lr": 0.001
                    }
                ]
            ]
        },
        "validation_metric": "+acc"
    },
    "evaluate_on_test": true
}