File size: 2,352 Bytes
c29bad5
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
{
  "monitor_metric": "eval_MRR@NM",
  "trainer_kwargs": {
    "class_name": "IR"
  },
  "trainee_kwargs": {
    "class_name": "CLIP_Encoder",
    "freeze_prefixes": [],
    "use_attention": false,
    "symmetric_CL": false,
    "weighted_loss": false,
    "image_type": false,
    "mlm_type": false,
    "tie_weights": false,
    "loss": {
      "class_name": "NLLLoss",
      "align_uniform": true
    }
  },
  "data_module_kwargs": {
    "class_name": "cross_modal_DataModule",
    "data_processor": {
      "class_name": "evqa_data_processor",
      "dataset_path": "../../data/evqa/",
      "kb_path": "../../data/evqa/passages",
      "entity_kb_path": "../../data/evqa/kb",
      ",": "../../data/viquae_dataset/"
    },
    "input_key": "question",
    "passage_key": "passage",
    "relevant_indices_key": "BM25_provenance_indices",
    "irrelevant_indices_key": "BM25_irrelevant_indices",
    "use_image": true,
    "add_positives": false,
    "cross_modal_viquae_valid": false,
    "use_mep": false,
    "use_mlm": false,
    "use_CL": true,
    "augmented": false,
    "random_mask": false,
    "dataloader_kwargs": {
      "num_workers": 6,
      "prefetch_factor": 2
    },
    "tokenizer_kwargs": {
      "class_name": "CLIPTokenizer",
      "pretrained_model_name_or_path": "clip-vit-base-patch32_tokenizer"
    },
    "tokenization_kwargs": {
      "max_length": 77,
      "padding": "longest"
    },
    "image_processor_kwargs": {
      "class_name": "ImageFormatter_evqa",
      "feature_extractor_kwargs": {
        "class_name": "CLIPFeatureExtractor",
        "pretrained_model_name_or_path": "clip-vit-base-patch32_FE"
      }
    }
  },
  "text_encoder_kwargs": {
    "class_name": "CLIP_Text_Encoder",
    "checkpoint_name": "text_encoder",
    "base_encoder_kwargs": {
      "class_name": "CLIPModel",
      "pretrained_model_name_or_path": "/home/data/meerqat/my_transformers_cache/clip-vit-base-patch32"
    },
    "inference_path": "saved_models/CLIP_evqa/text_encoder"
  },
  "image_encoder_kwargs": {
    "class_name": "CLIP_Image_Encoder",
    "checkpoint_name": "image_encoder",
    "base_encoder_kwargs": {
      "class_name": "CLIPModel",
      "pretrained_model_name_or_path": "/home/data/meerqat/my_transformers_cache/clip-vit-base-patch32"
    },
    "inference_path": "saved_models/CLIP_evqa/image_encoder"
  }
}