File size: 6,618 Bytes
6df4d35
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
{
  "max_seq_length": 256,
  "question_max_seq_length": 256,
  "RC": false,
  "coco": false,
  "flickr": false,
  "aokvqa": false,
  "grad_check": true,
  "MJL": false,
  "debug_run_time": false,
  "debug_output": false,
  "only_neighbors": false,
  "full_kb": false,
  "image_eval": false,
  "embedding_column": "my_DPR_few_shot",
  "output_ds": null,
  "output_kb": null,
  "embed": false,
  "data_path": null,
  "train_batch_size": 1,
  "eval_batch_size": 1,
  "viquae_dev_batch_size": 1000,
  "transformer_model_name": "bert-base-uncased",
  "gradient_accumulation_steps": 1,
  "warmup_proportion": 0.1,
  "weight_decay": 0.01,
  "lr_decay": false,
  "adam_beta1": 0.9,
  "adam_beta2": 0.999,
  "warmup_steps": 4,
  "adam_epsilon": 1e-08,
  "num_train_epochs": 20,
  "learning_rate": 5e-06,
  "dropout": 0.5,
  "bert_hidden_size": 768,
  "MM": null,
  "use_graph_P": null,
  "use_graph_Q": null,
  "syntactic_P": null,
  "syntactic_Q": null,
  "NS": false,
  "IC_Q": false,
  "IC_P": false,
  "gcn_lr": 2e-05,
  "clip_lr": null,
  "dpr_lr": null,
  "head_lr": 2e-06,
  "func": "cat",
  "graph_pooling": "mean",
  "max_nbr_nodes": 2,
  "num_neib": 1,
  "neib_depth": 1,
  "undirect": false,
  "node_hidden_size": 128,
  "max_num_relations": null,
  "max_num_syntactic_relations": null,
  "map_wikidataRelCode_to_idx": null,
  "graph_layout": "fr",
  "residual": false,
  "num_gcn": null,
  "node_alias_max_len": 32,
  "attention": false,
  "num_paths": 1,
  "kg_embed": false,
  "graph_only": false,
  "freeze": false,
  "sanity_run": false,
  "scale_losses": false,
  "check_answers": false,
  "load_4bit": false,
  "load_8bit": false,
  "device_id": null,
  "drop_last": false,
  "disable_checkpointing": false,
  "samples": null,
  "sample_id": null,
  "datasets_root_dir": "../datasets",
  "ds": "../datasets/textee/wikievents",
  "supp_train_ds": null,
  "guidelines": "new_Llama-31-8B-Instruct_annotation_guidelines",
  "num_trainable_params": null,
  "num_all_param": null,
  "trainable_ratio": null,
  "train_sanity_run": false,
  "enhanced_question": false,
  "use_entity_type": false,
  "filter_edges": false,
  "draw": false,
  "layer_norm": false,
  "filters_3": 768,
  "tensor_neurons": 16,
  "output_dir": "saved_models/wikievents/GoLLIE-7B/code_generator/train/2025-09-26/19-34-03",
  "main_dir": "/fscratch/oadjali/EEE",
  "experiment_dir": "/fscratch/oadjali/EEE/saved_models/wikievents/GoLLIE-7B/code_generator/train/2025-09-26/19-34-03",
  "experiment_name": null,
  "search": null,
  "input_key": null,
  "train_input_key": null,
  "train_search_run": null,
  "val_search_run": null,
  "test_search_run": null,
  "no_resize": false,
  "xlnet": false,
  "tune_loss": false,
  "tune_dev": true,
  "tune_valid_loss": false,
  "sanity_val_steps": 0,
  "cpu": false,
  "keep_in_memory": false,
  "nbr_gpus": 1,
  "N": 0,
  "nbr_workers": 1,
  "num_proc": 1,
  "acc": "gpu",
  "fast_dev_run": null,
  "local_cache": "../my_transformers_cache",
  "IMAGE_PATH": null,
  "transformer_path": null,
  "resume_from": null,
  "answer_generator": "HiTZ/GoLLIE-7B",
  "query_model": null,
  "context_model": null,
  "answer_generator_2": null,
  "checkpoint": null,
  "query_checkpoint": null,
  "checkpoint_2": null,
  "non_strict_load": true,
  "trainer_checkpoint": null,
  "linear_MEP_checkpoint": null,
  "linear_MLM_checkpoint": null,
  "config": "experiments/event_extraction/config_code_generator.json",
  "context_checkpoint": null,
  "grad_accum": 1,
  "cls_token": "[CLS]",
  "sep_token": "[SEP]",
  "pad_token": "[PAD]",
  "cls_token_at_end": false,
  "mask_padding_with_zero": true,
  "pad_on_left": false,
  "sequence_a_segment_id": 0,
  "pad_token_segment_id": 0,
  "cls_token_segment_id": 0,
  "pad_token_label_id": 0,
  "pad_token_id": 0,
  "past_index": -1,
  "world_size": 1,
  "use_lstm": false,
  "use_entity": false,
  "use_question_graph": false,
  "use_question_objects": false,
  "EFeat": null,
  "NFeat": null,
  "ltn": false,
  "use_kelm": false,
  "unshared": false,
  "mlm": false,
  "test": false,
  "validate": false,
  "eval_on_start": false,
  "predict": null,
  "split_dpr": false,
  "rename_model": false,
  "mask_rate": 0.15,
  "pretrained_triviaq": false,
  "error_analysis": false,
  "debug": false,
  "stop_debug": false,
  "entity_linking": false,
  "entity_linking_split": false,
  "build_entity_paths": null,
  "object_detection": null,
  "update_wikidata_ids": null,
  "update_None_ids": null,
  "dependency_parsing": null,
  "image_captionning": null,
  "build_graph": false,
  "from_bert": false,
  "fast": false,
  "get_examples": false,
  "get_statistics": null,
  "word_vocab_size": 0,
  "char_vocab_size": 0,
  "max_word_len": 30,
  "device": "cuda",
  "embedding_matrix": null,
  "new_vocab_embeddings": null,
  "w2v_file": "word_vector_200d.vec",
  "word_emb_dim": 200,
  "char_lstm": false,
  "char_cnn": false,
  "seed": 42,
  "tune_batch_size": false,
  "val_check_interval": null,
  "model_names": null,
  "build_hf_local_cache": true,
  "strategy": null,
  "monitor_metric": "mean_f1",
  "precision": 32,
  "no_lora": false,
  "early_stopping": true,
  "reduce_on_plateau": true,
  "num_generations": 2,
  "num_passages": 5,
  "k_schemes": 10,
  "use_liger_loss": false,
  "kl_beta": 0.0,
  "TI_alpha": 1.0,
  "TC_alpha": 1.0,
  "AI_alpha": 1.0,
  "AC_alpha": 1.0,
  "schema_retrieval_val": false,
  "schema_retrieval_train": false,
  "EE_2steps": false,
  "EE_SL": false,
  "save_ckpt": false,
  "lora_config": {
    "peft_type": "LORA",
    "auto_mapping": null,
    "base_model_name_or_path": null,
    "revision": null,
    "task_type": "CAUSAL_LM",
    "inference_mode": false,
    "r": 8,
    "target_modules": [
      "q_proj",
      "v_proj"
    ],
    "lora_alpha": 16,
    "lora_dropout": 0.05,
    "fan_in_fan_out": false,
    "bias": "none",
    "use_rslora": false,
    "modules_to_save": null,
    "init_lora_weights": true,
    "layers_to_transform": null,
    "layers_pattern": null,
    "rank_pattern": {},
    "alpha_pattern": {},
    "megatron_config": null,
    "megatron_core": "megatron.core",
    "loftq_config": {},
    "use_dora": false
  },
  "quantization_config": null,
  "hf": false,
  "slurm_scipt_path": null,
  "enabled_args": "  --train_batch_size 1\n  --eval_batch_size 1\n  --num_train_epochs 20\n  --nbr_gpus 1\n  --learning_rate 5e-6\n  --grad_check\n  --config experiments/event_extraction/config_code_generator.json\n  --non_strict_load\n  --ds ../datasets/textee/wikievents\n  --answer_generator HiTZ/GoLLIE-7B\n  --guidelines new_Llama-31-8B-Instruct_annotation_guidelines\n  --k_schemes 10\n  --num_passages 5"
}