squad_tuned_luke_peft_adapter / adapter_config.json
botcon's picture
Training in progress, epoch 1
d51685d
{
"auto_mapping": null,
"base_model_name_or_path": "studio-ousia/luke-base",
"bias": "none",
"fan_in_fan_out": false,
"inference_mode": true,
"init_lora_weights": true,
"layers_pattern": null,
"layers_to_transform": null,
"lora_alpha": 32,
"lora_dropout": 0.1,
"modules_to_save": null,
"peft_type": "LORA",
"r": 8,
"revision": null,
"target_modules": [
"luke.encoder.layer.0.attention.self.query",
"luke.encoder.layer.0.attention.self.key",
"luke.encoder.layer.0.attention.self.value",
"luke.encoder.layer.1.attention.self.query",
"luke.encoder.layer.1.attention.self.key",
"luke.encoder.layer.1.attention.self.value",
"luke.encoder.layer.2.attention.self.query",
"luke.encoder.layer.2.attention.self.key",
"luke.encoder.layer.2.attention.self.value",
"luke.encoder.layer.3.attention.self.query",
"luke.encoder.layer.3.attention.self.key",
"luke.encoder.layer.3.attention.self.value",
"luke.encoder.layer.4.attention.self.query",
"luke.encoder.layer.4.attention.self.key",
"luke.encoder.layer.4.attention.self.value",
"luke.encoder.layer.5.attention.self.query",
"luke.encoder.layer.5.attention.self.key",
"luke.encoder.layer.5.attention.self.value",
"luke.encoder.layer.6.attention.self.query",
"luke.encoder.layer.6.attention.self.key",
"luke.encoder.layer.6.attention.self.value",
"luke.encoder.layer.7.attention.self.query",
"luke.encoder.layer.7.attention.self.key",
"luke.encoder.layer.7.attention.self.value",
"luke.encoder.layer.8.attention.self.query",
"luke.encoder.layer.8.attention.self.key",
"luke.encoder.layer.8.attention.self.value",
"luke.encoder.layer.9.attention.self.query",
"luke.encoder.layer.9.attention.self.key",
"luke.encoder.layer.9.attention.self.value",
"luke.encoder.layer.10.attention.self.query",
"luke.encoder.layer.10.attention.self.key",
"luke.encoder.layer.10.attention.self.value",
"luke.encoder.layer.11.attention.self.query",
"luke.encoder.layer.11.attention.self.key",
"luke.encoder.layer.11.attention.self.value",
"luke.encoder.layer.11.output.dense",
"qa_outputs"
],
"task_type": "QUESTION_ANS"
}