LQAJudge-codereview / exp_args.json
Narmeen07's picture
Upload exp_args.json with huggingface_hub
a61dd32 verified
{
"target_model_name": "meta-llama/Llama-3.1-8B-Instruct",
"load_model_checkpoint": "",
"train_system": "",
"train_stimulus_completion": "",
"train_stimulus": "data/martian_data/pipeline_output/training_files/train_stimulus.json",
"train_control": "",
"train_qa": "data/martian_data/pipeline_output/training_files/train_qa.json",
"train_with_verb_mask": "user",
"add_thought_tokens": false,
"nudge_persona": false,
"modify_chat_template": true,
"filter": "",
"train_percent": 1.0,
"eval_ppl": true,
"eval_system": "",
"eval_stimulus_completion": "",
"eval_stimulus": "data/martian_data/pipeline_output/training_files/eval_stimulus.json",
"eval_control": "",
"eval_qa": "data/martian_data/pipeline_output/training_files/eval_qa.json",
"eval_every_n_steps": 200,
"output_dir": "out/codereview",
"save_model": true,
"save_every_n_steps": 200,
"use_wandb": true,
"run_name": "",
"shift_position_ids": true,
"min_layer_to_read": 15,
"max_layer_to_read": 16,
"layer_to_write": 0,
"module_setup": "read-vary_write-fixed_n-fixed",
"num_layers_to_read": 1,
"num_layers_to_sample": 1,
"batch_size_training": 1,
"gradient_accumulation_steps": 8,
"gradient_clipping": false,
"gradient_clipping_threshold": 1.0,
"num_epochs": 5,
"num_workers_dataloader": 1,
"lr": 3e-05,
"ema_decay": 1,
"warmup_steps": 50,
"weight_decay": 0.01,
"gamma": 0.85,
"seed": 42,
"peft_method": "lora",
"use_peft": true,
"use_fsdp": false,
"checkpoint_dir": "out/codereview/006/checkpoints"
}