Gen-oze's picture
Upload LoRA adapter (README written by author)
12094e7 verified
{
"run_id": "ds=u-10bei_structured_data_with_cot_dataset_512_v2_lr=1e-4_r=64_a=128_drop=0.03_wd=0.05_len=512_seed=3407_t=q_proj_k_proj_v_proj_o_proj_gate_proj_up_proj_down_proj_20260206_145038",
"run_id_source": "AUTO",
"created_at": "20260206_145038",
"base_model": "Qwen/Qwen3-4B-Instruct-2507",
"hf_repo_base": "your_id/your-lora-repo",
"hf_repo_id": "your_id/your-lora-repo-4a3a03d8",
"dataset_id": "u-10bei/structured_data_with_cot_dataset_512_v2",
"max_seq_len": "512",
"seed": "3407",
"lr": "1e-4",
"lora": {
"r": "64",
"alpha": "128",
"dropout": "0.03",
"target_modules": "q_proj,k_proj,v_proj,o_proj,gate_proj,up_proj,down_proj"
},
"train": {
"epochs": "2",
"per_device_train_bs": "2",
"per_device_eval_bs": "2",
"grad_accum": "8",
"warmup_ratio": "0.03",
"weight_decay": "0.05",
"max_steps": "-1",
"logging_steps": "10",
"eval_steps": "25",
"save_steps": "50",
"save_total_limit": "2"
},
"local_lora_dir": "/content/lora_runs/ds=u-10bei_structured_data_with_cot_dataset_512_v2_lr=1e-4_r=64_a=128_drop=0.03_wd=0.05_len=512_seed=3407_t=q_proj_k_proj_v_proj_o_proj_gate_proj_up_proj_down_proj_20260206_145038",
"drive_output_root": "/content/drive/MyDrive/LLM2025/OUTPUT",
"drive_adapter_dir": "/content/drive/MyDrive/LLM2025/OUTPUT/adapters/ds=u-10bei_structured_data_with_cot_dataset_512_v2_lr=1e-4_r=64_a=128_drop=0.03_wd=0.05_len=512_seed=3407_t=q_proj_k_proj_v_proj_o_proj_gate_proj_up_proj_down_proj_20260206_145038",
"drive_run_dir": "/content/drive/MyDrive/LLM2025/OUTPUT/runs/ds=u-10bei_structured_data_with_cot_dataset_512_v2_lr=1e-4_r=64_a=128_drop=0.03_wd=0.05_len=512_seed=3407_t=q_proj_k_proj_v_proj_o_proj_gate_proj_up_proj_down_proj_20260206_145038",
"drive_log_dir": "/content/drive/MyDrive/LLM2025/OUTPUT/logs/ds=u-10bei_structured_data_with_cot_dataset_512_v2_lr=1e-4_r=64_a=128_drop=0.03_wd=0.05_len=512_seed=3407_t=q_proj_k_proj_v_proj_o_proj_gate_proj_up_proj_down_proj_20260206_145038"
}