project_agora / paper.toml
ilessio-aiflowlab's picture
[AGORA] MVP validation artifacts + configs + report
342bee4 verified
# AGORA Planner LoRA Training Config — Paper-aligned
# Based on RoboOS-NeXT (arXiv:2510.26536)
[training]
batch_size = "auto"
learning_rate = 0.0001
epochs = 3
optimizer = "adamw"
weight_decay = 0.01
scheduler = "cosine"
warmup_steps = 50
precision = "bf16"
gradient_accumulation = 1
max_grad_norm = 1.0
seed = 42
[model]
base_model = "Qwen/Qwen2.5-1.5B-Instruct"
lora_r = 16
lora_alpha = 32
lora_dropout = 0.05
target_modules = ["q_proj", "v_proj", "k_proj", "o_proj"]
[data]
train_samples = 5000
eval_samples = 200
train_path = "/mnt/artifacts-datai/logs/project_agora/planning_train.jsonl"
eval_path = "/mnt/artifacts-datai/logs/project_agora/planning_eval.jsonl"
num_workers = 4
pin_memory = true
[checkpoint]
output_dir = "/mnt/artifacts-datai/checkpoints/project_agora"
save_every_n_steps = 200
keep_top_k = 2
metric = "eval_loss"
mode = "min"
[early_stopping]
enabled = true
patience = 10
min_delta = 0.0001
[logging]
log_dir = "/mnt/artifacts-datai/logs/project_agora"
tensorboard_dir = "/mnt/artifacts-datai/tensorboard/project_agora"