{ "loss_mode": "adaptive_std", "model_type": "film_hybrid", "dataset_type": "mixed_condition", "condition_mode": "embedding", "cond_dim": 256, "freeze_cap_encoder": false, "pretrained_cap_encoder": null, "adaptive_use_predicted_cond": true, "predicted_cond_supervision_weight": 1.5, "predicted_cond_supervision_loss": "smooth_l1", "metadata_path": "/pfs/lyj/dataset/t2i_rm/stage2_rollout/stage2_metadata.json", "rl_iter_metadata_path": "/pfs/lyj/dataset/t2i_rm/stage2_rollout/rl_iter_v2/combined_sdxl_flux_metadata.json", "ogd_std_path": "/pfs/lyj/t2i/HPSv3/data/ogd_std_qwen3vl.json", "tiers": [ "sd15", "sdxl", "qwen_image" ], "rl_tier": null, "max_rl_step": 1000, "val_size": 500, "max_images_per_group": 6, "labeled_json_list": [ "/pfs/lyj/dataset/t2i_rm/dataset/2.24/2.24aesthetic_clean_filter_both.json" ], "sup_weight": 5.0, "labeled_loss_type": "uncertainty", "sup_warmup_steps": 0, "rank_weight": 2.0, "ranking_loss_type": "bt", "pairs_per_prompt": 3, "ranking_pair_mode": "cross_model_only", "loss_type": "max_std_unsup", "std_weight": 1.0, "std_floor": -2.0, "adaptive_weight": 2.0, "adaptive_margin": 0.35, "adaptive_priority_mode": "strong_cap_high_iter", "warmup_steps": 500, "adaptive_eps": 1e-06, "std_constraint_enable": true, "std_constraint_mode": "ratio", "std_constraint_weight": 0.5, "std_constraint_warmup_steps": 500, "std_bound_min": 0.05, "std_bound_min_gap": 0.06, "std_bound_lower_base": 0.08, "std_bound_lower_cap_coef": 0.08, "std_bound_lower_iter_coef": 0.6, "std_bound_lower_ogd_coef": 0.5, "std_bound_upper_base": 0.35, "std_bound_upper_cap_coef": 0.15, "std_bound_upper_iter_coef": 0.6, "std_bound_upper_ogd_coef": 1.25, "std_target_enable": false, "std_target_weight": 0.0, "std_ratio_constraint_enable": true, "std_ratio_constraint_weight": 3.0, "std_ratio_constraint_warmup_steps": 300, "std_ratio_lower_base": 0.85, "std_ratio_lower_cap_coef": 0.0, "std_ratio_lower_iter_coef": 0.25, "std_ratio_upper_base": 1.15, "std_ratio_upper_cap_coef": 0.0, "std_ratio_upper_iter_coef": 0.45, "std_ratio_min": 0.3, "std_ratio_min_gap": 0.05, "std_ratio_space": "raw", "std_ratio_target_enable": true, "std_ratio_target_weight": 5.0, "std_ratio_target_base": 1.0, "std_ratio_target_cap_coef": 0.0, "std_ratio_target_iter_coef": 0.4, "std_ratio_target_margin_base": 0.1, "std_ratio_target_margin_cap_coef": 0.0, "std_ratio_target_margin_iter_coef": 0.05, "rm_head_type": "ranknet", "lora_enable": false, "vision_lora": false, "freeze_vision_tower": true, "freeze_llm": true, "tune_merger": true, "train_rm_head": true, "model_name_or_path": "/pfs/lyj/models/Qwen3-VL-8B-Instruct", "load_from_pretrained": "/pfs/lyj/t2i/HPSv3/output_models/HPSv3_8B_Qwen3VL_ogd_train_20260325_195334", "load_from_pretrained_step": 2992, "max_pixels": 200704, "min_pixels": 200704, "with_instruction": true, "use_special_tokens": true, "reward_token": "special", "output_dim": 2, "output_dir": "output_models", "per_device_train_batch_size": 4, "per_device_eval_batch_size": 8, "gradient_accumulation_steps": 1, "num_train_epochs": 3, "learning_rate": 1e-05, "warmup_ratio": 0.05, "lr_scheduler_type": "cosine", "gradient_checkpointing": true, "gradient_checkpointing_kwargs": { "use_reentrant": false }, "vision_lr": null, "merger_lr": 5e-06, "rm_head_lr": null, "special_token_lr": null, "reward_l2_coef": 0.03, "kl_coef": 0.0, "test_json_list": [ [ "HPDv3 Test", [ "/pfs/lyj/dataset/HPDv3/test.abs.json" ] ], [ "Own Aesthetic Test", [ "/pfs/lyj/dataset/t2i_rm/dataset/2.24/2.24aesthetic_test.json" ] ], [ "Own PromptFollow Test", [ "/pfs/lyj/dataset/t2i_rm/dataset/2.24/2.24promptfollow_test.json" ] ] ], "eval_train_json": "/pfs/lyj/dataset/t2i_rm/dataset/2.24/2.24aesthetic_clean_filter_both.json", "eval_train_size": 10000, "eval_strategy": "steps", "logging_steps": 10, "eval_steps": 500, "save_steps": 1000, "vis_steps": 200, "report_to": "none", "bf16": true, "torch_dtype": "bfloat16", "deepspeed": "hpsv3/config/ds_config/zero2.json", "save_only_model": true, "save_full_model": true, "dataloader_num_workers": 2 }