HPSv3-PlusPlus / config.json
Junjun2333's picture
Upload config.json with huggingface_hub
6c9122e verified
Raw
History Blame Contribute Delete
4.4 kB
{
"loss_mode": "adaptive_std",
"model_type": "film_hybrid",
"dataset_type": "mixed_condition",
"condition_mode": "embedding",
"cond_dim": 256,
"freeze_cap_encoder": false,
"pretrained_cap_encoder": null,
"adaptive_use_predicted_cond": true,
"predicted_cond_supervision_weight": 1.5,
"predicted_cond_supervision_loss": "smooth_l1",
"metadata_path": "/pfs/lyj/dataset/t2i_rm/stage2_rollout/stage2_metadata.json",
"rl_iter_metadata_path": "/pfs/lyj/dataset/t2i_rm/stage2_rollout/rl_iter_v2/combined_sdxl_flux_metadata.json",
"ogd_std_path": "/pfs/lyj/t2i/HPSv3/data/ogd_std_qwen3vl.json",
"tiers": [
"sd15",
"sdxl",
"qwen_image"
],
"rl_tier": null,
"max_rl_step": 1000,
"val_size": 500,
"max_images_per_group": 6,
"labeled_json_list": [
"/pfs/lyj/dataset/t2i_rm/dataset/2.24/2.24aesthetic_clean_filter_both.json"
],
"sup_weight": 5.0,
"labeled_loss_type": "uncertainty",
"sup_warmup_steps": 0,
"rank_weight": 2.0,
"ranking_loss_type": "bt",
"pairs_per_prompt": 3,
"ranking_pair_mode": "cross_model_only",
"loss_type": "max_std_unsup",
"std_weight": 1.0,
"std_floor": -2.0,
"adaptive_weight": 2.0,
"adaptive_margin": 0.35,
"adaptive_priority_mode": "strong_cap_high_iter",
"warmup_steps": 500,
"adaptive_eps": 1e-06,
"std_constraint_enable": true,
"std_constraint_mode": "ratio",
"std_constraint_weight": 0.5,
"std_constraint_warmup_steps": 500,
"std_bound_min": 0.05,
"std_bound_min_gap": 0.06,
"std_bound_lower_base": 0.08,
"std_bound_lower_cap_coef": 0.08,
"std_bound_lower_iter_coef": 0.6,
"std_bound_lower_ogd_coef": 0.5,
"std_bound_upper_base": 0.35,
"std_bound_upper_cap_coef": 0.15,
"std_bound_upper_iter_coef": 0.6,
"std_bound_upper_ogd_coef": 1.25,
"std_target_enable": false,
"std_target_weight": 0.0,
"std_ratio_constraint_enable": true,
"std_ratio_constraint_weight": 3.0,
"std_ratio_constraint_warmup_steps": 300,
"std_ratio_lower_base": 0.85,
"std_ratio_lower_cap_coef": 0.0,
"std_ratio_lower_iter_coef": 0.25,
"std_ratio_upper_base": 1.15,
"std_ratio_upper_cap_coef": 0.0,
"std_ratio_upper_iter_coef": 0.45,
"std_ratio_min": 0.3,
"std_ratio_min_gap": 0.05,
"std_ratio_space": "raw",
"std_ratio_target_enable": true,
"std_ratio_target_weight": 5.0,
"std_ratio_target_base": 1.0,
"std_ratio_target_cap_coef": 0.0,
"std_ratio_target_iter_coef": 0.4,
"std_ratio_target_margin_base": 0.1,
"std_ratio_target_margin_cap_coef": 0.0,
"std_ratio_target_margin_iter_coef": 0.05,
"rm_head_type": "ranknet",
"lora_enable": false,
"vision_lora": false,
"freeze_vision_tower": true,
"freeze_llm": true,
"tune_merger": true,
"train_rm_head": true,
"model_name_or_path": "/pfs/lyj/models/Qwen3-VL-8B-Instruct",
"load_from_pretrained": "/pfs/lyj/t2i/HPSv3/output_models/HPSv3_8B_Qwen3VL_ogd_train_20260325_195334",
"load_from_pretrained_step": 2992,
"max_pixels": 200704,
"min_pixels": 200704,
"with_instruction": true,
"use_special_tokens": true,
"reward_token": "special",
"output_dim": 2,
"output_dir": "output_models",
"per_device_train_batch_size": 4,
"per_device_eval_batch_size": 8,
"gradient_accumulation_steps": 1,
"num_train_epochs": 3,
"learning_rate": 1e-05,
"warmup_ratio": 0.05,
"lr_scheduler_type": "cosine",
"gradient_checkpointing": true,
"gradient_checkpointing_kwargs": {
"use_reentrant": false
},
"vision_lr": null,
"merger_lr": 5e-06,
"rm_head_lr": null,
"special_token_lr": null,
"reward_l2_coef": 0.03,
"kl_coef": 0.0,
"test_json_list": [
[
"HPDv3 Test",
[
"/pfs/lyj/dataset/HPDv3/test.abs.json"
]
],
[
"Own Aesthetic Test",
[
"/pfs/lyj/dataset/t2i_rm/dataset/2.24/2.24aesthetic_test.json"
]
],
[
"Own PromptFollow Test",
[
"/pfs/lyj/dataset/t2i_rm/dataset/2.24/2.24promptfollow_test.json"
]
]
],
"eval_train_json": "/pfs/lyj/dataset/t2i_rm/dataset/2.24/2.24aesthetic_clean_filter_both.json",
"eval_train_size": 10000,
"eval_strategy": "steps",
"logging_steps": 10,
"eval_steps": 500,
"save_steps": 1000,
"vis_steps": 200,
"report_to": "none",
"bf16": true,
"torch_dtype": "bfloat16",
"deepspeed": "hpsv3/config/ds_config/zero2.json",
"save_only_model": true,
"save_full_model": true,
"dataloader_num_workers": 2
}