qwen_classify_model / fru92_ls_5e_6_e5 /training_info.json
madehua
Upload folder using huggingface_hub
dcffe88 verified
{
"step": 179,
"epoch": 4,
"config": {
"model": {
"pretrained_name": "/llm_reco/dehua/model/Qwen2.5-VL-7B-Instruct",
"num_labels": 92
},
"loss": {
"type": "label_smoothing",
"smoothing": 0.1,
"temperature": 1.0
},
"datasets": {
"dataset_configs": {
"fru92": {
"num_classes": 92,
"description": "fru92 dataset",
"eval_ratio": 1
}
},
"enable_logits_masking": false,
"shuffle_datasets": false
},
"data": {
"train_jsonl": "/llm_reco/dehua/code/qwen_classify/data/dataset_food_label/fru92_train.jsonl",
"val_jsonl": "/llm_reco/dehua/code/qwen_classify/data/dataset_food_label/fru92_test.jsonl"
},
"training": {
"epochs": 5,
"lr": "5e-6",
"weight_decay": 0.01,
"warmup_steps": 0.1,
"output_dir": "/mmu_mllm_hdd_2/madehua/model/qwen_classify/fru92_ls_5e_6",
"logging_steps": 10000,
"save_steps": 50,
"eval_steps": 50,
"save_hf_format": true,
"save_deepspeed_format": false,
"num_workers": 32,
"use_fused_adam": true,
"lr_scheduler": {
"type": "cosine",
"final_lr_ratio": 0.1,
"num_cycles": 0.5
},
"best_model_tracking": {
"enabled": true,
"metric": "overall_accuracy",
"mode": "max",
"save_best_only": true
},
"evaluation": {
"partial_eval_during_training": true,
"full_eval_at_end": true,
"eval_best_model_only": true
},
"num_epochs": 5,
"learning_rate": "5e-6"
},
"deepspeed": "configs/ds_s2.json",
"wandb": {
"enabled": true,
"project": "qwen_classification",
"run_name": "fru92_cosine_5e_6_ls",
"tags": [
"qwen",
"deepspeed",
"classification",
"cosine_hold",
"single_dataset"
],
"notes": "Qwen2.5-VL Food101 classification with cosine+hold scheduler",
"log_dataset_metrics": false,
"log_overall_metrics": true
},
"accelerate": {
"bf16": true
},
"output_dir": "/mmu_mllm_hdd_2/madehua/model/qwen_classify/fru92_ls_5e_6",
"logging_steps": 10000,
"save_steps": 50,
"eval_steps": 50,
"save_hf_format": true,
"save_deepspeed_format": false
},
"dataset_metrics": {},
"is_best_model": true,
"best_metric_value": 0.9421112982405848,
"timestamp": 1753206968.9056048
}