qwen3-4b-sft-test / metadata.json
CocoRoF's picture
Upload metadata.json with huggingface_hub
7b95c93 verified
raw
history blame contribute delete
428 Bytes
{
"base_model": "Qwen/Qwen3-1.7B",
"training_method": "unknown",
"commit_msg": "Initial commit for Qwen3 4b SFT training",
"user_name": "CocoRoF",
"use_deepspeed": true,
"use_peft": false,
"use_sfttrainer": true,
"use_dpotrainer": false,
"use_ppotrainer": false,
"use_grpotrainer": false,
"use_kl_sfttrainer": false,
"use_stableadamw": false,
"use_attn_implementation": true
}