prometheus04
/

qwen3-4b-code-finetuned

	{
	"model": "Qwen/Qwen3-4B",
	"dataset": "microsoft/rStar-Coder (synthetic_sft)",
	"samples": 10000,
	"epochs": 1,
	"lora_rank": 32,
	"lora_alpha": 64,
	"batch_size": 2,
	"gradient_accumulation": 8,
	"learning_rate": 0.0002,
	"max_seq_length": 4096,
	"results": {
	"humaneval_base": 68.9,
	"humaneval_plus": 64.0,
	"mbpp_base": 58.2,
	"mbpp_plus": 50.8
	}
	}