DomainEmbedder / metadata.json
EphAsad's picture
Upload 19 files
485908e verified
{
"version": "DomainEmbedder-v2.6",
"step": 4000,
"base_model": "FireDevourerEmbedder-RL-v3.6",
"avg_reward": 1.5269566774368286,
"accuracy": 92.5,
"all_scores": {
"avg_reward": 1.5269566774368286,
"accuracy": 92.5
},
"timestamp": "2026-02-10T02:01:18.178319",
"method": "TRUE LoRA (PEFT) + SUPERVISED RL + CURRICULUM",
"config": {
"lora_rank": 16,
"lora_alpha": 32,
"lora_target_modules": [
"query",
"value"
],
"rl_algorithm": "Supervised A2C Policy Gradient",
"rl_total_steps": 5000,
"rl_gamma": 0.99,
"rl_entropy_coef": 0.1,
"correctness_bonus": 1.0,
"correctness_penalty": 0.5,
"curriculum_learning": true,
"domains": [
"medical",
"legal",
"code",
"finance",
"scientific"
]
},
"files": {
"base_model": "FireDevourerEmbedder-RL-v3.6.pt",
"rl_policy": "rl_policy.pt",
"lora_adapters": {
"medical": "medical_lora/",
"legal": "legal_lora/",
"code": "code_lora/",
"finance": "finance_lora/",
"scientific": "scientific_lora/"
}
}
}