--- license: apache-2.0 datasets: - OpenMed/Medical-Reasoning-SFT-GPT-OSS-120B language: - ro metrics: - accuracy base_model: - deepseek-ai/DeepSeek-V3.2 new_version: deepseek-ai/DeepSeek-V3.2 pipeline_tag: reinforcement-learning library_name: adapter-transformers tags: - chemistry - finance - music ---