| license: apache-2.0 | |
| datasets: | |
| - OpenMed/Medical-Reasoning-SFT-GPT-OSS-120B | |
| language: | |
| - ro | |
| metrics: | |
| - accuracy | |
| base_model: | |
| - deepseek-ai/DeepSeek-V3.2 | |
| new_version: deepseek-ai/DeepSeek-V3.2 | |
| pipeline_tag: reinforcement-learning | |
| library_name: adapter-transformers | |
| tags: | |
| - chemistry | |
| - finance | |
| - music | |