ayushKishor commited on
Commit
a70f2fd
·
1 Parent(s): d679523

Use Nemotron 3 Nano Omni reasoning model

Browse files
Files changed (1) hide show
  1. mp1/pluto/modes.py +2 -2
mp1/pluto/modes.py CHANGED
@@ -82,7 +82,7 @@ def _build_registry() -> dict[str, ModeConfig]:
82
  ),
83
  "MODE_REASONING": ModeConfig(
84
  mode_name="MODE_REASONING",
85
- model_id="nvidia/llama-3.3-nemotron-super-49b-v1",
86
  temperature=0.3,
87
  max_tokens=4096,
88
  compute_profile="high-reasoning",
@@ -107,7 +107,7 @@ def _build_registry() -> dict[str, ModeConfig]:
107
  # Keep MODE_GEMINI name for backward compat — maps to Super
108
  "MODE_GEMINI": ModeConfig(
109
  mode_name="MODE_GEMINI",
110
- model_id="nvidia/llama-3.3-nemotron-super-49b-v1",
111
  temperature=0.0,
112
  max_tokens=4096,
113
  compute_profile="high-throughput",
 
82
  ),
83
  "MODE_REASONING": ModeConfig(
84
  mode_name="MODE_REASONING",
85
+ model_id="nvidia/nemotron-3-nano-omni-30b-a3b-reasoning",
86
  temperature=0.3,
87
  max_tokens=4096,
88
  compute_profile="high-reasoning",
 
107
  # Keep MODE_GEMINI name for backward compat — maps to Super
108
  "MODE_GEMINI": ModeConfig(
109
  mode_name="MODE_GEMINI",
110
+ model_id="nvidia/nemotron-3-nano-omni-30b-a3b-reasoning",
111
  temperature=0.0,
112
  max_tokens=4096,
113
  compute_profile="high-throughput",