nvidia
/

llama-nv-embed-reasoning-3b

@@ -1,7 +1,7 @@
 # SPDX-FileCopyrightText: Copyright (c) 2026 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
 # SPDX-License-Identifier: Apache-2.0.
 """
-MTEB encoder and ModelMeta for nvidia/llama-embed-nemotron-reasoning-3b.
 """
 from mteb.models.model_meta import ModelMeta
@@ -30,8 +30,8 @@ BRIGHT_TASK_INSTRUCTIONS = {
 BRIGHT_PASSAGE_PREFIX = "passage: "
-class LlamaEmbedNemotronReasoning(LlamaEmbedNemotron):
-    """LlamaEmbedNemotron for reasoning with BRIGHT benchmark prompts."""
     def __init__(self, model_name: str, revision: str, device: str | None = None, **kwargs) -> None:
         super().__init__(model_name, revision=revision, device=device)
@@ -63,10 +63,10 @@ class LlamaEmbedNemotronReasoning(LlamaEmbedNemotron):
             prefix = self.format_instruction(instruction, prompt_type)
         return self._extract_embeddings(inputs, instruction=prefix, **kwargs)
-LLAMA_EMBED_NEMOTRON_REASONING_3B_META = ModelMeta(
-    loader=LlamaEmbedNemotronReasoning,
     loader_kwargs=dict(max_seq_length=8192),
-    name="nvidia/llama-embed-nemotron-reasoning-3b",
     model_type=["dense"],
     languages=llama_embed_nemotron_evaluated_languages,
     open_weights=True,
@@ -75,9 +75,9 @@ LLAMA_EMBED_NEMOTRON_REASONING_3B_META = ModelMeta(
     n_parameters=3_212_749_824,
     memory_usage_mb=6000,
     embed_dim=3072,
-    license="https://huggingface.co/nvidia/llama-embed-nemotron-reasoning-3b/blob/main/LICENSE",
     max_tokens=8192,
-    reference="https://huggingface.co/nvidia/llama-embed-nemotron-reasoning-3b",
     similarity_fn_name="cosine",
     framework=["PyTorch", "Transformers"],
     use_instructions=True,

 # SPDX-FileCopyrightText: Copyright (c) 2026 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
 # SPDX-License-Identifier: Apache-2.0.
 """
+MTEB encoder and ModelMeta for nvidia/llama-nv-embed-reasoning-3b.
 """
 from mteb.models.model_meta import ModelMeta
 BRIGHT_PASSAGE_PREFIX = "passage: "
+class LlamaNvEmbedReasoning(LlamaEmbedNemotron):
+    """LlamaNvEmbedReasoning for reasoning with BRIGHT benchmark prompts."""
     def __init__(self, model_name: str, revision: str, device: str | None = None, **kwargs) -> None:
         super().__init__(model_name, revision=revision, device=device)
             prefix = self.format_instruction(instruction, prompt_type)
         return self._extract_embeddings(inputs, instruction=prefix, **kwargs)
+LLAMA_NV_EMBED_REASONING_3B_META = ModelMeta(
+    loader=LlamaNvEmbedReasoning,
     loader_kwargs=dict(max_seq_length=8192),
+    name="nvidia/llama-nv-embed-reasoning-3b",
     model_type=["dense"],
     languages=llama_embed_nemotron_evaluated_languages,
     open_weights=True,
     n_parameters=3_212_749_824,
     memory_usage_mb=6000,
     embed_dim=3072,
+    license="https://huggingface.co/nvidia/llama-nv-embed-reasoning-3b/blob/main/LICENSE",
     max_tokens=8192,
+    reference="https://huggingface.co/nvidia/llama-nv-embed-reasoning-3b",
     similarity_fn_name="cosine",
     framework=["PyTorch", "Transformers"],
     use_instructions=True,