Feature Extraction
Transformers
Safetensors
sentence-transformers
English
nvembed
mteb
custom_code
Eval Results (legacy)
Instructions to use nvidia/NV-Embed-v2 with libraries, inference providers, notebooks, and local apps. Follow these links to get started.
- Libraries
- Transformers
How to use nvidia/NV-Embed-v2 with Transformers:
# Use a pipeline as a high-level helper from transformers import pipeline pipe = pipeline("feature-extraction", model="nvidia/NV-Embed-v2", trust_remote_code=True)# Load model directly from transformers import AutoModel model = AutoModel.from_pretrained("nvidia/NV-Embed-v2", trust_remote_code=True, dtype="auto") - sentence-transformers
How to use nvidia/NV-Embed-v2 with sentence-transformers:
from sentence_transformers import SentenceTransformer model = SentenceTransformer("nvidia/NV-Embed-v2", trust_remote_code=True) sentences = [ "The weather is lovely today.", "It's so sunny outside!", "He drove to the stadium." ] embeddings = model.encode(sentences) similarities = model.similarity(embeddings, embeddings) print(similarities.shape) # [3, 3] - Notebooks
- Google Colab
- Kaggle
Update modeling_nvembed.py
#44
by nihalnayak - opened
- modeling_nvembed.py +0 -2
modeling_nvembed.py
CHANGED
|
@@ -8,7 +8,6 @@ from contextlib import nullcontext
|
|
| 8 |
from transformers import AutoModel, PreTrainedTokenizerFast, BatchEncoding, DataCollatorWithPadding
|
| 9 |
from transformers.modeling_utils import PreTrainedModel
|
| 10 |
from transformers.models.auto import AutoTokenizer
|
| 11 |
-
from transformers.models.mistral.modeling_mistral import MISTRAL_INPUTS_DOCSTRING
|
| 12 |
from transformers.modeling_outputs import BaseModelOutputWithPast
|
| 13 |
from transformers.modeling_attn_mask_utils import _prepare_4d_attention_mask, _prepare_4d_attention_mask_for_sdpa
|
| 14 |
from transformers import MistralModel, MistralConfig
|
|
@@ -39,7 +38,6 @@ class BidirectionalMistralModel(MistralModel):
|
|
| 39 |
layer.self_attn.is_causal = False
|
| 40 |
self._attn_implementation = "eager"
|
| 41 |
|
| 42 |
-
@add_start_docstrings_to_model_forward(MISTRAL_INPUTS_DOCSTRING)
|
| 43 |
def forward(
|
| 44 |
self,
|
| 45 |
input_ids: torch.LongTensor = None,
|
|
|
|
| 8 |
from transformers import AutoModel, PreTrainedTokenizerFast, BatchEncoding, DataCollatorWithPadding
|
| 9 |
from transformers.modeling_utils import PreTrainedModel
|
| 10 |
from transformers.models.auto import AutoTokenizer
|
|
|
|
| 11 |
from transformers.modeling_outputs import BaseModelOutputWithPast
|
| 12 |
from transformers.modeling_attn_mask_utils import _prepare_4d_attention_mask, _prepare_4d_attention_mask_for_sdpa
|
| 13 |
from transformers import MistralModel, MistralConfig
|
|
|
|
| 38 |
layer.self_attn.is_causal = False
|
| 39 |
self._attn_implementation = "eager"
|
| 40 |
|
|
|
|
| 41 |
def forward(
|
| 42 |
self,
|
| 43 |
input_ids: torch.LongTensor = None,
|