Update handler.py
Browse files- handler.py +1 -1
handler.py
CHANGED
|
@@ -4,7 +4,7 @@ class EndpointHandler:
|
|
| 4 |
def __init__(self, path=""):
|
| 5 |
# Here is the magic override that bypasses the Hugging Face bug
|
| 6 |
print("Initializing Nemotron 8B with trust_remote_code=True...")
|
| 7 |
-
self.model = SentenceTransformer("nvidia/llama-embed-nemotron-8b", trust_remote_code=True)
|
| 8 |
print("Model loaded successfully!")
|
| 9 |
|
| 10 |
def __call__(self, data):
|
|
|
|
| 4 |
def __init__(self, path=""):
|
| 5 |
# Here is the magic override that bypasses the Hugging Face bug
|
| 6 |
print("Initializing Nemotron 8B with trust_remote_code=True...")
|
| 7 |
+
self.model = SentenceTransformer("nvidia/llama-embed-nemotron-8b", trust_remote_code=True,model_kwargs={"attn_implementation": "eager"})
|
| 8 |
print("Model loaded successfully!")
|
| 9 |
|
| 10 |
def __call__(self, data):
|