rohannsinghal
/

nemotron-custom-handler

Model card Files Files and versions

rohannsinghal commited on Mar 19

Commit

1d35377

·

verified ·

1 Parent(s): 803fdb2

Create handler.py

Files changed (1) hide show

handler.py +21 -0

handler.py ADDED Viewed

	@@ -0,0 +1,21 @@

+from sentence_transformers import SentenceTransformer
+class EndpointHandler:
+    def __init__(self, path=""):
+        # Here is the magic override that bypasses the Hugging Face bug
+        print("Initializing Nemotron 8B with trust_remote_code=True...")
+        self.model = SentenceTransformer("nvidia/llama-embed-nemotron-8b", trust_remote_code=True)
+        print("Model loaded successfully!")
+    def __call__(self, data):
+        """
+        This runs every time your Vectorize script sends text to the endpoint.
+        """
+        # Get the text from the API request
+        inputs = data.pop("inputs", data)
+        # Generate the math vectors
+        embeddings = self.model.encode(inputs)
+        # Return it as a standard Python list so your local script can read it
+        return embeddings.tolist()