Spaces:
Sleeping
Sleeping
Update app.py
Browse files
app.py
CHANGED
|
@@ -19,22 +19,14 @@ class ParrotletRetriever:
|
|
| 19 |
|
| 20 |
# Load tokenizer and model
|
| 21 |
self.tokenizer = AutoTokenizer.from_pretrained(model_name, token=HF_TOKEN)
|
| 22 |
-
self.model = AutoModel.from_pretrained(model_name, trust_remote_code=True, token=HF_TOKEN)
|
| 23 |
self.model.to(self.device)
|
| 24 |
self.model.eval()
|
| 25 |
|
| 26 |
-
# Pinecone initialization (unchanged)
|
| 27 |
self.pinecone_namespace = os.environ.get("NAMESPACE")
|
| 28 |
self.pinecone_client = Pinecone(api_key=os.environ.get("PINECONE_API_KEY"))
|
| 29 |
self.pinecone_index = self.pinecone_client.Index(host=os.environ.get("PINECONE_HOST"))
|
| 30 |
|
| 31 |
-
print(f"Connected to Pinecone index: {index_name}")
|
| 32 |
-
if self.pinecone_namespace:
|
| 33 |
-
print(f"🔹 Using namespace: {self.pinecone_namespace}")
|
| 34 |
-
|
| 35 |
-
# --------------------------
|
| 36 |
-
# Mean Pooling
|
| 37 |
-
# --------------------------
|
| 38 |
def mean_pooling(self, model_output, attention_mask):
|
| 39 |
"""Mean pooling for sentence embeddings."""
|
| 40 |
token_embeddings = model_output[0]
|
|
|
|
| 19 |
|
| 20 |
# Load tokenizer and model
|
| 21 |
self.tokenizer = AutoTokenizer.from_pretrained(model_name, token=HF_TOKEN)
|
| 22 |
+
self.model = AutoModel.from_pretrained(model_name, trust_remote_code=True, token=os.getenv("HF_TOKEN"))
|
| 23 |
self.model.to(self.device)
|
| 24 |
self.model.eval()
|
| 25 |
|
|
|
|
| 26 |
self.pinecone_namespace = os.environ.get("NAMESPACE")
|
| 27 |
self.pinecone_client = Pinecone(api_key=os.environ.get("PINECONE_API_KEY"))
|
| 28 |
self.pinecone_index = self.pinecone_client.Index(host=os.environ.get("PINECONE_HOST"))
|
| 29 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 30 |
def mean_pooling(self, model_output, attention_mask):
|
| 31 |
"""Mean pooling for sentence embeddings."""
|
| 32 |
token_embeddings = model_output[0]
|