Spaces:
Sleeping
Sleeping
Commit
·
a2fb673
1
Parent(s):
b8415ff
small
Browse files
app.py
CHANGED
|
@@ -136,13 +136,13 @@ class RepLlamaModel:
|
|
| 136 |
batch_dict = create_batch_dict(self.tokenizer, batch_texts, always_add_eos="last")
|
| 137 |
batch_dict = {key: value.cuda() for key, value in batch_dict.items()}
|
| 138 |
|
| 139 |
-
|
| 140 |
-
|
| 141 |
-
|
| 142 |
-
|
| 143 |
-
|
| 144 |
-
|
| 145 |
-
|
| 146 |
|
| 147 |
self.model = self.model.cpu()
|
| 148 |
return np.concatenate(all_embeddings, axis=0)
|
|
|
|
| 136 |
batch_dict = create_batch_dict(self.tokenizer, batch_texts, always_add_eos="last")
|
| 137 |
batch_dict = {key: value.cuda() for key, value in batch_dict.items()}
|
| 138 |
|
| 139 |
+
with torch.cuda.amp.autocast():
|
| 140 |
+
with torch.no_grad():
|
| 141 |
+
outputs = self.model(**batch_dict)
|
| 142 |
+
embeddings = pool(outputs.last_hidden_state, batch_dict['attention_mask'], 'last')
|
| 143 |
+
embeddings = F.normalize(embeddings, p=2, dim=-1)
|
| 144 |
+
logger.info(f"Encoded shape: {embeddings.shape}, Norm of first embedding: {torch.norm(embeddings[0]).item()}")
|
| 145 |
+
all_embeddings.append(embeddings.cpu().numpy())
|
| 146 |
|
| 147 |
self.model = self.model.cpu()
|
| 148 |
return np.concatenate(all_embeddings, axis=0)
|