Spaces:

ignitariumcloud
/

TI_demo_E2E

Sleeping

arjunanand13 commited on Jun 12, 2025

Commit

5321ee9

verified ·

1 Parent(s): 3366453

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -50,7 +50,17 @@ class DocumentRetrievalAndGeneration:
     def create_faiss_index(self):
         all_texts = [split.page_content for split in self.all_splits]
-        embeddings = self.encode_texts(all_texts)
         index = faiss.IndexFlatL2(embeddings.shape[1])
         index.add(embeddings)
         gpu_resource = faiss.StandardGpuResources()

     def create_faiss_index(self):
         all_texts = [split.page_content for split in self.all_splits]
+        batch_size = 32
+        all_embeddings = []
+        for i in range(0, len(all_texts), batch_size):
+            batch_texts = all_texts[i:i+batch_size]
+            batch_embeddings = self.encode_texts(batch_texts)
+            all_embeddings.append(batch_embeddings)
+            print(f"Processed batch {i//batch_size + 1}/{(len(all_texts) + batch_size - 1)//batch_size}")
+        embeddings = np.vstack(all_embeddings)
         index = faiss.IndexFlatL2(embeddings.shape[1])
         index.add(embeddings)
         gpu_resource = faiss.StandardGpuResources()