NavyDevilDoc commited on
Commit
06e0412
·
verified ·
1 Parent(s): 39f313e

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +10 -2
app.py CHANGED
@@ -124,8 +124,16 @@ class PersistentSearchEngine:
124
  self.collection = self.client.get_or_create_collection(name=collection_name)
125
 
126
  # 2. Load Models
127
- self.bi_encoder = SentenceTransformer('all-MiniLM-L6-v2')
128
- self.cross_encoder = CrossEncoder('cross-encoder/ms-marco-MiniLM-L-6-v2')
 
 
 
 
 
 
 
 
129
 
130
  # 3. Initialize/Load BM25 (Sparse)
131
  self.bm25 = None
 
124
  self.collection = self.client.get_or_create_collection(name=collection_name)
125
 
126
  # 2. Load Models
127
+ # We force the device to CPU to avoid "meta tensor" errors in Docker
128
+ device = "cpu"
129
+ self.bi_encoder = SentenceTransformer('all-MiniLM-L6-v2', device=device)
130
+
131
+ # We disable "low_cpu_mem_usage" to prevent the model from loading as a ghost (meta device)
132
+ self.cross_encoder = CrossEncoder(
133
+ 'cross-encoder/ms-marco-MiniLM-L-6-v2',
134
+ device=device,
135
+ automodel_args={"low_cpu_mem_usage": False}
136
+ )
137
 
138
  # 3. Initialize/Load BM25 (Sparse)
139
  self.bm25 = None