Update services/pdf_service.py
Browse files- services/pdf_service.py +7 -1
services/pdf_service.py
CHANGED
|
@@ -146,11 +146,17 @@ class PDFService:
|
|
| 146 |
|
| 147 |
score = 1 - distances[0][i] # Convert distance to similarity score
|
| 148 |
print(f"Chunk Index: {idx}, Distance: {distances[0][i]}, Score: {score}")
|
|
|
|
|
|
|
| 149 |
if score < min_score:
|
| 150 |
-
|
|
|
|
|
|
|
| 151 |
|
| 152 |
chunk = self.chunks[idx].copy()
|
| 153 |
chunk['score'] = score
|
|
|
|
|
|
|
| 154 |
results.append(chunk)
|
| 155 |
|
| 156 |
# Sort by score and take top_k
|
|
|
|
| 146 |
|
| 147 |
score = 1 - distances[0][i] # Convert distance to similarity score
|
| 148 |
print(f"Chunk Index: {idx}, Distance: {distances[0][i]}, Score: {score}")
|
| 149 |
+
print("----- score < min_score")
|
| 150 |
+
print(score < min_score)
|
| 151 |
if score < min_score:
|
| 152 |
+
print("skipped ---- ")
|
| 153 |
+
|
| 154 |
+
#continue # Skip low scores
|
| 155 |
|
| 156 |
chunk = self.chunks[idx].copy()
|
| 157 |
chunk['score'] = score
|
| 158 |
+
print("---- chuck " )
|
| 159 |
+
print(chunk)
|
| 160 |
results.append(chunk)
|
| 161 |
|
| 162 |
# Sort by score and take top_k
|