Spaces:
Sleeping
Sleeping
Update scrape_3gpp.py
Browse files- scrape_3gpp.py +2 -2
scrape_3gpp.py
CHANGED
|
@@ -449,8 +449,8 @@ def extractionPrincipale(url, excel_file=None, status_list=None, progress=gr.Pro
|
|
| 449 |
tabLine.append([pdfPage,selectedText,key])
|
| 450 |
print(f"Selected line in keywords is: {line}")
|
| 451 |
for r in tabLine:
|
| 452 |
-
|
| 453 |
-
|
| 454 |
|
| 455 |
# Add more categories as needed
|
| 456 |
contenu = "\n".join(extracted_content)
|
|
|
|
| 449 |
tabLine.append([pdfPage,selectedText,key])
|
| 450 |
print(f"Selected line in keywords is: {line}")
|
| 451 |
for r in tabLine:
|
| 452 |
+
extracted_content.append(f'PDF Page number {r[0]} extracted text from the KEYWORD {r[2]} : \n')
|
| 453 |
+
extracted_content.append(' '.join(r[1]))
|
| 454 |
|
| 455 |
# Add more categories as needed
|
| 456 |
contenu = "\n".join(extracted_content)
|