Spaces:
Sleeping
Sleeping
Update scrape_3gpp.py
Browse files- scrape_3gpp.py +2 -2
scrape_3gpp.py
CHANGED
@@ -449,8 +449,8 @@ def extractionPrincipale(url, excel_file=None, status_list=None, progress=gr.Pro
|
|
449 |
tabLine.append([pdfPage,selectedText,key])
|
450 |
print(f"Selected line in keywords is: {line}")
|
451 |
for r in tabLine:
|
452 |
-
|
453 |
-
|
454 |
|
455 |
# Add more categories as needed
|
456 |
contenu = "\n".join(extracted_content)
|
|
|
449 |
tabLine.append([pdfPage,selectedText,key])
|
450 |
print(f"Selected line in keywords is: {line}")
|
451 |
for r in tabLine:
|
452 |
+
extracted_content.append(f'PDF Page number {r[0]} extracted text from the KEYWORD {r[2]} : \n')
|
453 |
+
extracted_content.append(' '.join(r[1]))
|
454 |
|
455 |
# Add more categories as needed
|
456 |
contenu = "\n".join(extracted_content)
|