Spaces:
Sleeping
Sleeping
Update app.py
Browse files
app.py
CHANGED
@@ -131,6 +131,7 @@ def process_directory(directory):
|
|
131 |
with open(file_path, 'rb') as f:
|
132 |
if file_ext in ['.rst', '.md', '.txt', '.html', '.json', '.yaml', '.py']:
|
133 |
text = f.read().decode('utf-8')
|
|
|
134 |
elif file_ext == '.pdf':
|
135 |
reader = PdfReader(f)
|
136 |
text = ""
|
@@ -145,7 +146,8 @@ def process_directory(directory):
|
|
145 |
|
146 |
all_texts.append(text)
|
147 |
file_references.append(file_path)
|
148 |
-
|
|
|
149 |
return all_texts, file_references
|
150 |
|
151 |
|
|
|
131 |
with open(file_path, 'rb') as f:
|
132 |
if file_ext in ['.rst', '.md', '.txt', '.html', '.json', '.yaml', '.py']:
|
133 |
text = f.read().decode('utf-8')
|
134 |
+
print(f"Extracted text from {file_path}:\n{text[:200]}...\n")
|
135 |
elif file_ext == '.pdf':
|
136 |
reader = PdfReader(f)
|
137 |
text = ""
|
|
|
146 |
|
147 |
all_texts.append(text)
|
148 |
file_references.append(file_path)
|
149 |
+
|
150 |
+
print(f"All extracted texts:\n{all_texts}")
|
151 |
return all_texts, file_references
|
152 |
|
153 |
|