bupa1018 commited on
Commit
5b5d449
·
1 Parent(s): 157ebd3

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +3 -1
app.py CHANGED
@@ -131,6 +131,7 @@ def process_directory(directory):
131
  with open(file_path, 'rb') as f:
132
  if file_ext in ['.rst', '.md', '.txt', '.html', '.json', '.yaml', '.py']:
133
  text = f.read().decode('utf-8')
 
134
  elif file_ext == '.pdf':
135
  reader = PdfReader(f)
136
  text = ""
@@ -145,7 +146,8 @@ def process_directory(directory):
145
 
146
  all_texts.append(text)
147
  file_references.append(file_path)
148
-
 
149
  return all_texts, file_references
150
 
151
 
 
131
  with open(file_path, 'rb') as f:
132
  if file_ext in ['.rst', '.md', '.txt', '.html', '.json', '.yaml', '.py']:
133
  text = f.read().decode('utf-8')
134
+ print(f"Extracted text from {file_path}:\n{text[:200]}...\n")
135
  elif file_ext == '.pdf':
136
  reader = PdfReader(f)
137
  text = ""
 
146
 
147
  all_texts.append(text)
148
  file_references.append(file_path)
149
+
150
+ print(f"All extracted texts:\n{all_texts}")
151
  return all_texts, file_references
152
 
153