Rulga commited on
Commit
58849bb
·
1 Parent(s): feee140

Enhance document loading process with detailed logging and improved error handling

Browse files
Files changed (1) hide show
  1. api/fastapi_server.py +9 -2
api/fastapi_server.py CHANGED
@@ -232,19 +232,26 @@ def build_knowledge_base():
232
  # Create folder in advance
233
  os.makedirs(VECTOR_STORE_PATH, exist_ok=True)
234
 
235
- # Load documents
236
  for url in URLS:
237
  try:
 
238
  loader = WebBaseLoader(url)
239
  docs = loader.load()
 
240
  documents.extend(docs)
241
  print(f"Loaded {url}")
242
  except Exception as e:
243
  print(f"Failed to load {url}: {str(e)}")
 
244
  continue
245
 
 
 
246
  if not documents:
247
- raise HTTPException(status_code=500, detail="No documents loaded!")
 
 
248
 
249
  # Split into chunks
250
  text_splitter = RecursiveCharacterTextSplitter(
 
232
  # Create folder in advance
233
  os.makedirs(VECTOR_STORE_PATH, exist_ok=True)
234
 
235
+ # Load documents with detailed logging
236
  for url in URLS:
237
  try:
238
+ print(f"Attempting to load {url}")
239
  loader = WebBaseLoader(url)
240
  docs = loader.load()
241
+ print(f"Successfully loaded {url}, got {len(docs)} documents")
242
  documents.extend(docs)
243
  print(f"Loaded {url}")
244
  except Exception as e:
245
  print(f"Failed to load {url}: {str(e)}")
246
+ print(f"Full error: {traceback.format_exc()}")
247
  continue
248
 
249
+ print(f"Total documents loaded: {len(documents)}")
250
+
251
  if not documents:
252
+ error_msg = "No documents loaded! Check if the URLs are accessible and contain valid content."
253
+ print(error_msg)
254
+ raise HTTPException(status_code=500, detail=error_msg)
255
 
256
  # Split into chunks
257
  text_splitter = RecursiveCharacterTextSplitter(