acecalisto3 commited on
Commit
a4e9047
·
verified ·
1 Parent(s): 1b70f99

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +4 -2
app.py CHANGED
@@ -46,7 +46,7 @@ class Config:
46
  CHUNK_SIZE = 512
47
  MAX_WORKERS = 5
48
  INDEXED_URLS = {
49
- "https://drive.google.com/file/d/1d5kkqaQkdiA2SwJ0JFrTuKO9zauiUtFz/**/view?usp=sharing"
50
  }
51
 
52
  class ResourceItem:
@@ -153,8 +153,9 @@ class SchoolChatbot:
153
  crawler = RobustCrawler()
154
  response = crawler.crawl_with_exponential_backoff(url)
155
  if not response:
 
156
  return
157
-
158
  content_type = response.headers.get("Content-Type", "").lower()
159
 
160
  try:
@@ -165,6 +166,7 @@ class SchoolChatbot:
165
  elif "application/pdf" in content_type:
166
  self.extract_pdf_content(url, response.content)
167
  else:
 
168
  self.store_resource(url, response.text, 'unknown')
169
  except Exception as e:
170
  logger.error(f"Error processing {url}: {e}")
 
46
  CHUNK_SIZE = 512
47
  MAX_WORKERS = 5
48
  INDEXED_URLS = {
49
+ "https://drive.google.com/file/d/1d5kkqaQkdiA2SwJ0JFrTuKO9zauiUtFz/view?usp=sharing"
50
  }
51
 
52
  class ResourceItem:
 
153
  crawler = RobustCrawler()
154
  response = crawler.crawl_with_exponential_backoff(url)
155
  if not response:
156
+ logger.error(f"Failed to retrieve content from {url}. Please check the URL and permissions.")
157
  return
158
+
159
  content_type = response.headers.get("Content-Type", "").lower()
160
 
161
  try:
 
166
  elif "application/pdf" in content_type:
167
  self.extract_pdf_content(url, response.content)
168
  else:
169
+ logger.warning(f"Unknown content type for {url}: {content_type}")
170
  self.store_resource(url, response.text, 'unknown')
171
  except Exception as e:
172
  logger.error(f"Error processing {url}: {e}")