Spaces:
Sleeping
Sleeping
Update app.py
Browse files
app.py
CHANGED
@@ -46,7 +46,7 @@ class Config:
|
|
46 |
CHUNK_SIZE = 512
|
47 |
MAX_WORKERS = 5
|
48 |
INDEXED_URLS = {
|
49 |
-
"https://drive.google.com/file/d/1d5kkqaQkdiA2SwJ0JFrTuKO9zauiUtFz
|
50 |
}
|
51 |
|
52 |
class ResourceItem:
|
@@ -153,8 +153,9 @@ class SchoolChatbot:
|
|
153 |
crawler = RobustCrawler()
|
154 |
response = crawler.crawl_with_exponential_backoff(url)
|
155 |
if not response:
|
|
|
156 |
return
|
157 |
-
|
158 |
content_type = response.headers.get("Content-Type", "").lower()
|
159 |
|
160 |
try:
|
@@ -165,6 +166,7 @@ class SchoolChatbot:
|
|
165 |
elif "application/pdf" in content_type:
|
166 |
self.extract_pdf_content(url, response.content)
|
167 |
else:
|
|
|
168 |
self.store_resource(url, response.text, 'unknown')
|
169 |
except Exception as e:
|
170 |
logger.error(f"Error processing {url}: {e}")
|
|
|
46 |
CHUNK_SIZE = 512
|
47 |
MAX_WORKERS = 5
|
48 |
INDEXED_URLS = {
|
49 |
+
"https://drive.google.com/file/d/1d5kkqaQkdiA2SwJ0JFrTuKO9zauiUtFz/view?usp=sharing"
|
50 |
}
|
51 |
|
52 |
class ResourceItem:
|
|
|
153 |
crawler = RobustCrawler()
|
154 |
response = crawler.crawl_with_exponential_backoff(url)
|
155 |
if not response:
|
156 |
+
logger.error(f"Failed to retrieve content from {url}. Please check the URL and permissions.")
|
157 |
return
|
158 |
+
|
159 |
content_type = response.headers.get("Content-Type", "").lower()
|
160 |
|
161 |
try:
|
|
|
166 |
elif "application/pdf" in content_type:
|
167 |
self.extract_pdf_content(url, response.content)
|
168 |
else:
|
169 |
+
logger.warning(f"Unknown content type for {url}: {content_type}")
|
170 |
self.store_resource(url, response.text, 'unknown')
|
171 |
except Exception as e:
|
172 |
logger.error(f"Error processing {url}: {e}")
|