Spaces:
Sleeping
Sleeping
Update app.py
Browse files
app.py
CHANGED
@@ -17,20 +17,19 @@ client = OpenAI(
|
|
17 |
|
18 |
# Define constants for pagination
|
19 |
RESULTS_PER_PAGE = 10
|
20 |
-
TOTAL_RESULTS =
|
21 |
|
22 |
def fetch_search_results(query):
|
23 |
-
"""Fetch search results from the LLM without streaming."""
|
24 |
if not query.strip():
|
25 |
return None, "Please enter a search query."
|
26 |
|
27 |
prompt = f"""
|
28 |
-
You are a highly accurate search engine designed to provide reliable and
|
29 |
-
|
30 |
-
- '
|
31 |
-
- '
|
32 |
-
|
33 |
-
Format the response as a JSON array of objects, where each object has 'title', 'snippet', and 'url' fields. Ensure the results are diverse, directly relevant to the query, and avoid any hallucinated or fabricated content. Double-check your URLs to match real entities or resources.
|
34 |
"""
|
35 |
|
36 |
try:
|
@@ -82,7 +81,7 @@ def check_url():
|
|
82 |
favicon_url = favicon_tag['href'] if favicon_tag and 'href' in favicon_tag.attrs else None
|
83 |
if favicon_url and not favicon_url.startswith('http'):
|
84 |
favicon_url = urljoin(url, favicon_url) # Resolve relative URLs
|
85 |
-
return jsonify({'broken': False, 'favicon': favicon_url or '🌐'})
|
86 |
else:
|
87 |
return jsonify({'broken': True, 'favicon': None})
|
88 |
except requests.RequestException:
|
|
|
17 |
|
18 |
# Define constants for pagination
|
19 |
RESULTS_PER_PAGE = 10
|
20 |
+
TOTAL_RESULTS = 30 # Generate 30 results to allow pagination
|
21 |
|
22 |
def fetch_search_results(query):
|
23 |
+
"""Fetch search results from the LLM without streaming, minimizing hallucinations."""
|
24 |
if not query.strip():
|
25 |
return None, "Please enter a search query."
|
26 |
|
27 |
prompt = f"""
|
28 |
+
You are a highly accurate search engine designed to provide reliable, factual, and verifiable results. For the given query '{query}', generate {TOTAL_RESULTS} search results. Each result must include:
|
29 |
+
- 'title': A concise, accurate title directly relevant to the query, reflecting real-world content.
|
30 |
+
- 'snippet': A short, factual summary (2-3 sentences) based strictly on real-world knowledge, avoiding any speculation.
|
31 |
+
- 'url': A valid, existing URL from well-known, real websites or domains that you are certain exist based on your training data (e.g., wikipedia.org, python.org, nytimes.com, stackoverflow.com). Strictly prohibit any fictional, random, or fabricated URLs; only include URLs you can verify as real and accessible. Absolutely no made-up domains or paths are allowed—use only URLs tied to actual entities or resources.
|
32 |
+
Format the response as a JSON array of objects, where each object has 'title', 'snippet', and 'url' fields. Ensure the results are diverse, directly relevant to the query, and free of any hallucinated or fabricated content. Before including a URL, verify it matches a real website or resource you know exists from your training data.
|
|
|
33 |
"""
|
34 |
|
35 |
try:
|
|
|
81 |
favicon_url = favicon_tag['href'] if favicon_tag and 'href' in favicon_tag.attrs else None
|
82 |
if favicon_url and not favicon_url.startswith('http'):
|
83 |
favicon_url = urljoin(url, favicon_url) # Resolve relative URLs
|
84 |
+
return jsonify({'broken': False, 'favicon': favicon_url or '🌐'})
|
85 |
else:
|
86 |
return jsonify({'broken': True, 'favicon': None})
|
87 |
except requests.RequestException:
|