Spaces:
Running
Running
import logging | |
import json | |
from typing import Optional, List | |
from open_webui.retrieval.web.main import SearchResult, get_filtered_results | |
from open_webui.env import SRC_LOG_LEVELS | |
log = logging.getLogger(__name__) | |
log.setLevel(SRC_LOG_LEVELS["RAG"]) | |
def search_sougou( | |
sougou_api_sid: str, | |
sougou_api_sk: str, | |
query: str, | |
count: int, | |
filter_list: Optional[List[str]] = None, | |
) -> List[SearchResult]: | |
from tencentcloud.common.common_client import CommonClient | |
from tencentcloud.common import credential | |
from tencentcloud.common.exception.tencent_cloud_sdk_exception import ( | |
TencentCloudSDKException, | |
) | |
from tencentcloud.common.profile.client_profile import ClientProfile | |
from tencentcloud.common.profile.http_profile import HttpProfile | |
try: | |
cred = credential.Credential(sougou_api_sid, sougou_api_sk) | |
http_profile = HttpProfile() | |
http_profile.endpoint = "tms.tencentcloudapi.com" | |
client_profile = ClientProfile() | |
client_profile.http_profile = http_profile | |
params = json.dumps({"Query": query, "Cnt": 20}) | |
common_client = CommonClient( | |
"tms", "2020-12-29", cred, "", profile=client_profile | |
) | |
results = [ | |
json.loads(page) | |
for page in common_client.call_json("SearchPro", json.loads(params))[ | |
"Response" | |
]["Pages"] | |
] | |
sorted_results = sorted( | |
results, key=lambda x: x.get("scour", 0.0), reverse=True | |
) | |
if filter_list: | |
sorted_results = get_filtered_results(sorted_results, filter_list) | |
return [ | |
SearchResult( | |
link=result.get("url"), | |
title=result.get("title"), | |
snippet=result.get("passage"), | |
) | |
for result in sorted_results[:count] | |
] | |
except TencentCloudSDKException as err: | |
log.error(f"Error in Sougou search: {err}") | |
return [] | |