2024-05-06 04:27:46 +00:00
|
|
|
import json
|
|
|
|
import logging
|
2024-08-14 12:46:31 +00:00
|
|
|
from typing import Optional
|
2024-05-06 04:27:46 +00:00
|
|
|
|
2024-08-27 22:10:27 +00:00
|
|
|
import requests
|
2024-12-12 02:05:42 +00:00
|
|
|
from open_webui.retrieval.web.main import SearchResult, get_filtered_results
|
2024-09-04 14:54:48 +00:00
|
|
|
from open_webui.env import SRC_LOG_LEVELS
|
2024-05-06 04:27:46 +00:00
|
|
|
|
|
|
|
log = logging.getLogger(__name__)
|
|
|
|
log.setLevel(SRC_LOG_LEVELS["RAG"])
|
|
|
|
|
|
|
|
|
2024-06-17 21:32:23 +00:00
|
|
|
def search_serper(
|
2024-08-14 12:46:31 +00:00
|
|
|
api_key: str, query: str, count: int, filter_list: Optional[list[str]] = None
|
2024-06-17 21:32:23 +00:00
|
|
|
) -> list[SearchResult]:
|
2024-05-06 04:27:46 +00:00
|
|
|
"""Search using serper.dev's API and return the results as a list of SearchResult objects.
|
|
|
|
|
|
|
|
Args:
|
|
|
|
api_key (str): A serper.dev API key
|
|
|
|
query (str): The query to search for
|
|
|
|
"""
|
|
|
|
url = "https://google.serper.dev/search"
|
|
|
|
|
|
|
|
payload = json.dumps({"q": query})
|
|
|
|
headers = {"X-API-KEY": api_key, "Content-Type": "application/json"}
|
|
|
|
|
|
|
|
response = requests.request("POST", url, headers=headers, data=payload)
|
|
|
|
response.raise_for_status()
|
|
|
|
|
|
|
|
json_response = response.json()
|
|
|
|
results = sorted(
|
|
|
|
json_response.get("organic", []), key=lambda x: x.get("position", 0)
|
|
|
|
)
|
2024-06-17 07:37:26 +00:00
|
|
|
if filter_list:
|
|
|
|
results = get_filtered_results(results, filter_list)
|
2024-05-06 04:27:46 +00:00
|
|
|
return [
|
|
|
|
SearchResult(
|
2024-05-06 08:39:25 +00:00
|
|
|
link=result["link"],
|
2024-05-06 04:27:46 +00:00
|
|
|
title=result.get("title"),
|
|
|
|
snippet=result.get("description"),
|
|
|
|
)
|
2024-06-17 07:37:26 +00:00
|
|
|
for result in results[:count]
|
2024-05-06 04:27:46 +00:00
|
|
|
]
|