Spaces:
Paused
Paused
| import logging | |
| import requests | |
| from open_webui.retrieval.web.main import SearchResult | |
| from open_webui.env import SRC_LOG_LEVELS | |
| from yarl import URL | |
| log = logging.getLogger(__name__) | |
| log.setLevel(SRC_LOG_LEVELS["RAG"]) | |
| def search_jina(api_key: str, query: str, count: int) -> list[SearchResult]: | |
| """ | |
| Search using Jina's Search API and return the results as a list of SearchResult objects. | |
| Args: | |
| query (str): The query to search for | |
| count (int): The number of results to return | |
| Returns: | |
| list[SearchResult]: A list of search results | |
| """ | |
| jina_search_endpoint = "https://s.jina.ai/" | |
| headers = { | |
| "Accept": "application/json", | |
| "Content-Type": "application/json", | |
| "Authorization": api_key, | |
| "X-Retain-Images": "none", | |
| } | |
| payload = {"q": query, "count": count if count <= 10 else 10} | |
| url = str(URL(jina_search_endpoint)) | |
| response = requests.post(url, headers=headers, json=payload) | |
| response.raise_for_status() | |
| data = response.json() | |
| results = [] | |
| for result in data["data"]: | |
| results.append( | |
| SearchResult( | |
| link=result["url"], | |
| title=result.get("title"), | |
| snippet=result.get("content"), | |
| ) | |
| ) | |
| return results | |