serper.py 1.21 KB
Newer Older
1
2
import json
import logging
3
from typing import List
4
5
import requests

6
from apps.rag.search.main import SearchResult, filter_by_whitelist
Timothy J. Baek's avatar
Timothy J. Baek committed
7
from config import SRC_LOG_LEVELS
8
9
10
11
12

log = logging.getLogger(__name__)
log.setLevel(SRC_LOG_LEVELS["RAG"])


13
def search_serper(api_key: str, query: str, count: int, whitelist:List[str]) -> list[SearchResult]:
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
    """Search using serper.dev's API and return the results as a list of SearchResult objects.

    Args:
        api_key (str): A serper.dev API key
        query (str): The query to search for
    """
    url = "https://google.serper.dev/search"

    payload = json.dumps({"q": query})
    headers = {"X-API-KEY": api_key, "Content-Type": "application/json"}

    response = requests.request("POST", url, headers=headers, data=payload)
    response.raise_for_status()

    json_response = response.json()
    results = sorted(
        json_response.get("organic", []), key=lambda x: x.get("position", 0)
    )
32
    filtered_results = filter_by_whitelist(results, whitelist)
33
34
    return [
        SearchResult(
35
            link=result["link"],
36
37
38
            title=result.get("title"),
            snippet=result.get("description"),
        )
39
        for result in filtered_results[:count]
40
    ]