from typing import List import discord from bs4 import BeautifulSoup from dataclasses import dataclass from requests import get from urllib.parse import urlencode, unquote_plus @dataclass class SearchResult: status_code: int query: str results: List[str] def __post_init__(self): self.query = unquote_plus(self.query[2:]) def google_search(query) -> SearchResult: """ Function to get Google search results """ headers = { 'User-Agent': 'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/74.0.3729.169 Safari/537.36' } query = urlencode({"q": query}) # Get 20 results in case some of them are None resp = get("https://www.google.com/search?{}&num=20&hl=en".format(query), headers=headers) if resp.status_code != 200: return SearchResult(resp.status_code, query, []) bs = BeautifulSoup(resp.text, "html.parser") def getContent(element): """ Function to find links & titles in the HTML of a
element """ link = element.find("a", href=True) title = element.find("h3") if link is None or not link["href"].startswith(("http://", "https://",)) or title is None: return None return link["href"], title.text divs = bs.find_all("div", attrs={"class": "g"}) results = list(getContent(d) for d in divs) # Filter out Nones results = list(filter(lambda x: x is not None, results)) # Map to urls links = [] for (l, t) in results: links.append(f"[{t}]({l})") return SearchResult(200, query, links[:10]) def create_google_embed(result: SearchResult) -> discord.Embed: embed = discord.Embed(colour=discord.Colour.blue()) embed.set_author(name="Google Search") # Empty list of results if len(result.results) == 0: embed.colour = discord.Colour.red() embed.description = "Geen resultaten gevonden." return embed # Add results into a field links = [] for index, link in enumerate(result.results): links.append(f"{index + 1}: {link}") embed.description = "\n".join(links) # Add query into embed if len(result.query) > 256: embed.title = result.query[:253] + "..." else: embed.title = result.query return embed