mirror of https://github.com/stijndcl/didier
90 lines
2.3 KiB
Python
90 lines
2.3 KiB
Python
from typing import List
|
|
|
|
import discord
|
|
from bs4 import BeautifulSoup
|
|
from dataclasses import dataclass
|
|
from requests import get
|
|
from urllib.parse import urlencode, unquote_plus
|
|
|
|
|
|
@dataclass
|
|
class SearchResult:
|
|
status_code: int
|
|
query: str
|
|
results: List[str]
|
|
|
|
def __post_init__(self):
|
|
self.query = unquote_plus(self.query[2:])
|
|
|
|
|
|
def google_search(query) -> SearchResult:
|
|
"""
|
|
Function to get Google search results
|
|
"""
|
|
headers = {
|
|
'User-Agent': 'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/74.0.3729.169 Safari/537.36'
|
|
}
|
|
|
|
query = urlencode({"q": query})
|
|
|
|
# Get 20 results in case some of them are None
|
|
resp = get("https://www.google.com/search?{}&num=20&hl=en".format(query), headers=headers)
|
|
|
|
if resp.status_code != 200:
|
|
return SearchResult(resp.status_code, query, [])
|
|
|
|
bs = BeautifulSoup(resp.text, "html.parser")
|
|
|
|
def getContent(element):
|
|
"""
|
|
Function to find links & titles in the HTML of a <div> element
|
|
"""
|
|
link = element.find("a", href=True)
|
|
title = element.find("h3")
|
|
|
|
if link is None or not link["href"].startswith(("http://", "https://",)) or title is None:
|
|
return None
|
|
|
|
return link["href"], title.text
|
|
|
|
divs = bs.find_all("div", attrs={"class": "g"})
|
|
|
|
results = list(getContent(d) for d in divs)
|
|
|
|
# Filter out Nones
|
|
results = list(filter(lambda x: x is not None, results))
|
|
|
|
# Map to urls
|
|
links = []
|
|
for (l, t) in results:
|
|
links.append(f"[{t}]({l})")
|
|
|
|
return SearchResult(200, query, links[:10])
|
|
|
|
|
|
def create_google_embed(result: SearchResult) -> discord.Embed:
|
|
embed = discord.Embed(colour=discord.Colour.blue())
|
|
embed.set_author(name="Google Search")
|
|
|
|
# Empty list of results
|
|
if len(result.results) == 0:
|
|
embed.colour = discord.Colour.red()
|
|
embed.description = "Geen resultaten gevonden."
|
|
return embed
|
|
|
|
# Add results into a field
|
|
links = []
|
|
|
|
for index, link in enumerate(result.results):
|
|
links.append(f"{index + 1}: {link}")
|
|
|
|
embed.description = "\n".join(links)
|
|
|
|
# Add query into embed
|
|
if len(result.query) > 256:
|
|
embed.title = result.query[:253] + "..."
|
|
else:
|
|
embed.title = result.query
|
|
|
|
return embed
|