Scrapur/search.py

import requests
import re
from lxml import html, etree


def search_site(search_string: str):
    search = search_string
    search = search.replace(" ", "%20")
    headers = {
    "User-Agent": "Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/96.0.4664.110 Safari/537.36"
}
    search_res = requests.get(f"https://prehrajto.cz/hledej/{search}", headers=headers)
    tree = html.fromstring(search_res.content)
    links = tree.xpath('.//a[contains(@class, "video video--small video--link")]')
    if not links:
        print("EMPTYYY")
    x = []
    for link in links:
        title = link.get("title").replace("+", " ").replace("-", " ").replace(".", " ") # title of video
        href = link.get("href") # link to video
        thumbnail = link.xpath('.//img[contains(concat(" ", normalize-space(@class), " "), " thumb thumb1 ")]')[0].get("src") # link to thumbnail
        x.append({'title': title,
                  'href': href,
                  'thumbnail': thumbnail})
    return x

def get_video_url(href: str):
    video_site = requests.get(f"https://prehrajto.cz/{href}")
    x = re.search('(https:.{0,6}?storage.+?)\"', video_site.content.decode("utf-8")).groups()

    return x[0]