iptv/M3U8/scrapers/tvpass.py

import re
from pathlib import Path

import httpx

from .utils import Cache, Time, get_logger, leagues

log = get_logger(__name__)

urls: dict[str, dict[str, str]] = {}

BASE_URL = "https://tvpass.org/playlist/m3u"

CACHE_FILE = Cache(Path(__file__).parent / "caches" / "tvpass.json", exp=86_400)


async def fetch_m3u8(client: httpx.AsyncClient) -> list[str]:
    try:
        r = await client.get(BASE_URL)
        r.raise_for_status()
    except Exception as e:
        log.error(f'Failed to fetch "{BASE_URL}": {e}')
        return []

    return r.text.splitlines()


async def scrape(client: httpx.AsyncClient) -> None:
    if cached := CACHE_FILE.load():
        urls.update(cached)
        log.info(f"Loaded {len(urls)} event(s) from cache")
        return

    log.info(f'Scraping from "{BASE_URL}"')

    now = Time.now().timestamp()

    if not (data := await fetch_m3u8(client)):
        log.warning("No M3U8 data received")
        return

    for i, line in enumerate(data):
        if line.startswith("#EXTINF"):
            tvg_id_match = re.search(r'tvg-id="([^"]*)"', line)
            tvg_name_match = re.search(r'tvg-name="([^"]*)"', line)
            group_title_match = re.search(r'group-title="([^"]*)"', line)

            tvg = tvg_id_match[1] if tvg_id_match else None

            if not tvg and (url := data[i + 1]).endswith("/hd"):
                if tvg_name := tvg_name_match[1]:
                    sport = group_title_match[1].upper().strip()

                    event = "(".join(tvg_name.split("(")[:-1]).strip()

                    key = f"[{sport}] {event} (TVP)"

                    channel = url.split("/")[-2]

                    tvg_id, logo = leagues.info(sport)

                    entry = {
                        "url": f"http://origin.thetvapp.to/hls/{channel}/mono.m3u8",
                        "logo": logo,
                        "id": tvg_id or "Live.Event.us",
                        "base": "https://tvpass.org",
                        "timestamp": now,
                    }

                    urls[key] = entry

    CACHE_FILE.write(urls)

    log.info(f"Cached {len(urls)} event(s)")