iptv/M3U8/scrapers/tvpass.py

import re

import httpx

from .utils import Cache, Time, get_logger, leagues

log = get_logger(__name__)

urls: dict[str, dict[str, str | float]] = {}

CACHE_FILE = Cache("tvpass.json", exp=86_400)

BASE_URL = "https://tvpass.org/playlist/m3u"

TAG = "TVP"


async def get_data(client: httpx.AsyncClient) -> list[str]:
    try:
        r = await client.get(BASE_URL)
        r.raise_for_status()
    except Exception as e:
        log.error(f'Failed to fetch "{BASE_URL}": {e}')

        return []

    return r.text.splitlines()


async def get_events(client: httpx.AsyncClient) -> dict[str, dict[str, str | float]]:
    now = Time.now().timestamp()

    events = {}

    data = await get_data(client)

    for i, line in enumerate(data, start=1):
        if line.startswith("#EXTINF"):
            tvg_id_match = re.search(r'tvg-id="([^"]*)"', line)
            tvg_name_match = re.search(r'tvg-name="([^"]*)"', line)
            group_title_match = re.search(r'group-title="([^"]*)"', line)

            tvg = tvg_id_match[1] if tvg_id_match else None

            if not tvg and (url := data[i]).endswith("/sd"):
                if tvg_name := tvg_name_match[1]:
                    sport = group_title_match[1].upper().strip()

                    event = "(".join(tvg_name.split("(")[:-1]).strip()

                    key = f"[{sport}] {event} ({TAG})"

                    channel = url.split("/")[-2]

                    tvg_id, logo = leagues.info(sport)

                    events[key] = {
                        "url": f"http://origin.thetvapp.to/hls/{channel}/mono.m3u8",
                        "logo": logo,
                        "id": tvg_id or "Live.Event.us",
                        "base": "https://tvpass.org",
                        "timestamp": now,
                    }

    return events


async def scrape(client: httpx.AsyncClient) -> None:
    if cached := CACHE_FILE.load():
        urls.update(cached)
        log.info(f"Loaded {len(urls)} event(s) from cache")
        return

    log.info(f'Scraping from "{BASE_URL}"')

    events = await get_events(client)

    urls.update(events)

    CACHE_FILE.write(urls)

    log.info(f"Collected and cached {len(urls)} new event(s)")
e 2025-08-19 10:54:50 -04:00			`import re`

			`import httpx`

e 2025-10-01 11:57:49 -04:00			`from .utils import Cache, Time, get_logger, leagues`
e 2025-08-30 16:45:19 -04:00
e 2025-10-01 12:37:19 -04:00			`log = get_logger(__name__)`
e 2025-08-30 16:45:19 -04:00
e 2025-11-13 12:43:55 -05:00			`urls: dict[str, dict[str, str \| float]] = {}`
e 2025-08-19 10:54:50 -04:00
e 2025-11-13 12:43:55 -05:00			`CACHE_FILE = Cache("tvpass.json", exp=86_400)`
e 2025-08-19 10:54:50 -04:00
e 2025-11-13 12:43:55 -05:00			`BASE_URL = "https://tvpass.org/playlist/m3u"`
e 2025-08-28 19:43:35 -04:00
e 2025-12-01 14:46:31 -05:00			`TAG = "TVP"`

e 2025-08-30 16:45:19 -04:00
e 2025-11-19 18:58:52 -05:00			`async def get_data(client: httpx.AsyncClient) -> list[str]:`
e 2025-08-19 10:54:50 -04:00			`try:`
e 2025-09-03 03:14:52 -04:00			`r = await client.get(BASE_URL)`
e 2025-08-19 10:54:50 -04:00			`r.raise_for_status()`
			`except Exception as e:`
e 2025-10-01 11:57:49 -04:00			`log.error(f'Failed to fetch "{BASE_URL}": {e}')`
e 2025-11-13 12:43:55 -05:00
e 2025-09-04 19:53:27 -04:00			`return []`
e 2025-08-19 10:54:50 -04:00
			`return r.text.splitlines()`


e 2025-11-19 18:58:52 -05:00			`async def get_events(client: httpx.AsyncClient) -> dict[str, dict[str, str \| float]]:`
e 2025-10-01 18:34:18 -04:00			`now = Time.now().timestamp()`

e 2025-11-19 18:58:52 -05:00			`events = {}`

			`data = await get_data(client)`
e 2025-10-01 11:57:49 -04:00
update M3U8 2025-11-21 13:32:09 -05:00			`for i, line in enumerate(data, start=1):`
e 2025-08-27 10:26:56 -04:00			`if line.startswith("#EXTINF"):`
			`tvg_id_match = re.search(r'tvg-id="([^"]*)"', line)`
e 2025-09-29 13:42:51 -04:00			`tvg_name_match = re.search(r'tvg-name="([^"]*)"', line)`
e 2025-08-28 12:18:30 -04:00			`group_title_match = re.search(r'group-title="([^"]*)"', line)`
e 2025-08-19 10:54:50 -04:00
e 2025-09-29 13:42:51 -04:00			`tvg = tvg_id_match[1] if tvg_id_match else None`
e 2025-08-19 10:54:50 -04:00
update M3U8 2025-11-21 13:32:09 -05:00			`if not tvg and (url := data[i]).endswith("/sd"):`
e 2025-09-29 13:42:51 -04:00			`if tvg_name := tvg_name_match[1]:`
			`sport = group_title_match[1].upper().strip()`
e 2025-08-19 10:54:50 -04:00
e 2025-09-29 13:42:51 -04:00			`event = "(".join(tvg_name.split("(")[:-1]).strip()`
e 2025-08-19 10:54:50 -04:00
e 2025-12-01 14:46:31 -05:00			`key = f"[{sport}] {event} ({TAG})"`
e 2025-09-13 04:42:55 -04:00
e 2025-09-20 23:26:18 -04:00			`channel = url.split("/")[-2]`

e 2025-09-24 12:30:55 -04:00			`tvg_id, logo = leagues.info(sport)`
e 2025-09-21 10:28:15 -04:00
e 2025-11-19 18:58:52 -05:00			`events[key] = {`
e 2025-09-20 23:26:18 -04:00			`"url": f"http://origin.thetvapp.to/hls/{channel}/mono.m3u8",`
e 2025-09-21 10:28:15 -04:00			`"logo": logo,`
e 2025-10-01 11:57:49 -04:00			`"id": tvg_id or "Live.Event.us",`
e 2025-09-13 04:42:55 -04:00			`"base": "https://tvpass.org",`
e 2025-10-01 18:34:18 -04:00			`"timestamp": now,`
e 2025-08-30 16:45:19 -04:00			`}`
e 2025-08-19 10:54:50 -04:00
e 2025-11-19 18:58:52 -05:00			`return events`


			`async def scrape(client: httpx.AsyncClient) -> None:`
			`if cached := CACHE_FILE.load():`
			`urls.update(cached)`
			`log.info(f"Loaded {len(urls)} event(s) from cache")`
			`return`

			`log.info(f'Scraping from "{BASE_URL}"')`

			`events = await get_events(client)`

			`urls.update(events)`
e 2025-09-13 04:42:55 -04:00
e 2025-10-01 11:57:49 -04:00			`CACHE_FILE.write(urls)`
e 2025-08-30 16:45:19 -04:00
e 2025-11-19 18:58:52 -05:00			`log.info(f"Collected and cached {len(urls)} new event(s)")`