yt-dlp/yt_dlp/extractor/telewebion.py

from __future__ import annotations

import functools
import json
import textwrap

from .common import InfoExtractor
from ..utils import ExtractorError, format_field, int_or_none, parse_iso8601
from ..utils.traversal import traverse_obj


def _fmt_url(url):
    return format_field(template=url, default=None)


class TelewebionIE(InfoExtractor):
    _WORKING = False
    _VALID_URL = r'https?://(?:www\.)?telewebion\.com/episode/(?P<id>(?:0x[a-fA-F\d]+|\d+))'
    _TESTS = [{
        'url': 'http://www.telewebion.com/episode/0x1b3139c/',
        'info_dict': {
            'id': '0x1b3139c',
            'ext': 'mp4',
            'title': 'قرعه‌کشی لیگ قهرمانان اروپا',
            'series': '+ فوتبال',
            'series_id': '0x1b2505c',
            'channel': 'شبکه 3',
            'channel_id': '0x1b1a761',
            'channel_url': 'https://telewebion.com/live/tv3',
            'timestamp': 1425522414,
            'upload_date': '20150305',
            'release_timestamp': 1425517020,
            'release_date': '20150305',
            'duration': 420,
            'view_count': int,
            'tags': ['ورزشی', 'لیگ اروپا', 'اروپا'],
            'thumbnail': 'https://static.telewebion.com/episodeImages/YjFhM2MxMDBkMDNiZTU0MjE5YjQ3ZDY0Mjk1ZDE0ZmUwZWU3OTE3OWRmMDAyODNhNzNkNjdmMWMzMWIyM2NmMA/default',
        },
        'skip_download': 'm3u8',
    }, {
        'url': 'https://telewebion.com/episode/162175536',
        'info_dict': {
            'id': '0x9aa9a30',
            'ext': 'mp4',
            'title': 'کارما یعنی این !',
            'series': 'پاورقی',
            'series_id': '0x29a7426',
            'channel': 'شبکه 2',
            'channel_id': '0x1b1a719',
            'channel_url': 'https://telewebion.com/live/tv2',
            'timestamp': 1699979968,
            'upload_date': '20231114',
            'release_timestamp': 1699991638,
            'release_date': '20231114',
            'duration': 78,
            'view_count': int,
            'tags': ['کلیپ های منتخب', ' کلیپ طنز ', ' کلیپ سیاست ', 'پاورقی', 'ویژه فلسطین'],
            'thumbnail': 'https://static.telewebion.com/episodeImages/871e9455-7567-49a5-9648-34c22c197f5f/default',
        },
        'skip_download': 'm3u8',
    }]

    def _call_graphql_api(
        self, operation, video_id, query,
        variables: dict[str, tuple[str, str]] | None = None,
        note='Downloading GraphQL JSON metadata',
    ):
        parameters = ''
        if variables:
            parameters = ', '.join(f'${name}: {type_}' for name, (type_, _) in variables.items())
            parameters = f'({parameters})'

        result = self._download_json('https://graph.telewebion.com/graphql', video_id, note, data=json.dumps({
            'operationName': operation,
            'query': f'query {operation}{parameters} @cacheControl(maxAge: 60) {{{query}\n}}\n',
            'variables': {name: value for name, (_, value) in (variables or {}).items()},
        }, separators=(',', ':')).encode(), headers={
            'Content-Type': 'application/json',
            'Accept': 'application/json',
        })
        if not result or traverse_obj(result, 'errors'):
            message = ', '.join(traverse_obj(result, ('errors', ..., 'message', {str})))
            raise ExtractorError(message or 'Unknown GraphQL API error')

        return result['data']

    def _real_extract(self, url):
        video_id = self._match_id(url)
        if not video_id.startswith('0x'):
            video_id = hex(int(video_id))

        episode_data = self._call_graphql_api('getEpisodeDetail', video_id, textwrap.dedent('''
            queryEpisode(filter: {EpisodeID: $EpisodeId}, first: 1) {
              title
              program {
                ProgramID
                title
              }
              image
              view_count
              duration
              started_at
              created_at
              channel {
                ChannelID
                name
                descriptor
              }
              tags {
                name
              }
            }
        '''), {'EpisodeId': ('[ID!]', video_id)})

        info_dict = traverse_obj(episode_data, ('queryEpisode', 0, {
            'title': ('title', {str}),
            'view_count': ('view_count', {int_or_none}),
            'duration': ('duration', {int_or_none}),
            'tags': ('tags', ..., 'name', {str}),
            'release_timestamp': ('started_at', {parse_iso8601}),
            'timestamp': ('created_at', {parse_iso8601}),
            'series': ('program', 'title', {str}),
            'series_id': ('program', 'ProgramID', {str}),
            'channel': ('channel', 'name', {str}),
            'channel_id': ('channel', 'ChannelID', {str}),
            'channel_url': ('channel', 'descriptor', {_fmt_url('https://telewebion.com/live/%s')}),
            'thumbnail': ('image', {_fmt_url('https://static.telewebion.com/episodeImages/%s/default')}),
            'formats': (
                'channel', 'descriptor', {str},
                {_fmt_url(f'https://cdna.telewebion.com/%s/episode/{video_id}/playlist.m3u8')},
                {functools.partial(self._extract_m3u8_formats, video_id=video_id, ext='mp4', m3u8_id='hls')}),
        }))
        info_dict['id'] = video_id
        return info_dict
Update to ytdl-commit-be008e6 (#8836) - [utils] Make restricted filenames ignore some Unicode categories (by dirkf) - [ie/telewebion] Fix extraction (by Grub4K) - [ie/imgur] Overhaul extractor (by bashonly, Grub4K) - [ie/EpidemicSound] Add extractor (by Grub4K) Authored by: bashonly, dirkf, Grub4K Co-authored-by: bashonly <bashonly@protonmail.com> 2023-12-26 01:40:24 +01:00			`from __future__ import annotations`
[misc] Add `hatch`, `ruff`, `pre-commit` and improve dev docs (#7409) Authored by: bashonly, seproDev, Grub4K Co-authored-by: bashonly <88596187+bashonly@users.noreply.github.com> Co-authored-by: sepro <4618135+seproDev@users.noreply.github.com> 2024-05-26 21:27:21 +02:00
[ie, cleanup] No `from` stdlib imports in extractors (#8978) 2024-04-01 02:01:09 +02:00			`import functools`
Update to ytdl-commit-be008e6 (#8836) - [utils] Make restricted filenames ignore some Unicode categories (by dirkf) - [ie/telewebion] Fix extraction (by Grub4K) - [ie/imgur] Overhaul extractor (by bashonly, Grub4K) - [ie/EpidemicSound] Add extractor (by Grub4K) Authored by: bashonly, dirkf, Grub4K Co-authored-by: bashonly <bashonly@protonmail.com> 2023-12-26 01:40:24 +01:00			`import json`
[ie, cleanup] No `from` stdlib imports in extractors (#8978) 2024-04-01 02:01:09 +02:00			`import textwrap`
Update to ytdl-commit-be008e6 (#8836) - [utils] Make restricted filenames ignore some Unicode categories (by dirkf) - [ie/telewebion] Fix extraction (by Grub4K) - [ie/imgur] Overhaul extractor (by bashonly, Grub4K) - [ie/EpidemicSound] Add extractor (by Grub4K) Authored by: bashonly, dirkf, Grub4K Co-authored-by: bashonly <bashonly@protonmail.com> 2023-12-26 01:40:24 +01:00
[telewebion] Add new extractor (closes #5135) 2016-06-11 12:22:26 +02:00			`from .common import InfoExtractor`
Update to ytdl-commit-be008e6 (#8836) - [utils] Make restricted filenames ignore some Unicode categories (by dirkf) - [ie/telewebion] Fix extraction (by Grub4K) - [ie/imgur] Overhaul extractor (by bashonly, Grub4K) - [ie/EpidemicSound] Add extractor (by Grub4K) Authored by: bashonly, dirkf, Grub4K Co-authored-by: bashonly <bashonly@protonmail.com> 2023-12-26 01:40:24 +01:00			`from ..utils import ExtractorError, format_field, int_or_none, parse_iso8601`
			`from ..utils.traversal import traverse_obj`
[telewebion] Add new extractor (closes #5135) 2016-06-11 12:22:26 +02:00

Update to ytdl-commit-be008e6 (#8836) - [utils] Make restricted filenames ignore some Unicode categories (by dirkf) - [ie/telewebion] Fix extraction (by Grub4K) - [ie/imgur] Overhaul extractor (by bashonly, Grub4K) - [ie/EpidemicSound] Add extractor (by Grub4K) Authored by: bashonly, dirkf, Grub4K Co-authored-by: bashonly <bashonly@protonmail.com> 2023-12-26 01:40:24 +01:00			`def _fmt_url(url):`
[cleanup] Misc (#11347) Closes #11361 Authored by: avagordon01, bashonly, grqz, Grub4K, seproDev Co-authored-by: Ava Gordon <avagordon01@gmail.com> Co-authored-by: bashonly <bashonly@protonmail.com> Co-authored-by: N/Ame <173015200+grqz@users.noreply.github.com> Co-authored-by: Simon Sawicki <contact@grub4k.xyz> 2024-11-04 01:33:21 +01:00			`return format_field(template=url, default=None)`
[telewebion] Add new extractor (closes #5135) 2016-06-11 12:22:26 +02:00
Update to ytdl-commit-be008e6 (#8836) - [utils] Make restricted filenames ignore some Unicode categories (by dirkf) - [ie/telewebion] Fix extraction (by Grub4K) - [ie/imgur] Overhaul extractor (by bashonly, Grub4K) - [ie/EpidemicSound] Add extractor (by Grub4K) Authored by: bashonly, dirkf, Grub4K Co-authored-by: bashonly <bashonly@protonmail.com> 2023-12-26 01:40:24 +01:00
			`class TelewebionIE(InfoExtractor):`
[cleanup] Misc (#11347) Closes #11361 Authored by: avagordon01, bashonly, grqz, Grub4K, seproDev Co-authored-by: Ava Gordon <avagordon01@gmail.com> Co-authored-by: bashonly <bashonly@protonmail.com> Co-authored-by: N/Ame <173015200+grqz@users.noreply.github.com> Co-authored-by: Simon Sawicki <contact@grub4k.xyz> 2024-11-04 01:33:21 +01:00			`_WORKING = False`
Update to ytdl-commit-be008e6 (#8836) - [utils] Make restricted filenames ignore some Unicode categories (by dirkf) - [ie/telewebion] Fix extraction (by Grub4K) - [ie/imgur] Overhaul extractor (by bashonly, Grub4K) - [ie/EpidemicSound] Add extractor (by Grub4K) Authored by: bashonly, dirkf, Grub4K Co-authored-by: bashonly <bashonly@protonmail.com> 2023-12-26 01:40:24 +01:00			`_VALID_URL = r'https?://(?:www\.)?telewebion\.com/episode/(?P<id>(?:0x[a-fA-F\d]+\|\d+))'`
			`_TESTS = [{`
			`'url': 'http://www.telewebion.com/episode/0x1b3139c/',`
[telewebion] Add new extractor (closes #5135) 2016-06-11 12:22:26 +02:00			`'info_dict': {`
Update to ytdl-commit-be008e6 (#8836) - [utils] Make restricted filenames ignore some Unicode categories (by dirkf) - [ie/telewebion] Fix extraction (by Grub4K) - [ie/imgur] Overhaul extractor (by bashonly, Grub4K) - [ie/EpidemicSound] Add extractor (by Grub4K) Authored by: bashonly, dirkf, Grub4K Co-authored-by: bashonly <bashonly@protonmail.com> 2023-12-26 01:40:24 +01:00			`'id': '0x1b3139c',`
[telewebion] Add new extractor (closes #5135) 2016-06-11 12:22:26 +02:00			`'ext': 'mp4',`
Update to ytdl-commit-be008e6 (#8836) - [utils] Make restricted filenames ignore some Unicode categories (by dirkf) - [ie/telewebion] Fix extraction (by Grub4K) - [ie/imgur] Overhaul extractor (by bashonly, Grub4K) - [ie/EpidemicSound] Add extractor (by Grub4K) Authored by: bashonly, dirkf, Grub4K Co-authored-by: bashonly <bashonly@protonmail.com> 2023-12-26 01:40:24 +01:00			`'title': 'قرعه‌کشی لیگ قهرمانان اروپا',`
			`'series': '+ فوتبال',`
			`'series_id': '0x1b2505c',`
			`'channel': 'شبکه 3',`
			`'channel_id': '0x1b1a761',`
			`'channel_url': 'https://telewebion.com/live/tv3',`
			`'timestamp': 1425522414,`
			`'upload_date': '20150305',`
			`'release_timestamp': 1425517020,`
			`'release_date': '20150305',`
			`'duration': 420,`
[telewebion] Add new extractor (closes #5135) 2016-06-11 12:22:26 +02:00			`'view_count': int,`
Update to ytdl-commit-be008e6 (#8836) - [utils] Make restricted filenames ignore some Unicode categories (by dirkf) - [ie/telewebion] Fix extraction (by Grub4K) - [ie/imgur] Overhaul extractor (by bashonly, Grub4K) - [ie/EpidemicSound] Add extractor (by Grub4K) Authored by: bashonly, dirkf, Grub4K Co-authored-by: bashonly <bashonly@protonmail.com> 2023-12-26 01:40:24 +01:00			`'tags': ['ورزشی', 'لیگ اروپا', 'اروپا'],`
			`'thumbnail': 'https://static.telewebion.com/episodeImages/YjFhM2MxMDBkMDNiZTU0MjE5YjQ3ZDY0Mjk1ZDE0ZmUwZWU3OTE3OWRmMDAyODNhNzNkNjdmMWMzMWIyM2NmMA/default',`
[telewebion] Add new extractor (closes #5135) 2016-06-11 12:22:26 +02:00			`},`
Update to ytdl-commit-be008e6 (#8836) - [utils] Make restricted filenames ignore some Unicode categories (by dirkf) - [ie/telewebion] Fix extraction (by Grub4K) - [ie/imgur] Overhaul extractor (by bashonly, Grub4K) - [ie/EpidemicSound] Add extractor (by Grub4K) Authored by: bashonly, dirkf, Grub4K Co-authored-by: bashonly <bashonly@protonmail.com> 2023-12-26 01:40:24 +01:00			`'skip_download': 'm3u8',`
			`}, {`
			`'url': 'https://telewebion.com/episode/162175536',`
			`'info_dict': {`
			`'id': '0x9aa9a30',`
			`'ext': 'mp4',`
			`'title': 'کارما یعنی این !',`
			`'series': 'پاورقی',`
			`'series_id': '0x29a7426',`
			`'channel': 'شبکه 2',`
			`'channel_id': '0x1b1a719',`
			`'channel_url': 'https://telewebion.com/live/tv2',`
			`'timestamp': 1699979968,`
			`'upload_date': '20231114',`
			`'release_timestamp': 1699991638,`
			`'release_date': '20231114',`
			`'duration': 78,`
			`'view_count': int,`
			`'tags': ['کلیپ های منتخب', ' کلیپ طنز ', ' کلیپ سیاست ', 'پاورقی', 'ویژه فلسطین'],`
			`'thumbnail': 'https://static.telewebion.com/episodeImages/871e9455-7567-49a5-9648-34c22c197f5f/default',`
[telewebion] Add new extractor (closes #5135) 2016-06-11 12:22:26 +02:00			`},`
Update to ytdl-commit-be008e6 (#8836) - [utils] Make restricted filenames ignore some Unicode categories (by dirkf) - [ie/telewebion] Fix extraction (by Grub4K) - [ie/imgur] Overhaul extractor (by bashonly, Grub4K) - [ie/EpidemicSound] Add extractor (by Grub4K) Authored by: bashonly, dirkf, Grub4K Co-authored-by: bashonly <bashonly@protonmail.com> 2023-12-26 01:40:24 +01:00			`'skip_download': 'm3u8',`
			`}]`

			`def _call_graphql_api(`
			`self, operation, video_id, query,`
			`variables: dict[str, tuple[str, str]] \| None = None,`
			`note='Downloading GraphQL JSON metadata',`
			`):`
			`parameters = ''`
			`if variables:`
			`parameters = ', '.join(f'${name}: {type_}' for name, (type_, _) in variables.items())`
			`parameters = f'({parameters})'`

			`result = self._download_json('https://graph.telewebion.com/graphql', video_id, note, data=json.dumps({`
			`'operationName': operation,`
			`'query': f'query {operation}{parameters} @cacheControl(maxAge: 60) {{{query}\n}}\n',`
[cleanup] Add more ruff rules (#10149) Authored by: seproDev Reviewed-by: bashonly <88596187+bashonly@users.noreply.github.com> Reviewed-by: Simon Sawicki <contact@grub4k.xyz> 2024-06-12 01:09:58 +02:00			`'variables': {name: value for name, (_, value) in (variables or {}).items()},`
Update to ytdl-commit-be008e6 (#8836) - [utils] Make restricted filenames ignore some Unicode categories (by dirkf) - [ie/telewebion] Fix extraction (by Grub4K) - [ie/imgur] Overhaul extractor (by bashonly, Grub4K) - [ie/EpidemicSound] Add extractor (by Grub4K) Authored by: bashonly, dirkf, Grub4K Co-authored-by: bashonly <bashonly@protonmail.com> 2023-12-26 01:40:24 +01:00			`}, separators=(',', ':')).encode(), headers={`
			`'Content-Type': 'application/json',`
			`'Accept': 'application/json',`
			`})`
			`if not result or traverse_obj(result, 'errors'):`
			`message = ', '.join(traverse_obj(result, ('errors', ..., 'message', {str})))`
			`raise ExtractorError(message or 'Unknown GraphQL API error')`

			`return result['data']`
[telewebion] Add new extractor (closes #5135) 2016-06-11 12:22:26 +02:00
			`def _real_extract(self, url):`
			`video_id = self._match_id(url)`
Update to ytdl-commit-be008e6 (#8836) - [utils] Make restricted filenames ignore some Unicode categories (by dirkf) - [ie/telewebion] Fix extraction (by Grub4K) - [ie/imgur] Overhaul extractor (by bashonly, Grub4K) - [ie/EpidemicSound] Add extractor (by Grub4K) Authored by: bashonly, dirkf, Grub4K Co-authored-by: bashonly <bashonly@protonmail.com> 2023-12-26 01:40:24 +01:00			`if not video_id.startswith('0x'):`
			`video_id = hex(int(video_id))`

[ie, cleanup] No `from` stdlib imports in extractors (#8978) 2024-04-01 02:01:09 +02:00			`episode_data = self._call_graphql_api('getEpisodeDetail', video_id, textwrap.dedent('''`
Update to ytdl-commit-be008e6 (#8836) - [utils] Make restricted filenames ignore some Unicode categories (by dirkf) - [ie/telewebion] Fix extraction (by Grub4K) - [ie/imgur] Overhaul extractor (by bashonly, Grub4K) - [ie/EpidemicSound] Add extractor (by Grub4K) Authored by: bashonly, dirkf, Grub4K Co-authored-by: bashonly <bashonly@protonmail.com> 2023-12-26 01:40:24 +01:00			`queryEpisode(filter: {EpisodeID: $EpisodeId}, first: 1) {`
			`title`
			`program {`
			`ProgramID`
			`title`
			`}`
			`image`
			`view_count`
			`duration`
			`started_at`
			`created_at`
			`channel {`
			`ChannelID`
			`name`
			`descriptor`
			`}`
			`tags {`
			`name`
			`}`
			`}`
			`'''), {'EpisodeId': ('[ID!]', video_id)})`
[telewebion] Add new extractor (closes #5135) 2016-06-11 12:22:26 +02:00
Update to ytdl-commit-be008e6 (#8836) - [utils] Make restricted filenames ignore some Unicode categories (by dirkf) - [ie/telewebion] Fix extraction (by Grub4K) - [ie/imgur] Overhaul extractor (by bashonly, Grub4K) - [ie/EpidemicSound] Add extractor (by Grub4K) Authored by: bashonly, dirkf, Grub4K Co-authored-by: bashonly <bashonly@protonmail.com> 2023-12-26 01:40:24 +01:00			`info_dict = traverse_obj(episode_data, ('queryEpisode', 0, {`
			`'title': ('title', {str}),`
			`'view_count': ('view_count', {int_or_none}),`
			`'duration': ('duration', {int_or_none}),`
			`'tags': ('tags', ..., 'name', {str}),`
			`'release_timestamp': ('started_at', {parse_iso8601}),`
			`'timestamp': ('created_at', {parse_iso8601}),`
			`'series': ('program', 'title', {str}),`
			`'series_id': ('program', 'ProgramID', {str}),`
			`'channel': ('channel', 'name', {str}),`
			`'channel_id': ('channel', 'ChannelID', {str}),`
			`'channel_url': ('channel', 'descriptor', {_fmt_url('https://telewebion.com/live/%s')}),`
			`'thumbnail': ('image', {_fmt_url('https://static.telewebion.com/episodeImages/%s/default')}),`
			`'formats': (`
			`'channel', 'descriptor', {str},`
			`{_fmt_url(f'https://cdna.telewebion.com/%s/episode/{video_id}/playlist.m3u8')},`
[ie, cleanup] No `from` stdlib imports in extractors (#8978) 2024-04-01 02:01:09 +02:00			`{functools.partial(self._extract_m3u8_formats, video_id=video_id, ext='mp4', m3u8_id='hls')}),`
Update to ytdl-commit-be008e6 (#8836) - [utils] Make restricted filenames ignore some Unicode categories (by dirkf) - [ie/telewebion] Fix extraction (by Grub4K) - [ie/imgur] Overhaul extractor (by bashonly, Grub4K) - [ie/EpidemicSound] Add extractor (by Grub4K) Authored by: bashonly, dirkf, Grub4K Co-authored-by: bashonly <bashonly@protonmail.com> 2023-12-26 01:40:24 +01:00			`}))`
			`info_dict['id'] = video_id`
			`return info_dict`