From ef5acfe32de4c995625f9800cfe0776237961436 Mon Sep 17 00:00:00 2001 From: remitamine Date: Tue, 1 Sep 2015 23:05:19 +0100 Subject: [PATCH] [limelight] Add new extractor --- youtube_dl/extractor/__init__.py | 5 + youtube_dl/extractor/limelight.py | 176 ++++++++++++++++++++++++++++++ 2 files changed, 181 insertions(+) create mode 100644 youtube_dl/extractor/limelight.py diff --git a/youtube_dl/extractor/__init__.py b/youtube_dl/extractor/__init__.py index 495a18c17..20cc3660c 100644 --- a/youtube_dl/extractor/__init__.py +++ b/youtube_dl/extractor/__init__.py @@ -295,6 +295,11 @@ LifeNewsIE, LifeEmbedIE, ) +from .limelight import ( + LimeLightMediaIE, + LimeLightChannelIE, + LimeLightChannelListIE, +) from .liveleak import LiveLeakIE from .livestream import ( LivestreamIE, diff --git a/youtube_dl/extractor/limelight.py b/youtube_dl/extractor/limelight.py new file mode 100644 index 000000000..dcfc215c7 --- /dev/null +++ b/youtube_dl/extractor/limelight.py @@ -0,0 +1,176 @@ +# coding: utf-8 +from __future__ import unicode_literals + +import re + +from .common import InfoExtractor +from ..utils import ( + int_or_none, + determine_ext, +) + + +class LimeLightBaseIE(InfoExtractor): + + def get_playlist_service(self, id, method): + return self._download_json(self.PLAYLIST_SERVICE_URL % (id, method), id) + + def get_api(self, orgId, id, method): + return self._download_json(self.API_URL % (orgId, id, method), id) + + def process_data(self, mobileUrls, streams, properties): + video_id = properties['media_id'] + formats = [] + + for mobileUrl in mobileUrls: + if '.m3u8' in mobileUrl['mobileUrl']: + formats.extend(self._extract_m3u8_formats(mobileUrl['mobileUrl'], video_id)) + else: + formats.append({'url': mobileUrl['mobileUrl']}) + + for stream in streams: + if '.f4m' in stream['url']: + formats.extend(self._extract_f4m_formats(stream['url'], video_id)) + else: + fmt = { + 'url': stream.get('url'), + 'abr': stream.get('audioBitRate'), + 'vbr': stream.get('videoBitRate'), + 'fps': stream.get('videoFrameRate'), + 'width': stream.get('videoWidthInPixels'), + 'height': stream.get('videoHeightInPixels'), + 'ext': determine_ext(stream.get('url')) + } + rtmp = re.search(r'^(?Prtmp://[^/]+/(?P.+))/(?Pmp4:.+)$', stream['url']) + if rtmp: + fmt.update({ + 'url': rtmp.group('url'), + 'play_path': rtmp.group('playpath'), + 'app': rtmp.group('app'), + }) + formats.append(fmt) + + self._sort_formats(formats) + + title = properties['title'] + description = properties.get('description') + timestamp = properties.get('create_date') + duration = int_or_none(properties.get('duration_in_milliseconds')) + filesize = properties.get('total_storage_in_bytes') + categories = [properties.get('category')] + thumbnails = [{ + 'url': thumbnail.get('url'), + 'width': int_or_none(thumbnail.get('width')), + 'height': int_or_none(thumbnail.get('height')), + } for thumbnail in properties.get('thumbnails')] + subtitles = {caption.get('language_code'): [{'url': caption.get('url')}] for caption in properties.get('captions')} + + return { + 'id': video_id, + 'title': title, + 'description': description, + 'formats': formats, + 'timestamp': timestamp, + 'duration': duration, + 'filesize': filesize, + 'categories': categories, + 'thumbnails': thumbnails, + 'subtitles': subtitles, + } + + +class LimeLightMediaIE(LimeLightBaseIE): + IE_NAME = 'limelight' + _VALID_URL = r'http://link\.videoplatform\.limelight\.com/media/?.*mediaId=(?P[a-z0-9]{32})' + _TEST = { + 'url': 'http://link.videoplatform.limelight.com/media/?mediaId=3ffd040b522b4485b6d84effc750cd86', + 'md5': '3213605088be599705677ef785db6972', + 'info_dict': { + 'id': '3ffd040b522b4485b6d84effc750cd86', + 'ext': 'mp4', + 'title': 'HaP and the HB Prince Trailer', + 'description': 'As Harry Potter begins his 6th year at Hogwarts School of Witchcraft and Wizardry, he discovers an old book marked mysteriously "This book is the property of the Half-Blood Prince" and begins to learn more about Lord Voldemort\'s dark past.', + 'thumbnail': 're:^https?://.*\.jpeg$', + 'duration': 144230, + 'timestamp': 1244136834, + "upload_date": "20090604", + } + } + PLAYLIST_SERVICE_URL = 'http://production-ps.lvp.llnw.net/r/PlaylistService/media/%s/%s' + API_URL = 'http://api.video.limelight.com/rest/organizations/%s/media/%s/%s.json' + + def _real_extract(self, url): + video_id = self._match_id(url) + + mobile_json_data = self.get_playlist_service(video_id, 'getMobilePlaylistByMediaId') + pc_json_data = self.get_playlist_service(video_id, 'getPlaylistByMediaId') + properties = self.get_api(pc_json_data['orgId'], video_id, 'properties') + + return self.process_data(mobile_json_data['mediaList'][0]['mobileUrls'], pc_json_data['playlistItems'][0]['streams'], properties) + + +class LimeLightChannelIE(LimeLightBaseIE): + IE_NAME = 'limelight:channel' + _VALID_URL = r'http://link\.videoplatform\.limelight\.com/media/?.*channelId=(?P[a-z0-9]{32})' + _TEST = { + 'url': 'http://link.videoplatform.limelight.com/media/?channelId=ab6a524c379342f9b23642917020c082', + 'info_dict': { + 'id': 'ab6a524c379342f9b23642917020c082', + 'title': 'Javascript Sample Code', + }, + 'playlist_mincount': 3, + } + PLAYLIST_SERVICE_URL = 'http://production-ps.lvp.llnw.net/r/PlaylistService/channel/%s/%s' + API_URL = 'http://api.video.limelight.com/rest/organizations/%s/channels/%s/%s.json' + + def _real_extract(self, url): + channel_id = self._match_id(url) + + mobile_json_data = self.get_playlist_service(channel_id, 'getMobilePlaylistWithNItemsByChannelId?begin=0&count=-1') + pc_json_data = self.get_playlist_service(channel_id, 'getPlaylistByChannelId') + medias = self.get_api(pc_json_data['orgId'], channel_id, 'media') + + entries = [] + for i in range(len(medias['media_list'])): + entries.append(self.process_data(mobile_json_data['mediaList'][i]['mobileUrls'], pc_json_data['playlistItems'][i]['streams'], medias['media_list'][i])) + + return { + 'id': channel_id, + 'title': pc_json_data['title'], + 'entries': entries, + '_type': 'playlist', + } + + +class LimeLightChannelListIE(LimeLightBaseIE): + IE_NAME = 'limelight:channel_list' + _VALID_URL = r'http://link\.videoplatform\.limelight\.com/media/?.*channelListId=(?P[a-z0-9]{32})' + _TEST = { + 'url': 'http://link.videoplatform.limelight.com/media/?channelListId=301b117890c4465c8179ede21fd92e2b', + 'info_dict': { + 'id': '301b117890c4465c8179ede21fd92e2b', + 'title': 'Website - Hero Player', + }, + 'playlist_mincount': 2, + } + PLAYLIST_SERVICE_URL = 'http://production-ps.lvp.llnw.net/r/PlaylistService/channel_list/%s/%s' + + def _real_extract(self, url): + channel_list_id = self._match_id(url) + + json_data = self.get_playlist_service(channel_list_id, 'getMobileChannelListById') + + entries = [] + for channel in json_data['channelList']: + entries.append({ + 'url': 'http://link.videoplatform.limelight.com/media/?channelId=%s' % channel['id'], + '_type': 'url', + 'ie_key': 'LimeLightChannel', + }) + + return { + 'id': channel_list_id, + 'title': json_data['title'], + 'entries': entries, + '_type': 'playlist', + }