mirror of
https://github.com/yt-dlp/yt-dlp.git
synced 2024-11-05 10:42:37 +01:00
dcddc10a50
From now on, the line from __future__ import unicode_literals should be contained in every single Python file lest we run into any more 2.x/3.x issues. Going forward, we're likely to develop on 3.x only and would likely miss subtle bugs otherwise.
97 lines
3.2 KiB
Python
97 lines
3.2 KiB
Python
from __future__ import unicode_literals
|
|
|
|
import re
|
|
import json
|
|
import itertools
|
|
|
|
from .common import InfoExtractor
|
|
from ..utils import (
|
|
compat_urllib_request,
|
|
)
|
|
|
|
|
|
class BambuserIE(InfoExtractor):
|
|
IE_NAME = 'bambuser'
|
|
_VALID_URL = r'https?://bambuser\.com/v/(?P<id>\d+)'
|
|
_API_KEY = '005f64509e19a868399060af746a00aa'
|
|
|
|
_TEST = {
|
|
'url': 'http://bambuser.com/v/4050584',
|
|
# MD5 seems to be flaky, see https://travis-ci.org/rg3/youtube-dl/jobs/14051016#L388
|
|
# 'md5': 'fba8f7693e48fd4e8641b3fd5539a641',
|
|
'info_dict': {
|
|
'id': '4050584',
|
|
'ext': 'flv',
|
|
'title': 'Education engineering days - lightning talks',
|
|
'duration': 3741,
|
|
'uploader': 'pixelversity',
|
|
'uploader_id': '344706',
|
|
},
|
|
'params': {
|
|
# It doesn't respect the 'Range' header, it would download the whole video
|
|
# caused the travis builds to fail: https://travis-ci.org/rg3/youtube-dl/jobs/14493845#L59
|
|
'skip_download': True,
|
|
},
|
|
}
|
|
|
|
def _real_extract(self, url):
|
|
mobj = re.match(self._VALID_URL, url)
|
|
video_id = mobj.group('id')
|
|
info_url = ('http://player-c.api.bambuser.com/getVideo.json?'
|
|
'&api_key=%s&vid=%s' % (self._API_KEY, video_id))
|
|
info_json = self._download_webpage(info_url, video_id)
|
|
info = json.loads(info_json)['result']
|
|
|
|
return {
|
|
'id': video_id,
|
|
'title': info['title'],
|
|
'url': info['url'],
|
|
'thumbnail': info.get('preview'),
|
|
'duration': int(info['length']),
|
|
'view_count': int(info['views_total']),
|
|
'uploader': info['username'],
|
|
'uploader_id': info['uid'],
|
|
}
|
|
|
|
|
|
class BambuserChannelIE(InfoExtractor):
|
|
IE_NAME = 'bambuser:channel'
|
|
_VALID_URL = r'https?://bambuser\.com/channel/(?P<user>.*?)(?:/|#|\?|$)'
|
|
# The maximum number we can get with each request
|
|
_STEP = 50
|
|
_TEST = {
|
|
'url': 'http://bambuser.com/channel/pixelversity',
|
|
'info_dict': {
|
|
'title': 'pixelversity',
|
|
},
|
|
'playlist_mincount': 60,
|
|
}
|
|
|
|
def _real_extract(self, url):
|
|
mobj = re.match(self._VALID_URL, url)
|
|
user = mobj.group('user')
|
|
urls = []
|
|
last_id = ''
|
|
for i in itertools.count(1):
|
|
req_url = (
|
|
'http://bambuser.com/xhr-api/index.php?username={user}'
|
|
'&sort=created&access_mode=0%2C1%2C2&limit={count}'
|
|
'&method=broadcast&format=json&vid_older_than={last}'
|
|
).format(user=user, count=self._STEP, last=last_id)
|
|
req = compat_urllib_request.Request(req_url)
|
|
# Without setting this header, we wouldn't get any result
|
|
req.add_header('Referer', 'http://bambuser.com/channel/%s' % user)
|
|
data = self._download_json(
|
|
req, user, 'Downloading page %d' % i)
|
|
results = data['result']
|
|
if not results:
|
|
break
|
|
last_id = results[-1]['vid']
|
|
urls.extend(self.url_result(v['page'], 'Bambuser') for v in results)
|
|
|
|
return {
|
|
'_type': 'playlist',
|
|
'title': user,
|
|
'entries': urls,
|
|
}
|