1
0
mirror of https://github.com/yt-dlp/yt-dlp.git synced 2024-11-02 17:22:31 +01:00

[dailymotion] Fix user playlist extraction

This commit is contained in:
Sergey M․ 2014-04-23 19:42:34 +07:00
parent 5bec574859
commit 4b10aadffc

View File

@ -11,8 +11,8 @@
orderedSet, orderedSet,
str_to_int, str_to_int,
int_or_none, int_or_none,
ExtractorError, ExtractorError,
unescapeHTML,
) )
class DailymotionBaseInfoExtractor(InfoExtractor): class DailymotionBaseInfoExtractor(InfoExtractor):
@ -188,7 +188,7 @@ def _extract_entries(self, id):
webpage = self._download_webpage(request, webpage = self._download_webpage(request,
id, u'Downloading page %s' % pagenum) id, u'Downloading page %s' % pagenum)
video_ids.extend(re.findall(r'data-id="(.+?)"', webpage)) video_ids.extend(re.findall(r'data-xid="(.+?)"', webpage))
if re.search(self._MORE_PAGES_INDICATOR, webpage) is None: if re.search(self._MORE_PAGES_INDICATOR, webpage) is None:
break break
@ -217,9 +217,9 @@ def _real_extract(self, url):
mobj = re.match(self._VALID_URL, url) mobj = re.match(self._VALID_URL, url)
user = mobj.group('user') user = mobj.group('user')
webpage = self._download_webpage(url, user) webpage = self._download_webpage(url, user)
full_user = self._html_search_regex( full_user = unescapeHTML(self._html_search_regex(
r'<a class="label" href="/%s".*?>(.*?)</' % re.escape(user), r'<a class="nav-image" title="([^"]+)" href="/%s">' % re.escape(user),
webpage, u'user', flags=re.DOTALL) webpage, u'user', flags=re.DOTALL))
return { return {
'_type': 'playlist', '_type': 'playlist',