[youtube:playlist] Work around buggy playlists (fixes #4449)
They show a "Load more" button, but they don't have more videos. The continuation url in the json file was a link to itself, so we ended up in an infinite loop.
This commit is contained in:
parent
caff59499c
commit
4b7df0d30c
1 changed files with 11 additions and 0 deletions
|
@ -1128,6 +1128,13 @@ class YoutubePlaylistIE(YoutubeBaseInfoExtractor):
|
||||||
'info_dict': {
|
'info_dict': {
|
||||||
'title': 'JODA7',
|
'title': 'JODA7',
|
||||||
}
|
}
|
||||||
|
}, {
|
||||||
|
'note': 'Buggy playlist: the webpage has a "Load more" button but it doesn\'t have more videos',
|
||||||
|
'url': 'https://www.youtube.com/playlist?list=UUXw-G3eDE9trcvY2sBMM_aA',
|
||||||
|
'info_dict': {
|
||||||
|
'title': 'Uploads from Interstellar Movie',
|
||||||
|
},
|
||||||
|
'playlist_mincout': 21,
|
||||||
}]
|
}]
|
||||||
|
|
||||||
def _real_initialize(self):
|
def _real_initialize(self):
|
||||||
|
@ -1212,6 +1219,10 @@ class YoutubePlaylistIE(YoutubeBaseInfoExtractor):
|
||||||
'Downloading page #%s' % page_num,
|
'Downloading page #%s' % page_num,
|
||||||
transform_source=uppercase_escape)
|
transform_source=uppercase_escape)
|
||||||
content_html = more['content_html']
|
content_html = more['content_html']
|
||||||
|
if not content_html.strip():
|
||||||
|
# Some webpages show a "Load more" button but they don't
|
||||||
|
# have more videos
|
||||||
|
break
|
||||||
more_widget_html = more['load_more_widget_html']
|
more_widget_html = more['load_more_widget_html']
|
||||||
|
|
||||||
playlist_title = self._html_search_regex(
|
playlist_title = self._html_search_regex(
|
||||||
|
|
Loading…
Reference in a new issue