From: Sergey M․ Date: Sun, 31 Jan 2016 11:52:02 +0000 (+0600) Subject: [youtube] Filter duplicates in playlists base extractor X-Git-Url: http://git.cielonegro.org/gitweb.cgi?a=commitdiff_plain;h=9acd33094d36acde60a42837ed775c68ad3a327d;p=youtube-dl.git [youtube] Filter duplicates in playlists base extractor --- diff --git a/youtube_dl/extractor/youtube.py b/youtube_dl/extractor/youtube.py index 2941da467..9a64c1d11 100644 --- a/youtube_dl/extractor/youtube.py +++ b/youtube_dl/extractor/youtube.py @@ -233,7 +233,7 @@ class YoutubePlaylistBaseInfoExtractor(YoutubeEntryListBaseInfoExtractor): class YoutubePlaylistsBaseInfoExtractor(YoutubeEntryListBaseInfoExtractor): def _process_page(self, content): - for playlist_id in re.findall(r'href="/?playlist\?list=(.+?)"', content): + for playlist_id in set(re.findall(r'href="/?playlist\?list=([0-9A-Za-z-_]{10,})"', content)): yield self.url_result( 'https://www.youtube.com/playlist?list=%s' % playlist_id, 'YoutubePlaylist')