[nova] Fix extraction (closes #17241)

[youtube-dl.git] / youtube_dl / extractor / generic.py
diff --git a/youtube_dl/extractor/generic.py b/youtube_dl/extractor/generic.py

index 6c0f772ac63142c83f010d07989e91e389c858cb..83a31f3d3d67cc52cf1c1dbb0457e973c8b68e28 100644 (file)
--- a/youtube_dl/extractor/generic.py
+++ b/youtube_dl/extractor/generic.py
@@ -32,6 +32,7 @@ from ..utils import (
      unified_strdate,
      unsmuggle_url,
      UnsupportedError,
+    url_or_none,
      xpath_text,
  )
  from .commonprotocols import RtmpIE
@@ -111,6 +112,9 @@ from .cloudflarestream import CloudflareStreamIE
  from .peertube import PeerTubeIE
  from .indavideo import IndavideoEmbedIE
  from .apa import APAIE
+from .foxnews import FoxNewsIE
+from .viqeo import ViqeoIE
+from .expressen import ExpressenIE
  
  
  class GenericIE(InfoExtractor):
@@ -1394,17 +1398,6 @@ class GenericIE(InfoExtractor):
                  'skip_download': True,
              },
          },
-        # SVT embed
-        {
-            'url': 'http://www.svt.se/sport/ishockey/jagr-tacklar-giroux-under-intervjun',
-            'info_dict': {
-                'id': '2900353',
-                'ext': 'flv',
-                'title': 'Här trycker Jagr till Giroux (under SVT-intervjun)',
-                'duration': 27,
-                'age_limit': 0,
-            },
-        },
          # Crooks and Liars embed
          {
              'url': 'http://crooksandliars.com/2015/04/fox-friends-says-protecting-atheists',
@@ -2069,6 +2062,15 @@ class GenericIE(InfoExtractor):
              },
              'skip': 'TODO: fix nested playlists processing in tests',
          },
+        {
+            # Viqeo embeds
+            'url': 'https://viqeo.tv/',
+            'info_dict': {
+                'id': 'viqeo',
+                'title': 'All-new video platform',
+            },
+            'playlist_count': 6,
+        },
          # {
          #     # TODO: find another test
          #     # http://schema.org/VideoObject
@@ -3091,6 +3093,11 @@ class GenericIE(InfoExtractor):
              return self.playlist_from_matches(
                  apa_urls, video_id, video_title, ie=APAIE.ie_key())
  
+        foxnews_urls = FoxNewsIE._extract_urls(webpage)
+        if foxnews_urls:
+            return self.playlist_from_matches(
+                foxnews_urls, video_id, video_title, ie=FoxNewsIE.ie_key())
+
          sharevideos_urls = [mobj.group('url') for mobj in re.finditer(
              r'<iframe[^>]+?\bsrc\s*=\s*(["\'])(?P<url>(?:https?:)?//embed\.share-videos\.se/auto/embed/\d+\?.*?\buid=\d+.*?)\1',
              webpage)]
@@ -3098,6 +3105,16 @@ class GenericIE(InfoExtractor):
              return self.playlist_from_matches(
                  sharevideos_urls, video_id, video_title)
  
+        viqeo_urls = ViqeoIE._extract_urls(webpage)
+        if viqeo_urls:
+            return self.playlist_from_matches(
+                viqeo_urls, video_id, video_title, ie=ViqeoIE.ie_key())
+
+        expressen_urls = ExpressenIE._extract_urls(webpage)
+        if expressen_urls:
+            return self.playlist_from_matches(
+                expressen_urls, video_id, video_title, ie=ExpressenIE.ie_key())
+
          # Look for HTML5 media
          entries = self._parse_html5_media_entries(url, webpage, video_id, m3u8_id='hls')
          if entries:
@@ -3135,8 +3152,8 @@ class GenericIE(InfoExtractor):
                  sources = [sources]
              formats = []
              for source in sources:
-                src = source.get('src')
-                if not src or not isinstance(src, compat_str):
+                src = url_or_none(source.get('src'))
+                if not src:
                      continue
                  src = compat_urlparse.urljoin(url, src)
                  src_type = source.get('type')