[YoutubeDL] Remove force_generic_extractor arg from process_ie_result

[youtube-dl.git] / youtube_dl / YoutubeDL.py
diff --git a/youtube_dl/YoutubeDL.py b/youtube_dl/YoutubeDL.py

index 21d247f234cf7d8ed6a73bdc8132e4271d8a907a..a7d3a1c017fb6230639b522c1b36c356cfcaf93e 100755 (executable)
--- a/youtube_dl/YoutubeDL.py
+++ b/youtube_dl/YoutubeDL.py
@@ -49,6 +49,7 @@ from .utils import (
      ExtractorError,
      format_bytes,
      formatSeconds,
+    HEADRequest,
      locked_file,
      make_HTTPS_handler,
      MaxDownloadsReached,
@@ -138,6 +139,7 @@ class YoutubeDL(object):
      outtmpl:           Template for output names.
      restrictfilenames: Do not allow "&" and spaces in file names
      ignoreerrors:      Do not stop on download errors.
+    force_generic_extractor: Force downloader to use the generic extractor
      nooverwrites:      Prevent overwriting files.
      playliststart:     Playlist item to start at.
      playlistend:       Playlist item to end at.
@@ -625,13 +627,16 @@ class YoutubeDL(object):
              info_dict.setdefault(key, value)
  
      def extract_info(self, url, download=True, ie_key=None, extra_info={},
-                     process=True):
+                     process=True, force_generic_extractor=False):
          '''
          Returns a list with a dictionary for each video we find.
          If 'download', also downloads the videos.
          extra_info is a dict containing the extra values to add to each result
          '''
  
+        if not ie_key and force_generic_extractor:
+            ie_key = 'Generic'
+
          if ie_key:
              ies = [self.get_info_extractor(ie_key)]
          else:
@@ -923,8 +928,9 @@ class YoutubeDL(object):
                  if f.get('vcodec') != 'none' and f.get('acodec') != 'none']
              if audiovideo_formats:
                  return audiovideo_formats[format_idx]
-            # for audio only urls, select the best/worst audio format
-            elif all(f.get('acodec') != 'none' for f in available_formats):
+            # for audio only (soundcloud) or video only (imgur) urls, select the best/worst audio format
+            elif (all(f.get('acodec') != 'none' for f in available_formats) or
+                  all(f.get('vcodec') != 'none' for f in available_formats)):
                  return available_formats[format_idx]
          elif format_spec == 'bestaudio':
              audio_formats = [
@@ -1014,13 +1020,13 @@ class YoutubeDL(object):
              info_dict['display_id'] = info_dict['id']
  
          if info_dict.get('upload_date') is None and info_dict.get('timestamp') is not None:
-            # Working around negative timestamps in Windows
-            # (see http://bugs.python.org/issue1646728)
-            if info_dict['timestamp'] < 0 and os.name == 'nt':
-                info_dict['timestamp'] = 0
-            upload_date = datetime.datetime.utcfromtimestamp(
-                info_dict['timestamp'])
-            info_dict['upload_date'] = upload_date.strftime('%Y%m%d')
+            # Working around out-of-range timestamp values (e.g. negative ones on Windows,
+            # see http://bugs.python.org/issue1646728)
+            try:
+                upload_date = datetime.datetime.utcfromtimestamp(info_dict['timestamp'])
+                info_dict['upload_date'] = upload_date.strftime('%Y%m%d')
+            except (ValueError, OverflowError, OSError):
+                pass
  
          if self.params.get('listsubtitles', False):
              if 'automatic_captions' in info_dict:
@@ -1497,7 +1503,8 @@ class YoutubeDL(object):
          for url in url_list:
              try:
                  # It also downloads the videos
-                res = self.extract_info(url)
+                res = self.extract_info(
+                    url, force_generic_extractor=self.params.get('force_generic_extractor', False))
              except UnavailableVideoError:
                  self.report_error('unable to download video')
              except MaxDownloadsReached:
@@ -1720,7 +1727,8 @@ class YoutubeDL(object):
              if req_is_string:
                  req = url_escaped
              else:
-                req = compat_urllib_request.Request(
+                req_type = HEADRequest if req.get_method() == 'HEAD' else compat_urllib_request.Request
+                req = req_type(
                      url_escaped, data=req.data, headers=req.headers,
                      origin_req_host=req.origin_req_host, unverifiable=req.unverifiable)