[beatenpro] Simplify and improve

[youtube-dl.git] / youtube_dl / extractor / nrk.py
diff --git a/youtube_dl/extractor/nrk.py b/youtube_dl/extractor/nrk.py

index 46f493cfca6d6926d9ba6c8b1cf73aa73fe15476..bff36f9d3f24cad293144d8e216faf5eeefed92c 100644 (file)
--- a/youtube_dl/extractor/nrk.py
+++ b/youtube_dl/extractor/nrk.py
@@ -4,6 +4,7 @@ from __future__ import unicode_literals
  import re
  
  from .common import InfoExtractor
+from ..compat import compat_str
  from ..utils import (
      ExtractorError,
      float_or_none,
@@ -148,9 +149,6 @@ class NRKTVIE(InfoExtractor):
          }
      ]
  
-    def _seconds2str(self, s):
-        return '%02d:%02d:%02d.%03d' % (s / 3600, (s % 3600) / 60, s % 60, (s % 1) * 1000)
-
      def _debug_print(self, txt):
          if self._downloader.params.get('verbose', False):
              self.to_screen('[debug] %s' % txt)
@@ -158,17 +156,18 @@ class NRKTVIE(InfoExtractor):
      def _get_subtitles(self, subtitlesurl, video_id, baseurl):
          url = "%s%s" % (baseurl, subtitlesurl)
          self._debug_print('%s: Subtitle url: %s' % (video_id, url))
-        captions = self._download_xml(url, video_id, 'Downloading subtitles')
+        captions = self._download_xml(
+            url, video_id, 'Downloading subtitles',
+            transform_source=lambda s: s.replace(r'<br />', '\r\n'))
          lang = captions.get('lang', 'no')
          ps = captions.findall('./{0}body/{0}div/{0}p'.format('{http://www.w3.org/ns/ttml}'))
          srt = ''
          for pos, p in enumerate(ps):
              begin = parse_duration(p.get('begin'))
              duration = parse_duration(p.get('dur'))
-            starttime = self._seconds2str(begin)
-            endtime = self._seconds2str(begin + duration)
-            text = '\n'.join(p.itertext())
-            srt += '%s\r\n%s --> %s\r\n%s\r\n\r\n' % (str(pos), starttime, endtime, text)
+            starttime = self._subtitles_timecode(begin)
+            endtime = self._subtitles_timecode(begin + duration)
+            srt += '%s\r\n%s --> %s\r\n%s\r\n\r\n' % (compat_str(pos), starttime, endtime, p.text)
          return {lang: [
              {'ext': 'ttml', 'url': url},
              {'ext': 'srt', 'data': srt},