2 from __future__ import unicode_literals
4 from .common import InfoExtractor
13 class GoshgayIE(InfoExtractor):
14 _VALID_URL = r'https?://(?:www\.)?goshgay\.com/video(?P<id>\d+?)($|/)'
16 'url': 'http://www.goshgay.com/video299069/diesel_sfw_xxx_video',
17 'md5': '4b6db9a0a333142eb9f15913142b0ed1',
21 'title': 'DIESEL SFW XXX Video',
22 'thumbnail': 're:^http://.*\.jpg$',
28 def _real_extract(self, url):
29 video_id = self._match_id(url)
30 webpage = self._download_webpage(url, video_id)
32 title = self._html_search_regex(
33 r'<h2>(.*?)<', webpage, 'title')
34 duration = parse_duration(self._html_search_regex(
35 r'<span class="duration">\s*-?\s*(.*?)</span>',
36 webpage, 'duration', fatal=False))
38 flashvars = compat_parse_qs(self._html_search_regex(
39 r'<embed.+?id="flash-player-embed".+?flashvars="([^"]+)"',
40 webpage, 'flashvars'))
41 thumbnail = flashvars.get('url_bigthumb', [None])[0]
42 video_url = flashvars['flv_url'][0]
48 'thumbnail': thumbnail,