4 from .common
import InfoExtractor
5 from ..compat
import compat_urllib_parse_unquote
6 from ..utils
import ExtractorError
, clean_html
9 class PlayvidIE(InfoExtractor
):
10 _VALID_URL
= r
'https?://(?:www\.)?playvid\.com/watch(\?v=|/)(?P<id>.+?)(?:#|$)'
12 'url': 'http://www.playvid.com/watch/RnmBNgtrrJu',
13 'md5': 'ffa2f6b2119af359f544388d8c01eb6c',
17 'title': 'md5:9256d01c6317e3f703848b5906880dc8',
21 'skip': 'Video removed due to ToS',
23 'url': 'http://www.playvid.com/watch/hwb0GpNkzgH',
24 'md5': '39d49df503ad7b8f23a4432cbf046477',
28 'title': 'Ellen Euro Cutie Blond Takes a Sexy Survey Get Facial in The Park',
30 'thumbnail': r
're:^https?://.*\.jpg$',
34 def _real_extract(self
, url
):
35 video_id
= self
._match
_id
(url
)
36 webpage
= self
._download
_webpage
(url
, video_id
)
39 r
'<div class="block-error">\s*<div class="heading">\s*<div>(?P<msg>.+?)</div>\s*</div>', webpage
)
41 raise ExtractorError(clean_html(m_error
.group('msg')), expected
=True)
45 video_thumbnail
= None
48 # most of the information is stored in the flashvars
49 flashvars
= self
._html
_search
_regex
(
50 r
'flashvars="(.+?)"', webpage
, 'flashvars')
52 infos
= compat_urllib_parse_unquote(flashvars
).split(r
'&')
54 videovars_match
= re
.match(r
'^video_vars\[(.+?)\]=(.+?)$', info
)
56 key
= videovars_match
.group(1)
57 val
= videovars_match
.group(2)
60 video_title
= urllib
.parse
.unquote_plus(val
)
66 if key
== 'big_thumb':
69 videourl_match
= re
.match(
70 r
'^video_urls\]\[(?P<resolution>[0-9]+)p', key
)
72 height
= int(videourl_match
.group('resolution'))
78 # Extract title - should be in the flashvars; if not, look elsewhere
79 if video_title
is None:
80 video_title
= self
._html
_extract
_title
(webpage
)
86 'thumbnail': video_thumbnail
,