1 from .common
import InfoExtractor
11 class AparatIE(InfoExtractor
):
12 _VALID_URL
= r
'https?://(?:www\.)?aparat\.com/(?:v/|video/video/embed/videohash/)(?P<id>[a-zA-Z0-9]+)'
13 _EMBED_REGEX
= [r
'<iframe .*?src="(?P<url>http://www\.aparat\.com/video/[^"]+)"']
16 'url': 'http://www.aparat.com/v/wP8On',
17 'md5': '131aca2e14fe7c4dcb3c4877ba300c89',
21 'title': 'تیم گلکسی 11 - زومیت',
22 'description': 'md5:096bdabcdcc4569f2b8a5e903a3b3028',
24 'timestamp': 1387394859,
25 'upload_date': '20131218',
30 'url': 'https://www.aparat.com/v/8dflw/',
31 'only_matching': True,
34 def _parse_options(self
, webpage
, video_id
, fatal
=True):
35 return self
._parse
_json
(self
._search
_regex
(
36 r
'options\s*=\s*({.+?})\s*;', webpage
, 'options', default
='{}'), video_id
)
38 def _real_extract(self
, url
):
39 video_id
= self
._match
_id
(url
)
41 # If available, provides more metadata
42 webpage
= self
._download
_webpage
(url
, video_id
, fatal
=False)
43 options
= self
._parse
_options
(webpage
, video_id
, fatal
=False)
46 webpage
= self
._download
_webpage
(
47 'http://www.aparat.com/video/video/embed/vt/frame/showvideo/yes/videohash/' + video_id
,
48 video_id
, 'Downloading embed webpage')
49 options
= self
._parse
_options
(webpage
, video_id
)
52 for sources
in (options
.get('multiSRC') or []):
54 if not isinstance(item
, dict):
56 file_url
= url_or_none(item
.get('src'))
59 item_type
= item
.get('type')
60 if item_type
== 'application/vnd.apple.mpegurl':
61 formats
.extend(self
._extract
_m
3u8_formats
(
62 file_url
, video_id
, 'mp4',
63 entry_protocol
='m3u8_native', m3u8_id
='hls',
66 ext
= mimetype2ext(item
.get('type'))
67 label
= item
.get('label')
71 'format_id': 'http-%s' % (label
or ext
),
72 'height': int_or_none(self
._search
_regex
(
73 r
'(\d+)[pP]', label
or '', 'height',
77 info
= self
._search
_json
_ld
(webpage
, video_id
, default
={})
79 if not info
.get('title'):
80 info
['title'] = get_element_by_id('videoTitle', webpage
) or \
81 self
._html
_search
_meta
(['og:title', 'twitter:title', 'DC.Title', 'title'], webpage
, fatal
=True)
83 return merge_dicts(info
, {
85 'thumbnail': url_or_none(options
.get('poster')),
86 'duration': int_or_none(options
.get('duration')),