[atvat] Add new extractor(closes #5325)
parent
610a6d1053
commit
d66d43c554
2 changed files with 74 additions and 0 deletions
@ -0,0 +1,73 @@ |
||||
# coding: utf-8 |
||||
from __future__ import unicode_literals |
||||
|
||||
from .common import InfoExtractor |
||||
from ..utils import ( |
||||
determine_ext, |
||||
int_or_none, |
||||
unescapeHTML, |
||||
) |
||||
|
||||
|
||||
class ATVAtIE(InfoExtractor): |
||||
_VALID_URL = r'https?://(?:www\.)?atv\.at/(?:[^/]+/){2}(?P<id>[dv]\d+)' |
||||
_TESTS = [{ |
||||
'url': 'http://atv.at/aktuell/di-210317-2005-uhr/v1698449/', |
||||
'md5': 'c3b6b975fb3150fc628572939df205f2', |
||||
'info_dict': { |
||||
'id': '1698447', |
||||
'ext': 'mp4', |
||||
'title': 'DI, 21.03.17 | 20:05 Uhr 1/1', |
||||
} |
||||
}, { |
||||
'url': 'http://atv.at/aktuell/meinrad-knapp/d8416/', |
||||
'only_matching': True, |
||||
}] |
||||
|
||||
def _real_extract(self, url): |
||||
display_id = self._match_id(url) |
||||
webpage = self._download_webpage(url, display_id) |
||||
video_data = self._parse_json(unescapeHTML(self._search_regex( |
||||
r'class="[^"]*jsb_video/FlashPlayer[^"]*"[^>]+data-jsb="([^"]+)"', |
||||
webpage, 'player data')), display_id)['config']['initial_video'] |
||||
|
||||
video_id = video_data['id'] |
||||
video_title = video_data['title'] |
||||
|
||||
parts = [] |
||||
for part in video_data.get('parts', []): |
||||
part_id = part['id'] |
||||
part_title = part['title'] |
||||
|
||||
formats = [] |
||||
for source in part.get('sources', []): |
||||
source_url = source.get('src') |
||||
if not source_url: |
||||
continue |
||||
ext = determine_ext(source_url) |
||||
if ext == 'm3u8': |
||||
formats.extend(self._extract_m3u8_formats( |
||||
source_url, part_id, 'mp4', 'm3u8_native', |
||||
m3u8_id='hls', fatal=False)) |
||||
else: |
||||
formats.append({ |
||||
'format_id': source.get('delivery'), |
||||
'url': source_url, |
||||
}) |
||||
self._sort_formats(formats) |
||||
|
||||
parts.append({ |
||||
'id': part_id, |
||||
'title': part_title, |
||||
'thumbnail': part.get('preview_image_url'), |
||||
'duration': int_or_none(part.get('duration')), |
||||
'is_live': part.get('is_livestream'), |
||||
'formats': formats, |
||||
}) |
||||
|
||||
return { |
||||
'_type': 'multi_video', |
||||
'id': video_id, |
||||
'title': video_title, |
||||
'entries': parts, |
||||
} |
Loading…
Reference in new issue