You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
133 lines
4.6 KiB
133 lines
4.6 KiB
# coding: utf-8 |
|
from __future__ import unicode_literals |
|
|
|
from .common import InfoExtractor |
|
from ..compat import compat_str |
|
from ..utils import ( |
|
int_or_none, |
|
parse_iso8601, |
|
try_get, |
|
determine_ext, |
|
) |
|
|
|
|
|
class TV4IE(InfoExtractor): |
|
IE_DESC = 'tv4.se and tv4play.se' |
|
_VALID_URL = r'''(?x)https?://(?:www\.)? |
|
(?: |
|
tv4\.se/(?:[^/]+)/klipp/(?:.*)-| |
|
tv4play\.se/ |
|
(?: |
|
(?:program|barn)/(?:[^/]+/|(?:[^\?]+)\?video_id=)| |
|
iframe/video/| |
|
film/| |
|
sport/| |
|
) |
|
)(?P<id>[0-9]+)''' |
|
_GEO_COUNTRIES = ['SE'] |
|
_TESTS = [ |
|
{ |
|
'url': 'http://www.tv4.se/kalla-fakta/klipp/kalla-fakta-5-english-subtitles-2491650', |
|
'md5': 'cb837212f342d77cec06e6dad190e96d', |
|
'info_dict': { |
|
'id': '2491650', |
|
'ext': 'mp4', |
|
'title': 'Kalla Fakta 5 (english subtitles)', |
|
'thumbnail': r're:^https?://.*\.jpg$', |
|
'timestamp': int, |
|
'upload_date': '20131125', |
|
}, |
|
}, |
|
{ |
|
'url': 'http://www.tv4play.se/iframe/video/3054113', |
|
'md5': 'cb837212f342d77cec06e6dad190e96d', |
|
'info_dict': { |
|
'id': '3054113', |
|
'ext': 'mp4', |
|
'title': 'Så här jobbar ficktjuvarna - se avslöjande bilder', |
|
'thumbnail': r're:^https?://.*\.jpg$', |
|
'description': 'Unika bilder avslöjar hur turisternas fickor vittjas mitt på Stockholms central. Två experter på ficktjuvarna avslöjar knepen du ska se upp för.', |
|
'timestamp': int, |
|
'upload_date': '20150130', |
|
}, |
|
}, |
|
{ |
|
'url': 'http://www.tv4play.se/sport/3060959', |
|
'only_matching': True, |
|
}, |
|
{ |
|
'url': 'http://www.tv4play.se/film/2378136', |
|
'only_matching': True, |
|
}, |
|
{ |
|
'url': 'http://www.tv4play.se/barn/looney-tunes?video_id=3062412', |
|
'only_matching': True, |
|
}, |
|
{ |
|
'url': 'http://www.tv4play.se/program/farang/3922081', |
|
'only_matching': True, |
|
} |
|
] |
|
|
|
def _real_extract(self, url): |
|
video_id = self._match_id(url) |
|
|
|
info = self._download_json( |
|
'http://www.tv4play.se/player/assets/%s.json' % video_id, |
|
video_id, 'Downloading video info JSON') |
|
|
|
title = info['title'] |
|
|
|
subtitles = {} |
|
formats = [] |
|
# http formats are linked with unresolvable host |
|
for kind in ('hls3', ''): |
|
data = self._download_json( |
|
'https://prima.tv4play.se/api/web/asset/%s/play.json' % video_id, |
|
video_id, 'Downloading sources JSON', query={ |
|
'protocol': kind, |
|
'videoFormat': 'MP4+WEBVTT', |
|
}) |
|
items = try_get(data, lambda x: x['playback']['items']['item']) |
|
if not items: |
|
continue |
|
if isinstance(items, dict): |
|
items = [items] |
|
for item in items: |
|
manifest_url = item.get('url') |
|
if not isinstance(manifest_url, compat_str): |
|
continue |
|
ext = determine_ext(manifest_url) |
|
if ext == 'm3u8': |
|
formats.extend(self._extract_m3u8_formats( |
|
manifest_url, video_id, 'mp4', entry_protocol='m3u8_native', |
|
m3u8_id=kind, fatal=False)) |
|
elif ext == 'f4m': |
|
formats.extend(self._extract_akamai_formats( |
|
manifest_url, video_id, { |
|
'hls': 'tv4play-i.akamaihd.net', |
|
})) |
|
elif ext == 'webvtt': |
|
subtitles = self._merge_subtitles( |
|
subtitles, { |
|
'sv': [{ |
|
'url': manifest_url, |
|
'ext': 'vtt', |
|
}]}) |
|
|
|
if not formats and info.get('is_geo_restricted'): |
|
self.raise_geo_restricted(countries=self._GEO_COUNTRIES) |
|
|
|
self._sort_formats(formats) |
|
|
|
return { |
|
'id': video_id, |
|
'title': title, |
|
'formats': formats, |
|
'subtitles': subtitles, |
|
'description': info.get('description'), |
|
'timestamp': parse_iso8601(info.get('broadcast_date_time')), |
|
'duration': int_or_none(info.get('duration')), |
|
'thumbnail': info.get('image'), |
|
'is_live': info.get('is_live') is True, |
|
}
|
|
|