parent
5de538787d
commit
061d1cd948
1 changed files with 59 additions and 33 deletions
@ -1,54 +1,80 @@ |
||||
from __future__ import unicode_literals |
||||
|
||||
import re |
||||
|
||||
from .common import InfoExtractor |
||||
from ..utils import ExtractorError |
||||
|
||||
|
||||
class NhkVodIE(InfoExtractor): |
||||
_VALID_URL = r'https?://www3\.nhk\.or\.jp/nhkworld/en/(?:vod|ondemand)/(?P<id>[^/]+/[^/?#&]+)' |
||||
_VALID_URL = r'https?://www3\.nhk\.or\.jp/nhkworld/(?P<lang>[a-z]{2})/ondemand/(?P<type>video|audio)/(?P<id>\d{7}|[a-z]+-\d{8}-\d+)' |
||||
# Content available only for a limited period of time. Visit |
||||
# https://www3.nhk.or.jp/nhkworld/en/ondemand/ for working samples. |
||||
_TESTS = [{ |
||||
# Videos available only for a limited period of time. Visit |
||||
# http://www3.nhk.or.jp/nhkworld/en/vod/ for working samples. |
||||
'url': 'http://www3.nhk.or.jp/nhkworld/en/vod/tokyofashion/20160815', |
||||
'info_dict': { |
||||
'id': 'A1bnNiNTE6nY3jLllS-BIISfcC_PpvF5', |
||||
'ext': 'flv', |
||||
'title': 'TOKYO FASHION EXPRESS - The Kimono as Global Fashion', |
||||
'description': 'md5:db338ee6ce8204f415b754782f819824', |
||||
'series': 'TOKYO FASHION EXPRESS', |
||||
'episode': 'The Kimono as Global Fashion', |
||||
}, |
||||
'skip': 'Videos available only for a limited period of time', |
||||
}, { |
||||
'url': 'https://www3.nhk.or.jp/nhkworld/en/ondemand/video/2015173/', |
||||
'only_matching': True, |
||||
}, { |
||||
'url': 'https://www3.nhk.or.jp/nhkworld/en/ondemand/audio/plugin-20190404-1/', |
||||
'only_matching': True, |
||||
}, { |
||||
'url': 'https://www3.nhk.or.jp/nhkworld/fr/ondemand/audio/plugin-20190404-1/', |
||||
'only_matching': True, |
||||
}] |
||||
_API_URL = 'http://api.nhk.or.jp/nhkworld/vodesdlist/v1/all/all/all.json?apikey=EJfK8jdS57GqlupFgAfAAwr573q01y6k' |
||||
_API_URL_TEMPLATE = 'https://api.nhk.or.jp/nhkworld/%sodesdlist/v7/episode/%s/%s/all%s.json' |
||||
|
||||
def _real_extract(self, url): |
||||
video_id = self._match_id(url) |
||||
lang, m_type, episode_id = re.match(self._VALID_URL, url).groups() |
||||
if episode_id.isdigit(): |
||||
episode_id = episode_id[:4] + '-' + episode_id[4:] |
||||
|
||||
data = self._download_json(self._API_URL, video_id) |
||||
is_video = m_type == 'video' |
||||
episode = self._download_json( |
||||
self._API_URL_TEMPLATE % ('v' if is_video else 'r', episode_id, lang, '/all' if is_video else ''), |
||||
episode_id, query={'apikey': 'EJfK8jdS57GqlupFgAfAAwr573q01y6k'})['data']['episodes'][0] |
||||
title = episode.get('sub_title_clean') or episode['sub_title'] |
||||
|
||||
try: |
||||
episode = next( |
||||
e for e in data['data']['episodes'] |
||||
if e.get('url') and video_id in e['url']) |
||||
except StopIteration: |
||||
raise ExtractorError('Unable to find episode') |
||||
def get_clean_field(key): |
||||
return episode.get(key + '_clean') or episode.get(key) |
||||
|
||||
embed_code = episode['vod_id'] |
||||
series = get_clean_field('title') |
||||
|
||||
title = episode.get('sub_title_clean') or episode['sub_title'] |
||||
description = episode.get('description_clean') or episode.get('description') |
||||
series = episode.get('title_clean') or episode.get('title') |
||||
thumbnails = [] |
||||
for s, w, h in [('', 640, 360), ('_l', 1280, 720)]: |
||||
img_path = episode.get('image' + s) |
||||
if not img_path: |
||||
continue |
||||
thumbnails.append({ |
||||
'id': '%dp' % h, |
||||
'height': h, |
||||
'width': w, |
||||
'url': 'https://www3.nhk.or.jp' + img_path, |
||||
}) |
||||
|
||||
return { |
||||
'_type': 'url_transparent', |
||||
'ie_key': 'Ooyala', |
||||
'url': 'ooyala:%s' % embed_code, |
||||
info = { |
||||
'id': episode_id + '-' + lang, |
||||
'title': '%s - %s' % (series, title) if series and title else title, |
||||
'description': description, |
||||
'description': get_clean_field('description'), |
||||
'thumbnails': thumbnails, |
||||
'series': series, |
||||
'episode': title, |
||||
} |
||||
if is_video: |
||||
info.update({ |
||||
'_type': 'url_transparent', |
||||
'ie_key': 'Ooyala', |
||||
'url': 'ooyala:' + episode['vod_id'], |
||||
}) |
||||
else: |
||||
audio = episode['audio'] |
||||
audio_path = audio['audio'] |
||||
info['formats'] = self._extract_m3u8_formats( |
||||
'https://nhks-vh.akamaihd.net/i%s/master.m3u8' % audio_path, |
||||
episode_id, 'm4a', m3u8_id='hls', fatal=False) |
||||
info['formats'].append({ |
||||
'ext': 'flv', |
||||
'format_id': 'flv', |
||||
'url': 'rtmp://flv.nhk.or.jp/ondemand/mp4:flv' + audio_path, |
||||
'vcodec': 'none', |
||||
}) |
||||
for f in info['formats']: |
||||
f['language'] = lang |
||||
return info |
||||
|
Loading…
Reference in new issue