[abc] Add extractor (closes #3361)
parent
11b85ce62e
commit
64ce58db38
2 changed files with 49 additions and 0 deletions
@ -0,0 +1,48 @@ |
|||||||
|
from __future__ import unicode_literals |
||||||
|
|
||||||
|
import re |
||||||
|
import json |
||||||
|
|
||||||
|
from .common import InfoExtractor |
||||||
|
|
||||||
|
|
||||||
|
class ABCIE(InfoExtractor): |
||||||
|
IE_NAME = 'abc.net.au' |
||||||
|
_VALID_URL = r'http://www\.abc\.net\.au/news/[^/]+/[^/]+/(?P<id>\d+)' |
||||||
|
|
||||||
|
_TEST = { |
||||||
|
'url': 'http://www.abc.net.au/news/2014-07-25/bringing-asylum-seekers-to-australia-would-give/5624716', |
||||||
|
'md5': 'dad6f8ad011a70d9ddf887ce6d5d0742', |
||||||
|
'info_dict': { |
||||||
|
'id': '5624716', |
||||||
|
'ext': 'mp4', |
||||||
|
'title': 'Bringing asylum seekers to Australia would give them right to asylum claims: professor', |
||||||
|
'description': 'md5:ba36fa5e27e5c9251fd929d339aea4af', |
||||||
|
}, |
||||||
|
} |
||||||
|
|
||||||
|
def _real_extract(self, url): |
||||||
|
mobj = re.match(self._VALID_URL, url) |
||||||
|
video_id = mobj.group('id') |
||||||
|
webpage = self._download_webpage(url, video_id) |
||||||
|
|
||||||
|
urls_info_json = self._search_regex( |
||||||
|
r'inlineVideoData\.push\((.*?)\);', webpage, 'video urls', |
||||||
|
flags=re.DOTALL) |
||||||
|
urls_info = json.loads(urls_info_json.replace('\'', '"')) |
||||||
|
formats = [{ |
||||||
|
'url': url_info['url'], |
||||||
|
'width': int(url_info['width']), |
||||||
|
'height': int(url_info['height']), |
||||||
|
'tbr': int(url_info['bitrate']), |
||||||
|
'filesize': int(url_info['filesize']), |
||||||
|
} for url_info in urls_info] |
||||||
|
self._sort_formats(formats) |
||||||
|
|
||||||
|
return { |
||||||
|
'id': video_id, |
||||||
|
'title': self._og_search_title(webpage), |
||||||
|
'formats': formats, |
||||||
|
'description': self._og_search_description(webpage), |
||||||
|
'thumbnail': self._og_search_thumbnail(webpage), |
||||||
|
} |
Loading…
Reference in new issue