[shared] Add extractor (Closes #3312)
parent
4192b51c7c
commit
916c145217
2 changed files with 58 additions and 0 deletions
@ -0,0 +1,57 @@ |
||||
from __future__ import unicode_literals |
||||
|
||||
import re |
||||
import base64 |
||||
|
||||
from .common import InfoExtractor |
||||
from ..utils import ( |
||||
ExtractorError, |
||||
compat_urllib_request, |
||||
compat_urllib_parse, |
||||
int_or_none, |
||||
) |
||||
|
||||
|
||||
class SharedIE(InfoExtractor): |
||||
_VALID_URL = r'http://shared\.sx/(?P<id>[\da-z]{10})' |
||||
|
||||
_TEST = { |
||||
'url': 'http://shared.sx/0060718775', |
||||
'md5': '53e1c58fc3e777ae1dfe9e57ba2f9c72', |
||||
'info_dict': { |
||||
'id': '0060718775', |
||||
'ext': 'mp4', |
||||
'title': 'Big Buck Bunny Trailer', |
||||
}, |
||||
} |
||||
|
||||
def _real_extract(self, url): |
||||
mobj = re.match(self._VALID_URL, url) |
||||
video_id = mobj.group('id') |
||||
|
||||
page = self._download_webpage(url, video_id) |
||||
|
||||
if re.search(r'>File does not exist<', page) is not None: |
||||
raise ExtractorError('Video %s does not exist' % video_id, expected=True) |
||||
|
||||
download_form = dict(re.findall(r'<input type="hidden" name="([^"]+)" value="([^"]*)"', page)) |
||||
|
||||
request = compat_urllib_request.Request(url, compat_urllib_parse.urlencode(download_form)) |
||||
request.add_header('Content-Type', 'application/x-www-form-urlencoded') |
||||
|
||||
video_page = self._download_webpage(request, video_id, 'Downloading video page') |
||||
|
||||
video_url = self._html_search_regex(r'data-url="([^"]+)"', video_page, 'video URL') |
||||
title = base64.b64decode(self._html_search_meta('full:title', page, 'title')).decode('utf-8') |
||||
filesize = int_or_none(self._html_search_meta('full:size', page, 'file size', fatal=False)) |
||||
thumbnail = self._html_search_regex( |
||||
r'data-poster="([^"]+)"', video_page, 'thumbnail', fatal=False, default=None) |
||||
|
||||
return { |
||||
'id': video_id, |
||||
'url': video_url, |
||||
'ext': 'mp4', |
||||
'filesize': filesize, |
||||
'title': title, |
||||
'thumbnail': thumbnail, |
||||
} |
Loading…
Reference in new issue