[vidme] Add extractor (Closes #3404)
parent
4f31d0f2b7
commit
0138968a6a
2 changed files with 69 additions and 0 deletions
@ -0,0 +1,68 @@ |
||||
from __future__ import unicode_literals |
||||
|
||||
import re |
||||
|
||||
from .common import InfoExtractor |
||||
from ..utils import ( |
||||
int_or_none, |
||||
float_or_none, |
||||
str_to_int, |
||||
) |
||||
|
||||
|
||||
class VidmeIE(InfoExtractor): |
||||
_VALID_URL = r'https?://vid\.me/(?:e/)?(?P<id>[\da-zA-Z]+)' |
||||
_TEST = { |
||||
'url': 'https://vid.me/QNB', |
||||
'md5': 'f42d05e7149aeaec5c037b17e5d3dc82', |
||||
'info_dict': { |
||||
'id': 'QNB', |
||||
'ext': 'mp4', |
||||
'title': 'Fishing for piranha - the easy way', |
||||
'description': 'source: https://www.facebook.com/photo.php?v=312276045600871', |
||||
'duration': 119.92, |
||||
'timestamp': 1406313244, |
||||
'upload_date': '20140725', |
||||
'thumbnail': 're:^https?://.*\.jpg', |
||||
}, |
||||
} |
||||
|
||||
def _real_extract(self, url): |
||||
mobj = re.match(self._VALID_URL, url) |
||||
video_id = mobj.group('id') |
||||
|
||||
webpage = self._download_webpage(url, video_id) |
||||
|
||||
video_url = self._html_search_regex(r'<source src="([^"]+)"', webpage, 'video URL') |
||||
|
||||
title = self._og_search_title(webpage) |
||||
description = self._og_search_description(webpage, default='') |
||||
thumbnail = self._og_search_thumbnail(webpage) |
||||
timestamp = int_or_none(self._og_search_property('updated_time', webpage, fatal=False)) |
||||
width = int_or_none(self._og_search_property('video:width', webpage, fatal=False)) |
||||
height = int_or_none(self._og_search_property('video:height', webpage, fatal=False)) |
||||
duration = float_or_none(self._html_search_regex( |
||||
r'data-duration="([^"]+)"', webpage, 'duration', fatal=False)) |
||||
view_count = str_to_int(self._html_search_regex( |
||||
r'<span class="video_views">\s*([\d,\.]+)\s*plays?', webpage, 'view count', fatal=False)) |
||||
like_count = str_to_int(self._html_search_regex( |
||||
r'class="score js-video-vote-score"[^>]+data-score="([\d,\.\s]+)">', |
||||
webpage, 'like count', fatal=False)) |
||||
comment_count = str_to_int(self._html_search_regex( |
||||
r'class="js-comment-count"[^>]+data-count="([\d,\.\s]+)">', |
||||
webpage, 'comment count', fatal=False)) |
||||
|
||||
return { |
||||
'id': video_id, |
||||
'url': video_url, |
||||
'title': title, |
||||
'description': description, |
||||
'thumbnail': thumbnail, |
||||
'timestamp': timestamp, |
||||
'width': width, |
||||
'height': height, |
||||
'duration': duration, |
||||
'view_count': view_count, |
||||
'like_count': like_count, |
||||
'comment_count': comment_count, |
||||
} |
Loading…
Reference in new issue