You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
98 lines
3.2 KiB
98 lines
3.2 KiB
# coding: utf-8 |
|
from __future__ import unicode_literals |
|
|
|
from .common import InfoExtractor |
|
from ..compat import compat_chr |
|
from ..utils import ( |
|
determine_ext, |
|
ExtractorError, |
|
) |
|
|
|
|
|
class OpenloadIE(InfoExtractor): |
|
_VALID_URL = r'https?://(?:openload\.(?:co|io)|oload\.tv)/(?:f|embed)/(?P<id>[a-zA-Z0-9-_]+)' |
|
|
|
_TESTS = [{ |
|
'url': 'https://openload.co/f/kUEfGclsU9o', |
|
'md5': 'bf1c059b004ebc7a256f89408e65c36e', |
|
'info_dict': { |
|
'id': 'kUEfGclsU9o', |
|
'ext': 'mp4', |
|
'title': 'skyrim_no-audio_1080.mp4', |
|
'thumbnail': r're:^https?://.*\.jpg$', |
|
}, |
|
}, { |
|
'url': 'https://openload.co/embed/rjC09fkPLYs', |
|
'info_dict': { |
|
'id': 'rjC09fkPLYs', |
|
'ext': 'mp4', |
|
'title': 'movie.mp4', |
|
'thumbnail': r're:^https?://.*\.jpg$', |
|
'subtitles': { |
|
'en': [{ |
|
'ext': 'vtt', |
|
}], |
|
}, |
|
}, |
|
'params': { |
|
'skip_download': True, # test subtitles only |
|
}, |
|
}, { |
|
'url': 'https://openload.co/embed/kUEfGclsU9o/skyrim_no-audio_1080.mp4', |
|
'only_matching': True, |
|
}, { |
|
'url': 'https://openload.io/f/ZAn6oz-VZGE/', |
|
'only_matching': True, |
|
}, { |
|
'url': 'https://openload.co/f/_-ztPaZtMhM/', |
|
'only_matching': True, |
|
}, { |
|
# unavailable via https://openload.co/f/Sxz5sADo82g/, different layout |
|
# for title and ext |
|
'url': 'https://openload.co/embed/Sxz5sADo82g/', |
|
'only_matching': True, |
|
}, { |
|
'url': 'https://oload.tv/embed/KnG-kKZdcfY/', |
|
'only_matching': True, |
|
}] |
|
|
|
def _real_extract(self, url): |
|
video_id = self._match_id(url) |
|
webpage = self._download_webpage('https://openload.co/embed/%s/' % video_id, video_id) |
|
|
|
if 'File not found' in webpage or 'deleted by the owner' in webpage: |
|
raise ExtractorError('File not found', expected=True) |
|
|
|
ol_id = self._search_regex( |
|
'<span[^>]+id="[a-zA-Z0-9]+x"[^>]*>([0-9]+)</span>', |
|
webpage, 'openload ID') |
|
|
|
first_two_chars = int(float(ol_id[0:][:2])) |
|
urlcode = '' |
|
num = 2 |
|
|
|
while num < len(ol_id): |
|
urlcode += compat_chr(int(float(ol_id[num:][:3])) - |
|
first_two_chars * int(float(ol_id[num + 3:][:2]))) |
|
num += 5 |
|
|
|
video_url = 'https://openload.co/stream/' + urlcode |
|
|
|
title = self._og_search_title(webpage, default=None) or self._search_regex( |
|
r'<span[^>]+class=["\']title["\'][^>]*>([^<]+)', webpage, |
|
'title', default=None) or self._html_search_meta( |
|
'description', webpage, 'title', fatal=True) |
|
|
|
entries = self._parse_html5_media_entries(url, webpage, video_id) |
|
subtitles = entries[0]['subtitles'] if entries else None |
|
|
|
info_dict = { |
|
'id': video_id, |
|
'title': title, |
|
'thumbnail': self._og_search_thumbnail(webpage, default=None), |
|
'url': video_url, |
|
# Seems all videos have extensions in their titles |
|
'ext': determine_ext(title), |
|
'subtitles': subtitles, |
|
} |
|
return info_dict
|
|
|