You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
128 lines
4.0 KiB
128 lines
4.0 KiB
# coding: utf-8 |
|
from __future__ import unicode_literals |
|
|
|
import re |
|
|
|
from .common import InfoExtractor |
|
from ..compat import compat_chr |
|
from ..utils import ( |
|
determine_ext, |
|
ExtractorError, |
|
) |
|
|
|
|
|
class OpenloadIE(InfoExtractor): |
|
_VALID_URL = r'https?://(?:openload\.(?:co|io)|oload\.tv)/(?:f|embed)/(?P<id>[a-zA-Z0-9-_]+)' |
|
|
|
_TESTS = [{ |
|
'url': 'https://openload.co/f/kUEfGclsU9o', |
|
'md5': 'bf1c059b004ebc7a256f89408e65c36e', |
|
'info_dict': { |
|
'id': 'kUEfGclsU9o', |
|
'ext': 'mp4', |
|
'title': 'skyrim_no-audio_1080.mp4', |
|
'thumbnail': r're:^https?://.*\.jpg$', |
|
}, |
|
}, { |
|
'url': 'https://openload.co/embed/rjC09fkPLYs', |
|
'info_dict': { |
|
'id': 'rjC09fkPLYs', |
|
'ext': 'mp4', |
|
'title': 'movie.mp4', |
|
'thumbnail': r're:^https?://.*\.jpg$', |
|
'subtitles': { |
|
'en': [{ |
|
'ext': 'vtt', |
|
}], |
|
}, |
|
}, |
|
'params': { |
|
'skip_download': True, # test subtitles only |
|
}, |
|
}, { |
|
'url': 'https://openload.co/embed/kUEfGclsU9o/skyrim_no-audio_1080.mp4', |
|
'only_matching': True, |
|
}, { |
|
'url': 'https://openload.io/f/ZAn6oz-VZGE/', |
|
'only_matching': True, |
|
}, { |
|
'url': 'https://openload.co/f/_-ztPaZtMhM/', |
|
'only_matching': True, |
|
}, { |
|
# unavailable via https://openload.co/f/Sxz5sADo82g/, different layout |
|
# for title and ext |
|
'url': 'https://openload.co/embed/Sxz5sADo82g/', |
|
'only_matching': True, |
|
}, { |
|
'url': 'https://oload.tv/embed/KnG-kKZdcfY/', |
|
'only_matching': True, |
|
}] |
|
|
|
@staticmethod |
|
def _extract_urls(webpage): |
|
return re.findall( |
|
r'<iframe[^>]+src=["\']((?:https?://)?(?:openload\.(?:co|io)|oload\.tv)/embed/[a-zA-Z0-9-_]+)', |
|
webpage) |
|
|
|
def _real_extract(self, url): |
|
video_id = self._match_id(url) |
|
webpage = self._download_webpage('https://openload.co/embed/%s/' % video_id, video_id) |
|
|
|
if 'File not found' in webpage or 'deleted by the owner' in webpage: |
|
raise ExtractorError('File not found', expected=True) |
|
|
|
ol_id = self._search_regex( |
|
'<span[^>]+id="[^"]+"[^>]*>([0-9A-Za-z]+)</span>', |
|
webpage, 'openload ID') |
|
|
|
decoded = '' |
|
a = ol_id[0:24] |
|
b = [] |
|
for i in range(0, len(a), 8): |
|
b.append(int(a[i:i + 8] or '0', 16)) |
|
ol_id = ol_id[24:] |
|
j = 0 |
|
k = 0 |
|
while j < len(ol_id): |
|
c = 128 |
|
d = 0 |
|
e = 0 |
|
f = 0 |
|
_more = True |
|
while _more: |
|
if j + 1 >= len(ol_id): |
|
c = 143 |
|
f = int(ol_id[j:j + 2] or '0', 16) |
|
j += 2 |
|
d += (f & 127) << e |
|
e += 7 |
|
_more = f >= c |
|
g = d ^ b[k % 3] |
|
for i in range(4): |
|
char_dec = (g >> 8 * i) & (c + 127) |
|
char = compat_chr(char_dec) |
|
if char != '#': |
|
decoded += char |
|
k += 1 |
|
|
|
video_url = 'https://openload.co/stream/%s?mime=true' |
|
video_url = video_url % decoded |
|
|
|
title = self._og_search_title(webpage, default=None) or self._search_regex( |
|
r'<span[^>]+class=["\']title["\'][^>]*>([^<]+)', webpage, |
|
'title', default=None) or self._html_search_meta( |
|
'description', webpage, 'title', fatal=True) |
|
|
|
entries = self._parse_html5_media_entries(url, webpage, video_id) |
|
subtitles = entries[0]['subtitles'] if entries else None |
|
|
|
info_dict = { |
|
'id': video_id, |
|
'title': title, |
|
'thumbnail': self._og_search_thumbnail(webpage, default=None), |
|
'url': video_url, |
|
# Seems all videos have extensions in their titles |
|
'ext': determine_ext(title, 'mp4'), |
|
'subtitles': subtitles, |
|
} |
|
return info_dict
|
|
|