Skip to content

Commit

Permalink
[vivo] Fix extraction (closes #22328, closes #22279)
Browse files Browse the repository at this point in the history
  • Loading branch information
dstftw authored and pareronia committed Jun 22, 2020
1 parent 6a8ae7a commit a4eaef1
Showing 1 changed file with 19 additions and 8 deletions.
27 changes: 19 additions & 8 deletions youtube_dl/extractor/shared.py
Original file line number Diff line number Diff line change
@@ -1,13 +1,18 @@
from __future__ import unicode_literals

from .common import InfoExtractor
from ..compat import compat_b64decode
from ..compat import (
compat_b64decode,
compat_urllib_parse_unquote_plus,
)
from ..utils import (
determine_ext,
ExtractorError,
int_or_none,
js_to_json,
KNOWN_EXTENSIONS,
parse_filesize,
rot47,
url_or_none,
urlencode_postdata,
)
Expand Down Expand Up @@ -112,16 +117,22 @@ def _extract_filesize(self, webpage):
webpage, 'filesize', fatal=False))

def _extract_video_url(self, webpage, video_id, url):
def decode_url(encoded_url):
def decode_url_old(encoded_url):
return compat_b64decode(encoded_url).decode('utf-8')

stream_url = url_or_none(decode_url(self._search_regex(
stream_url = self._search_regex(
r'data-stream\s*=\s*(["\'])(?P<url>(?:(?!\1).)+)\1', webpage,
'stream url', default=None, group='url')))
'stream url', default=None, group='url')
if stream_url:
stream_url = url_or_none(decode_url_old(stream_url))
if stream_url:
return stream_url
return self._parse_json(

def decode_url(encoded_url):
return rot47(compat_urllib_parse_unquote_plus(encoded_url))

return decode_url(self._parse_json(
self._search_regex(
r'InitializeStream\s*\(\s*(["\'])(?P<url>(?:(?!\1).)+)\1',
webpage, 'stream', group='url'),
video_id, transform_source=decode_url)[0]
r'(?s)InitializeStream\s*\(\s*({.+?})\s*\)\s*;', webpage,
'stream'),
video_id, transform_source=js_to_json)['source'])

0 comments on commit a4eaef1

Please sign in to comment.