[extractor/voot] Fix extractor (#7227)
Closes #6715 Authored by: bashonly
This commit is contained in:
parent
d1795f4a6a
commit
4f7b11cc1c
1 changed files with 119 additions and 58 deletions
|
@ -1,14 +1,86 @@
|
||||||
|
import json
|
||||||
|
import time
|
||||||
|
import urllib.error
|
||||||
|
import uuid
|
||||||
|
|
||||||
from .common import InfoExtractor
|
from .common import InfoExtractor
|
||||||
from ..compat import compat_str
|
from ..compat import compat_str
|
||||||
from ..utils import (
|
from ..utils import (
|
||||||
ExtractorError,
|
ExtractorError,
|
||||||
|
float_or_none,
|
||||||
int_or_none,
|
int_or_none,
|
||||||
|
jwt_decode_hs256,
|
||||||
|
parse_age_limit,
|
||||||
|
traverse_obj,
|
||||||
|
try_call,
|
||||||
try_get,
|
try_get,
|
||||||
unified_timestamp,
|
unified_strdate,
|
||||||
)
|
)
|
||||||
|
|
||||||
|
|
||||||
class VootIE(InfoExtractor):
|
class VootBaseIE(InfoExtractor):
|
||||||
|
_NETRC_MACHINE = 'voot'
|
||||||
|
_GEO_BYPASS = False
|
||||||
|
_LOGIN_HINT = 'Log in with "-u <email_address> -p <password>", or use "-u token -p <auth_token>" to login with auth token.'
|
||||||
|
_TOKEN = None
|
||||||
|
_EXPIRY = 0
|
||||||
|
_API_HEADERS = {'Origin': 'https://www.voot.com', 'Referer': 'https://www.voot.com/'}
|
||||||
|
|
||||||
|
def _perform_login(self, username, password):
|
||||||
|
if self._TOKEN and self._EXPIRY:
|
||||||
|
return
|
||||||
|
|
||||||
|
if username.lower() == 'token' and try_call(lambda: jwt_decode_hs256(password)):
|
||||||
|
VootBaseIE._TOKEN = password
|
||||||
|
VootBaseIE._EXPIRY = jwt_decode_hs256(password)['exp']
|
||||||
|
self.report_login()
|
||||||
|
|
||||||
|
# Mobile number as username is not supported
|
||||||
|
elif not username.isdigit():
|
||||||
|
check_username = self._download_json(
|
||||||
|
'https://userauth.voot.com/usersV3/v3/checkUser', None, data=json.dumps({
|
||||||
|
'type': 'email',
|
||||||
|
'email': username
|
||||||
|
}, separators=(',', ':')).encode(), headers={
|
||||||
|
**self._API_HEADERS,
|
||||||
|
'Content-Type': 'application/json;charset=utf-8',
|
||||||
|
}, note='Checking username', expected_status=403)
|
||||||
|
if not traverse_obj(check_username, ('isExist', {bool})):
|
||||||
|
if traverse_obj(check_username, ('status', 'code', {int})) == 9999:
|
||||||
|
self.raise_geo_restricted(countries=['IN'])
|
||||||
|
raise ExtractorError('Incorrect username', expected=True)
|
||||||
|
auth_token = traverse_obj(self._download_json(
|
||||||
|
'https://userauth.voot.com/usersV3/v3/login', None, data=json.dumps({
|
||||||
|
'type': 'traditional',
|
||||||
|
'deviceId': str(uuid.uuid4()),
|
||||||
|
'deviceBrand': 'PC/MAC',
|
||||||
|
'data': {
|
||||||
|
'email': username,
|
||||||
|
'password': password
|
||||||
|
}
|
||||||
|
}, separators=(',', ':')).encode(), headers={
|
||||||
|
**self._API_HEADERS,
|
||||||
|
'Content-Type': 'application/json;charset=utf-8',
|
||||||
|
}, note='Logging in', expected_status=400), ('data', 'authToken', {dict}))
|
||||||
|
if not auth_token:
|
||||||
|
raise ExtractorError('Incorrect password', expected=True)
|
||||||
|
VootBaseIE._TOKEN = auth_token['accessToken']
|
||||||
|
VootBaseIE._EXPIRY = auth_token['expirationTime']
|
||||||
|
|
||||||
|
else:
|
||||||
|
raise ExtractorError(self._LOGIN_HINT, expected=True)
|
||||||
|
|
||||||
|
def _check_token_expiry(self):
|
||||||
|
if int(time.time()) >= self._EXPIRY:
|
||||||
|
raise ExtractorError('Access token has expired', expected=True)
|
||||||
|
|
||||||
|
def _real_initialize(self):
|
||||||
|
if not self._TOKEN:
|
||||||
|
self.raise_login_required(self._LOGIN_HINT, method=None)
|
||||||
|
self._check_token_expiry()
|
||||||
|
|
||||||
|
|
||||||
|
class VootIE(VootBaseIE):
|
||||||
_VALID_URL = r'''(?x)
|
_VALID_URL = r'''(?x)
|
||||||
(?:
|
(?:
|
||||||
voot:|
|
voot:|
|
||||||
|
@ -20,27 +92,25 @@ class VootIE(InfoExtractor):
|
||||||
)
|
)
|
||||||
(?P<id>\d{3,})
|
(?P<id>\d{3,})
|
||||||
'''
|
'''
|
||||||
_GEO_COUNTRIES = ['IN']
|
|
||||||
_TESTS = [{
|
_TESTS = [{
|
||||||
'url': 'https://www.voot.com/shows/ishq-ka-rang-safed/1/360558/is-this-the-end-of-kamini-/441353',
|
'url': 'https://www.voot.com/shows/ishq-ka-rang-safed/1/360558/is-this-the-end-of-kamini-/441353',
|
||||||
'info_dict': {
|
'info_dict': {
|
||||||
'id': '0_8ledb18o',
|
'id': '441353',
|
||||||
'ext': 'mp4',
|
'ext': 'mp4',
|
||||||
'title': 'Ishq Ka Rang Safed - Season 01 - Episode 340',
|
'title': 'Is this the end of Kamini?',
|
||||||
'description': 'md5:06291fbbbc4dcbe21235c40c262507c1',
|
'description': 'md5:06291fbbbc4dcbe21235c40c262507c1',
|
||||||
'timestamp': 1472162937,
|
'timestamp': 1472103000,
|
||||||
'upload_date': '20160825',
|
'upload_date': '20160825',
|
||||||
'series': 'Ishq Ka Rang Safed',
|
'series': 'Ishq Ka Rang Safed',
|
||||||
'season_number': 1,
|
'season_number': 1,
|
||||||
'episode': 'Is this the end of Kamini?',
|
'episode': 'Is this the end of Kamini?',
|
||||||
'episode_number': 340,
|
'episode_number': 340,
|
||||||
'view_count': int,
|
'release_date': '20160825',
|
||||||
'like_count': int,
|
'season': 'Season 1',
|
||||||
|
'age_limit': 13,
|
||||||
|
'duration': 1146.0,
|
||||||
},
|
},
|
||||||
'params': {
|
'params': {'skip_download': 'm3u8'},
|
||||||
'skip_download': True,
|
|
||||||
},
|
|
||||||
'expected_warnings': ['Failed to download m3u8 information'],
|
|
||||||
}, {
|
}, {
|
||||||
'url': 'https://www.voot.com/kids/characters/mighty-cat-masked-niyander-e-/400478/school-bag-disappears/440925',
|
'url': 'https://www.voot.com/kids/characters/mighty-cat-masked-niyander-e-/400478/school-bag-disappears/440925',
|
||||||
'only_matching': True,
|
'only_matching': True,
|
||||||
|
@ -55,59 +125,50 @@ class VootIE(InfoExtractor):
|
||||||
def _real_extract(self, url):
|
def _real_extract(self, url):
|
||||||
video_id = self._match_id(url)
|
video_id = self._match_id(url)
|
||||||
media_info = self._download_json(
|
media_info = self._download_json(
|
||||||
'https://wapi.voot.com/ws/ott/getMediaInfo.json', video_id,
|
'https://psapi.voot.com/jio/voot/v1/voot-web/content/query/asset-details', video_id,
|
||||||
query={
|
query={'ids': f'include:{video_id}', 'responseType': 'common'}, headers={'accesstoken': self._TOKEN})
|
||||||
'platform': 'Web',
|
|
||||||
'pId': 2,
|
|
||||||
'mediaId': video_id,
|
|
||||||
})
|
|
||||||
|
|
||||||
status_code = try_get(media_info, lambda x: x['status']['code'], int)
|
try:
|
||||||
if status_code != 0:
|
m3u8_url = self._download_json(
|
||||||
raise ExtractorError(media_info['status']['message'], expected=True)
|
'https://vootapi.media.jio.com/playback/v1/playbackrights', video_id,
|
||||||
|
'Downloading playback JSON', data=b'{}', headers={
|
||||||
|
**self.geo_verification_headers(),
|
||||||
|
**self._API_HEADERS,
|
||||||
|
'Content-Type': 'application/json;charset=utf-8',
|
||||||
|
'platform': 'androidwebdesktop',
|
||||||
|
'vootid': video_id,
|
||||||
|
'voottoken': self._TOKEN,
|
||||||
|
})['m3u8']
|
||||||
|
except ExtractorError as e:
|
||||||
|
if isinstance(e.cause, urllib.error.HTTPError) and e.cause.code == 400:
|
||||||
|
self._check_token_expiry()
|
||||||
|
raise
|
||||||
|
|
||||||
media = media_info['assets']
|
formats = self._extract_m3u8_formats(m3u8_url, video_id, 'mp4', m3u8_id='hls')
|
||||||
|
self._remove_duplicate_formats(formats)
|
||||||
|
|
||||||
entry_id = media['EntryId']
|
|
||||||
title = media['MediaName']
|
|
||||||
formats = self._extract_m3u8_formats(
|
|
||||||
'https://cdnapisec.kaltura.com/p/1982551/playManifest/pt/https/f/applehttp/t/web/e/' + entry_id,
|
|
||||||
video_id, 'mp4', m3u8_id='hls')
|
|
||||||
|
|
||||||
description, series, season_number, episode, episode_number = [None] * 5
|
|
||||||
|
|
||||||
for meta in try_get(media, lambda x: x['Metas'], list) or []:
|
|
||||||
key, value = meta.get('Key'), meta.get('Value')
|
|
||||||
if not key or not value:
|
|
||||||
continue
|
|
||||||
if key == 'ContentSynopsis':
|
|
||||||
description = value
|
|
||||||
elif key == 'RefSeriesTitle':
|
|
||||||
series = value
|
|
||||||
elif key == 'RefSeriesSeason':
|
|
||||||
season_number = int_or_none(value)
|
|
||||||
elif key == 'EpisodeMainTitle':
|
|
||||||
episode = value
|
|
||||||
elif key == 'EpisodeNo':
|
|
||||||
episode_number = int_or_none(value)
|
|
||||||
return {
|
return {
|
||||||
'extractor_key': 'Kaltura',
|
'id': video_id,
|
||||||
'id': entry_id,
|
# '/_definst_/smil:vod/' m3u8 manifests claim to have 720p+ formats but max out at 480p
|
||||||
'title': title,
|
'formats': traverse_obj(formats, (
|
||||||
'description': description,
|
lambda _, v: '/_definst_/smil:vod/' not in v['url'] or v['height'] <= 480)),
|
||||||
'series': series,
|
'http_headers': self._API_HEADERS,
|
||||||
'season_number': season_number,
|
**traverse_obj(media_info, ('result', 0, {
|
||||||
'episode': episode,
|
'title': ('fullTitle', {str}),
|
||||||
'episode_number': episode_number,
|
'description': ('fullSynopsis', {str}),
|
||||||
'timestamp': unified_timestamp(media.get('CreationDate')),
|
'series': ('showName', {str}),
|
||||||
'duration': int_or_none(media.get('Duration')),
|
'season_number': ('season', {int_or_none}),
|
||||||
'view_count': int_or_none(media.get('ViewCounter')),
|
'episode': ('fullTitle', {str}),
|
||||||
'like_count': int_or_none(media.get('like_counter')),
|
'episode_number': ('episode', {int_or_none}),
|
||||||
'formats': formats,
|
'timestamp': ('uploadTime', {int_or_none}),
|
||||||
|
'release_date': ('telecastDate', {unified_strdate}),
|
||||||
|
'age_limit': ('ageNemonic', {parse_age_limit}),
|
||||||
|
'duration': ('duration', {float_or_none}),
|
||||||
|
})),
|
||||||
}
|
}
|
||||||
|
|
||||||
|
|
||||||
class VootSeriesIE(InfoExtractor):
|
class VootSeriesIE(VootBaseIE):
|
||||||
_VALID_URL = r'https?://(?:www\.)?voot\.com/shows/[^/]+/(?P<id>\d{3,})'
|
_VALID_URL = r'https?://(?:www\.)?voot\.com/shows/[^/]+/(?P<id>\d{3,})'
|
||||||
_TESTS = [{
|
_TESTS = [{
|
||||||
'url': 'https://www.voot.com/shows/chakravartin-ashoka-samrat/100002',
|
'url': 'https://www.voot.com/shows/chakravartin-ashoka-samrat/100002',
|
||||||
|
|
Loading…
Reference in a new issue