[thescene] fix extraction(closes #13061)

This commit is contained in:
Remita Amine 2017-05-12 16:32:38 +01:00
parent 6c52477f59
commit 7ad4362357

View File

@ -3,10 +3,6 @@
from .common import InfoExtractor from .common import InfoExtractor
from ..compat import compat_urlparse from ..compat import compat_urlparse
from ..utils import (
int_or_none,
qualities,
)
class TheSceneIE(InfoExtractor): class TheSceneIE(InfoExtractor):
@ -24,6 +20,9 @@ class TheSceneIE(InfoExtractor):
'season': 'Ready To Wear Spring 2013', 'season': 'Ready To Wear Spring 2013',
'tags': list, 'tags': list,
'categories': list, 'categories': list,
'upload_date': '20120913',
'timestamp': 1347512400,
'uploader': 'vogue',
}, },
} }
@ -37,32 +36,9 @@ def _real_extract(self, url):
self._html_search_regex( self._html_search_regex(
r'id=\'js-player-script\'[^>]+src=\'(.+?)\'', webpage, 'player url')) r'id=\'js-player-script\'[^>]+src=\'(.+?)\'', webpage, 'player url'))
player = self._download_webpage(player_url, display_id)
info = self._parse_json(
self._search_regex(
r'(?m)video\s*:\s*({.+?}),$', player, 'info json'),
display_id)
video_id = info['id']
title = info['title']
qualities_order = qualities(('low', 'high'))
formats = [{
'format_id': '{0}-{1}'.format(f['type'].split('/')[0], f['quality']),
'url': f['src'],
'quality': qualities_order(f['quality']),
} for f in info['sources']]
self._sort_formats(formats)
return { return {
'id': video_id, '_type': 'url_transparent',
'display_id': display_id, 'display_id': display_id,
'title': title, 'url': player_url,
'formats': formats, 'ie_key': 'CondeNast',
'thumbnail': info.get('poster_frame'),
'duration': int_or_none(info.get('duration')),
'series': info.get('series_title'),
'season': info.get('season_title'),
'tags': info.get('tags'),
'categories': info.get('categories'),
} }