from __future__ import unicode_literals from .common import InfoExtractor from ..utils import int_or_none class VimpleIE(InfoExtractor): IE_DESC = 'Vimple - one-click video hosting' _VALID_URL = r'https?://(?:player\.vimple\.ru/iframe|vimple\.ru)/(?P<id>[\da-f-]{32,36})' _TESTS = [ { 'url': 'http://vimple.ru/c0f6b1687dcd4000a97ebe70068039cf', 'md5': '2e750a330ed211d3fd41821c6ad9a279', 'info_dict': { 'id': 'c0f6b168-7dcd-4000-a97e-be70068039cf', 'ext': 'mp4', 'title': 'Sunset', 'duration': 20, 'thumbnail': 're:https?://.*?\.jpg', }, }, { 'url': 'http://player.vimple.ru/iframe/52e1beec-1314-4a83-aeac-c61562eadbf9', 'only_matching': True, } ] def _real_extract(self, url): video_id = self._match_id(url) webpage = self._download_webpage( 'http://player.vimple.ru/iframe/%s' % video_id, video_id) playlist = self._parse_json( self._search_regex( r'sprutoData\s*:\s*({.+?}),\r\n', webpage, 'spruto data'), video_id)['playlist'][0] title = playlist['title'] video_id = playlist.get('videoId') or video_id thumbnail = playlist.get('posterUrl') or playlist.get('thumbnailUrl') duration = int_or_none(playlist.get('duration')) formats = [{ 'url': f['url'], } for f in playlist['video']] self._sort_formats(formats) return { 'id': video_id, 'title': title, 'thumbnail': thumbnail, 'duration': duration, 'formats': formats, }