mirror of
https://github.com/yt-dlp/yt-dlp.git
synced 2024-12-20 18:27:46 +01:00
86e5f3ed2e
Using https://github.com/asottile/pyupgrade 1. `__future__` imports and `coding: utf-8` were removed 2. Files were rewritten with `pyupgrade --py36-plus --keep-percent-format` 3. f-strings were cherry-picked from `pyupgrade --py36-plus` Extractors are left untouched (except removing header) to avoid unnecessary merge conflicts
46 lines
1.9 KiB
Python
46 lines
1.9 KiB
Python
from .common import InfoExtractor
|
|
from .jwplatform import JWPlatformIE
|
|
|
|
|
|
class BusinessInsiderIE(InfoExtractor):
|
|
_VALID_URL = r'https?://(?:[^/]+\.)?businessinsider\.(?:com|nl)/(?:[^/]+/)*(?P<id>[^/?#&]+)'
|
|
_TESTS = [{
|
|
'url': 'http://uk.businessinsider.com/how-much-radiation-youre-exposed-to-in-everyday-life-2016-6',
|
|
'md5': 'ffed3e1e12a6f950aa2f7d83851b497a',
|
|
'info_dict': {
|
|
'id': 'cjGDb0X9',
|
|
'ext': 'mp4',
|
|
'title': "Bananas give you more radiation exposure than living next to a nuclear power plant",
|
|
'description': 'md5:0175a3baf200dd8fa658f94cade841b3',
|
|
'upload_date': '20160611',
|
|
'timestamp': 1465675620,
|
|
},
|
|
}, {
|
|
'url': 'https://www.businessinsider.nl/5-scientifically-proven-things-make-you-less-attractive-2017-7/',
|
|
'md5': '43f438dbc6da0b89f5ac42f68529d84a',
|
|
'info_dict': {
|
|
'id': '5zJwd4FK',
|
|
'ext': 'mp4',
|
|
'title': 'Deze dingen zorgen ervoor dat je minder snel een date scoort',
|
|
'description': 'md5:2af8975825d38a4fed24717bbe51db49',
|
|
'upload_date': '20170705',
|
|
'timestamp': 1499270528,
|
|
},
|
|
}, {
|
|
'url': 'http://www.businessinsider.com/excel-index-match-vlookup-video-how-to-2015-2?IR=T',
|
|
'only_matching': True,
|
|
}]
|
|
|
|
def _real_extract(self, url):
|
|
video_id = self._match_id(url)
|
|
webpage = self._download_webpage(url, video_id)
|
|
jwplatform_id = self._search_regex(
|
|
(r'data-media-id=["\']([a-zA-Z0-9]{8})',
|
|
r'id=["\']jwplayer_([a-zA-Z0-9]{8})',
|
|
r'id["\']?\s*:\s*["\']?([a-zA-Z0-9]{8})',
|
|
r'(?:jwplatform\.com/players/|jwplayer_)([a-zA-Z0-9]{8})'),
|
|
webpage, 'jwplatform id')
|
|
return self.url_result(
|
|
'jwplatform:%s' % jwplatform_id, ie=JWPlatformIE.ie_key(),
|
|
video_id=video_id)
|