youtube-dl/youtube_dl/extractor/hark.py

# coding: utf-8
from __future__ import unicode_literals

from .common import InfoExtractor


class HarkIE(InfoExtractor):
    _VALID_URL = r'https?://(?:www\.)?hark\.com/clips/(?P<id>.+?)-.+'
    _TEST = {
        'url': 'http://www.hark.com/clips/mmbzyhkgny-obama-beyond-the-afghan-theater-we-only-target-al-qaeda-on-may-23-2013',
        'md5': '6783a58491b47b92c7c1af5a77d4cbee',
        'info_dict': {
            'id': 'mmbzyhkgny',
            'ext': 'mp3',
            'title': 'Obama: \'Beyond The Afghan Theater, We Only Target Al Qaeda\' on May 23, 2013',
            'description': 'President Barack Obama addressed the nation live on May 23, 2013 in a speech aimed at addressing counter-terrorism policies including the use of drone strikes, detainees at Guantanamo Bay prison facility, and American citizens who are terrorists.',
            'duration': 11,
        }
    }

    def _real_extract(self, url):
        video_id = self._match_id(url)
        data = self._download_json(
            'http://www.hark.com/clips/%s.json' % video_id, video_id)

        return {
            'id': video_id,
            'url': data['url'],
            'title': data['name'],
            'description': data.get('description'),
            'thumbnail': data.get('image_original'),
            'duration': data.get('duration'),
        }
Unify coding cookie 2016-10-02 13:39:18 +02:00			`# coding: utf-8`
[hark] Modernize 2014-10-24 22:31:55 +02:00			`from __future__ import unicode_literals`
Added an IE for hark.com 2013-08-11 19:23:05 +02:00
			`from .common import InfoExtractor`
[hark] Modernize 2014-10-24 22:31:55 +02:00
Added an IE for hark.com 2013-08-11 19:23:05 +02:00
			`class HarkIE(InfoExtractor):`
Improve some _VALID_URLs 2016-09-08 13:29:05 +02:00			`_VALID_URL = r'https?://(?:www\.)?hark\.com/clips/(?P<id>.+?)-.+'`
Added an IE for hark.com 2013-08-11 19:23:05 +02:00			`_TEST = {`
[hark] Modernize 2014-10-24 22:31:55 +02:00			`'url': 'http://www.hark.com/clips/mmbzyhkgny-obama-beyond-the-afghan-theater-we-only-target-al-qaeda-on-may-23-2013',`
			`'md5': '6783a58491b47b92c7c1af5a77d4cbee',`
			`'info_dict': {`
			`'id': 'mmbzyhkgny',`
			`'ext': 'mp3',`
			`'title': 'Obama: \'Beyond The Afghan Theater, We Only Target Al Qaeda\' on May 23, 2013',`
			`'description': 'President Barack Obama addressed the nation live on May 23, 2013 in a speech aimed at addressing counter-terrorism policies including the use of drone strikes, detainees at Guantanamo Bay prison facility, and American citizens who are terrorists.',`
			`'duration': 11,`
Added an IE for hark.com 2013-08-11 19:23:05 +02:00			`}`
			`}`

			`def _real_extract(self, url):`
[hark] Modernize 2014-10-24 22:31:55 +02:00			`video_id = self._match_id(url)`
			`data = self._download_json(`
			`'http://www.hark.com/clips/%s.json' % video_id, video_id)`
Added an IE for hark.com 2013-08-11 19:23:05 +02:00
[hark] Modernize 2014-10-24 22:31:55 +02:00			`return {`
			`'id': video_id,`
			`'url': data['url'],`
			`'title': data['name'],`
			`'description': data.get('description'),`
			`'thumbnail': data.get('image_original'),`
			`'duration': data.get('duration'),`
			`}`