youtube-dl/youtube_dl/extractor/howcast.py

from __future__ import unicode_literals

import re

from .common import InfoExtractor


class HowcastIE(InfoExtractor):
    _VALID_URL = r'https?://(?:www\.)?howcast\.com/videos/(?P<id>\d+)'
    _TEST = {
        'url': 'http://www.howcast.com/videos/390161-How-to-Tie-a-Square-Knot-Properly',
        'md5': '8b743df908c42f60cf6496586c7f12c3',
        'info_dict': {
            'id': '390161',
            'ext': 'mp4',
            'description': 'The square knot, also known as the reef knot, is one of the oldest, most basic knots to tie, and can be used in many different ways. Here\'s the proper way to tie a square knot.',
            'title': 'How to Tie a Square Knot Properly',
        }
    }

    def _real_extract(self, url):
        mobj = re.match(self._VALID_URL, url)

        video_id = mobj.group('id')
        webpage = self._download_webpage(url, video_id)

        self.report_extraction(video_id)

        video_url = self._search_regex(r'\'?file\'?: "(http://mobile-media\.howcast\.com/[0-9]+\.mp4)',
                                       webpage, 'video URL')

        video_description = self._html_search_regex(r'<meta content=(?:"([^"]+)"|\'([^\']+)\') name=\'description\'',
                                                    webpage, 'description', fatal=False)

        return {
            'id': video_id,
            'url': video_url,
            'title': self._og_search_title(webpage),
            'description': video_description,
            'thumbnail': self._og_search_thumbnail(webpage),
        }
[howcast] Modernize 2014-02-10 20:45:17 +01:00			`from __future__ import unicode_literals`

[howcast] Move into own file 2013-06-23 22:30:16 +02:00			`import re`

			`from .common import InfoExtractor`


			`class HowcastIE(InfoExtractor):`
[howcast] Modernize 2014-02-10 20:45:17 +01:00			`_VALID_URL = r'https?://(?:www\.)?howcast\.com/videos/(?P<id>\d+)'`
Move tests to the IE definitions 2013-06-27 20:46:46 +02:00			`_TEST = {`
[howcast] Modernize 2014-02-10 20:45:17 +01:00			`'url': 'http://www.howcast.com/videos/390161-How-to-Tie-a-Square-Knot-Properly',`
			`'md5': '8b743df908c42f60cf6496586c7f12c3',`
			`'info_dict': {`
			`'id': '390161',`
			`'ext': 'mp4',`
PEP8 applied 2014-11-23 20:41:03 +01:00			`'description': 'The square knot, also known as the reef knot, is one of the oldest, most basic knots to tie, and can be used in many different ways. Here\'s the proper way to tie a square knot.',`
[howcast] Modernize 2014-02-10 20:45:17 +01:00			`'title': 'How to Tie a Square Knot Properly',`
Move tests to the IE definitions 2013-06-27 20:46:46 +02:00			`}`
			`}`
[howcast] Move into own file 2013-06-23 22:30:16 +02:00
			`def _real_extract(self, url):`
			`mobj = re.match(self._VALID_URL, url)`

			`video_id = mobj.group('id')`
[howcast] Do not download from http://www.howcast.com/videos/{video_id} It takes too much to follow the redirection. 2013-09-11 17:36:23 +02:00			`webpage = self._download_webpage(url, video_id)`
[howcast] Move into own file 2013-06-23 22:30:16 +02:00
			`self.report_extraction(video_id)`

			`video_url = self._search_regex(r'\'?file\'?: "(http://mobile-media\.howcast\.com/[0-9]+\.mp4)',`
PEP8: applied even more rules 2014-11-23 21:39:15 +01:00			`webpage, 'video URL')`
[howcast] Move into own file 2013-06-23 22:30:16 +02:00
			`video_description = self._html_search_regex(r'<meta content=(?:"([^"]+)"\|\'([^\']+)\') name=\'description\'',`
PEP8: applied even more rules 2014-11-23 21:39:15 +01:00			`webpage, 'description', fatal=False)`
[howcast] Move into own file 2013-06-23 22:30:16 +02:00
[howcast] Modernize 2014-02-10 20:45:17 +01:00			`return {`
			`'id': video_id,`
			`'url': video_url,`
			`'title': self._og_search_title(webpage),`
[howcast] Move into own file 2013-06-23 22:30:16 +02:00			`'description': video_description,`
[howcast] Modernize 2014-02-10 20:45:17 +01:00			`'thumbnail': self._og_search_thumbnail(webpage),`
			`}`