youtube-dl/youtube_dl/extractor/wimp.py

from __future__ import unicode_literals

from .common import InfoExtractor
from .youtube import YoutubeIE


class WimpIE(InfoExtractor):
    _VALID_URL = r'https?://(?:www\.)?wimp\.com/(?P<id>[^/]+)'
    _TESTS = [{
        'url': 'http://www.wimp.com/maru-is-exhausted/',
        'md5': 'ee21217ffd66d058e8b16be340b74883',
        'info_dict': {
            'id': 'maru-is-exhausted',
            'ext': 'mp4',
            'title': 'Maru is exhausted.',
            'description': 'md5:57e099e857c0a4ea312542b684a869b8',
        }
    }, {
        'url': 'http://www.wimp.com/clowncar/',
        'md5': '5c31ad862a90dc5b1f023956faec13fe',
        'info_dict': {
            'id': 'cG4CEr2aiSg',
            'ext': 'webm',
            'title': 'Basset hound clown car...incredible!',
            'description': '5 of my Bassets crawled in this dog loo! www.bellinghambassets.com\n\nFor licensing/usage please contact: licensing(at)jukinmediadotcom',
            'upload_date': '20140303',
            'uploader': 'Gretchen Hoey',
            'uploader_id': 'gretchenandjeff1',
        },
        'add_ie': ['Youtube'],
    }]

    def _real_extract(self, url):
        video_id = self._match_id(url)

        webpage = self._download_webpage(url, video_id)

        youtube_id = self._search_regex(
            (r"videoId\s*:\s*[\"']([0-9A-Za-z_-]{11})[\"']",
             r'data-id=["\']([0-9A-Za-z_-]{11})'),
            webpage, 'video URL', default=None)
        if youtube_id:
            return self.url_result(youtube_id, YoutubeIE.ie_key())

        info_dict = self._extract_jwplayer_data(
            webpage, video_id, require_title=False)

        info_dict.update({
            'id': video_id,
            'title': self._og_search_title(webpage),
            'description': self._og_search_description(webpage),
        })

        return info_dict
[Wimp] Use new URL relay method 2014-01-22 02:01:23 +01:00			`from __future__ import unicode_literals`

[generic] Try parsing JWPlayer embedded videos (closes #12030) 2017-02-16 16:42:36 +01:00			`from .common import InfoExtractor`
[wimp] Detect youtube videos (fixes #2686) 2014-04-03 20:44:51 +02:00			`from .youtube import YoutubeIE`
added an IE for wimp.com 2013-06-26 12:25:53 +02:00

[generic] Try parsing JWPlayer embedded videos (closes #12030) 2017-02-16 16:42:36 +01:00			`class WimpIE(InfoExtractor):`
Add support for https for all extractors as preventive and future-proof measure 2016-03-21 16:36:32 +01:00			`_VALID_URL = r'https?://(?:www\.)?wimp\.com/(?P<id>[^/]+)'`
[wimp] Detect youtube videos (fixes #2686) 2014-04-03 20:44:51 +02:00			`_TESTS = [{`
[wimp] Fix extraction and update _TESTS 2016-06-16 06:27:21 +02:00			`'url': 'http://www.wimp.com/maru-is-exhausted/',`
[wimp] fix tests info 2015-09-07 13:49:59 +02:00			`'md5': 'ee21217ffd66d058e8b16be340b74883',`
[Wimp] Use new URL relay method 2014-01-22 02:01:23 +01:00			`'info_dict': {`
[wimp] Fix extraction and update _TESTS 2016-06-16 06:27:21 +02:00			`'id': 'maru-is-exhausted',`
[wimp] fix tests info 2015-09-07 13:49:59 +02:00			`'ext': 'mp4',`
[wimp] Modernize and replace test 2014-02-21 11:57:19 +01:00			`'title': 'Maru is exhausted.',`
			`'description': 'md5:57e099e857c0a4ea312542b684a869b8',`
Move tests to the IE definitions 2013-06-27 20:46:46 +02:00			`}`
[wimp] Detect youtube videos (fixes #2686) 2014-04-03 20:44:51 +02:00			`}, {`
			`'url': 'http://www.wimp.com/clowncar/',`
[wimp] Fix extraction and update _TESTS 2016-06-16 06:27:21 +02:00			`'md5': '5c31ad862a90dc5b1f023956faec13fe',`
[wimp] Detect youtube videos (fixes #2686) 2014-04-03 20:44:51 +02:00			`'info_dict': {`
[wimp] Fix extraction and update _TESTS 2016-06-16 06:27:21 +02:00			`'id': 'cG4CEr2aiSg',`
update tests related to the change in youtube http format sorting the change was done in 82156fdbf0913c75181484dcc813565713bf78e9 2016-03-05 21:52:24 +01:00			`'ext': 'webm',`
[wimp] Fix extraction and update _TESTS 2016-06-16 06:27:21 +02:00			`'title': 'Basset hound clown car...incredible!',`
			`'description': '5 of my Bassets crawled in this dog loo! www.bellinghambassets.com\n\nFor licensing/usage please contact: licensing(at)jukinmediadotcom',`
			`'upload_date': '20140303',`
			`'uploader': 'Gretchen Hoey',`
			`'uploader_id': 'gretchenandjeff1',`
[wimp] Detect youtube videos (fixes #2686) 2014-04-03 20:44:51 +02:00			`},`
[wimp] Fix extraction and update _TESTS 2016-06-16 06:27:21 +02:00			`'add_ie': ['Youtube'],`
[wimp] Detect youtube videos (fixes #2686) 2014-04-03 20:44:51 +02:00			`}]`
added an IE for wimp.com 2013-06-26 12:25:53 +02:00
			`def _real_extract(self, url):`
[wimp] fix tests info 2015-09-07 13:49:59 +02:00			`video_id = self._match_id(url)`
[wimp] Fix extraction (Closes #7784) 2015-12-07 17:14:45 +01:00
added an IE for wimp.com 2013-06-26 12:25:53 +02:00			`webpage = self._download_webpage(url, video_id)`
[wimp] Fix extraction (Closes #7784) 2015-12-07 17:14:45 +01:00
			`youtube_id = self._search_regex(`
[wimp] Fix Youtube embeds extraction 2018-06-10 21:40:17 +02:00			`(r"videoId\s:\s[\"']([0-9A-Za-z_-]{11})[\"']",`
			`r'data-id=["\']([0-9A-Za-z_-]{11})'),`
[wimp] Fix extraction (Closes #7784) 2015-12-07 17:14:45 +01:00			`webpage, 'video URL', default=None)`
			`if youtube_id:`
Refactor code to use url_result 2019-01-01 17:56:05 +01:00			`return self.url_result(youtube_id, YoutubeIE.ie_key())`
changed wimp.py according to the changes suggested by jaime 2013-06-26 14:26:59 +02:00
[wimp] Fix extraction and update _TESTS 2016-06-16 06:27:21 +02:00			`info_dict = self._extract_jwplayer_data(`
			`webpage, video_id, require_title=False)`
[wimp] Fix extraction (Closes #7784) 2015-12-07 17:14:45 +01:00
[wimp] Fix extraction and update _TESTS 2016-06-16 06:27:21 +02:00			`info_dict.update({`
[wimp] simplify 2013-12-08 07:22:19 +01:00			`'id': video_id,`
			`'title': self._og_search_title(webpage),`
			`'description': self._og_search_description(webpage),`
[wimp] Fix extraction and update _TESTS 2016-06-16 06:27:21 +02:00			`})`

			`return info_dict`