[narando] add separate [narando:player] extractor

2025-01-08 14:17:54 +01:00 · 2018-11-21 15:20:41 -05:00 · 2018-11-21 15:20:41 -05:00 · f8a4a38880
commit f8a4a38880
parent 200ad7687a
2 changed files with 35 additions and 36 deletions
--- a/youtube_dl/extractor/extractors.py
+++ b/youtube_dl/extractor/extractors.py
@ -672,7 +672,10 @@ from .myvi import (
    MyviEmbedIE,
 )
 from .myvidster import MyVidsterIE
-from .narando import NarandoIE
+from .narando import (
    NarandoIE,
    NarandoPlayerIE,
 )
 from .nationalgeographic import (
    NationalGeographicVideoIE,
    NationalGeographicIE,
--- a/youtube_dl/extractor/narando.py
+++ b/youtube_dl/extractor/narando.py
@ -4,6 +4,33 @@ from __future__ import unicode_literals
 from .common import InfoExtractor
 class NarandoPlayerIE(InfoExtractor):
    IE_NAME = "narando:player"
    _VALID_URL = r'https://narando.com/widget\?r=(?P<id>\w+)'
    _TEST = {
        'url': 'https://narando.com/widget?r=b2t4t789kxgy9g7ms4rwjvvw',
        'md5': 'd20f671f0395bab8f8285d1f6e8f965e',
        'info_dict': {
            'id': 'b2t4t789kxgy9g7ms4rwjvvw',
            'ext': 'mp3',
            'title': 'An  ihrem  Selbstlob  erkennt  man  sie',
            'url': 'https://static.narando.com/sounds/10492/original.mp3',
        }
    }
    def _real_extract(self, url):
        video_id = self._match_id(url)
        webpage = self._download_webpage('https://narando.com/widget?r=' + video_id, video_id)
        title = self._html_search_regex(r'<title>narando \| (.+?)</title>', webpage, 'title')
        download_url = self._html_search_regex(r'.<div class="stream_url hide">\s*([^?]*)', webpage, 'download_url')
        return {
            'id': video_id,
            'title': title,
            'url': download_url,
        }
 class NarandoIE(InfoExtractor):
    IE_NAME = "narando"
    _VALID_URL = r'https?://(?:www\.)?narando\.com/articles/(?P<id>([a-zA-Z]|-)+)'
@ -22,48 +49,17 @@ class NarandoIE(InfoExtractor):
    def _real_extract(self, url):
        video_id = self._match_id(url)
        webpage = self._download_webpage('https://narando.com/articles/' + video_id, video_id)
        title = self._html_search_regex(r'<h1 class="visible-xs h3">(.+?)</h1>', webpage, 'title')
        player_id = self._html_search_regex(r'[\n\r].*https:\/\/narando.com\/r\/\s*([^"]*)', webpage, 'player_id')
-        player_page = self._download_webpage('https://narando.com/widget?r=' + player_id, player_id)
+        player_url = 'https://narando.com/widget?r=' + player_id
        download_url = self._html_search_regex(r'.<div class="stream_url hide">\s*([^?]*)', player_page, 'url')
 #       download_url = NarandoPlayerIE()._real_extract('https://narando.com/widget?r=' + player_id)['url']
        description = self._html_search_regex(r'<meta content="(.+?)" property="og:description" />', webpage, 'description')
        return {
            'display_id': video_id,
            'id': player_id,
            'title': title,
-            'url': download_url,
+            'url': player_url,
            'description': description,
            '_type': 'url',
        }
 """to be implemented later
 class NarandoPlayerIE(InfoExtractor):
    IE_NAME = "narando:player"
    _VALID_URL = r'https://narando.com/widget\?r=(?P<id>\w+)'
    _TEST = {
        'url': 'https://narando.com/widget?r=b2t4t789kxgy9g7ms4rwjvvw',
        'md5': 'd20f671f0395bab8f8285d1f6e8f965e',
        'info_dict': {
            'id': 'b2t4t789kxgy9g7ms4rwjvvw',
            'ext': 'mp3',
            'title': 'An  ihrem  Selbstlob  erkennt  man  sie',
            'url': 'https://static.narando.com/sounds/10492/original.mp3',
        }
    }
    def _real_extract(self, url):
        video_id = self._match_id(url)
        webpage = self._download_webpage('https://narando.com/widget?r=' + video_id, video_id)
        title = self._html_search_regex(r'<title>narando \| (.+?)</title>', webpage, 'title')
        download_url = self._html_search_regex(r'.<div class="stream_url hide">\s*([^?]*)', webpage, 'download_url')
        return {
            'id': video_id,
            'title': title,
            'url': download_url,
        }
 """