2018-04-20 19:56:26 +02:00
|
|
|
# coding: utf-8
|
|
|
|
from __future__ import unicode_literals
|
|
|
|
|
|
|
|
from .common import InfoExtractor
|
|
|
|
|
2018-05-01 15:42:42 +02:00
|
|
|
from ..utils import (
|
2019-10-12 13:42:56 +02:00
|
|
|
ExtractorError,
|
2019-10-09 21:50:52 +02:00
|
|
|
urljoin,
|
2019-10-12 13:42:56 +02:00
|
|
|
parse_duration,
|
2019-10-12 14:19:26 +02:00
|
|
|
int_or_none,
|
2019-10-12 14:34:21 +02:00
|
|
|
merge_dicts,
|
2018-05-01 15:42:42 +02:00
|
|
|
)
|
2018-04-20 19:56:26 +02:00
|
|
|
|
|
|
|
|
|
|
|
class MakoTVIE(InfoExtractor):
|
2019-10-12 13:42:56 +02:00
|
|
|
_VALID_URL = r'https?://(?:www\.)?mako\.co\.il/.+?/(?:VOD|Video)-(?P<id>[0-9a-f]{18})\.htm'
|
|
|
|
_TESTS = [
|
|
|
|
{
|
|
|
|
'url': 'https://www.mako.co.il/mako-vod-keshet/parliament-s1/VOD-5df5a86c1966831006.htm',
|
|
|
|
'md5': 'd826489500d23d122055a30df0d59cb5',
|
|
|
|
'info_dict': {
|
|
|
|
'id': '5df5a86c1966831006',
|
|
|
|
'ext': 'm3u8',
|
2019-10-12 13:51:30 +02:00
|
|
|
'title': '\u05d4\u05e4\u05e8\u05dc\u05de\u05e0\u05d8 | \u05e4\u05e8\u05e7 1 \u05dc\u05e6\u05e4\u05d9\u05d9\u05d4 \u05d9\u05e9\u05d9\u05e8\u05d4 | makoTV ',
|
2019-10-12 13:42:56 +02:00
|
|
|
'thumbnail': r're:^https?://img\.mako\.co\.il/\d{4}/\d{2}/\d{2}/.+\.jpg$',
|
2019-10-12 13:51:30 +02:00
|
|
|
'description': '\u05e9\u05d0\u05d5\u05dc\u05d9, \u05d0\u05de\u05e6\u05d9\u05d4, \u05d4\u05e7\u05d8\u05d5\u05e8, \u05e7\u05e8\u05e7\u05d5 \u05d5\u05d0\u05d1\u05d9 \u05de\u05e7\u05d1\u05dc\u05d9\u05dd \u05e1\u05d3\u05e8\u05d4 \u05de\u05e9\u05dc\u05d4\u05dd. \u05db\u05dc \u05d4\u05e4\u05e8\u05e7\u05d9\u05dd \u05e9\u05dc \u05d4\u05e4\u05e8\u05dc\u05de\u05e0\u05d8 \u05dc\u05e6\u05e4\u05d9\u05d9\u05d4 \u05d9\u05e9\u05d9\u05e8\u05d4 | makoTV ',
|
2019-10-12 13:42:56 +02:00
|
|
|
'upload_date': '20120708',
|
|
|
|
'timestamp': 1341751140,
|
|
|
|
'duration': 1774.0,
|
|
|
|
'episode_number': 1,
|
2019-10-12 13:51:30 +02:00
|
|
|
'episode': '\u05e4\u05e8\u05e7 1',
|
|
|
|
'season': '\u05e2\u05d5\u05e0\u05d4 1',
|
2019-10-12 13:42:56 +02:00
|
|
|
},
|
|
|
|
},
|
|
|
|
{
|
|
|
|
'url': 'https://www.mako.co.il/tv-erez-nehederet/season14-shauli-and-irena/Video-6c53a12777d9c51006.htm',
|
|
|
|
'md5': '77b0c836ebfb6237c7e9b909e57a4194',
|
|
|
|
'info_dict': {
|
|
|
|
'id': '6c53a12777d9c51006',
|
|
|
|
'ext': 'm3u8',
|
2019-10-12 13:51:30 +02:00
|
|
|
'title': '\u05e9\u05d0\u05d5\u05dc\u05d9 \u05d5\u05d0\u05d9\u05e8\u05e0\u05d4 \u05d1\u05d1\u05d9\u05ea \u05d7\u05d5\u05dc\u05d9\u05dd \u2013 \u05e4\u05e8\u05e7 \u05d4\u05e1\u05d9\u05d5\u05dd',
|
2019-10-12 13:42:56 +02:00
|
|
|
'thumbnail': r're:^https?://img\.mako\.co\.il/\d{4}/\d{2}/\d{2}/.+\.jpg$',
|
2019-10-12 13:51:30 +02:00
|
|
|
'description': '\u05d4\u05d0\u05dd \u05e9\u05d0\u05d5\u05dc\u05d9 \u05d4\u05d5\u05dc\u05da \u05dc\u05de\u05d5\u05ea?',
|
2019-10-12 13:42:56 +02:00
|
|
|
'duration': 669.0,
|
2019-10-12 13:51:30 +02:00
|
|
|
'episode': '\u05e9\u05d0\u05d5\u05dc\u05d9 \u05d5\u05d0\u05d9\u05e8\u05e0\u05d4 \u05d1\u05d1\u05d9\u05ea \u05d7\u05d5\u05dc\u05d9\u05dd \u2013 \u05e4\u05e8\u05e7 \u05d4\u05e1\u05d9\u05d5\u05dd',
|
2019-10-12 13:42:56 +02:00
|
|
|
},
|
|
|
|
},
|
|
|
|
]
|
|
|
|
|
2018-04-20 19:56:26 +02:00
|
|
|
def _real_extract(self, url):
|
|
|
|
video_id = self._match_id(url)
|
|
|
|
webpage = self._download_webpage(url, video_id)
|
|
|
|
|
2019-10-12 13:42:56 +02:00
|
|
|
vcmid_pattern = r'var vcmidOfContent\s*?=\s*?\'([0-9A-Za-z]{40})\''
|
|
|
|
vcmid = self._search_regex(vcmid_pattern, webpage, 'vcmid')
|
|
|
|
channel_id_pattern = r'var currentChannelId\s*?=\s*?\'([0-9A-Za-z]{40})\''
|
|
|
|
channel_id = self._search_regex(channel_id_pattern, webpage, 'channel_id')
|
2018-04-20 19:56:26 +02:00
|
|
|
|
2019-10-12 13:42:56 +02:00
|
|
|
config_new_url = 'https://rcs.mako.co.il/flash_swf/players/makoPlayer/configNew.xml'
|
|
|
|
config_new = self._download_xml(config_new_url, video_id)
|
2018-04-20 19:56:26 +02:00
|
|
|
playlist_url = config_new.findtext('./PlaylistUrl')
|
2019-10-12 13:42:56 +02:00
|
|
|
playlist_url = playlist_url.replace('$$vcmid$$', vcmid)
|
|
|
|
playlist_url = playlist_url.replace('$$videoChannelId$$', channel_id)
|
|
|
|
playlist_url = playlist_url.replace('$$galleryChannelId$$', vcmid)
|
|
|
|
playlist_url = urljoin('https://www.mako.co.il', playlist_url)
|
|
|
|
playlist = self._download_json(playlist_url, video_id)
|
2018-04-20 19:56:26 +02:00
|
|
|
|
|
|
|
formats = []
|
2018-05-01 15:42:42 +02:00
|
|
|
for media in playlist.get('media', []):
|
2019-10-09 21:50:52 +02:00
|
|
|
tickets_url = 'https://mass.mako.co.il/ClicksStatistics/entitlementsServicesV2.jsp'
|
|
|
|
tickets_query = {
|
|
|
|
'et': 'gt',
|
|
|
|
'lp': media['url'],
|
|
|
|
'rv': media['cdn'],
|
|
|
|
}
|
|
|
|
tickets = self._download_json(tickets_url, video_id, query=tickets_query, fatal=False)
|
2019-10-09 22:08:28 +02:00
|
|
|
if tickets is None or tickets.get('status', '').lower() != 'success':
|
2018-05-01 15:42:42 +02:00
|
|
|
continue
|
|
|
|
for ticket in tickets.get('tickets', {}):
|
2019-10-12 13:42:56 +02:00
|
|
|
ticket_url = urljoin('https://makostore-hd.ctedgecdn.net', ticket['url']) + '?' + ticket['ticket']
|
2018-05-01 15:42:42 +02:00
|
|
|
formats.extend(self._extract_m3u8_formats(ticket_url, video_id, fatal=False))
|
2018-04-20 19:56:26 +02:00
|
|
|
|
|
|
|
self._sort_formats(formats)
|
|
|
|
|
2019-10-12 13:42:56 +02:00
|
|
|
info = {
|
2018-04-20 19:56:26 +02:00
|
|
|
'id': video_id,
|
2019-10-12 13:42:56 +02:00
|
|
|
'formats': formats,
|
|
|
|
}
|
|
|
|
|
2019-10-12 14:34:21 +02:00
|
|
|
video_details = playlist.get('videoDetails', {})
|
|
|
|
video_info = {
|
|
|
|
'url': video_details.get('directLink'),
|
|
|
|
'duration': parse_duration(video_details.get('duration')),
|
|
|
|
'view_count': video_details.get('numViews'),
|
|
|
|
'average_rating': video_details.get('rank'),
|
|
|
|
'episode': video_details.get('title'),
|
|
|
|
'episode_number': int_or_none(video_details.get('episodeNumber')),
|
|
|
|
'season': video_details.get('season'),
|
|
|
|
}
|
2019-10-12 13:42:56 +02:00
|
|
|
|
2019-10-12 14:34:21 +02:00
|
|
|
og_info = {
|
|
|
|
'url': self._og_search_url(webpage, fatal=False),
|
|
|
|
'title': self._og_search_title(webpage, fatal=False),
|
2018-04-20 19:56:26 +02:00
|
|
|
'thumbnail': self._og_search_thumbnail(webpage),
|
|
|
|
'description': self._og_search_description(webpage),
|
2019-10-12 14:34:21 +02:00
|
|
|
}
|
2018-04-20 19:56:26 +02:00
|
|
|
|
2019-10-12 14:34:21 +02:00
|
|
|
try:
|
|
|
|
json_ld = self._search_json_ld(webpage, video_id, fatal=False)
|
|
|
|
except ExtractorError:
|
|
|
|
json_ld = {}
|
2019-10-12 13:42:56 +02:00
|
|
|
|
2019-10-12 14:34:21 +02:00
|
|
|
return merge_dicts(info, video_info, og_info, json_ld)
|