1
0
mirror of https://codeberg.org/polarisfm/youtube-dl synced 2024-11-22 16:44:32 +01:00

[Northpoint] Add new extractor

This commit is contained in:
Marek Chowaniok 2018-10-24 15:19:22 -03:00
parent b99b0bcfa0
commit ff2e3e38be
2 changed files with 63 additions and 0 deletions

View File

@ -741,6 +741,7 @@ from .noco import NocoIE
from .nonktube import NonkTubeIE
from .noovo import NoovoIE
from .normalboots import NormalbootsIE
from .northpoint import NorthpointIE
from .nosvideo import NosVideoIE
from .nova import (
NovaEmbedIE,

View File

@ -0,0 +1,62 @@
# coding: utf-8
from __future__ import unicode_literals
from .common import InfoExtractor
from .theplatform import ThePlatformIE
class NorthpointIE(ThePlatformIE):
_VALID_URL = r'(?:http?://)?(?:www\.)?northpoint\.org/messages/[^/]+/(?P<id>[^/]+)'
_TESTS =[ {
'url': 'http://northpoint.org/messages/three-things/what-makes-you-a-wonder/',
'md5': '214af23fa75d0fae44298a5128c35d56',
'info_dict': {
'id': 'rosH7wGAB33s',
'ext': 'mp4',
'title': "Three Things I Learned from a Movie I Didn't Want to See - The Power Of Friendship",
'series': "Three Things I Learned from a Movie I Didn't Want to See",
}
}]
def _real_extract(self, url):
display_id = self._match_id(url)
webpage = self._download_webpage(url, display_id)
playerCode = self._search_regex(r'playerCode\s*=\s*[\'"]([^\'"]+)',webpage, 'player Code')
seriesPermalink = self._search_regex(r'series_permalink\s*:\s*[\'"]([^\'"]+)',webpage, 'series name')
seriesJSON = self._download_json(
'http://northpoint.org/api/mma/details/channel/npcc/permalink/%s' %seriesPermalink,display_id)['messages']
videoIDLink = ''
videoIDLinkTemp = ''
for serie in seriesJSON:
videoIDLinkTemp = serie['hv_msg']['id']
if serie['title'].lower() == display_id.replace('-', ' ').lower():
videoIDLink = serie['hv_msg']['id']
if not videoIDLink:
videoIDLink = videoIDLinkTemp
linkWebpage = self._download_webpage('http://player.theplatform.com/p/IfSiAC/'+playerCode+'/embed/select/'+videoIDLink, display_id)
releaseUrl = self._search_regex(r'tp:releaseUrl\s*=\s*[\'"]([^\'"]+)',linkWebpage, 'release url')
platformMetaData = self._search_regex(r'.*.com\/s\/\s*([^\n\r]*)[ˆ?]',releaseUrl, 'release url')
theplatform_metadata = self._download_theplatform_metadata(platformMetaData, display_id)
# print theplatform_metadata
video_id = theplatform_metadata['pid']
title = theplatform_metadata['title'][19:]
series = theplatform_metadata['pl1$seriesName']
# print title, series
formats, subtitles = self._extract_theplatform_smil(releaseUrl, video_id)
self._sort_formats(formats)
return {
'id': video_id,
'title': title,
'subtitles': subtitles,
'formats': formats,
'series': series,
}