1
0
mirror of https://codeberg.org/polarisfm/youtube-dl synced 2025-01-24 13:37:54 +01:00
youtube-dl/youtube_dl/extractor/picta.py

181 lines
7.6 KiB
Python
Raw Normal View History

2019-02-02 01:07:44 +01:00
# coding: utf-8
from __future__ import unicode_literals
2019-02-02 06:30:27 +01:00
from ..compat import compat_str
2020-05-25 08:42:40 +02:00
from ..utils import int_or_none, unified_timestamp, try_get, ExtractorError
2019-02-02 01:07:44 +01:00
from .common import InfoExtractor
2019-02-02 06:30:27 +01:00
class PictaBaseIE(InfoExtractor):
2020-05-25 08:42:40 +02:00
API_BASE_URL = "https://api.picta.cu/api/v2/"
@staticmethod
def _extract_video(video, video_id=None, require_title=True):
2020-05-31 05:57:21 +02:00
if len(video["results"]) == 0:
raise ExtractorError("Cannot find video!")
2020-05-25 08:42:40 +02:00
title = (
video["results"][0]["nombre"]
if require_title
else video.get("results")[0].get("nombre")
)
description = try_get(
video, lambda x: x["results"][0]["descripcion"], compat_str
)
uploader = try_get(
video, lambda x: x["results"][0]["usuario"]["username"], compat_str
)
add_date = try_get(video, lambda x: x["results"][0]["fecha_creacion"])
2019-02-02 06:30:27 +01:00
timestamp = int_or_none(unified_timestamp(add_date))
2020-05-25 08:42:40 +02:00
thumbnail = try_get(video, lambda x: x["results"][0]["url_imagen"])
manifest_url = try_get(video, lambda x: x["results"][0]["url_manifiesto"])
category = try_get(
video, lambda x: x["results"][0]["canal"]["nombre"], compat_str
)
2019-02-02 06:30:27 +01:00
return {
2020-05-25 08:42:40 +02:00
"id": try_get(video, lambda x: x["results"][0]["id"], compat_str)
or video_id,
"title": title,
"description": description,
"thumbnail": thumbnail,
"uploader": uploader,
"timestamp": timestamp,
"category": [category] if category else None,
"manifest_url": manifest_url,
2019-02-02 06:30:27 +01:00
}
class PictaIE(PictaBaseIE):
2020-05-25 08:42:40 +02:00
IE_NAME = "picta"
IE_DESC = "Picta videos"
_VALID_URL = (
r"https?://(?:www\.)?picta\.cu/(?:medias|embed)/(?:\?v=)?(?P<id>[\da-z-]+)"
)
_TESTS = [
{
"url": "https://www.picta.cu/medias/orishas-everyday-2019-01-16-16-36-42-443003",
"file": "Orishas - Everyday-orishas-everyday-2019-01-16-16-36-42-443003.webm",
"md5": "7ffdeb0043500c4bb660c04e74e90f7a",
"info_dict": {
"id": "orishas-everyday-2019-01-16-16-36-42-443003",
"ext": "webm",
"title": "Orishas - Everyday",
"thumbnail": r"re:^https?://.*imagen/img.*\.png$",
"upload_date": "20190116",
"description": "Orishas - Everyday (Video Oficial)",
"uploader": "admin",
"timestamp": 1547656602,
},
2020-05-25 09:10:59 +02:00
"params": {"format": "4"},
2019-02-17 04:36:31 +01:00
},
2020-05-25 08:42:40 +02:00
{
"url": "https://www.picta.cu/medias/palmiche-galeno-tercer-lugar-torneo-virtual-robotica-2020-05-21-16-15-31-431895",
"file": "Palmiche Galeno tercer lugar en torneo virtual de robótica-palmiche-galeno-tercer-lugar-torneo-virtual-robotica-2020-05-21-16-15-31-431895.mp4",
"md5": "6031b7a3add2eade9c5bef7ecf5d4b02",
"info_dict": {
"id": "palmiche-galeno-tercer-lugar-torneo-virtual-robotica-2020-05-21-16-15-31-431895",
"ext": "mp4",
"title": "Palmiche Galeno tercer lugar en torneo virtual de robótica",
"thumbnail": r"re:^https?://.*imagen/img.*\.jpeg$",
"upload_date": "20200521",
"description": "En esta emisión:\r\n"
"Iniciará en La Habana nuevo método para medir el consumo "
"eléctrico | https://bit.ly/jtlecturacee\r\n"
"GICAcovid: nueva aplicación web para los centros de "
"aislamiento | https://bit.ly/jtgicacovid\r\n"
"Obtuvo Palmiche tercer lugar en la primera competencia "
"virtual de robótica | https://bit.ly/jtpalmichegaleno\r\n"
"\r\n"
"Síguenos en:\r\n"
"Facebook: http://www.facebook.com/JuventudTecnicaCuba\r\n"
"Twitter e Instagram: @juventudtecnica\r\n"
"Telegram: http://t.me/juventudtecnica",
"uploader": "ernestoguerra21",
"timestamp": 1590077731,
},
2019-02-17 00:25:59 +01:00
},
2020-05-25 09:10:59 +02:00
{"url": "https://www.picta.cu/embed/?v=818", "only_matching": True},
2020-05-28 15:20:51 +02:00
{
"url": "https://www.picta.cu/embed/palmiche-galeno-tercer-lugar-torneo-virtual-robotica-2020-05-21-16-15-31-431895",
"only_matching": True,
},
2020-05-25 08:42:40 +02:00
]
2019-02-02 01:07:44 +01:00
def _real_extract(self, url):
video_id = self._match_id(url)
2020-05-25 08:42:40 +02:00
json_url = (
self.API_BASE_URL + "publicacion/?format=json&slug_url_raw=%s" % video_id
)
video = self._download_json(json_url, video_id, "Downloading video JSON")
2019-02-02 06:30:27 +01:00
info = self._extract_video(video, video_id)
2019-02-02 01:07:44 +01:00
formats = []
# MPD manifest
2020-05-25 08:42:40 +02:00
if info.get("manifest_url"):
formats.extend(
self._extract_mpd_formats(info.get("manifest_url"), video_id)
)
2019-02-02 01:07:44 +01:00
if not formats:
2020-05-25 08:42:40 +02:00
raise ExtractorError("Cannot find video formats")
2019-02-02 01:07:44 +01:00
self._sort_formats(formats)
2020-05-25 08:42:40 +02:00
info["formats"] = formats
2019-02-02 06:30:27 +01:00
return info
2019-02-08 00:38:41 +01:00
class PictaEmbedIE(InfoExtractor):
2020-05-25 08:42:40 +02:00
IE_NAME = "picta:embed"
IE_DESC = "Picta embedded videos"
_VALID_URL = r"https?://www\.picta\.cu/embed/(?:\?v=)?(?P<id>[0-9]+)"
2019-02-08 00:38:41 +01:00
2020-05-28 15:20:51 +02:00
_TESTS = [
{
"url": "https://www.picta.cu/embed/?v=818",
"file": "Orishas - Everyday-orishas-everyday-2019-01-16-16-36-42-443003.webm",
"md5": "7ffdeb0043500c4bb660c04e74e90f7a",
"info_dict": {
"id": "orishas-everyday-2019-01-16-16-36-42-443003",
"ext": "webm",
"title": "Orishas - Everyday",
"thumbnail": r"re:^https?://.*imagen/img.*\.png$",
"upload_date": "20190116",
"description": "Orishas - Everyday (Video Oficial)",
"uploader": "admin",
"timestamp": 1547656602,
},
"params": {"format": "4"},
},
{
"url": "https://www.picta.cu/embed/palmiche-galeno-tercer-lugar-torneo-virtual-robotica-2020-05-21-16-15-31-431895",
"file": "Palmiche Galeno tercer lugar en torneo virtual de robótica-palmiche-galeno-tercer-lugar-torneo-virtual-robotica-2020-05-21-16-15-31-431895.mp4",
"md5": "6031b7a3add2eade9c5bef7ecf5d4b02",
"info_dict": {
"id": "palmiche-galeno-tercer-lugar-torneo-virtual-robotica-2020-05-21-16-15-31-431895",
"ext": "mp4",
"title": "Palmiche Galeno tercer lugar en torneo virtual de robótica",
"thumbnail": r"re:^https?://.*imagen/img.*\.jpeg$",
"upload_date": "20200521",
"description": "En esta emisión:\r\n"
2020-05-31 05:57:21 +02:00
"Iniciará en La Habana nuevo método para medir el consumo "
"eléctrico | https://bit.ly/jtlecturacee\r\n"
"GICAcovid: nueva aplicación web para los centros de "
"aislamiento | https://bit.ly/jtgicacovid\r\n"
"Obtuvo Palmiche tercer lugar en la primera competencia "
"virtual de robótica | https://bit.ly/jtpalmichegaleno\r\n"
"\r\n"
"Síguenos en:\r\n"
"Facebook: http://www.facebook.com/JuventudTecnicaCuba\r\n"
"Twitter e Instagram: @juventudtecnica\r\n"
"Telegram: http://t.me/juventudtecnica",
2020-05-28 15:20:51 +02:00
"uploader": "ernestoguerra21",
"timestamp": 1590077731,
},
2019-02-17 04:36:31 +01:00
},
2020-05-28 15:20:51 +02:00
]
2019-02-08 00:38:41 +01:00
def _real_extract(self, url):
return self.url_result(url, PictaIE.ie_key())