# coding: utf-8 from __future__ import unicode_literals from .common import InfoExtractor import re class ChangbaIE(InfoExtractor): _VALID_URL = r'https?://(?:www\.)?changba\.com/s/(?P[0-9A-Za-z-_]+)' _TESTS = [{ 'url': 'https://changba.com/s/0GHVw6vyXv9N2FhaFi2WJg', 'md5': 'ea55d17e939f3e2dabf483e47e8e5693', 'info_dict': { 'id': '1152860688', 'ext': 'mp4', 'title': '对你爱不完【炫酷慢摇】 ', } }, { 'url': 'http://changba.com/s/nZqfbS_vCnieNNjJ7UiEGw?', 'md5': 'e401463ffb03ed8900a0bccc641335e1', 'info_dict': { 'id': '1091968526', 'ext': 'mp3', 'title': '下雪 ', } }, { 'url': 'http://changba.com/s/CPiNWbAa1qy0po0llqIJbg', 'md5': '7adcc9afb85ace8ff854bdd0e8567f50', 'info_dict': { 'id': '136918054', 'ext': 'mp3', 'title': '红豆 ', } }, { 'url': 'http://changba.com/s/-N00JJ30YruunrER5eBcWw', 'md5': 'cd68f8da8d8c69afbb8e4dbbbfa8b277', 'info_dict': { 'id': '172671761', 'ext': 'mp3', 'title': '天与地 ', } }] def _real_extract(self, url): video_id = self._match_id(url) webpage = self._download_webpage(url, video_id) id = self._search_regex(r'workid=([0-9]+)', webpage, 'id') title = self._search_regex(r']+class="title"[^>]*>([^<]+)', webpage, 'title') isvideo = self._search_regex(r'&isvideo=([0-9])', webpage, 'isvideo') ext = 'mp3' if int(isvideo) == 0 else 'mp4' try: url = self._search_regex(r'([a-z]+:\/\/[0-9a-z]+\.changba\.com\/[a-z]+\/[a-z]+\/[0-9]+\/[0-9]+\.mp[3-4])', webpage, 'url') except: url = 'http://lzscuw.changba.com/{}.{}'.format(str(id), ext) return { 'url': url, 'id': id, 'ext': ext, 'title': title, }