Initial import: Music_Server, MusicFree, catalog-sync
This commit is contained in:
@@ -0,0 +1,205 @@
|
||||
'''
|
||||
Function:
|
||||
Implementation of XimalayaMusicClient: https://www.ximalaya.com/
|
||||
Author:
|
||||
Zhenchao Jin
|
||||
WeChat Official Account (微信公众号):
|
||||
Charles的皮卡丘
|
||||
'''
|
||||
import re
|
||||
import time
|
||||
import math
|
||||
import copy
|
||||
import base64
|
||||
import binascii
|
||||
from Crypto.Cipher import AES
|
||||
from rich.progress import Progress
|
||||
from ..sources import BaseMusicClient
|
||||
from urllib.parse import urlencode, urlparse, parse_qs
|
||||
from ..utils import byte2mb, resp2json, seconds2hms, legalizestring, safeextractfromdict, usesearchheaderscookies, SongInfo
|
||||
|
||||
|
||||
'''XimalayaMusicClient'''
|
||||
class XimalayaMusicClient(BaseMusicClient):
|
||||
source = 'XimalayaMusicClient'
|
||||
ALLOWED_SEARCH_TYPES = ['album', 'track']
|
||||
def __init__(self, **kwargs):
|
||||
self.allowed_search_types = list(set(kwargs.pop('allowed_search_types', XimalayaMusicClient.ALLOWED_SEARCH_TYPES)))
|
||||
super(XimalayaMusicClient, self).__init__(**kwargs)
|
||||
self.default_search_headers = {
|
||||
"User-Agent": "Mozilla/5.0 (Linux; Android 10; SM-G981B) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/80.0.3987.162 Mobile Safari/537.36",
|
||||
}
|
||||
self.default_download_headers = {
|
||||
"User-Agent": "Mozilla/5.0 (Linux; Android 10; SM-G981B) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/80.0.3987.162 Mobile Safari/537.36",
|
||||
}
|
||||
self.default_headers = self.default_search_headers
|
||||
self._initsession()
|
||||
'''_constructsearchurls'''
|
||||
def _constructsearchurls(self, keyword: str, rule: dict = None, request_overrides: dict = None):
|
||||
# init
|
||||
rule, request_overrides = rule or {}, request_overrides or {}
|
||||
# search rules
|
||||
default_rule = {
|
||||
'appid': '0', 'condition': 'relation', 'core': 'track', 'device': 'android', 'deviceId': '9a68144e-de5b-3c60-be5e-adce947ab5ff', 'kw': keyword,
|
||||
'live': 'true', 'needSemantic': 'true', 'network': 'wifi', 'operator': '1', 'page': '1', 'paidFilter': 'false', 'plan': 'c', 'recall': 'normal',
|
||||
'rows': self.search_size_per_page, 'search_version': '2.8', 'spellchecker': 'true', 'version': '6.6.48', 'voiceAsinput': 'false',
|
||||
}
|
||||
default_rule.update(rule)
|
||||
# construct search urls based on search rules
|
||||
base_url = 'https://searchwsa.ximalaya.com/front/v1?'
|
||||
search_urls, page_size = [], self.search_size_per_page
|
||||
for search_type in XimalayaMusicClient.ALLOWED_SEARCH_TYPES:
|
||||
if search_type not in self.allowed_search_types: continue
|
||||
default_rule_search_type = copy.deepcopy(default_rule)
|
||||
default_rule_search_type['core'], count = search_type, 0
|
||||
while self.search_size_per_source > count:
|
||||
page_rule = copy.deepcopy(default_rule_search_type)
|
||||
page_rule['rows'] = str(page_size)
|
||||
page_rule['page'] = str(int(count // page_size) + 1)
|
||||
search_urls.append(base_url + urlencode(page_rule))
|
||||
count += page_size
|
||||
# return
|
||||
return search_urls
|
||||
'''_crackplayurl'''
|
||||
def _crackplayurl(self, ciphertext: str):
|
||||
if not ciphertext: return ciphertext
|
||||
key = binascii.unhexlify("aaad3e4fd540b0f79dca95606e72bf93")
|
||||
ciphertext = base64.urlsafe_b64decode(ciphertext + "=" * (4 - len(ciphertext) % 4))
|
||||
cipher = AES.new(key, AES.MODE_ECB)
|
||||
plaintext = cipher.decrypt(ciphertext)
|
||||
plaintext = re.sub(r"[^\x20-\x7E]", "", plaintext.decode("utf-8"))
|
||||
return plaintext
|
||||
'''_parsewithcggapi'''
|
||||
def _parsewithcggapi(self, search_result: dict, request_overrides: dict = None):
|
||||
# init
|
||||
request_overrides, song_id, song_info = request_overrides or {}, search_result.get('id') or search_result.get('trackId'), SongInfo(source=self.source)
|
||||
# parse
|
||||
(resp := self.get(f"https://api-v2.cenguigui.cn/api/music/ximalaya.php?trackId={song_id}", **request_overrides)).raise_for_status()
|
||||
download_result = resp2json(resp=resp)
|
||||
if ('0 MB' in download_result['size']) or (not download_result.get('url')): return song_info
|
||||
download_url = download_result['url']
|
||||
file_size = re.sub(r"^\s*([0-9]*\.?[0-9]+)\s*([A-Za-z]+)\s*$", lambda m: f"{float(m.group(1)):.2f} {m.group(2)}", download_result['size'])
|
||||
m = re.match(r'^\s*([0-9]*\.?[0-9]+)\s*([KMGT]?B)\s*$', download_result['size'])
|
||||
file_size_bytes = int(float(m.group(1)) * {'B': 1, 'KB': 1024, 'MB': 1024**2, 'GB': 1024**3, 'TB': 1024**4}[m.group(2).upper()])
|
||||
song_info = SongInfo(
|
||||
raw_data={'search': search_result, 'download': download_result, 'lyric': {}}, source=self.source, song_name=legalizestring(search_result.get('title')), singers=legalizestring(search_result.get('nickname')),
|
||||
album=legalizestring(search_result.get('album_title') or search_result.get('albumTitle')), ext=download_url.split('?')[0].split('.')[-1], file_size_bytes=file_size_bytes, file_size=file_size, identifier=song_id,
|
||||
duration_s=int(float(search_result.get('duration', 0) or 0)), duration=seconds2hms(search_result.get('duration', 0) or 0), lyric=None, cover_url=safeextractfromdict(search_result, ['cover_path'], None),
|
||||
download_url=download_url, download_url_status=self.audio_link_tester.test(download_url, request_overrides),
|
||||
)
|
||||
song_info.download_url_status['probe_status'] = self.audio_link_tester.probe(song_info.download_url, request_overrides)
|
||||
song_info.file_size = song_info.download_url_status['probe_status']['file_size']
|
||||
song_info.ext = song_info.download_url_status['probe_status']['ext'] if (song_info.download_url_status['probe_status']['ext'] and song_info.download_url_status['probe_status']['ext'] not in ('NULL',)) else song_info.ext
|
||||
return song_info
|
||||
'''_parsewithofficialapiv1'''
|
||||
def _parsewithofficialapiv1(self, search_result: dict, request_overrides: dict = None):
|
||||
# init
|
||||
request_overrides, song_id, song_info = request_overrides or {}, search_result.get('id') or search_result.get('trackId'), SongInfo(source=self.source)
|
||||
# parse
|
||||
params = {"device": "web", "trackId": song_id, "trackQualityLevel": '3'}
|
||||
(resp := self.get(f"https://www.ximalaya.com/mobile-playpage/track/v3/baseInfo/{int(time.time() * 1000)}", params=params, **request_overrides)).raise_for_status()
|
||||
download_result = resp2json(resp=resp)
|
||||
track_info = safeextractfromdict(download_result, ['trackInfo'], {})
|
||||
if not track_info or not isinstance(track_info, dict): return song_info
|
||||
for encrypted_url in sorted(safeextractfromdict(track_info, ['playUrlList'], []), key=lambda x: int(x['fileSize']), reverse=True):
|
||||
if not isinstance(encrypted_url, dict): continue
|
||||
download_url: str = self._crackplayurl(encrypted_url.get('url', ''))
|
||||
if not download_url or not str(download_url).startswith('http'): continue
|
||||
song_info = SongInfo(
|
||||
raw_data={'search': search_result, 'download': download_result, 'lyric': {}}, source=self.source, song_name=legalizestring(search_result.get('title')), singers=legalizestring(search_result.get('nickname')),
|
||||
album=legalizestring(search_result.get('album_title') or search_result.get('albumTitle')), ext=download_url.split('?')[0].split('.')[-1] or 'mp3', file_size_bytes=float(encrypted_url.get('fileSize', 0) or 0),
|
||||
file_size=byte2mb(encrypted_url.get('fileSize', 0)), identifier=song_id, duration_s=int(float(search_result.get('duration', 0) or 0)), duration=seconds2hms(search_result.get('duration', 0) or 0), lyric=None,
|
||||
cover_url=safeextractfromdict(search_result, ['cover_path'], None), download_url=download_url, download_url_status=self.audio_link_tester.test(download_url, request_overrides),
|
||||
)
|
||||
if not song_info.with_valid_download_url: continue
|
||||
song_info.download_url_status['probe_status'] = self.audio_link_tester.probe(song_info.download_url, request_overrides)
|
||||
song_info.file_size = song_info.download_url_status['probe_status']['file_size']
|
||||
song_info.ext = song_info.download_url_status['probe_status']['ext'] if (song_info.download_url_status['probe_status']['ext'] and song_info.download_url_status['probe_status']['ext'] not in ('NULL',)) else song_info.ext
|
||||
if song_info.with_valid_download_url: break
|
||||
# return
|
||||
return song_info
|
||||
'''_parsebytrack'''
|
||||
def _parsebytrack(self, search_results, song_infos: list = [], request_overrides: dict = None, progress: Progress = None):
|
||||
request_overrides = request_overrides or {}
|
||||
for search_result in search_results['response']['docs']:
|
||||
if (not isinstance(search_result, dict)) or ('id' not in search_result): continue
|
||||
song_info = SongInfo(source=self.source)
|
||||
for parser in [self._parsewithcggapi, self._parsewithofficialapiv1]:
|
||||
try: song_info = parser(search_result=search_result, request_overrides=request_overrides)
|
||||
except: continue
|
||||
if song_info.with_valid_download_url: break
|
||||
if not song_info.with_valid_download_url: continue
|
||||
song_infos.append(song_info)
|
||||
if self.strict_limit_search_size_per_page and len(song_infos) >= self.search_size_per_page: break
|
||||
return song_infos
|
||||
'''_parsebyalbum'''
|
||||
def _parsebyalbum(self, search_results, song_infos: list = [], request_overrides: dict = None, progress: Progress = None):
|
||||
request_overrides = request_overrides or {}
|
||||
for search_result in search_results['response']['docs']:
|
||||
if (not isinstance(search_result, dict)) or ('id' not in search_result): continue
|
||||
download_results, page_size, tracks, unique_track_ids = [], 200, [], set()
|
||||
song_info = SongInfo(
|
||||
raw_data={'search': search_result, 'download': download_results, 'lyric': {}}, source=self.source, song_name=legalizestring(search_result.get('title')), singers=legalizestring(search_result.get('nickname')),
|
||||
album=f"{search_result.get('tracks', 0) or 0} Episodes", ext=None, file_size=None, identifier=search_result['id'], duration='-:-:-', lyric=None, cover_url=safeextractfromdict(search_result, ['cover_path'], None),
|
||||
download_url=None, download_url_status={}, episodes=[],
|
||||
)
|
||||
num_pages = math.ceil(int(search_result.get('tracks', 0) or 0) / page_size)
|
||||
download_album_pid = progress.add_task(f"{self.source}._parsebyalbum >>> (0/{num_pages}) pages downloaded in album {search_result['id']}", total=num_pages)
|
||||
for page_num_idx, page_num in enumerate(range(1, num_pages + 1)):
|
||||
if page_num_idx > 0:
|
||||
progress.advance(download_album_pid, 1)
|
||||
progress.update(download_album_pid, description=f"{self.source}._parsebyalbum >>> ({page_num_idx}/{num_pages}) pages downloaded in album {search_result['id']}")
|
||||
try: resp = self.get(f'http://mobile.ximalaya.com/mobile/v1/album/track?albumId={search_result["id"]}&pageId={page_num}&pageSize={page_size}&isAsc=true', **request_overrides)
|
||||
except: continue
|
||||
download_results.append(resp2json(resp=resp))
|
||||
progress.advance(download_album_pid, 1)
|
||||
progress.update(download_album_pid, description=f"{self.source}._parsebyalbum >>> ({page_num_idx+1}/{num_pages}) pages downloaded in album {search_result['id']}")
|
||||
for download_result in download_results:
|
||||
for track in (safeextractfromdict(download_result, ['data', 'list'], []) or []):
|
||||
if not isinstance(track, dict) or not track.get('trackId'): continue
|
||||
if track.get('trackId') in unique_track_ids: continue
|
||||
unique_track_ids.add(track.get('trackId'))
|
||||
tracks.append(track)
|
||||
download_album_pid = progress.add_task(f"{self.source}._parsebyalbum >>> (0/{len(tracks)}) episodes completed in album {search_result['id']}", total=len(tracks))
|
||||
for track_idx, track in enumerate(tracks):
|
||||
if track_idx > 0:
|
||||
progress.advance(download_album_pid, 1)
|
||||
progress.update(download_album_pid, description=f"{self.source}._parsebyalbum >>> ({track_idx}/{len(tracks)}) episodes completed in album {search_result['id']}")
|
||||
eps_info = SongInfo(source=self.source)
|
||||
for parser in [self._parsewithcggapi, self._parsewithofficialapiv1]:
|
||||
try: eps_info = parser(search_result=track, request_overrides=request_overrides)
|
||||
except: continue
|
||||
if eps_info.with_valid_download_url: break
|
||||
if not eps_info.with_valid_download_url: continue
|
||||
song_info.episodes.append(eps_info)
|
||||
progress.advance(download_album_pid, 1)
|
||||
progress.update(download_album_pid, description=f"{self.source}._parsebyalbum >>> ({track_idx+1}/{len(tracks)}) episodes completed in album {search_result['id']}")
|
||||
if not song_info.with_valid_download_url: continue
|
||||
try: song_info.duration_s = sum([eps.duration_s for eps in song_info.episodes]); song_info.duration = seconds2hms(song_info.duration_s)
|
||||
except Exception: pass
|
||||
try: song_info.file_size_bytes = sum([eps.file_size_bytes for eps in song_info.episodes]); song_info.file_size = byte2mb(song_info.file_size_bytes)
|
||||
except Exception: pass
|
||||
song_infos.append(song_info)
|
||||
if self.strict_limit_search_size_per_page and len(song_infos) >= self.search_size_per_page: break
|
||||
return song_infos
|
||||
'''_search'''
|
||||
@usesearchheaderscookies
|
||||
def _search(self, keyword: str = '', search_url: str = '', request_overrides: dict = None, song_infos: list = [], progress: Progress = None, progress_id: int = 0):
|
||||
# init
|
||||
request_overrides = request_overrides or {}
|
||||
# successful
|
||||
try:
|
||||
# --search results
|
||||
(resp := self.get(search_url, **request_overrides)).raise_for_status()
|
||||
search_results = resp2json(resp)
|
||||
# --parse based on search type
|
||||
search_type = parse_qs(urlparse(search_url).query, keep_blank_values=True).get('core')[0]
|
||||
parsers = {'album': self._parsebyalbum, 'track': self._parsebytrack}
|
||||
parsers[search_type](search_results, song_infos=song_infos, request_overrides=request_overrides, progress=progress)
|
||||
# --update progress
|
||||
progress.update(progress_id, description=f"{self.source}.search >>> {search_url} (Success)")
|
||||
# failure
|
||||
except Exception as err:
|
||||
progress.update(progress_id, description=f"{self.source}.search >>> {search_url} (Error: {err})")
|
||||
# return
|
||||
return song_infos
|
||||
Reference in New Issue
Block a user