PyPI - musicdl - Versions diffs - 2.1.11__py3-none-any.whl → 2.7.3__py3-none-any.whl - Mend

musicdl 2.1.11py3-none-any.whl → 2.7.3py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (59) hide show

musicdl/__init__.py +5 -5
musicdl/modules/__init__.py +10 -3
musicdl/modules/common/__init__.py +2 -0
musicdl/modules/common/gdstudio.py +204 -0
musicdl/modules/js/__init__.py +1 -0
musicdl/modules/js/youtube/__init__.py +2 -0
musicdl/modules/js/youtube/botguard.js +1 -0
musicdl/modules/js/youtube/jsinterp.py +902 -0
musicdl/modules/js/youtube/runner.js +2 -0
musicdl/modules/sources/__init__.py +41 -10
musicdl/modules/sources/apple.py +207 -0
musicdl/modules/sources/base.py +256 -28
musicdl/modules/sources/bilibili.py +118 -0
musicdl/modules/sources/buguyy.py +148 -0
musicdl/modules/sources/fangpi.py +153 -0
musicdl/modules/sources/fivesing.py +108 -0
musicdl/modules/sources/gequbao.py +148 -0
musicdl/modules/sources/jamendo.py +108 -0
musicdl/modules/sources/joox.py +104 -68
musicdl/modules/sources/kugou.py +129 -76
musicdl/modules/sources/kuwo.py +188 -68
musicdl/modules/sources/lizhi.py +107 -0
musicdl/modules/sources/migu.py +172 -66
musicdl/modules/sources/mitu.py +140 -0
musicdl/modules/sources/mp3juice.py +264 -0
musicdl/modules/sources/netease.py +163 -115
musicdl/modules/sources/qianqian.py +125 -77
musicdl/modules/sources/qq.py +232 -94
musicdl/modules/sources/tidal.py +342 -0
musicdl/modules/sources/ximalaya.py +256 -0
musicdl/modules/sources/yinyuedao.py +144 -0
musicdl/modules/sources/youtube.py +238 -0
musicdl/modules/utils/__init__.py +12 -4
musicdl/modules/utils/appleutils.py +563 -0
musicdl/modules/utils/data.py +107 -0
musicdl/modules/utils/logger.py +211 -58
musicdl/modules/utils/lyric.py +73 -0
musicdl/modules/utils/misc.py +335 -23
musicdl/modules/utils/modulebuilder.py +75 -0
musicdl/modules/utils/neteaseutils.py +81 -0
musicdl/modules/utils/qqutils.py +184 -0
musicdl/modules/utils/quarkparser.py +105 -0
musicdl/modules/utils/songinfoutils.py +54 -0
musicdl/modules/utils/tidalutils.py +738 -0
musicdl/modules/utils/youtubeutils.py +3606 -0
musicdl/musicdl.py +184 -86
musicdl-2.7.3.dist-info/LICENSE +203 -0
musicdl-2.7.3.dist-info/METADATA +704 -0
musicdl-2.7.3.dist-info/RECORD +53 -0
{musicdl-2.1.11.dist-info → musicdl-2.7.3.dist-info}/WHEEL +5 -5
musicdl-2.7.3.dist-info/entry_points.txt +2 -0
musicdl/modules/sources/baiduFlac.py +0 -69
musicdl/modules/sources/xiami.py +0 -104
musicdl/modules/utils/downloader.py +0 -80
musicdl-2.1.11.dist-info/LICENSE +0 -22
musicdl-2.1.11.dist-info/METADATA +0 -82
musicdl-2.1.11.dist-info/RECORD +0 -24
{musicdl-2.1.11.dist-info → musicdl-2.7.3.dist-info}/top_level.txt +0 -0
{musicdl-2.1.11.dist-info → musicdl-2.7.3.dist-info}/zip-safe +0 -0

musicdl/modules/sources/tidal.py ADDED Viewed

@@ -0,0 +1,342 @@
+'''
+Function:
+    Implementation of TIDALMusicClient: https://tidal.com/
+Author:
+    Zhenchao Jin
+WeChat Official Account (微信公众号):
+    Charles的皮卡丘
+'''
+import os
+import re
+import copy
+import aigpy
+import base64
+import tempfile
+import json_repair
+from xml.etree import ElementTree
+from .base import BaseMusicClient
+from rich.progress import Progress
+from urllib.parse import urlencode, urljoin
+from ..utils import legalizestring, resp2json, seconds2hms, touchdir, replacefile, usesearchheaderscookies, usedownloadheaderscookies, SongInfo, SongInfoUtils
+from ..utils.tidalutils import (
+    TIDALTvSession, SearchResult, StreamRespond, StreamUrl, Manifest, Period, AdaptationSet, Representation, SegmentTemplate, SegmentList, SegmentTimelineEntry, Track,
+    decryptfile, decryptsecuritytoken, pyavready, ffmpegready, remuxflacstream, setmetadata
+)
+'''TIDALMusicClient'''
+class TIDALMusicClient(BaseMusicClient):
+    source = 'TIDALMusicClient'
+    def __init__(self, **kwargs):
+        super(TIDALMusicClient, self).__init__(**kwargs)
+        self.tidal_session = TIDALTvSession(headers={}, cookies=self.default_cookies)
+        try:
+            self.tidal_session.loadfromcache()
+            self.tidal_session.refresh()
+        except:
+            self.tidal_session.auth()
+        self.tidal_session.cache()
+        self._setauthheaders()
+        self._initsession()
+    '''_setauthheaders'''
+    def _setauthheaders(self):
+        self.default_search_headers = self.tidal_session.auth_headers
+        self.default_download_headers = self.tidal_session.auth_headers
+        self.default_headers = self.default_search_headers
+    '''_saferequestget'''
+    def _saferequestget(self, url, **kwargs):
+        resp = self.get(url, **kwargs)
+        if resp.status_code in [401, 403]:
+            self.tidal_session.refresh()
+            self._setauthheaders()
+            self._initsession()
+            resp = self.get(url, **kwargs)
+        return resp
+    '''_parsedashmanifest'''
+    def _parsedashmanifest(self, xml):
+        # getbaseurl
+        def _getbaseurl(element: ElementTree.Element, inherited: str):
+            base_url = inherited
+            base_el = element.find('BaseURL')
+            if base_el is not None and base_el.text:
+                candidate = base_el.text.strip()
+                if candidate:
+                    base_url = urljoin(inherited, candidate)
+            return base_url
+        # _parsesegmenttemplate
+        def _parsesegmenttemplate(element: ElementTree.Element):
+            template = SegmentTemplate(
+                media=element.get('media'), initialization=element.get('initialization'), start_number=int(element.get('startNumber') or 1),
+                timescale=int(element.get('timescale') or 1), presentation_time_offset=int(element.get('presentationTimeOffset') or 0),
+            )
+            timeline_el = element.find('SegmentTimeline')
+            if timeline_el is not None:
+                for s_el in timeline_el.findall('S'):
+                    duration = int(s_el.get('d'))
+                    repeat = int(s_el.get('r') or 0)
+                    start_time = int(s_el.get('t')) if s_el.get('t') else None
+                    template.timeline.append(SegmentTimelineEntry(start_time=start_time, duration=duration, repeat=repeat))
+            return template
+        # _parsesegmentlist
+        def _parsesegmentlist(element: ElementTree.Element):
+            init_el = element.find('Initialization')
+            initialization = init_el.get('sourceURL') if init_el is not None else None
+            media_segments = []
+            for seg_el in element.findall('SegmentURL'):
+                media = seg_el.get('media')
+                if media: media_segments.append(media)
+            return SegmentList(initialization=initialization, media_segments=media_segments)
+        # _parserepresentation
+        def _parserepresentation(element: ElementTree.Element, parent_base: str):
+            base_url = _getbaseurl(element, parent_base)
+            template = element.find('SegmentTemplate')
+            seg_template = _parsesegmenttemplate(template) if template is not None else None
+            seg_list_el = element.find('SegmentList')
+            seg_list = _parsesegmentlist(seg_list_el) if seg_list_el is not None else None
+            return Representation(
+                id=element.get('id'), bandwidth=element.get('bandwidth'), codec=element.get('codecs'), base_url=base_url, segment_template=seg_template,
+                segment_list=seg_list,
+            )
+        # _parseadaptation
+        def _parseadaptation(element: ElementTree.Element, parent_base: str):
+            base_url = _getbaseurl(element, parent_base)
+            adaptation = AdaptationSet(content_type=element.get('contentType'), base_url=base_url)
+            for rep_el in element.findall('Representation'):
+                adaptation.representations.append(_parserepresentation(rep_el, base_url))
+            return adaptation
+        # _parseperiod
+        def _parseperiod(element: ElementTree.Element, parent_base: str):
+            base_url = _getbaseurl(element, parent_base)
+            period = Period(base_url=base_url)
+            for adaptation_el in element.findall('AdaptationSet'):
+                period.adaptation_sets.append(_parseadaptation(adaptation_el, base_url))
+            return period
+        # convert to string text
+        if isinstance(xml, bytes):
+            xml_text = xml.decode("utf-8")
+        else:
+            xml_text = str(xml)
+        # parse
+        xml_text = re.sub(r'xmlns="[^"]+"', '', xml_text, count=1)
+        root = ElementTree.fromstring(xml_text)
+        manifest_base = _getbaseurl(root, '')
+        manifest = Manifest(base_url=manifest_base)
+        for period_el in root.findall('Period'):
+            manifest.periods.append(_parseperiod(period_el, manifest_base))
+        # return
+        return manifest
+    '''_parsempd'''
+    def _parsempd(self, xml: bytes):
+        manifest = self._parsedashmanifest(xml)
+        for period in manifest.periods:
+            for adaptation in period.adaptation_sets:
+                if adaptation.content_type == 'audio':
+                    for representation in adaptation.representations:
+                        if representation.segments:
+                            return manifest
+    '''_parsemanifest'''
+    def _parsemanifest(self, stream_resp: StreamRespond):
+        # vnd.tidal.bt
+        if "vnd.tidal.bt" in stream_resp.manifestMimeType:
+            manifest = json_repair.loads(base64.b64decode(stream_resp.manifest).decode('utf-8'))
+            stream_url = StreamUrl()
+            stream_url.trackid = stream_resp.trackid
+            stream_url.soundQuality = stream_resp.audioQuality
+            stream_url.codec = manifest['codecs']
+            stream_url.encryptionKey = manifest['keyId'] if 'keyId' in manifest else ""
+            stream_url.url = manifest['urls'][0]
+            stream_url.urls = [stream_url.url]
+            return stream_url
+        # dash+xml
+        elif "dash+xml" in stream_resp.manifestMimeType:
+            xml_bytes = base64.b64decode(stream_resp.manifest)
+            manifest = self._parsempd(xml_bytes)
+            if not manifest: return
+            stream_url = StreamUrl()
+            stream_url.trackid = stream_resp.trackid
+            stream_url.soundQuality = stream_resp.audioQuality
+            audio_reps = []
+            for period in manifest.periods:
+                for adaptation in period.adaptation_sets:
+                    if adaptation.content_type == 'audio':
+                        audio_reps.extend(adaptation.representations)
+            if not audio_reps: return
+            representation = next((rep for rep in audio_reps if rep.segments), audio_reps[0])
+            codec = (representation.codec or '').upper()
+            if codec.startswith('MP4A'): codec = 'AAC'
+            stream_url.codec = codec
+            stream_url.encryptionKey = ""
+            stream_url.urls = representation.segments
+            if len(stream_url.urls) > 0:
+                stream_url.url = stream_url.urls[0]
+            return stream_url
+    '''_guessextension'''
+    def _guessextension(self, stream_url: StreamUrl):
+        url = (stream_url.url or '').lower()
+        codec = (stream_url.codec or '').lower()
+        if '.flac' in url: return '.flac'
+        if '.mp4' in url:
+            if 'ac4' in codec or 'mha1' in codec: return '.mp4'
+            elif 'flac' in codec: return '.flac'
+            return '.m4a'
+        return '.m4a'
+    '''_guessstreamextension'''
+    def _guessstreamextension(self, stream_url: StreamUrl):
+        candidates = []
+        if stream_url.url: candidates.append(stream_url.url)
+        if stream_url.urls: candidates.extend(stream_url.urls)
+        for candidate in candidates:
+            if not candidate: continue
+            lowered: str = candidate.split("?")[0].lower()
+            for ext in (".flac", ".mp4", ".m4a", ".m4b", ".mp3", ".ogg", ".aac"):
+                if lowered.endswith(ext): return ext
+        codec = (stream_url.codec or "").lower()
+        if "flac" in codec:
+            return ".flac"
+        if "mp4" in codec or "m4a" in codec or "aac" in codec:
+            return ".m4a"
+        return ".m4a"
+    '''_constructsearchurls'''
+    def _constructsearchurls(self, keyword: str, rule: dict = None, request_overrides: dict = None):
+        # init
+        rule, request_overrides = rule or {}, request_overrides or {}
+        # search rules
+        default_rule = {'countryCode': self.tidal_session.storage.country_code, 'limit': 10, 'offset': 0, 'query': keyword, 'includeContributors': 'truee'}
+        default_rule.update(rule)
+        # construct search urls based on search rules
+        base_url = 'https://api.tidal.com/v1/search?'
+        search_urls, page_size, count = [], self.search_size_per_page, 0
+        while self.search_size_per_source > count:
+            page_rule = copy.deepcopy(default_rule)
+            page_rule['limit'] = page_size
+            page_rule['offset'] = count
+            search_urls.append(base_url + urlencode(page_rule))
+            count += page_size
+        # return
+        return search_urls
+    '''_download'''
+    @usedownloadheaderscookies
+    def _download(self, song_info: SongInfo, request_overrides: dict = None, downloaded_song_infos: list = [], progress: Progress = None, song_progress_id: int = 0):
+        # init
+        request_overrides = request_overrides or {}
+        # success
+        try:
+            touchdir(song_info.work_dir)
+            # parse basic information
+            stream_url: StreamUrl = song_info.download_url
+            download_ext, final_ext = self._guessstreamextension(stream_url=stream_url), song_info.ext
+            if (final_ext != ".flac") or (download_ext == ".flac"):
+                remux_required = False
+            else:
+                remux_required = "flac" in (stream_url.codec or "").lower()
+            if remux_required and (not ffmpegready() and not pyavready()):
+                final_ext, remux_required = download_ext, False
+            chunk_size = 1048576
+            progress.update(song_progress_id, total=1)
+            progress.update(song_progress_id, description=f"{self.source}.download >>> {song_info.song_name} (Downloading)")
+            # download music file
+            with tempfile.TemporaryDirectory(prefix="musicdl-TIDALMusicClient-track-") as tmpdir:
+                download_part = os.path.join(
+                    tmpdir, f"download{download_ext}.part" if download_ext else "download.part"
+                )
+                tool = aigpy.download.DownloadTool(download_part, stream_url.urls)
+                tool.setUserProgress(None)
+                tool.setPartSize(chunk_size)
+                check, err = tool.start(showProgress=False)
+                assert check
+                decrypted_target = os.path.join(
+                    tmpdir, f"decrypted{download_ext}" if download_ext else "decrypted"
+                )
+                if aigpy.string.isNull(stream_url.encryptionKey):
+                    replacefile(download_part, decrypted_target)
+                    decrypted_path = decrypted_target
+                else:
+                    key, nonce = decryptsecuritytoken(stream_url.encryptionKey)
+                    decryptfile(download_part, decrypted_target, key, nonce)
+                    os.remove(download_part)
+                    decrypted_path = decrypted_target
+                if remux_required:
+                    remux_target = os.path.join(tmpdir, "remux.flac")
+                    processed_path, backend_used = remuxflacstream(decrypted_path, remux_target)
+                    if processed_path != decrypted_path:
+                        if os.path.exists(decrypted_path): os.remove(decrypted_path)
+                        decrypted_path = processed_path
+                    else:
+                        final_ext = download_ext
+                        decrypted_path = decrypted_path
+                save_path = song_info.save_path
+                replacefile(decrypted_path, save_path)
+                setmetadata(track=song_info.raw_data['search'], filepath=save_path, stream=stream_url)
+            # update progress
+            progress.update(song_progress_id, total=os.path.getsize(save_path))
+            progress.advance(song_progress_id, os.path.getsize(save_path))
+            progress.update(song_progress_id, description=f"{self.source}.download >>> {song_info.song_name} (Success)")
+            downloaded_song_info = copy.deepcopy(song_info)
+            downloaded_song_info.ext = final_ext
+            downloaded_song_infos.append(SongInfoUtils.fillsongtechinfo(downloaded_song_info, logger_handle=self.logger_handle, disable_print=self.disable_print))
+        # failure
+        except Exception as err:
+            progress.update(song_progress_id, description=f"{self.source}.download >>> {song_info.song_name} (Error: {err})")
+        # return
+        return downloaded_song_infos
+    '''_search'''
+    @usesearchheaderscookies
+    def _search(self, keyword: str = '', search_url: str = '', request_overrides: dict = None, song_infos: list = [], progress: Progress = None, progress_id: int = 0):
+        # init
+        request_overrides = request_overrides or {}
+        # successful
+        try:
+            # --search results
+            resp = self._saferequestget(search_url, **request_overrides)
+            resp.raise_for_status()
+            search_results: list[Track] = aigpy.model.dictToModel(resp2json(resp=resp), SearchResult()).tracks.items
+            for search_result in search_results:
+                if search_result.id is None: continue
+                song_info = SongInfo(source=self.source)
+                # --download results
+                qualities = [('hi_res_lossless', 'HI_RES_LOSSLESS'), ('high_lossless', 'LOSSLESS'), ('low_320k', 'HIGH'), ('low_96k', 'LOW')]
+                for quality in qualities:
+                    params = {"playbackmode": "STREAM", "audioquality": quality[1], "assetpresentation": "FULL",}
+                    try:
+                        resp = self._saferequestget(f'https://tidal.com/v1/tracks/{search_result.id}/playbackinfo', params=params, **request_overrides)
+                        resp.raise_for_status()
+                        download_result = aigpy.model.dictToModel(resp2json(resp), StreamRespond())
+                    except:
+                        continue
+                    if ("vnd.tidal.bt" not in download_result.manifestMimeType) and ("dash+xml" not in download_result.manifestMimeType): continue
+                    try: download_url = self._parsemanifest(stream_resp=download_result)
+                    except: continue
+                    if not download_url: continue
+                    song_info = SongInfo(
+                        source=self.source, download_url=download_url, download_url_status=self.audio_link_tester.test(download_url.urls[0], request_overrides),
+                        ext=self._guessextension(stream_url=download_url), duration=seconds2hms(search_result.duration),
+                        raw_data={'search': search_result, 'download': download_result}, file_size='NULL',
+                        song_name=legalizestring(search_result.title, replace_null_string='NULL'),
+                        singers=legalizestring(', '.join([singer.name for singer in search_result.artists]), replace_null_string='NULL'),
+                        album=legalizestring(search_result.album.title, replace_null_string='NULL'),
+                        identifier=search_result.id,
+                    )
+                    if song_info.with_valid_download_url: break
+                if not song_info.with_valid_download_url: continue
+                # --lyric results
+                params = {'countryCode': self.tidal_session.storage.country_code, 'include': 'lyrics'}
+                try:
+                    resp = self._saferequestget(f'https://openapi.tidal.com/v2/tracks/{search_result.id}', params=params, **request_overrides)
+                    resp.raise_for_status()
+                    lyric_result = resp2json(resp)
+                    lyric = lyric_result.get('included', [{}])[0].get('attributes', {}).get('lrcText', 'NULL')
+                except:
+                    lyric_result, lyric = {}, 'NULL'
+                song_info.raw_data['lyric'] = lyric_result
+                song_info.lyric = lyric
+                # --append to song_infos
+                song_infos.append(song_info)
+                # --judgement for search_size
+                if self.strict_limit_search_size_per_page and len(song_infos) >= self.search_size_per_page: break
+            # --update progress
+            progress.update(progress_id, description=f"{self.source}.search >>> {search_url} (Success)")
+        # failure
+        except Exception as err:
+            progress.update(progress_id, description=f"{self.source}.search >>> {search_url} (Error: {err})")
+        # return
+        return song_infos

musicdl/modules/sources/ximalaya.py ADDED Viewed

@@ -0,0 +1,256 @@
+'''
+Function:
+    Implementation of XimalayaMusicClient: https://www.ximalaya.com/
+Author:
+    Zhenchao Jin
+WeChat Official Account (微信公众号):
+    Charles的皮卡丘
+'''
+import re
+import time
+import copy
+import base64
+import binascii
+from Crypto.Cipher import AES
+from .base import BaseMusicClient
+from rich.progress import Progress
+from urllib.parse import urlencode, urlparse
+from ..utils import byte2mb, resp2json, seconds2hms, legalizestring, safeextractfromdict, usesearchheaderscookies, SongInfo
+'''XimalayaMusicClient'''
+class XimalayaMusicClient(BaseMusicClient):
+    source = 'XimalayaMusicClient'
+    def __init__(self, **kwargs):
+        super(XimalayaMusicClient, self).__init__(**kwargs)
+        self.default_search_headers = {
+            "User-Agent": "Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/142.0.0.0 Safari/537.36",
+        }
+        self.default_download_headers = {
+            "User-Agent": "Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/142.0.0.0 Safari/537.36",
+        }
+        self.default_headers = self.default_search_headers
+        self._initsession()
+    '''_decrypturl'''
+    def _decrypturl(self, ciphertext: str):
+        if not ciphertext: return ciphertext
+        key = binascii.unhexlify("aaad3e4fd540b0f79dca95606e72bf93")
+        ciphertext = base64.urlsafe_b64decode(ciphertext + "=" * (4 - len(ciphertext) % 4))
+        cipher = AES.new(key, AES.MODE_ECB)
+        plaintext = cipher.decrypt(ciphertext)
+        plaintext = re.sub(r"[^\x20-\x7E]", "", plaintext.decode("utf-8"))
+        return plaintext
+    '''_validategdstudio'''
+    def _validategdstudio(self, request_overrides: dict = None):
+        request_overrides = request_overrides or {}
+        try:
+            resp = self.get('https://music-api.gdstudio.xyz/api.php?types=search&source=ximalaya&name=%E4%B8%89%E5%9B%BD&count=1&pages=1', timeout=10, **request_overrides)
+            resp.raise_for_status()
+            result = resp2json(resp=resp)
+            assert isinstance(result, list) and (len(result) == 1)
+            return True
+        except:
+            return False
+    '''_constructsearchurls'''
+    def _constructsearchurls(self, keyword: str, rule: dict = None, request_overrides: dict = None):
+        # init
+        rule, request_overrides = rule or {}, request_overrides or {}
+        # if with cookies, use official apis
+        if self.default_search_cookies:
+            # --search rules
+            default_rule = {
+                'kw': keyword, 'page': 1, 'spellchecker': 'true', 'condition': 'relation', 'rows': self.search_size_per_page, 'device': 'iPhone',
+                'core': 'track', 'fq': '', 'paidFilter': 'false',
+            }
+            default_rule.update(rule)
+            # --construct search urls based on search rules
+            base_url = 'https://www.ximalaya.com/revision/search/main?'
+            search_urls, page_size, count = [], self.search_size_per_page, 0
+            while self.search_size_per_source > count:
+                page_rule = copy.deepcopy(default_rule)
+                page_rule['rows'] = page_size
+                page_rule['page'] = int(count // page_size) + 1
+                search_urls.append(base_url + urlencode(page_rule))
+                count += page_size
+        # if without cookies, use third part apis
+        else:
+            use_gdstudio = self._validategdstudio(request_overrides=request_overrides)
+            if use_gdstudio:
+                # --search rules
+                default_rule = {'types': 'search', 'source': 'ximalaya', 'name': keyword, 'count': self.search_size_per_page, 'pages': '1'}
+                default_rule.update(rule)
+                # --construct search urls based on search rules
+                base_url = 'https://music-api.gdstudio.xyz/api.php?'
+                search_urls, page_size, count = [], self.search_size_per_page, 0
+                while self.search_size_per_source > count:
+                    page_rule = copy.deepcopy(default_rule)
+                    page_rule['count'] = page_size
+                    page_rule['pages'] = int(count // page_size) + 1
+                    search_urls.append(base_url + urlencode(page_rule))
+                    count += page_size
+            else:
+                # --search rules
+                default_rule = {'msg': keyword, 'n': '', 'num': self.search_size_per_source, 'type': 'json'}
+                default_rule.update(rule)
+                # --construct search urls based on search rules
+                for base_url in ['https://api-v1.cenguigui.cn/api/music/dg_ximalayamusic.php?', 'https://api.cenguigui.cn/api/music/dg_ximalayamusic.php?']:
+                    page_rule = copy.deepcopy(default_rule)
+                    page_rule['num'] = self.search_size_per_source
+                    search_urls = [base_url + urlencode(page_rule)]
+                    self.search_size_per_page = self.search_size_per_source
+                    try:
+                        resp = self.get(search_urls[0], timeout=10, **request_overrides)
+                        resp.raise_for_status()
+                        result = resp2json(resp=resp)
+                        assert isinstance(result, dict) and (len(result['data']) > 0)
+                        break
+                    except:
+                        continue
+        # return
+        return search_urls
+    '''_parsecggapi'''
+    def _parsecggapi(self, keyword, search_results, song_infos: list = [], request_overrides: dict = None):
+        # init
+        request_overrides = request_overrides or {}
+        # parse
+        for search_result in search_results['data']:
+            # --download results
+            if (not isinstance(search_result, dict)) or ('trackId' not in search_result) or ('n' not in search_result):
+                continue
+            song_info = SongInfo(source=self.source)
+            params = {'msg': keyword, 'n': search_result['n'], 'num': self.search_size_per_source, 'type': 'json'}
+            try:
+                try:
+                    resp = self.get('https://api-v1.cenguigui.cn/api/music/dg_ximalayamusic.php', params=params, timeout=10, **request_overrides)
+                    resp.raise_for_status()
+                except:
+                    resp = self.get('https://api.cenguigui.cn/api/music/dg_ximalayamusic.php', params=params, timeout=10, **request_overrides)
+                    resp.raise_for_status()
+                download_result = resp2json(resp)
+                download_url: str = download_result.get('url', '')
+                if not download_url: continue
+                ext = download_url.split('.')[-1].split('?')[0]
+                song_info = SongInfo(
+                    source=self.source, download_url=download_url, download_url_status=self.audio_link_tester.test(download_url, request_overrides),
+                    raw_data={'search': search_result, 'download': {}, 'lyric': {}}, lyric='NULL', duration='-:-:-', file_size='NULL', ext=ext,
+                    song_name=legalizestring(search_result.get('title', 'NULL'), replace_null_string='NULL'),
+                    singers=legalizestring(search_result.get('nickname', 'NULL'), replace_null_string='NULL'),
+                    album=legalizestring(search_result.get('categoryName', 'NULL'), replace_null_string='NULL'),
+                    identifier=search_result['trackId'],
+                )
+            except:
+                continue
+            if not song_info.with_valid_download_url: continue
+            song_info.download_url_status['probe_status'] = self.audio_link_tester.probe(song_info.download_url, request_overrides)
+            ext, file_size = song_info.download_url_status['probe_status']['ext'], song_info.download_url_status['probe_status']['file_size']
+            if file_size and file_size != 'NULL': song_info.file_size = file_size
+            if ext and ext != 'NULL': song_info.ext = ext
+            # --append to song_infos
+            song_infos.append(song_info)
+            # --judgement for search_size
+            if self.strict_limit_search_size_per_page and len(song_infos) >= self.search_size_per_page: break
+        # return
+        return song_infos
+    '''_parsegdstudioapi'''
+    def _parsegdstudioapi(self, search_results, song_infos: list = [], request_overrides: dict = None):
+        # init
+        request_overrides = request_overrides or {}
+        # parse
+        for search_result in search_results:
+            # --download results
+            if (not isinstance(search_result, dict)) or ('id' not in search_result) or ('raw' not in search_result):
+                continue
+            song_info = SongInfo(source=self.source)
+            for quality in ['play_path_64', 'play_path_aacv164', 'play_path_32', 'play_path_aacv224']:
+                download_url: str = search_result['raw'].get(quality, '')
+                if not download_url: continue
+                song_info = SongInfo(
+                    source=self.source, download_url=download_url, download_url_status=self.audio_link_tester.test(download_url, request_overrides),
+                    raw_data={'search': search_result, 'download': {}, 'lyric': {}}, lyric='NULL', duration_s=search_result['raw'].get('duration', 0),
+                    duration=seconds2hms(search_result['raw'].get('duration', 0)), file_size='NULL', ext=download_url.split('.')[-1].split('?')[0],
+                    song_name=legalizestring(search_result['raw'].get('title', 'NULL'), replace_null_string='NULL'),
+                    singers=legalizestring(search_result['raw'].get('nickname', 'NULL'), replace_null_string='NULL'),
+                    album=legalizestring(search_result['raw'].get('album_title', 'NULL'), replace_null_string='NULL'),
+                    identifier=search_result['id'],
+                )
+                if song_info.with_valid_download_url: break
+            if not song_info.with_valid_download_url: continue
+            song_info.download_url_status['probe_status'] = self.audio_link_tester.probe(song_info.download_url, request_overrides)
+            ext, file_size = song_info.download_url_status['probe_status']['ext'], song_info.download_url_status['probe_status']['file_size']
+            if file_size and file_size != 'NULL': song_info.file_size = file_size
+            if ext and ext != 'NULL': song_info.ext = ext
+            # --append to song_infos
+            song_infos.append(song_info)
+            # --judgement for search_size
+            if self.strict_limit_search_size_per_page and len(song_infos) >= self.search_size_per_page: break
+        # return
+        return song_infos
+    '''_parseofficialapi'''
+    def _parseofficialapi(self, search_results, song_infos: list = [], request_overrides: dict = None):
+        # init
+        request_overrides = request_overrides or {}
+        for search_result in search_results['data']['track']['docs']:
+            # --download results
+            if (not isinstance(search_result, dict)) or ('trackUrl' not in search_result):
+                continue
+            song_info = SongInfo(source=self.source)
+            track_id = search_result.get('trackUrl').strip('/').split('/')[-1]
+            for quality in [2, 1, 0]:
+                params = {"device": "web", "trackId": track_id, "trackQualityLevel": quality}
+                try:
+                    resp = self.get(f"https://www.ximalaya.com/mobile-playpage/track/v3/baseInfo/{int(time.time() * 1000)}", params=params, **request_overrides)
+                    resp.raise_for_status()
+                    download_result = resp2json(resp=resp)
+                    track_info = safeextractfromdict(download_result, ['trackInfo'], {})
+                    if not track_info: continue
+                except:
+                    continue
+                for encrypted_url in sorted(safeextractfromdict(track_info, ['playUrlList'], []), key=lambda x: int(x['fileSize']), reverse=True):
+                    if not isinstance(encrypted_url, dict): continue
+                    download_url = self._decrypturl(encrypted_url.get('url', ''))
+                    if not download_url: continue
+                    song_info = SongInfo(
+                        source=self.source, download_url=download_url, download_url_status=self.audio_link_tester.test(download_url, request_overrides),
+                        raw_data={'search': search_result, 'download': download_result, 'lyric': {}}, lyric='NULL', duration_s=track_info.get('duration', 0),
+                        duration=seconds2hms(track_info.get('duration', 0)), file_size_bytes=encrypted_url.get('fileSize', 0), file_size=byte2mb(encrypted_url.get('fileSize', 0)),
+                        ext=download_url.split('.')[-1].split('?')[0], identifier=track_id, song_name=legalizestring(search_result.get('title', 'NULL'), replace_null_string='NULL'),
+                        singers=legalizestring(search_result.get('nickname', 'NULL'), replace_null_string='NULL'),
+                        album=legalizestring(safeextractfromdict(search_result, ['albumInfo', 'title'], ''), replace_null_string='NULL'),
+                    )
+                    if song_info.with_valid_download_url: break
+                if song_info.with_valid_download_url: break
+            if not song_info.with_valid_download_url: continue
+            song_info.download_url_status['probe_status'] = self.audio_link_tester.probe(song_info.download_url, request_overrides)
+            ext, file_size = song_info.download_url_status['probe_status']['ext'], song_info.download_url_status['probe_status']['file_size']
+            if file_size and file_size != 'NULL': song_info.file_size = file_size
+            if ext and ext != 'NULL': song_info.ext = ext
+            # --append to song_infos
+            song_infos.append(song_info)
+            # --judgement for search_size
+            if self.strict_limit_search_size_per_page and len(song_infos) >= self.search_size_per_page: break
+    '''_search'''
+    @usesearchheaderscookies
+    def _search(self, keyword: str = '', search_url: str = '', request_overrides: dict = None, song_infos: list = [], progress: Progress = None, progress_id: int = 0):
+        # init
+        request_overrides = request_overrides or {}
+        # successful
+        try:
+            # --search results
+            resp = self.get(search_url, **request_overrides)
+            resp.raise_for_status()
+            search_results = resp2json(resp)
+            # --parse based on selected API
+            parsed_search_url = urlparse(search_url)
+            if parsed_search_url.hostname in ['music-api.gdstudio.xyz']:
+                self._parsegdstudioapi(search_results, song_infos=song_infos, request_overrides=request_overrides)
+            elif parsed_search_url.hostname in ['api-v1.cenguigui.cn', 'api.cenguigui.cn']:
+                self._parsecggapi(keyword, search_results, song_infos=song_infos, request_overrides=request_overrides)
+            else:
+                self._parseofficialapi(search_results, song_infos=song_infos, request_overrides=request_overrides)
+            # --update progress
+            progress.update(progress_id, description=f"{self.source}.search >>> {search_url} (Success)")
+        # failure
+        except Exception as err:
+            progress.update(progress_id, description=f"{self.source}.search >>> {search_url} (Error: {err})")
+        # return
+        return song_infos

musicdl 2.1.11__py3-none-any.whl → 2.7.3__py3-none-any.whl

musicdl 2.1.11py3-none-any.whl → 2.7.3py3-none-any.whl