Skip to content

Commit 1722c55

Browse files
doe1080eason1478
andauthored
[ie/hypergryph] Improve metadata extraction (#13415)
Closes #13384 Authored by: doe1080, eason1478 Co-authored-by: eason1478 <[email protected]>
1 parent e6bd4a3 commit 1722c55

File tree

1 file changed

+45
-11
lines changed

1 file changed

+45
-11
lines changed

yt_dlp/extractor/hypergryph.py

Lines changed: 45 additions & 11 deletions
Original file line numberDiff line numberDiff line change
@@ -1,32 +1,66 @@
11
from .common import InfoExtractor
2-
from ..utils import js_to_json, traverse_obj
2+
from ..utils import (
3+
ExtractorError,
4+
clean_html,
5+
url_or_none,
6+
)
7+
from ..utils.traversal import subs_list_to_dict, traverse_obj
38

49

510
class MonsterSirenHypergryphMusicIE(InfoExtractor):
11+
IE_NAME = 'monstersiren'
12+
IE_DESC = '塞壬唱片'
13+
_API_BASE = 'https://monster-siren.hypergryph.com/api'
614
_VALID_URL = r'https?://monster-siren\.hypergryph\.com/music/(?P<id>\d+)'
715
_TESTS = [{
816
'url': 'https://monster-siren.hypergryph.com/music/514562',
917
'info_dict': {
1018
'id': '514562',
1119
'ext': 'wav',
12-
'artists': ['塞壬唱片-MSR'],
13-
'album': 'Flame Shadow',
1420
'title': 'Flame Shadow',
21+
'album': 'Flame Shadow',
22+
'artists': ['塞壬唱片-MSR'],
23+
'description': 'md5:19e2acfcd1b65b41b29e8079ab948053',
24+
'thumbnail': r're:https?://web\.hycdn\.cn/siren/pic/.+\.jpg',
25+
},
26+
}, {
27+
'url': 'https://monster-siren.hypergryph.com/music/514518',
28+
'info_dict': {
29+
'id': '514518',
30+
'ext': 'wav',
31+
'title': 'Heavenly Me (Instrumental)',
32+
'album': 'Heavenly Me',
33+
'artists': ['塞壬唱片-MSR', 'AIYUE blessed : 理名'],
34+
'description': 'md5:ce790b41c932d1ad72eb791d1d8ae598',
35+
'thumbnail': r're:https?://web\.hycdn\.cn/siren/pic/.+\.jpg',
1536
},
1637
}]
1738

1839
def _real_extract(self, url):
1940
audio_id = self._match_id(url)
20-
webpage = self._download_webpage(url, audio_id)
21-
json_data = self._search_json(
22-
r'window\.g_initialProps\s*=', webpage, 'data', audio_id, transform_source=js_to_json)
41+
song = self._download_json(f'{self._API_BASE}/song/{audio_id}', audio_id)
42+
if traverse_obj(song, 'code') != 0:
43+
msg = traverse_obj(song, ('msg', {str}, filter))
44+
raise ExtractorError(
45+
msg or 'API returned an error response', expected=bool(msg))
46+
47+
album = None
48+
if album_id := traverse_obj(song, ('data', 'albumCid', {str})):
49+
album = self._download_json(
50+
f'{self._API_BASE}/album/{album_id}/detail', album_id, fatal=False)
2351

2452
return {
2553
'id': audio_id,
26-
'title': traverse_obj(json_data, ('player', 'songDetail', 'name')),
27-
'url': traverse_obj(json_data, ('player', 'songDetail', 'sourceUrl')),
28-
'ext': 'wav',
2954
'vcodec': 'none',
30-
'artists': traverse_obj(json_data, ('player', 'songDetail', 'artists', ...)),
31-
'album': traverse_obj(json_data, ('musicPlay', 'albumDetail', 'name')),
55+
**traverse_obj(song, ('data', {
56+
'title': ('name', {str}),
57+
'artists': ('artists', ..., {str}),
58+
'subtitles': ({'url': 'lyricUrl'}, all, {subs_list_to_dict(lang='en')}),
59+
'url': ('sourceUrl', {url_or_none}),
60+
})),
61+
**traverse_obj(album, ('data', {
62+
'album': ('name', {str}),
63+
'description': ('intro', {clean_html}),
64+
'thumbnail': ('coverUrl', {url_or_none}),
65+
})),
3266
}

0 commit comments

Comments
 (0)