Merge pull request #6966 from remitamine/kuwo

[kuwo] fix title extraction and update test
2025-01-23 17:26:38 +00:00 · 2015-09-26 19:28:16 +08:00 · 2015-09-26 19:28:16 +08:00 · fe6ad195ae
parent a82ba8d0ce 7193650641
commit fe6ad195ae
1 changed files with 4 additions and 1 deletions
--- a/youtube_dl/extractor/kuwo.py
+++ b/youtube_dl/extractor/kuwo.py
@ -57,6 +57,7 @@ class KuwoIE(KuwoBaseIE):
            'upload_date': '20080122',
            'description': 'md5:ed13f58e3c3bf3f7fd9fbc4e5a7aa75c'
        },
        'skip': 'this song has been offline because of copyright issues',
    }, {
        'url': 'http://www.kuwo.cn/yinyue/6446136/',
        'info_dict': {
@ -76,9 +77,11 @@ def _real_extract(self, url):
        webpage = self._download_webpage(
            url, song_id, note='Download song detail info',
            errnote='Unable to get song detail info')
        if '对不起，该歌曲由于版权问题已被下线，将返回网站首页' in webpage:
            raise ExtractorError('this song has been offline because of copyright issues', expected=True)
        song_name = self._html_search_regex(
-            r'<h1[^>]+title="([^"]+)">', webpage, 'song name')
+            r'(?s)class="(?:[^"\s]+\s+)*title(?:\s+[^"\s]+)*".*?<h1[^>]+title="([^"]+)"', webpage, 'song name')
        singer_name = self._html_search_regex(
            r'<div[^>]+class="s_img">\s*<a[^>]+title="([^>]+)"',
            webpage, 'singer name', fatal=False)