Merge pull request #6966 from remitamine/kuwo

author Yen Chi Hsuan <yan12125@gmail.com>

Sat, 26 Sep 2015 11:28:16 +0000 (19:28 +0800)

committer Yen Chi Hsuan <yan12125@gmail.com>

Sat, 26 Sep 2015 11:28:16 +0000 (19:28 +0800)
author Yen Chi Hsuan <yan12125@gmail.com>
Sat, 26 Sep 2015 11:28:16 +0000 (19:28 +0800)
committer Yen Chi Hsuan <yan12125@gmail.com>
Sat, 26 Sep 2015 11:28:16 +0000 (19:28 +0800)
diff --git a/youtube_dl/extractor/kuwo.py b/youtube_dl/extractor/kuwo.py

index fa233377d67ee83bf71db61f14d0e934111174a3..0c8ed5d07258d463375c2848d2f93c79885bdaae 100644 (file)
--- a/youtube_dl/extractor/kuwo.py
+++ b/youtube_dl/extractor/kuwo.py
@@ -57,6 +57,7 @@ class KuwoIE(KuwoBaseIE):
              'upload_date': '20080122',
              'description': 'md5:ed13f58e3c3bf3f7fd9fbc4e5a7aa75c'
          },
+        'skip': 'this song has been offline because of copyright issues',
      }, {
          'url': 'http://www.kuwo.cn/yinyue/6446136/',
          'info_dict': {
@@ -76,9 +77,11 @@ class KuwoIE(KuwoBaseIE):
          webpage = self._download_webpage(
              url, song_id, note='Download song detail info',
              errnote='Unable to get song detail info')
+        if '对不起，该歌曲由于版权问题已被下线，将返回网站首页' in webpage:
+            raise ExtractorError('this song has been offline because of copyright issues', expected=True)
  
          song_name = self._html_search_regex(
-            r'<h1[^>]+title="([^"]+)">', webpage, 'song name')
+            r'(?s)class="(?:[^"\s]+\s+)*title(?:\s+[^"\s]+)*".*?<h1[^>]+title="([^"]+)"', webpage, 'song name')
          singer_name = self._html_search_regex(
              r'<div[^>]+class="s_img">\s*<a[^>]+title="([^>]+)"',
              webpage, 'singer name', fatal=False)
author	Yen Chi Hsuan <yan12125@gmail.com>
	Sat, 26 Sep 2015 11:28:16 +0000 (19:28 +0800)
committer	Yen Chi Hsuan <yan12125@gmail.com>
	Sat, 26 Sep 2015 11:28:16 +0000 (19:28 +0800)