[svtplay:series] Add extractor

author Mattias Wadman <mattias.wadman@gmail.com>

Fri, 30 Mar 2018 18:02:09 +0000 (20:02 +0200)

committer Sergey M․ <dstftw@gmail.com>

Wed, 4 Apr 2018 17:28:58 +0000 (00:28 +0700)
author Mattias Wadman <mattias.wadman@gmail.com>
Fri, 30 Mar 2018 18:02:09 +0000 (20:02 +0200)
committer Sergey M․ <dstftw@gmail.com>
Wed, 4 Apr 2018 17:28:58 +0000 (00:28 +0700)
diff --git a/youtube_dl/extractor/extractors.py b/youtube_dl/extractor/extractors.py

index bded6e144cc86acf063850d05acb17a22059d61f..b46a304acdae8e139d60591b71716b27cad2f6a3 100644 (file)
--- a/youtube_dl/extractor/extractors.py
+++ b/youtube_dl/extractor/extractors.py
@@ -1031,6 +1031,7 @@ from .sunporno import SunPornoIE
  from .svt import (
      SVTIE,
      SVTPlayIE,
+    SVTPlaylistIE,
  )
  from .swrmediathek import SWRMediathekIE
  from .syfy import SyfyIE
diff --git a/youtube_dl/extractor/svt.py b/youtube_dl/extractor/svt.py

index 48bc4529e6ae8a265a672c066ac59b388ea3a5d5..d02fd945081c80cebad517c46849ed5e831a3887 100644 (file)
--- a/youtube_dl/extractor/svt.py
+++ b/youtube_dl/extractor/svt.py
@@ -9,6 +9,8 @@ from ..utils import (
      dict_get,
      int_or_none,
      try_get,
+    urljoin,
+    compat_str,
  )
  
  
@@ -189,3 +191,58 @@ class SVTPlayIE(SVTBaseIE):
                      r'\s*\|\s*.+?$', '',
                      info_dict.get('episode') or self._og_search_title(webpage))
              return info_dict
+
+
+class SVTPlaylistIE(InfoExtractor):
+    IE_DESC = 'SVT Play serie'
+    _VALID_URL = r'https?://(?:www\.)?svtplay\.se/(?P<id>[^/?&#]+)'
+    IE_NAME = 'svtplay:serie'
+    _TESTS = [{
+        'url': 'https://www.svtplay.se/rederiet',
+        'info_dict': {
+            'id': 'rederiet',
+            'title': 'Rederiet',
+            'description': 'md5:505d491a58f4fcf6eb418ecab947e69e',
+        },
+        'playlist_mincount': 318,
+    }]
+
+    @classmethod
+    def suitable(cls, url):
+        return False if SVTIE.suitable(url) or SVTPlayIE.suitable(url) else super(SVTPlaylistIE, cls).suitable(url)
+
+    def _real_extract(self, url):
+        video_id = self._match_id(url)
+
+        page = self._download_webpage(
+            url, video_id,
+            note='Downloading serie page',
+            errnote='unable to fetch serie page')
+
+        root_json = self._search_regex(
+            r'root\[\'__svtplay\'\]\s*=(.+);\n',
+            page, 'root')
+        root = self._parse_json(root_json, video_id)
+
+        metadata = root.get('metaData', {})
+        related_videos_accordion = root['relatedVideoContent']['relatedVideosAccordion']
+
+        entries = []
+        for season in related_videos_accordion:
+            videos = season.get('videos')
+            if not isinstance(videos, list):
+                continue
+
+            for video in videos:
+                content_url = video.get('contentUrl')
+                if not isinstance(content_url, compat_str):
+                    continue
+                entries.append(
+                    self.url_result(
+                        urljoin(url, content_url),
+                        ie=SVTPlayIE.ie_key(),
+                        video_title=video.get('title')
+                    ))
+
+        return self.playlist_result(
+            entries, video_id, metadata.get('title'), metadata.get('description'))
author	Mattias Wadman <mattias.wadman@gmail.com>
	Fri, 30 Mar 2018 18:02:09 +0000 (20:02 +0200)
committer	Sergey M․ <dstftw@gmail.com>
	Wed, 4 Apr 2018 17:28:58 +0000 (00:28 +0700)
youtube_dl/extractor/extractors.py		patch \| blob \| history
youtube_dl/extractor/svt.py		patch \| blob \| history