[mangomolo] fix video format extraction and add support for player URLs

author Remita Amine <remitamine@gmail.com>

Thu, 17 Oct 2019 12:21:44 +0000 (13:21 +0100)

committer Remita Amine <remitamine@gmail.com>

Thu, 17 Oct 2019 12:21:44 +0000 (13:21 +0100)
author Remita Amine <remitamine@gmail.com>
Thu, 17 Oct 2019 12:21:44 +0000 (13:21 +0100)
committer Remita Amine <remitamine@gmail.com>
Thu, 17 Oct 2019 12:21:44 +0000 (13:21 +0100)
diff --git a/youtube_dl/extractor/generic.py b/youtube_dl/extractor/generic.py

index ec43c5ae4086a769300ce9e550244cd9c13d6c00..5ed952b295a3e288304626c173a2eb22c6483f27 100644 (file)
--- a/youtube_dl/extractor/generic.py
+++ b/youtube_dl/extractor/generic.py
@@ -2962,10 +2962,14 @@ class GenericIE(InfoExtractor):
  
          # Look for Mangomolo embeds
          mobj = re.search(
-            r'''(?x)<iframe[^>]+src=(["\'])(?P<url>(?:https?:)?//(?:www\.)?admin\.mangomolo\.com/analytics/index\.php/customers/embed/
+            r'''(?x)<iframe[^>]+src=(["\'])(?P<url>(?:https?:)?//
+                (?:
+                    admin\.mangomolo\.com/analytics/index\.php/customers/embed|
+                    player\.mangomolo\.com/v1
+                )/
                  (?:
                      video\?.*?\bid=(?P<video_id>\d+)|
-                    index\?.*?\bchannelid=(?P<channel_id>(?:[A-Za-z0-9+/=]|%2B|%2F|%3D)+)
+                    (?:index|live)\?.*?\bchannelid=(?P<channel_id>(?:[A-Za-z0-9+/=]|%2B|%2F|%3D)+)
                  ).+?)\1''', webpage)
          if mobj is not None:
              info = {
diff --git a/youtube_dl/extractor/mangomolo.py b/youtube_dl/extractor/mangomolo.py

index 482175a3412db859e32cb79893df1c830afa17e7..acee370e931602bd3972eb631109e71c74c97ce8 100644 (file)
--- a/youtube_dl/extractor/mangomolo.py
+++ b/youtube_dl/extractor/mangomolo.py
@@ -10,18 +10,21 @@ from ..utils import int_or_none
  
  
  class MangomoloBaseIE(InfoExtractor):
+    _BASE_REGEX = r'https?://(?:admin\.mangomolo\.com/analytics/index\.php/customers/embed/|player\.mangomolo\.com/v1/)'
+
      def _get_real_id(self, page_id):
          return page_id
  
      def _real_extract(self, url):
          page_id = self._get_real_id(self._match_id(url))
-        webpage = self._download_webpage(url, page_id)
+        webpage = self._download_webpage(
+            'https://player.mangomolo.com/v1/%s?%s' % (self._TYPE, url.split('?')[1]), page_id)
          hidden_inputs = self._hidden_inputs(webpage)
          m3u8_entry_protocol = 'm3u8' if self._IS_LIVE else 'm3u8_native'
  
          format_url = self._html_search_regex(
              [
-                r'file\s*:\s*"(https?://[^"]+?/playlist\.m3u8)',
+                r'(?:file|src)\s*:\s*"(https?://[^"]+?/playlist\.m3u8)',
                  r'<a[^>]+href="(rtsp://[^"]+)"'
              ], webpage, 'format url')
          formats = self._extract_wowza_formats(
@@ -39,14 +42,16 @@ class MangomoloBaseIE(InfoExtractor):
  
  
  class MangomoloVideoIE(MangomoloBaseIE):
-    IE_NAME = 'mangomolo:video'
-    _VALID_URL = r'https?://admin\.mangomolo\.com/analytics/index\.php/customers/embed/video\?.*?\bid=(?P<id>\d+)'
+    _TYPE = 'video'
+    IE_NAME = 'mangomolo:' + _TYPE
+    _VALID_URL = MangomoloBaseIE._BASE_REGEX + r'video\?.*?\bid=(?P<id>\d+)'
      _IS_LIVE = False
  
  
  class MangomoloLiveIE(MangomoloBaseIE):
-    IE_NAME = 'mangomolo:live'
-    _VALID_URL = r'https?://admin\.mangomolo\.com/analytics/index\.php/customers/embed/index\?.*?\bchannelid=(?P<id>(?:[A-Za-z0-9+/=]|%2B|%2F|%3D)+)'
+    _TYPE = 'live'
+    IE_NAME = 'mangomolo:' + _TYPE
+    _VALID_URL = MangomoloBaseIE._BASE_REGEX + r'(live|index)\?.*?\bchannelid=(?P<id>(?:[A-Za-z0-9+/=]|%2B|%2F|%3D)+)'
      _IS_LIVE = True
  
      def _get_real_id(self, page_id):
author	Remita Amine <remitamine@gmail.com>
	Thu, 17 Oct 2019 12:21:44 +0000 (13:21 +0100)
committer	Remita Amine <remitamine@gmail.com>
	Thu, 17 Oct 2019 12:21:44 +0000 (13:21 +0100)
youtube_dl/extractor/generic.py		patch \| blob \| history
youtube_dl/extractor/mangomolo.py		patch \| blob \| history