[SouthParkStudiosIE] Also detect urls without http:// or www

[youtube-dl] / youtube_dl / extractor / southparkstudios.py
diff --git a/youtube_dl/extractor/southparkstudios.py b/youtube_dl/extractor/southparkstudios.py

index 1a611d3bb628643740b999e85f7bdd321a7e3de8..bb0c4b393f85012cffaeaed3de60ce7797dd0ba8 100644 (file)
--- a/youtube_dl/extractor/southparkstudios.py
+++ b/youtube_dl/extractor/southparkstudios.py
@@ -5,7 +5,7 @@ from .mtv import MTVIE, _media_xml_tag
  
  class SouthParkStudiosIE(MTVIE):
      IE_NAME = u'southparkstudios.com'
-    _VALID_URL = r'https?://www\.southparkstudios\.com/(clips|full-episodes)/(?P<id>.+?)(\?|#|$)'
+    _VALID_URL = r'(https?://)?(www\.)?(?P<url>southparkstudios\.com/(clips|full-episodes)/(?P<id>.+?)(\?|#|$))'
  
      _FEED_URL = 'http://www.southparkstudios.com/feeds/video-player/mrss'
  
@@ -14,7 +14,7 @@ class SouthParkStudiosIE(MTVIE):
          u'file': u'a7bff6c2-ed00-11e0-aca6-0026b9414f30.mp4',
          u'info_dict': {
              u'title': u'Bat Daded',
-            u'description': u'Randy finally gets the chance to fight Bat Dad and gets the boys disqualified from the season championships.',
+            u'description': u'Randy disqualifies South Park by getting into a fight with Bat Dad.',
          },
      }
  
@@ -31,8 +31,9 @@ class SouthParkStudiosIE(MTVIE):
  
      def _real_extract(self, url):
          mobj = re.match(self._VALID_URL, url)
+        url = u'http://www.' + mobj.group(u'url')
          video_id = mobj.group('id')
          webpage = self._download_webpage(url, video_id)
-        mgid = self._search_regex(r'data-mgid="(mgid:.*?)"',
+        mgid = self._search_regex(r'swfobject.embedSWF\(".*?(mgid:.*?)"',
                                    webpage, u'mgid')
          return self._get_videos_info(mgid)