[nowtv] Fix extraction (Closes #6169)

[youtube-dl] / youtube_dl / extractor / snagfilms.py
diff --git a/youtube_dl/extractor/snagfilms.py b/youtube_dl/extractor/snagfilms.py

index f04ca60369410b1435eee232c382ef22ecf96a1c..cf495f31066b6d26a30662742cd95a6cfada24c9 100644 (file)
--- a/youtube_dl/extractor/snagfilms.py
+++ b/youtube_dl/extractor/snagfilms.py
@@ -4,6 +4,7 @@ import re
  
  from .common import InfoExtractor
  from ..utils import (
+    ExtractorError,
      clean_html,
      determine_ext,
      int_or_none,
@@ -30,7 +31,8 @@ class SnagFilmsEmbedIE(InfoExtractor):
      @staticmethod
      def _extract_url(webpage):
          mobj = re.search(
-            r'<iframe[^>]+?src=(["\'])(?P<url>(?:https?:)?//(?:embed\.)?snagfilms\.com/embed/player.+?)\1', webpage)
+            r'<iframe[^>]+?src=(["\'])(?P<url>(?:https?:)?//(?:embed\.)?snagfilms\.com/embed/player.+?)\1',
+            webpage)
          if mobj:
              return mobj.group('url')
  
@@ -39,6 +41,10 @@ class SnagFilmsEmbedIE(InfoExtractor):
  
          webpage = self._download_webpage(url, video_id)
  
+        if '>This film is not playable in your area.<' in webpage:
+            raise ExtractorError(
+                'Film %s is not playable in your area.' % video_id, expected=True)
+
          formats = []
          for source in self._parse_json(js_to_json(self._search_regex(
                  r'(?s)sources:\s*(\[.+?\]),', webpage, 'json')), video_id):
@@ -103,6 +109,14 @@ class SnagFilmsIE(InfoExtractor):
              'duration': 979,
              'categories': ['Documentary', 'Sports', 'Politics']
          }
+    }, {
+        # Film is not playable in your area.
+        'url': 'http://www.snagfilms.com/films/title/inside_mecca',
+        'only_matching': True,
+    }, {
+        # Film is not available.
+        'url': 'http://www.snagfilms.com/show/augie_alone/flirting',
+        'only_matching': True,
      }]
  
      def _real_extract(self, url):
@@ -110,6 +124,10 @@ class SnagFilmsIE(InfoExtractor):
  
          webpage = self._download_webpage(url, display_id)
  
+        if ">Sorry, the Film you're looking for is not available.<" in webpage:
+            raise ExtractorError(
+                'Film %s is not available.' % display_id, expected=True)
+
          film_id = self._search_regex(r'filmId=([\da-f-]{36})"', webpage, 'film id')
  
          snag = self._parse_json(