Merge pull request #1620 from jaimeMF/console_script

[youtube-dl] / youtube_dl / extractor / common.py
diff --git a/youtube_dl/extractor/common.py b/youtube_dl/extractor/common.py

index 69cdcdc1b5b75d1cac5733b34565f087c9dcddec..aaa5c24c8565fffb85295188daf7bbd52f5aae89 100644 (file)
--- a/youtube_dl/extractor/common.py
+++ b/youtube_dl/extractor/common.py
@@ -14,6 +14,7 @@ from ..utils import (
      clean_html,
      compiled_regex_type,
      ExtractorError,
+    RegexNotFoundError,
      unescapeHTML,
  )
  
@@ -54,15 +55,19 @@ class InfoExtractor(object):
      view_count:     How many users have watched the video on the platform.
      urlhandle:      [internal] The urlHandle to be used to download the file,
                      like returned by urllib.request.urlopen
+    age_limit:      Age restriction for the video, as an integer (years)
      formats:        A list of dictionaries for each format available, it must
                      be ordered from worst to best quality. Potential fields:
                      * url       Mandatory. The URL of the video file
                      * ext       Will be calculated from url if missing
                      * format    A human-readable description of the format
                                  ("mp4 container with h264/opus").
-                                Calculated from width and height if missing.
+                                Calculated from the format_id, width, height 
+                                and format_note fields if missing.
                      * format_id A short description of the format
                                  ("mp4_h264_opus" or "19")
+                    * format_note Additional info about the format
+                                ("3D" or "DASH video")
                      * width     Width of the video, if known
                      * height    Height of the video, if known
  
@@ -227,7 +232,7 @@ class InfoExtractor(object):
          Perform a regex search on the given string, using a single or a list of
          patterns returning the first matching group.
          In case of failure return a default value or raise a WARNING or a
-        ExtractorError, depending on fatal, specifying the field name.
+        RegexNotFoundError, depending on fatal, specifying the field name.
          """
          if isinstance(pattern, (str, compat_str, compiled_regex_type)):
              mobj = re.search(pattern, string, flags)
@@ -247,7 +252,7 @@ class InfoExtractor(object):
          elif default is not None:
              return default
          elif fatal:
-            raise ExtractorError(u'Unable to extract %s' % _name)
+            raise RegexNotFoundError(u'Unable to extract %s' % _name)
          else:
              self._downloader.report_warning(u'unable to extract %s; '
                  u'please report this issue on http://yt-dl.org/bug' % _name)
@@ -318,6 +323,15 @@ class InfoExtractor(object):
                                          self._og_regex('video')],
                                         html, name, **kargs)
  
+    def _rta_search(self, html):
+        # See http://www.rtalabel.org/index.php?content=howtofaq#single
+        if re.search(r'(?ix)<meta\s+name="rating"\s+'
+                     r'     content="RTA-5042-1996-1400-1577-RTA"',
+                     html):
+            return 18
+        return 0
+
+
  class SearchInfoExtractor(InfoExtractor):
      """
      Base class for paged search queries extractors.
@@ -355,7 +369,7 @@ class SearchInfoExtractor(InfoExtractor):
  
      def _get_n_results(self, query, n):
          """Get a specified number of results for a query"""
-        raise NotImplementedError("This method must be implemented by sublclasses")
+        raise NotImplementedError("This method must be implemented by subclasses")
  
      @property
      def SEARCH_KEY(self):