Merge remote-tracking branch 'origin/master'
authorPhilipp Hagemeister <phihag@phihag.de>
Mon, 28 Oct 2013 09:44:13 +0000 (10:44 +0100)
committerPhilipp Hagemeister <phihag@phihag.de>
Mon, 28 Oct 2013 09:44:13 +0000 (10:44 +0100)
1  2 
youtube_dl/extractor/common.py

index 458635f1e99392cd05895d6f66b89ef1a5379ba8,8b067b48d7d81d5fb2ab102ea745695183c2be30..ce349fe207af21690c95b86dd7a293220ac7025e
@@@ -15,7 -15,6 +15,7 @@@ from ..utils import 
      compiled_regex_type,
      ExtractorError,
      RegexNotFoundError,
 +    sanitize_filename,
      unescapeHTML,
  )
  
@@@ -183,17 -182,6 +183,17 @@@ class InfoExtractor(object)
              self.to_screen(u'Dumping request to ' + url)
              dump = base64.b64encode(webpage_bytes).decode('ascii')
              self._downloader.to_screen(dump)
 +        if self._downloader.params.get('write_pages', False):
 +            try:
 +                url = url_or_request.get_full_url()
 +            except AttributeError:
 +                url = url_or_request
 +            raw_filename = ('%s_%s.dump' % (video_id, url))
 +            filename = sanitize_filename(raw_filename, restricted=True)
 +            self.to_screen(u'Saving request to ' + filename)
 +            with open(filename, 'wb') as outf:
 +                outf.write(webpage_bytes)
 +
          content = webpage_bytes.decode(encoding, 'replace')
          return (content, urlh)
  
      def _og_search_title(self, html, **kargs):
          return self._og_search_property('title', html, **kargs)
  
-     def _og_search_video_url(self, html, name='video url', **kargs):
-         return self._html_search_regex([self._og_regex('video:secure_url'),
-                                         self._og_regex('video')],
-                                        html, name, **kargs)
+     def _og_search_video_url(self, html, name='video url', secure=True, **kargs):
+         regexes = [self._og_regex('video')]
+         if secure: regexes.insert(0, self._og_regex('video:secure_url'))
+         return self._html_search_regex(regexes, html, name, **kargs)
  
      def _rta_search(self, html):
          # See http://www.rtalabel.org/index.php?content=howtofaq#single