From: Philipp Hagemeister <phihag@phihag.de>
Date: Wed, 4 Dec 2013 18:56:05 +0000 (+0100)
Subject: Merge remote-tracking branch 'dstftw/correct-valid-urls'
X-Git-Url: http://git.bitcoin.ninja/index.cgi?a=commitdiff_plain;h=29030c0a4c2f4dded5a310add940aae0791f9d73;hp=-c;p=youtube-dl

Merge remote-tracking branch 'dstftw/correct-valid-urls'
---

29030c0a4c2f4dded5a310add940aae0791f9d73
diff --combined youtube_dl/extractor/appletrailers.py
index 4befff394,5b522552a..a527f10de
--- a/youtube_dl/extractor/appletrailers.py
+++ b/youtube_dl/extractor/appletrailers.py
@@@ -10,7 -10,7 +10,7 @@@ from ..utils import 
  
  
  class AppleTrailersIE(InfoExtractor):
-     _VALID_URL = r'https?://(?:www\.)?trailers.apple.com/trailers/(?P<company>[^/]+)/(?P<movie>[^/]+)'
+     _VALID_URL = r'https?://(?:www\.)?trailers\.apple\.com/trailers/(?P<company>[^/]+)/(?P<movie>[^/]+)'
      _TEST = {
          u"url": u"http://trailers.apple.com/trailers/wb/manofsteel/",
          u"playlist": [
@@@ -113,7 -113,7 +113,7 @@@
                  })
              formats = sorted(formats, key=lambda f: (f['height'], f['width']))
  
 -            info = {
 +            playlist.append({
                  '_type': 'video',
                  'id': video_id,
                  'title': title,
@@@ -124,7 -124,12 +124,7 @@@
                  'upload_date': upload_date,
                  'uploader_id': uploader_id,
                  'user_agent': 'QuickTime compatible (youtube-dl)',
 -            }
 -            # TODO: Remove when #980 has been merged
 -            info['url'] = formats[-1]['url']
 -            info['ext'] = formats[-1]['ext']
 -
 -            playlist.append(info)
 +            })
  
          return {
              '_type': 'playlist',
diff --combined youtube_dl/extractor/archiveorg.py
index 3ae0aebb1,a8394bfb0..8bb546410
--- a/youtube_dl/extractor/archiveorg.py
+++ b/youtube_dl/extractor/archiveorg.py
@@@ -11,7 -11,7 +11,7 @@@ from ..utils import 
  class ArchiveOrgIE(InfoExtractor):
      IE_NAME = 'archive.org'
      IE_DESC = 'archive.org videos'
-     _VALID_URL = r'(?:https?://)?(?:www\.)?archive.org/details/(?P<id>[^?/]+)(?:[?].*)?$'
+     _VALID_URL = r'(?:https?://)?(?:www\.)?archive\.org/details/(?P<id>[^?/]+)(?:[?].*)?$'
      _TEST = {
          u"url": u"http://archive.org/details/XD300-23_68HighlightsAResearchCntAugHumanIntellect",
          u'file': u'XD300-23_68HighlightsAResearchCntAugHumanIntellect.ogv',
@@@ -49,7 -49,7 +49,7 @@@
          for f in formats:
              f['ext'] = determine_ext(f['url'])
  
 -        info = {
 +        return {
              '_type': 'video',
              'id': video_id,
              'title': title,
@@@ -57,5 -57,12 +57,5 @@@
              'description': description,
              'uploader': uploader,
              'upload_date': upload_date,
 +            'thumbnail': data.get('misc', {}).get('image'),
          }
 -        thumbnail = data.get('misc', {}).get('image')
 -        if thumbnail:
 -            info['thumbnail'] = thumbnail
 -
 -        # TODO: Remove when #980 has been merged
 -        info.update(formats[-1])
 -
 -        return info
diff --combined youtube_dl/extractor/comedycentral.py
index 53579aa27,caea446ea..a54ce3ee7
--- a/youtube_dl/extractor/comedycentral.py
+++ b/youtube_dl/extractor/comedycentral.py
@@@ -1,7 -1,7 +1,7 @@@
  import re
  
  from .common import InfoExtractor
 -from .mtv import MTVIE, _media_xml_tag
 +from .mtv import MTVServicesInfoExtractor
  from ..utils import (
      compat_str,
      compat_urllib_parse,
@@@ -11,8 -11,8 +11,8 @@@
  )
  
  
 -class ComedyCentralIE(MTVIE):
 -    _VALID_URL = r'https?://(?:www\.)?comedycentral\.com/(video-clips|episodes|cc-studios)/(?P<title>.*)'
 +class ComedyCentralIE(MTVServicesInfoExtractor):
-     _VALID_URL = r'http://www.comedycentral.com/(video-clips|episodes|cc-studios)/(?P<title>.*)'
++    _VALID_URL = r'https?://(?:www.)?comedycentral.com/(video-clips|episodes|cc-studios)/(?P<title>.*)'
      _FEED_URL = u'http://comedycentral.com/feeds/mrss/'
  
      _TEST = {
@@@ -25,6 -25,12 +25,6 @@@
              u'description': u'After a certain point, breastfeeding becomes c**kblocking.',
          },
      }
 -    # Overwrite MTVIE properties we don't want
 -    _TESTS = []
 -
 -    def _get_thumbnail_url(self, uri, itemdoc):
 -        search_path = '%s/%s' % (_media_xml_tag('group'), _media_xml_tag('thumbnail'))
 -        return itemdoc.find(search_path).attrib['url']
  
      def _real_extract(self, url):
          mobj = re.match(self._VALID_URL, url)
@@@ -191,7 -197,7 +191,7 @@@ class ComedyCentralShowsIE(InfoExtracto
                  })
  
              effTitle = showId + u'-' + epTitle + u' part ' + compat_str(partNum+1)
 -            info = {
 +            results.append({
                  'id': shortMediaId,
                  'formats': formats,
                  'uploader': showId,
@@@ -199,6 -205,11 +199,6 @@@
                  'title': effTitle,
                  'thumbnail': None,
                  'description': compat_str(officialTitle),
 -            }
 -
 -            # TODO: Remove when #980 has been merged
 -            info.update(info['formats'][-1])
 -
 -            results.append(info)
 +            })
  
          return results
diff --combined youtube_dl/extractor/dreisat.py
index 24ce79425,008c99699..cb7226f82
--- a/youtube_dl/extractor/dreisat.py
+++ b/youtube_dl/extractor/dreisat.py
@@@ -11,7 -11,7 +11,7 @@@ from ..utils import 
  
  class DreiSatIE(InfoExtractor):
      IE_NAME = '3sat'
-     _VALID_URL = r'(?:http://)?(?:www\.)?3sat.de/mediathek/index.php\?(?:(?:mode|display)=[^&]+&)*obj=(?P<id>[0-9]+)$'
+     _VALID_URL = r'(?:http://)?(?:www\.)?3sat\.de/mediathek/index\.php\?(?:(?:mode|display)=[^&]+&)*obj=(?P<id>[0-9]+)$'
      _TEST = {
          u"url": u"http://www.3sat.de/mediathek/index.php?obj=36983",
          u'file': u'36983.webm',
@@@ -65,7 -65,7 +65,7 @@@
              return (qidx, prefer_http, format['video_bitrate'])
          formats.sort(key=_sortkey)
  
 -        info = {
 +        return {
              '_type': 'video',
              'id': video_id,
              'title': video_title,
@@@ -76,3 -76,8 +76,3 @@@
              'uploader': video_uploader,
              'upload_date': upload_date,
          }
 -
 -        # TODO: Remove when #980 has been merged
 -        info.update(formats[-1])
 -
 -        return info
diff --combined youtube_dl/extractor/faz.py
index d0dfde694,615674baf..c6ab6952e
--- a/youtube_dl/extractor/faz.py
+++ b/youtube_dl/extractor/faz.py
@@@ -9,7 -9,7 +9,7 @@@ from ..utils import 
  
  class FazIE(InfoExtractor):
      IE_NAME = u'faz.net'
-     _VALID_URL = r'https?://www\.faz\.net/multimedia/videos/.*?-(?P<id>\d+).html'
+     _VALID_URL = r'https?://www\.faz\.net/multimedia/videos/.*?-(?P<id>\d+)\.html'
  
      _TEST = {
          u'url': u'http://www.faz.net/multimedia/videos/stockholm-chemie-nobelpreis-fuer-drei-amerikanische-forscher-12610585.html',
@@@ -44,10 -44,13 +44,10 @@@
              })
  
          descr = self._html_search_regex(r'<p class="Content Copy">(.*?)</p>', webpage, u'description')
 -        info = {
 +        return {
              'id': video_id,
              'title': self._og_search_title(webpage),
              'formats': formats,
              'description': descr,
              'thumbnail': config.find('STILL/STILL_BIG').text,
          }
 -        # TODO: Remove when #980 has been merged
 -        info.update(formats[-1])
 -        return info
diff --combined youtube_dl/extractor/gametrailers.py
index 3a8bef250,88f656031..d82a5d4b2
--- a/youtube_dl/extractor/gametrailers.py
+++ b/youtube_dl/extractor/gametrailers.py
@@@ -1,11 -1,13 +1,10 @@@
  import re
  
 -from .mtv import MTVIE, _media_xml_tag
 +from .mtv import MTVServicesInfoExtractor
  
 -class GametrailersIE(MTVIE):
 -    """
 -    Gametrailers use the same videos system as MTVIE, it just changes the feed
 -    url, where the uri is and the method to get the thumbnails.
 -    """
 +
 +class GametrailersIE(MTVServicesInfoExtractor):
-     _VALID_URL = r'http://www.gametrailers.com/(?P<type>videos|reviews|full-episodes)/(?P<id>.*?)/(?P<title>.*)'
- 
+     _VALID_URL = r'http://www\.gametrailers\.com/(?P<type>videos|reviews|full-episodes)/(?P<id>.*?)/(?P<title>.*)'
      _TEST = {
          u'url': u'http://www.gametrailers.com/videos/zbvr8i/mirror-s-edge-2-e3-2013--debut-trailer',
          u'file': u'70e9a5d7-cf25-4a10-9104-6f3e7342ae0d.mp4',
@@@ -15,9 -17,15 +14,9 @@@
              u'description': u'Faith is back!  Check out the World Premiere trailer for Mirror\'s Edge 2 straight from the EA Press Conference at E3 2013!',
          },
      }
 -    # Overwrite MTVIE properties we don't want
 -    _TESTS = []
  
      _FEED_URL = 'http://www.gametrailers.com/feeds/mrss'
  
 -    def _get_thumbnail_url(self, uri, itemdoc):
 -        search_path = '%s/%s' % (_media_xml_tag('group'), _media_xml_tag('thumbnail'))
 -        return itemdoc.find(search_path).attrib['url']
 -
      def _real_extract(self, url):
          mobj = re.match(self._VALID_URL, url)
          video_id = mobj.group('id')
diff --combined youtube_dl/extractor/viddler.py
index 75335dfb8,36d1bde08..138a35b2a
--- a/youtube_dl/extractor/viddler.py
+++ b/youtube_dl/extractor/viddler.py
@@@ -8,7 -8,7 +8,7 @@@ from ..utils import 
  
  
  class ViddlerIE(InfoExtractor):
-     _VALID_URL = r'(?P<domain>https?://(?:www\.)?viddler.com)/(?:v|embed|player)/(?P<id>[a-z0-9]+)'
+     _VALID_URL = r'(?P<domain>https?://(?:www\.)?viddler\.com)/(?:v|embed|player)/(?P<id>[a-z0-9]+)'
      _TEST = {
          u"url": u"http://www.viddler.com/v/43903784",
          u'file': u'43903784.mp4',
@@@ -47,7 -47,7 +47,7 @@@
              r"thumbnail\s*:\s*'([^']*)'",
              webpage, u'thumbnail', fatal=False)
  
 -        info = {
 +        return {
              '_type': 'video',
              'id': video_id,
              'title': title,
@@@ -56,3 -56,9 +56,3 @@@
              'duration': duration,
              'formats': formats,
          }
 -
 -        # TODO: Remove when #980 has been merged
 -        info['formats'][-1]['ext'] = determine_ext(info['formats'][-1]['url'])
 -        info.update(info['formats'][-1])
 -
 -        return info