Merge pull request #2944 from pulpe/SWRMediathek

author Sergey M. <dstftw@gmail.com>

Thu, 22 May 2014 12:30:09 +0000 (19:30 +0700)

committer Sergey M. <dstftw@gmail.com>

Thu, 22 May 2014 12:30:09 +0000 (19:30 +0700)
author Sergey M. <dstftw@gmail.com>
Thu, 22 May 2014 12:30:09 +0000 (19:30 +0700)
committer Sergey M. <dstftw@gmail.com>
Thu, 22 May 2014 12:30:09 +0000 (19:30 +0700)
diff --git a/CHANGELOG b/CHANGELOG

deleted file mode 100644 (file)

index 3fa1167..0000000
--- a/CHANGELOG
+++ /dev/null
@@ -1,14 +0,0 @@
-2013.01.02  Codename: GIULIA
-
-    * Add support for ComedyCentral clips <nto>
-    * Corrected Vimeo description fetching <Nick Daniels>
-    * Added the --no-post-overwrites argument <Barbu Paul - Gheorghe>
-    * --verbose offers more environment info
-    * New info_dict field: uploader_id
-    * New updates system, with signature checking
-    * New IEs: NBA, JustinTV, FunnyOrDie, TweetReel, Steam, Ustream
-    * Fixed IEs: BlipTv
-    * Fixed for Python 3 IEs: Xvideo, Youku, XNXX, Dailymotion, Vimeo, InfoQ
-    * Simplified IEs and test code
-    * Various (Python 3 and other) fixes
-    * Revamped and expanded tests
diff --git a/youtube_dl/__init__.py b/youtube_dl/__init__.py

index 4e657e297d1a5ddb2aac4a448a8a94a0ac4cf180..cbb053e13f50f865a0cb3fe15891203b4d685ccc 100644 (file)
--- a/youtube_dl/__init__.py
+++ b/youtube_dl/__init__.py
@@ -56,6 +56,7 @@ __authors__  = (
      'Nicolas Évrard',
      'Jason Normore',
      'Hoje Lee',
+    'Adam Thalhammer',
  )
  
  __license__ = 'Public Domain'
diff --git a/youtube_dl/extractor/aftonbladet.py b/youtube_dl/extractor/aftonbladet.py

index 6a8cd14c90635f4e42ccc526de138f996853f5c9..cfc7370ae43da592eaca49245200bd922d75a019 100644 (file)
--- a/youtube_dl/extractor/aftonbladet.py
+++ b/youtube_dl/extractor/aftonbladet.py
@@ -1,7 +1,6 @@
  # encoding: utf-8
  from __future__ import unicode_literals
  
-import datetime
  import re
  
  from .common import InfoExtractor
@@ -16,6 +15,7 @@ class AftonbladetIE(InfoExtractor):
              'ext': 'mp4',
              'title': 'Vulkanutbrott i rymden - nu släpper NASA bilderna',
              'description': 'Jupiters måne mest aktiv av alla himlakroppar',
+            'timestamp': 1394142732,
              'upload_date': '20140306',
          },
      }
@@ -27,17 +27,17 @@ class AftonbladetIE(InfoExtractor):
          webpage = self._download_webpage(url, video_id)
  
          # find internal video meta data
-        META_URL = 'http://aftonbladet-play.drlib.aptoma.no/video/%s.json'
+        meta_url = 'http://aftonbladet-play.drlib.aptoma.no/video/%s.json'
          internal_meta_id = self._html_search_regex(
              r'data-aptomaId="([\w\d]+)"', webpage, 'internal_meta_id')
-        internal_meta_url = META_URL % internal_meta_id
+        internal_meta_url = meta_url % internal_meta_id
          internal_meta_json = self._download_json(
              internal_meta_url, video_id, 'Downloading video meta data')
  
          # find internal video formats
-        FORMATS_URL = 'http://aftonbladet-play.videodata.drvideo.aptoma.no/actions/video/?id=%s'
+        format_url = 'http://aftonbladet-play.videodata.drvideo.aptoma.no/actions/video/?id=%s'
          internal_video_id = internal_meta_json['videoId']
-        internal_formats_url = FORMATS_URL % internal_video_id
+        internal_formats_url = format_url % internal_video_id
          internal_formats_json = self._download_json(
              internal_formats_url, video_id, 'Downloading video formats')
  
@@ -54,16 +54,13 @@ class AftonbladetIE(InfoExtractor):
              })
          self._sort_formats(formats)
  
-        timestamp = datetime.datetime.fromtimestamp(internal_meta_json['timePublished'])
-        upload_date = timestamp.strftime('%Y%m%d')
-
          return {
              'id': video_id,
              'title': internal_meta_json['title'],
              'formats': formats,
              'thumbnail': internal_meta_json['imageUrl'],
              'description': internal_meta_json['shortPreamble'],
-            'upload_date': upload_date,
+            'timestamp': internal_meta_json['timePublished'],
              'duration': internal_meta_json['duration'],
              'view_count': internal_meta_json['views'],
          }
diff --git a/youtube_dl/extractor/bandcamp.py b/youtube_dl/extractor/bandcamp.py

index 929aafdff3e848af3295eacf1520ec0ec0334966..dcbbdef4346c36c789e49531df1dc602bc35255b 100644 (file)
--- a/youtube_dl/extractor/bandcamp.py
+++ b/youtube_dl/extractor/bandcamp.py
@@ -19,7 +19,7 @@ class BandcampIE(InfoExtractor):
          'md5': 'c557841d5e50261777a6585648adf439',
          'info_dict': {
              "title": "youtube-dl  \"'/\\\u00e4\u21ad - youtube-dl test song \"'/\\\u00e4\u21ad",
-            "duration": 10,
+            "duration": 9.8485,
          },
          '_skip': 'There is a limit of 200 free downloads / month for the test song'
      }]
@@ -28,36 +28,32 @@ class BandcampIE(InfoExtractor):
          mobj = re.match(self._VALID_URL, url)
          title = mobj.group('title')
          webpage = self._download_webpage(url, title)
-        # We get the link to the free download page
          m_download = re.search(r'freeDownloadPage: "(.*?)"', webpage)
-        if m_download is None:
+        if not m_download:
              m_trackinfo = re.search(r'trackinfo: (.+),\s*?\n', webpage)
              if m_trackinfo:
                  json_code = m_trackinfo.group(1)
-                data = json.loads(json_code)
-                d = data[0]
+                data = json.loads(json_code)[0]
  
-                duration = int(round(d['duration']))
                  formats = []
-                for format_id, format_url in d['file'].items():
-                    ext, _, abr_str = format_id.partition('-')
-
+                for format_id, format_url in data['file'].items():
+                    ext, abr_str = format_id.split('-', 1)
                      formats.append({
                          'format_id': format_id,
                          'url': format_url,
-                        'ext': format_id.partition('-')[0],
+                        'ext': ext,
                          'vcodec': 'none',
-                        'acodec': format_id.partition('-')[0],
-                        'abr': int(format_id.partition('-')[2]),
+                        'acodec': ext,
+                        'abr': int(abr_str),
                      })
  
                  self._sort_formats(formats)
  
                  return {
-                    'id': compat_str(d['id']),
-                    'title': d['title'],
+                    'id': compat_str(data['id']),
+                    'title': data['title'],
                      'formats': formats,
-                    'duration': duration,
+                    'duration': float(data['duration']),
                  }
              else:
                  raise ExtractorError('No free songs found')
@@ -67,11 +63,9 @@ class BandcampIE(InfoExtractor):
              r'var TralbumData = {(.*?)id: (?P<id>\d*?)$',
              webpage, re.MULTILINE | re.DOTALL).group('id')
  
-        download_webpage = self._download_webpage(download_link, video_id,
-                                                  'Downloading free downloads page')
-        # We get the dictionary of the track from some javascrip code
-        info = re.search(r'items: (.*?),$',
-                         download_webpage, re.MULTILINE).group(1)
+        download_webpage = self._download_webpage(download_link, video_id, 'Downloading free downloads page')
+        # We get the dictionary of the track from some javascript code
+        info = re.search(r'items: (.*?),$', download_webpage, re.MULTILINE).group(1)
          info = json.loads(info)[0]
          # We pick mp3-320 for now, until format selection can be easily implemented.
          mp3_info = info['downloads']['mp3-320']
@@ -100,7 +94,7 @@ class BandcampIE(InfoExtractor):
  
  class BandcampAlbumIE(InfoExtractor):
      IE_NAME = 'Bandcamp:album'
-    _VALID_URL = r'https?://(?:(?P<subdomain>[^.]+)\.)?bandcamp\.com(?:/album/(?P<title>[^?#]+))?'
+    _VALID_URL = r'https?://(?:(?P<subdomain>[^.]+)\.)?bandcamp\.com(?:/album/(?P<title>[^?#]+))'
  
      _TEST = {
          'url': 'http://blazo.bandcamp.com/album/jazz-format-mixtape-vol-1',
@@ -123,7 +117,7 @@ class BandcampAlbumIE(InfoExtractor):
          'params': {
              'playlistend': 2
          },
-        'skip': 'Bancamp imposes download limits. See test_playlists:test_bandcamp_album for the playlist test'
+        'skip': 'Bandcamp imposes download limits. See test_playlists:test_bandcamp_album for the playlist test'
      }
  
      def _real_extract(self, url):
diff --git a/youtube_dl/extractor/blinkx.py b/youtube_dl/extractor/blinkx.py

index 96408e4e093ba6b27b4da54248d436d162d3c40c..38ccd957f3eb61a761950bb9a70cdbbeec6bea6d 100644 (file)
--- a/youtube_dl/extractor/blinkx.py
+++ b/youtube_dl/extractor/blinkx.py
@@ -1,6 +1,5 @@
  from __future__ import unicode_literals
  
-import datetime
  import json
  import re
  
@@ -19,15 +18,16 @@ class BlinkxIE(InfoExtractor):
          'file': '8aQUy7GV.mp4',
          'md5': '2e9a07364af40163a908edbf10bb2492',
          'info_dict': {
-            "title": "Police Car Rolls Away",
-            "uploader": "stupidvideos.com",
-            "upload_date": "20131215",
-            "description": "A police car gently rolls away from a fight. Maybe it felt weird being around a confrontation and just had to get out of there!",
-            "duration": 14.886,
-            "thumbnails": [{
-                "width": 100,
-                "height": 76,
-                "url": "http://cdn.blinkx.com/stream/b/41/StupidVideos/20131215/1873969261/1873969261_tn_0.jpg",
+            'title': 'Police Car Rolls Away',
+            'uploader': 'stupidvideos.com',
+            'upload_date': '20131215',
+            'timestamp': 1387068000,
+            'description': 'A police car gently rolls away from a fight. Maybe it felt weird being around a confrontation and just had to get out of there!',
+            'duration': 14.886,
+            'thumbnails': [{
+                'width': 100,
+                'height': 76,
+                'url': 'http://cdn.blinkx.com/stream/b/41/StupidVideos/20131215/1873969261/1873969261_tn_0.jpg',
              }],
          },
      }
@@ -41,9 +41,6 @@ class BlinkxIE(InfoExtractor):
                     'video=%s' % video_id)
          data_json = self._download_webpage(api_url, display_id)
          data = json.loads(data_json)['api']['results'][0]
-        dt = datetime.datetime.fromtimestamp(data['pubdate_epoch'])
-        pload_date = dt.strftime('%Y%m%d')
-
          duration = None
          thumbnails = []
          formats = []
@@ -64,10 +61,7 @@ class BlinkxIE(InfoExtractor):
                  vcodec = remove_start(m['vcodec'], 'ff')
                  acodec = remove_start(m['acodec'], 'ff')
                  tbr = (int(m['vbr']) + int(m['abr'])) // 1000
-                format_id = (u'%s-%sk-%s' %
-                             (vcodec,
-                              tbr,
-                              m['w']))
+                format_id = u'%s-%sk-%s' % (vcodec, tbr, m['w'])
                  formats.append({
                      'format_id': format_id,
                      'url': m['link'],
@@ -88,7 +82,7 @@ class BlinkxIE(InfoExtractor):
              'title': data['title'],
              'formats': formats,
              'uploader': data['channel_name'],
-            'upload_date': pload_date,
+            'timestamp': data['pubdate_epoch'],
              'description': data.get('description'),
              'thumbnails': thumbnails,
              'duration': duration,
diff --git a/youtube_dl/extractor/gamekings.py b/youtube_dl/extractor/gamekings.py

index 2333989665520b8e35728705255b246ea93decac..11fee3d31e88833b8074a1b59cff885eeffa46d3 100644 (file)
--- a/youtube_dl/extractor/gamekings.py
+++ b/youtube_dl/extractor/gamekings.py
@@ -15,7 +15,7 @@ class GamekingsIE(InfoExtractor):
              'id': '20130811',
              'ext': 'mp4',
              'title': 'Phoenix Wright: Ace Attorney \u2013 Dual Destinies Review',
-            'description': 'md5:632e61a9f97d700e83f43d77ddafb6a4',
+            'description': 'md5:36fd701e57e8c15ac8682a2374c99731',
          }
      }
  
diff --git a/youtube_dl/extractor/generic.py b/youtube_dl/extractor/generic.py

index 0e5cf0efbd0867e0daeb06992e561eefc5262326..38a357d3b0406906144e25cbbc45fbe74d2f6c2c 100644 (file)
--- a/youtube_dl/extractor/generic.py
+++ b/youtube_dl/extractor/generic.py
@@ -363,8 +363,13 @@ class GenericIE(InfoExtractor):
                      return self.url_result('http://' + url)
                  else:
                      if default_search == 'auto_warning':
-                        self._downloader.report_warning(
-                            'Falling back to youtube search for  %s . Set --default-search to "auto" to suppress this warning.' % url)
+                        if re.match(r'^(?:url|URL)$', url):
+                            raise ExtractorError(
+                                'Invalid URL:  %r . Call youtube-dl like this:  youtube-dl -v "https://www.youtube.com/watch?v=BaW_jenozKc"  ' % url,
+                                expected=True)
+                        else:
+                            self._downloader.report_warning(
+                                'Falling back to youtube search for  %s . Set --default-search to "auto" to suppress this warning.' % url)
                      return self.url_result('ytsearch:' + url)
              else:
                  assert ':' in default_search
diff --git a/youtube_dl/extractor/mailru.py b/youtube_dl/extractor/mailru.py

index f819c09b348550c878616151ace346ac1a7ab3a4..5016989cc9504ef1071b4816514e0924242f1602 100644 (file)
--- a/youtube_dl/extractor/mailru.py
+++ b/youtube_dl/extractor/mailru.py
@@ -2,7 +2,6 @@
  from __future__ import unicode_literals
  
  import re
-import datetime
  
  from .common import InfoExtractor
  
@@ -19,6 +18,7 @@ class MailRuIE(InfoExtractor):
              'id': '46301138',
              'ext': 'mp4',
              'title': 'Новый Человек-Паук. Высокое напряжение. Восстание Электро',
+            'timestamp': 1393232740,
              'upload_date': '20140224',
              'uploader': 'sonypicturesrus',
              'uploader_id': 'sonypicturesrus@mail.ru',
@@ -43,7 +43,6 @@ class MailRuIE(InfoExtractor):
          thumbnail = movie['poster']
          duration = movie['duration']
  
-        upload_date = datetime.datetime.fromtimestamp(video_data['timestamp']).strftime('%Y%m%d')
          view_count = video_data['views_count']
  
          formats = [
@@ -57,7 +56,7 @@ class MailRuIE(InfoExtractor):
              'id': content_id,
              'title': title,
              'thumbnail': thumbnail,
-            'upload_date': upload_date,
+            'timestamp': video_data['timestamp'],
              'uploader': uploader,
              'uploader_id': uploader_id,
              'duration': duration,
diff --git a/youtube_dl/extractor/nowness.py b/youtube_dl/extractor/nowness.py

index b1bcb7e54cf3f01989eb17c51160acce680eed2c..1c5e9401f36c72a73a701bdffc89529979a1eaaf 100644 (file)
--- a/youtube_dl/extractor/nowness.py
+++ b/youtube_dl/extractor/nowness.py
@@ -4,9 +4,7 @@ import re
  
  from .brightcove import BrightcoveIE
  from .common import InfoExtractor
-from ..utils import (
-    ExtractorError,
-)
+from ..utils import ExtractorError
  
  
  class NownessIE(InfoExtractor):
@@ -14,9 +12,10 @@ class NownessIE(InfoExtractor):
  
      _TEST = {
          'url': 'http://www.nowness.com/day/2013/6/27/3131/candor--the-art-of-gesticulation',
-        'file': '2520295746001.mp4',
-        'md5': '0ece2f70a7bd252c7b00f3070182d418',
+        'md5': '068bc0202558c2e391924cb8cc470676',
          'info_dict': {
+            'id': '2520295746001',
+            'ext': 'mp4',
              'description': 'Candor: The Art of Gesticulation',
              'uploader': 'Nowness',
              'title': 'Candor: The Art of Gesticulation',
diff --git a/youtube_dl/version.py b/youtube_dl/version.py

index 3193fd152cc7dda04ae2f4bfc20732f0cc2513e9..638ff8af5ae995a5ebe7a5d4171a7c02ab0feec4 100644 (file)
--- a/youtube_dl/version.py
+++ b/youtube_dl/version.py
@@ -1,2 +1,2 @@
  
-__version__ = '2014.05.17'
+__version__ = '2014.05.19'
author	Sergey M. <dstftw@gmail.com>
	Thu, 22 May 2014 12:30:09 +0000 (19:30 +0700)
committer	Sergey M. <dstftw@gmail.com>
	Thu, 22 May 2014 12:30:09 +0000 (19:30 +0700)
CHANGELOG	[deleted file]	patch \| blob \| history
youtube_dl/__init__.py		patch \| blob \| history
youtube_dl/extractor/aftonbladet.py		patch \| blob \| history
youtube_dl/extractor/bandcamp.py		patch \| blob \| history
youtube_dl/extractor/blinkx.py		patch \| blob \| history
youtube_dl/extractor/gamekings.py		patch \| blob \| history
youtube_dl/extractor/generic.py		patch \| blob \| history
youtube_dl/extractor/mailru.py		patch \| blob \| history
youtube_dl/extractor/nowness.py		patch \| blob \| history
youtube_dl/version.py		patch \| blob \| history