Merge remote-tracking branch 'dstftw/smotri.com-broadcast'
authorPhilipp Hagemeister <phihag@phihag.de>
Mon, 9 Dec 2013 03:42:35 +0000 (04:42 +0100)
committerPhilipp Hagemeister <phihag@phihag.de>
Mon, 9 Dec 2013 03:42:35 +0000 (04:42 +0100)
Conflicts:
youtube_dl/FileDownloader.py
youtube_dl/extractor/smotri.py

1  2 
youtube_dl/FileDownloader.py
youtube_dl/extractor/__init__.py
youtube_dl/extractor/smotri.py

index 8f95775125e7e09566c4747a65c9cc0d47576216,de1dc66bb4cdd8d43cfb3feecaf1d3e04f4b313f..47124932fc7e9ff3c40ec29d003757cdb20cf967
@@@ -204,27 -204,11 +204,27 @@@ class FileDownloader(object)
          """Report destination filename."""
          self.to_screen(u'[download] Destination: ' + filename)
  
 +    def _report_progress_status(self, msg, is_last_line=False):
 +        fullmsg = u'[download] ' + msg
 +        if self.params.get('progress_with_newline', False):
 +            self.to_screen(fullmsg)
 +        else:
 +            if os.name == 'nt':
 +                prev_len = getattr(self, '_report_progress_prev_line_length',
 +                                   0)
 +                if prev_len > len(fullmsg):
 +                    fullmsg += u' ' * (prev_len - len(fullmsg))
 +                self._report_progress_prev_line_length = len(fullmsg)
 +                clear_line = u'\r'
 +            else:
 +                clear_line = (u'\r\x1b[K' if sys.stderr.isatty() else u'\r')
 +            self.to_screen(clear_line + fullmsg, skip_eol=not is_last_line)
 +        self.to_console_title(u'youtube-dl ' + msg)
 +
      def report_progress(self, percent, data_len_str, speed, eta):
          """Report download progress."""
          if self.params.get('noprogress', False):
              return
 -        clear_line = (u'\x1b[K' if sys.stderr.isatty() and os.name != 'nt' else u'')
          if eta is not None:
              eta_str = self.format_eta(eta)
          else:
          else:
              percent_str = 'Unknown %'
          speed_str = self.format_speed(speed)
 -        if self.params.get('progress_with_newline', False):
 -            self.to_screen(u'[download] %s of %s at %s ETA %s' %
 -                (percent_str, data_len_str, speed_str, eta_str))
 -        else:
 -            self.to_screen(u'\r%s[download] %s of %s at %s ETA %s' %
 -                (clear_line, percent_str, data_len_str, speed_str, eta_str), skip_eol=True)
 -        self.to_console_title(u'youtube-dl - %s of %s at %s ETA %s' %
 -                (percent_str.strip(), data_len_str.strip(), speed_str.strip(), eta_str.strip()))
 -        
 +
 +        msg = (u'%s of %s at %s ETA %s' %
 +               (percent_str, data_len_str, speed_str, eta_str))
 +        self._report_progress_status(msg)
 +
+     def report_progress_live_stream(self, downloaded_data_len, speed, elapsed):
+         if self.params.get('noprogress', False):
+             return
 -        clear_line = (u'\x1b[K' if sys.stderr.isatty() and os.name != 'nt' else u'')
+         downloaded_str = format_bytes(downloaded_data_len)
+         speed_str = self.format_speed(speed)
+         elapsed_str = FileDownloader.format_seconds(elapsed)
 -        if self.params.get('progress_with_newline', False):
 -            self.to_screen(u'[download] %s at %s' %
 -                (downloaded_str, speed_str))
++        msg = u'%s at %s (%s)' % (downloaded_str, speed_str, elapsed_str)
++        self._report_progress_status(msg)
++
 +    def report_finish(self, data_len_str, tot_time):
 +        """Report download finished."""
 +        if self.params.get('noprogress', False):
 +            self.to_screen(u'[download] Download completed')
          else:
 -            self.to_screen(u'\r%s[download] %s at %s ET %s' %
 -                (clear_line, downloaded_str, speed_str, elapsed_str), skip_eol=True)
 -        self.to_console_title(u'youtube-dl - %s at %s ET %s' %
 -                (downloaded_str.strip(), speed_str.strip(), elapsed_str.strip())) 
 +            self._report_progress_status(
 +                (u'100%% of %s in %s' %
 +                 (data_len_str, self.format_seconds(tot_time))),
 +                is_last_line=True)
  
      def report_resuming_byte(self, resume_len):
          """Report attempt to resume at given byte."""
          """Report it was impossible to resume download."""
          self.to_screen(u'[download] Unable to resume')
  
-     def _download_with_rtmpdump(self, filename, url, player_url, page_url, play_path, tc_url, live):
 -    def report_finish(self, data_len_str, tot_time):
 -        """Report download finished."""
 -        if self.params.get('noprogress', False):
 -            self.to_screen(u'[download] Download completed')
 -        else:
 -            clear_line = (u'\x1b[K' if sys.stderr.isatty() and os.name != 'nt' else u'')
 -            self.to_screen(u'\r%s[download] 100%% of %s in %s' %
 -                (clear_line, data_len_str, self.format_seconds(tot_time)))
 -
+     def _download_with_rtmpdump(self, filename, url, player_url, page_url, play_path, tc_url, live, conn):
          def run_rtmpdump(args):
              start = time.time()
              resume_percent = None
                          'eta': eta,
                          'speed': speed,
                      })
-                 elif self.params.get('verbose', False):
-                     if not cursor_in_new_line:
-                         self.to_screen(u'')
-                     cursor_in_new_line = True
-                     self.to_screen(u'[rtmpdump] '+line)
+                 else:
+                     # no percent for live streams
+                     mobj = re.search(r'([0-9]+\.[0-9]{3}) kB / [0-9]+\.[0-9]{2} sec', line)
+                     if mobj:
+                         downloaded_data_len = int(float(mobj.group(1))*1024)
+                         time_now = time.time()
+                         speed = self.calc_speed(start, time_now, downloaded_data_len)
+                         self.report_progress_live_stream(downloaded_data_len, speed, time_now - start)
+                         cursor_in_new_line = False
+                         self._hook_progress({
+                             'downloaded_bytes': downloaded_data_len,
+                             'tmpfilename': tmpfilename,
+                             'filename': filename,
+                             'status': 'downloading',
+                             'speed': speed,
+                         })
+                     elif self.params.get('verbose', False):
+                         if not cursor_in_new_line:
+                             self.to_screen(u'')
+                         cursor_in_new_line = True
+                         self.to_screen(u'[rtmpdump] '+line)
              proc.wait()
              if not cursor_in_new_line:
                  self.to_screen(u'')
              basic_args += ['--stop', '1']
          if live:
              basic_args += ['--live']
+         if conn:
+             basic_args += ['--conn', conn]
          args = basic_args + [[], ['--resume', '--skip', '1']][self.params.get('continuedl', False)]
  
          if sys.platform == 'win32' and sys.version_info < (3, 0):
                                                  info_dict.get('page_url', None),
                                                  info_dict.get('play_path', None),
                                                  info_dict.get('tc_url', None),
-                                                 info_dict.get('rtmp_live', False))
+                                                 info_dict.get('rtmp_live', False),
+                                                 info_dict.get('rtmp_conn', None))
  
          # Attempt to download using mplayer
          if url.startswith('mms') or url.startswith('rtsp'):
index 7ecafb10470d4cdc99623f98853c885566b4f8c6,60e2d6ebde32127fdb52c89d5f8a5f9d7be84f66..2b78cc84dc09e5d67f609d9c29ccf48d71be3e5b
@@@ -8,7 -8,6 +8,7 @@@ from .arte import 
      ArteTVPlus7IE,
      ArteTVCreativeIE,
      ArteTVFutureIE,
 +    ArteTVDDCIE,
  )
  from .auengine import AUEngineIE
  from .bambuser import BambuserIE, BambuserChannelIE
@@@ -57,7 -56,7 +57,7 @@@ from .flickr import FlickrI
  from .francetv import (
      PluzzIE,
      FranceTvInfoIE,
 -    France2IE,
 +    FranceTVIE,
      GenerationQuoiIE
  )
  from .freesound import FreesoundIE
@@@ -103,7 -102,6 +103,7 @@@ from .nbc import NBCNewsI
  from .newgrounds import NewgroundsIE
  from .nhl import NHLIE, NHLVideocenterIE
  from .niconico import NiconicoIE
 +from .ninegag import NineGagIE
  from .nowvideo import NowVideoIE
  from .ooyala import OoyalaIE
  from .orf import ORFIE
@@@ -112,7 -110,6 +112,7 @@@ from .photobucket import PhotobucketI
  from .podomatic import PodomaticIE
  from .pornhub import PornHubIE
  from .pornotube import PornotubeIE
 +from .pyvideo import PyvideoIE
  from .rbmaradio import RBMARadioIE
  from .redtube import RedTubeIE
  from .ringtv import RingTVIE
@@@ -128,6 -125,7 +128,7 @@@ from .smotri import 
      SmotriIE,
      SmotriCommunityIE,
      SmotriUserIE,
+     SmotriBroadcastIE,
  )
  from .sohu import SohuIE
  from .soundcloud import SoundcloudIE, SoundcloudSetIE, SoundcloudUserIE
@@@ -147,7 -145,6 +148,7 @@@ from .teamcoco import TeamcocoI
  from .techtalks import TechTalksIE
  from .ted import TEDIE
  from .tf1 import TF1IE
 +from .theplatform import ThePlatformIE
  from .thisav import ThisAVIE
  from .toutv import TouTvIE
  from .traileraddict import TrailerAddictIE
@@@ -172,8 -169,6 +173,8 @@@ from .vimeo import 
      VimeoIE,
      VimeoChannelIE,
      VimeoUserIE,
 +    VimeoAlbumIE,
 +    VimeoGroupsIE,
  )
  from .vine import VineIE
  from .viki import VikiIE
@@@ -182,7 -177,6 +183,7 @@@ from .wat import WatI
  from .websurg import WeBSurgIE
  from .weibo import WeiboIE
  from .wimp import WimpIE
 +from .wistia import WistiaIE
  from .worldstarhiphop import WorldStarHipHopIE
  from .xhamster import XHamsterIE
  from .xnxx import XNXXIE
index 5a28bc82084228c42d0e9982ce82dfad68f6dec2,ff539ea0cbcb332c8a7e107174e7847abe60bca7..4ea89bf85e7c27cd159af8b6a927a92476b70b0d
@@@ -3,10 -3,13 +3,13 @@@
  import re
  import json
  import hashlib
+ import uuid
  
  from .common import InfoExtractor
  from ..utils import (
-     ExtractorError
+     compat_urllib_parse,
+     compat_urllib_request,
 -    ExtractorError
++    ExtractorError,
  )
  
  
@@@ -249,3 -252,105 +252,105 @@@ class SmotriUserIE(InfoExtractor)
              u'user nickname')
  
          return self.playlist_result(entries, user_id, user_nickname)
 -        }
+ class SmotriBroadcastIE(InfoExtractor):
+     IE_DESC = u'Smotri.com broadcasts'
+     IE_NAME = u'smotri:broadcast'
+     _VALID_URL = r'^https?://(?:www\.)?(?P<url>smotri\.com/live/(?P<broadcastid>[^/]+))/?.*'
+     def _real_extract(self, url):
+         mobj = re.match(self._VALID_URL, url)
+         broadcast_id = mobj.group('broadcastid')
+         broadcast_url = 'http://' + mobj.group('url')
+         broadcast_page = self._download_webpage(broadcast_url, broadcast_id, u'Downloading broadcast page')
+         if re.search(u'>Режиссер с логином <br/>"%s"<br/> <span>не существует<' % broadcast_id, broadcast_page) is not None:
+             raise ExtractorError(u'Broadcast %s does not exist' % broadcast_id, expected=True)
+         # Adult content
+         if re.search(u'EroConfirmText">', broadcast_page) is not None:
+             (username, password) = self._get_login_info()
+             if username is None:
+                 raise ExtractorError(u'Erotic broadcasts allowed only for registered users, '
+                     u'use --username and --password options to provide account credentials.', expected=True)
+             # Log in
+             login_form_strs = {
+                 u'login-hint53': '1',
+                 u'confirm_erotic': '1',
+                 u'login': username,
+                 u'password': password,
+             }
+             # Convert to UTF-8 *before* urlencode because Python 2.x's urlencode
+             # chokes on unicode
+             login_form = dict((k.encode('utf-8'), v.encode('utf-8')) for k,v in login_form_strs.items())
+             login_data = compat_urllib_parse.urlencode(login_form).encode('utf-8')
+             login_url = broadcast_url + '/?no_redirect=1'
+             request = compat_urllib_request.Request(login_url, login_data)
+             request.add_header('Content-Type', 'application/x-www-form-urlencoded')
+             broadcast_page = self._download_webpage(
+                 request, broadcast_id, note=u'Logging in and confirming age')
+             if re.search(u'>Неверный логин или пароль<', broadcast_page) is not None:
+                 raise ExtractorError(u'Unable to log in: bad username or password', expected=True)
+             adult_content = True
+         else:
+             adult_content = False
+         ticket = self._html_search_regex(
+             u'window\.broadcast_control\.addFlashVar\\(\'file\', \'([^\']+)\'\\);',
+             broadcast_page, u'broadcast ticket')
+         url = 'http://smotri.com/broadcast/view/url/?ticket=%s' % ticket
+         broadcast_password = self._downloader.params.get('videopassword', None)
+         if broadcast_password:
+             url += '&pass=%s' % hashlib.md5(broadcast_password.encode('utf-8')).hexdigest()
+         broadcast_json_page = self._download_webpage(url, broadcast_id, u'Downloading broadcast JSON')
+         try:
+             broadcast_json = json.loads(broadcast_json_page)
+             protected_broadcast = broadcast_json['_pass_protected'] == 1
+             if protected_broadcast and not broadcast_password:
+                 raise ExtractorError(u'This broadcast is protected by a password, use the --video-password option', expected=True)
+             broadcast_offline = broadcast_json['is_play'] == 0
+             if broadcast_offline:
+                 raise ExtractorError(u'Broadcast %s is offline' % broadcast_id, expected=True)
+             rtmp_url = broadcast_json['_server']
+             if not rtmp_url.startswith('rtmp://'):
+                 raise ExtractorError(u'Unexpected broadcast rtmp URL')
+             broadcast_playpath = broadcast_json['_streamName']
+             broadcast_thumbnail = broadcast_json['_imgURL']
+             broadcast_title = broadcast_json['title']
+             broadcast_description = broadcast_json['description']
+             broadcaster_nick = broadcast_json['nick']
+             broadcaster_login = broadcast_json['login']
+             rtmp_conn = 'S:%s' % uuid.uuid4().hex
+         except KeyError:
+             if protected_broadcast:
+                 raise ExtractorError(u'Bad broadcast password', expected=True)
+             raise ExtractorError(u'Unexpected broadcast JSON')
+         return {
+             'id': broadcast_id,
+             'url': rtmp_url,
+             'title': broadcast_title,
+             'thumbnail': broadcast_thumbnail,
+             'description': broadcast_description,
+             'uploader': broadcaster_nick,
+             'uploader_id': broadcaster_login,
+             'age_limit': 18 if adult_content else 0,
+             'ext': 'flv',
+             'play_path': broadcast_playpath,
+             'rtmp_live': True,
+             'rtmp_conn': rtmp_conn
++        }