X-Git-Url: http://git.bitcoin.ninja/index.cgi?a=blobdiff_plain;f=youtube_dl%2Futils.py;h=658fd2686b8534e834c34872883fd26d3d820cde;hb=92b91c18780938283c505f5662c458e049bf3567;hp=922e17eccfac611a1d90bf83e913383c9afce30d;hpb=b0d4f9589973396eea1731e4a5ed3d8015365018;p=youtube-dl diff --git a/youtube_dl/utils.py b/youtube_dl/utils.py index 922e17ecc..658fd2686 100644 --- a/youtube_dl/utils.py +++ b/youtube_dl/utils.py @@ -19,13 +19,18 @@ except ImportError: import StringIO std_headers = { - 'User-Agent': 'Mozilla/5.0 (X11; Linux x86_64; rv:5.0.1) Gecko/20100101 Firefox/5.0.1', + 'User-Agent': 'Mozilla/5.0 (X11; Linux x86_64; rv:10.0) Gecko/20100101 Firefox/10.0', 'Accept-Charset': 'ISO-8859-1,utf-8;q=0.7,*;q=0.7', 'Accept': 'text/html,application/xhtml+xml,application/xml;q=0.9,*/*;q=0.8', 'Accept-Encoding': 'gzip, deflate', 'Accept-Language': 'en-us,en;q=0.5', } +try: + compat_str = unicode # Python 2 +except NameError: + compat_str = str + def preferredencoding(): """Get preferred encoding. @@ -83,7 +88,6 @@ class IDParser(HTMLParser.HTMLParser): HTMLParser.HTMLParser.__init__(self) def error(self, message): - print >> sys.stderr, self.getpos() if self.error_count > 10 or self.started: raise HTMLParser.HTMLParseError(message, self.getpos()) self.rawdata = '\n'.join(self.html.split('\n')[self.getpos()[0]:]) # skip one line @@ -194,10 +198,20 @@ def timeconvert(timestr): def sanitize_filename(s): """Sanitizes a string so it could be used as part of a filename.""" def replace_insane(char): - if char in u' .\\/|?*<>:"' or ord(char) < 32: - return '_' + if char == '?' or ord(char) < 32 or ord(char) == 127: + return '' + elif char == '"': + return '\'' + elif char == ':': + return ' -' + elif char in '\\/|*<>': + return '-' return char - return u''.join(map(replace_insane, s)).strip('_') + + result = u''.join(map(replace_insane, s)) + while '--' in result: + result = result.replace('--', '-') + return result.strip('-') def orderedSet(iterable): """ Remove all duplicates from the input iterable """