[grooveshark] Fix extraction

[youtube-dl] / youtube_dl / utils.py
diff --git a/youtube_dl/utils.py b/youtube_dl/utils.py

index 0f49d602eab1296dced15449a949c26dc4408d66..472d4df41fda2cb1ffd0392cc4da0f4bdcc2a48a 100644 (file)
--- a/youtube_dl/utils.py
+++ b/youtube_dl/utils.py
@@ -252,15 +252,12 @@ def sanitize_open(filename, open_mode):
              raise
  
          # In case of error, try to remove win32 forbidden chars
-        alt_filename = os.path.join(
-            re.sub('[/<>:"\\|\\\\?\\*]', '#', path_part)
-            for path_part in os.path.split(filename)
-        )
+        alt_filename = sanitize_path(filename)
          if alt_filename == filename:
              raise
          else:
              # An exception here should be caught in the caller
-            stream = open(encodeFilename(filename), open_mode)
+            stream = open(encodeFilename(alt_filename), open_mode)
              return (stream, alt_filename)
  
  
@@ -322,13 +319,20 @@ def sanitize_path(s):
      if unc_or_drive:
          norm_path.pop(0)
      sanitized_path = [
-        re.sub('[/<>:"\\|\\\\?\\*]', '#', path_part)
+        path_part if path_part in ['.', '..'] else re.sub('(?:[/<>:"\\|\\\\?\\*]|\.$)', '#', path_part)
          for path_part in norm_path]
      if unc_or_drive:
          sanitized_path.insert(0, unc_or_drive + os.path.sep)
      return os.path.join(*sanitized_path)
  
  
+def sanitize_url_path_consecutive_slashes(url):
+    """Collapses consecutive slashes in URLs' path"""
+    parsed_url = list(compat_urlparse.urlparse(url))
+    parsed_url[2] = re.sub(r'/{2,}', '/', parsed_url[2])
+    return compat_urlparse.urlunparse(parsed_url)
+
+
  def orderedSet(iterable):
      """ Remove all duplicates from the input iterable """
      res = []