[break] adapt to new paths
authorPhilipp Hagemeister <phihag@phihag.de>
Sun, 23 Jun 2013 20:59:51 +0000 (22:59 +0200)
committerPhilipp Hagemeister <phihag@phihag.de>
Sun, 23 Jun 2013 20:59:51 +0000 (22:59 +0200)
test/tests.json
youtube_dl/extractor/__init__.py
youtube_dl/extractor/breakcom.py [new file with mode: 0644]

index 86dc48570ae61ed01e753c287d01806ef4824ead..01367b0fb44c60917db9c50a4ab05a7ddb1a6cdd 100644 (file)
         "uploader_id": "videoseconds",
         "title": "Instagram photo by @videoseconds (Videos)"
     }
+  },
+  {
+    "name": "Break",
+    "url": "http://www.break.com/video/when-girls-act-like-guys-2468056",
+    "file": "2468056.mp4",
+    "md5": "a3513fb1547fba4fb6cfac1bffc6c46b",
+    "info_dict": {
+        "title": "When Girls Act Like D-Bags"
+    }
   }
 ]
index 4729512edde28f7caf180cc48975bed0cf23c899..b208f9002e9e9bb31771b12e6b96399859d1382f 100644 (file)
@@ -3,6 +3,7 @@ from .ard import ARDIE
 from .arte import ArteTvIE
 from .bandcamp import BandcampIE
 from .bliptv import BlipTVIE, BlipTVUserIE
+from .breakcom import BreakIE
 from .comedycentral import ComedyCentralIE
 from .collegehumor import CollegeHumorIE
 from .dailymotion import DailymotionIE
@@ -123,6 +124,7 @@ def gen_extractors():
         Vbox7IE(),
         GametrailersIE(),
         StatigramIE(),
+        BreakIE(),
         GenericIE()
     ]
 
diff --git a/youtube_dl/extractor/breakcom.py b/youtube_dl/extractor/breakcom.py
new file mode 100644 (file)
index 0000000..1f6620d
--- /dev/null
@@ -0,0 +1,25 @@
+import re
+
+from .common import InfoExtractor
+
+
+class BreakIE(InfoExtractor):
+    _VALID_URL = r'(?:http://)?(?:www\.)?break\.com/video/([^/]+)'
+
+    def _real_extract(self, url):
+        mobj = re.match(self._VALID_URL, url)
+        video_id = mobj.group(1).split("-")[-1]
+        webpage = self._download_webpage(url, video_id)
+        video_url = re.search(r"videoPath: '(.+?)',",webpage).group(1)
+        key = re.search(r"icon: '(.+?)',",webpage).group(1)
+        final_url = str(video_url)+"?"+str(key)
+        thumbnail_url = re.search(r"thumbnailURL: '(.+?)'",webpage).group(1)
+        title = re.search(r"sVidTitle: '(.+)',",webpage).group(1)
+        ext = video_url.split('.')[-1]
+        return [{
+            'id':        video_id,
+            'url':       final_url,
+            'ext':       ext,
+            'title':     title,
+            'thumbnail': thumbnail_url,
+        }]