Add support for beeg.com

author peugeot <peugeot@psa.fr>

Sun, 31 Aug 2014 09:57:10 +0000 (11:57 +0200)

committer peugeot <peugeot@psa.fr>

Sun, 31 Aug 2014 09:57:10 +0000 (11:57 +0200)
author peugeot <peugeot@psa.fr>
Sun, 31 Aug 2014 09:57:10 +0000 (11:57 +0200)
committer peugeot <peugeot@psa.fr>
Sun, 31 Aug 2014 09:57:10 +0000 (11:57 +0200)
diff --git a/youtube_dl/extractor/__init__.py b/youtube_dl/extractor/__init__.py

index 1479d998a264b5ec7206d15f7acc5465dd309b6a..01b5f19ddc5f7d940cc28ad61e2796cbdaa0c51b 100644 (file)
--- a/youtube_dl/extractor/__init__.py
+++ b/youtube_dl/extractor/__init__.py
@@ -23,6 +23,7 @@ from .auengine import AUEngineIE
  from .bambuser import BambuserIE, BambuserChannelIE
  from .bandcamp import BandcampIE, BandcampAlbumIE
  from .bbccouk import BBCCoUkIE
  from .bambuser import BambuserIE, BambuserChannelIE
  from .bandcamp import BandcampIE, BandcampAlbumIE
  from .bbccouk import BBCCoUkIE
+from .beeg import BeegIE
  from .bilibili import BiliBiliIE
  from .blinkx import BlinkxIE
  from .bliptv import BlipTVIE, BlipTVUserIE
  from .bilibili import BiliBiliIE
  from .blinkx import BlinkxIE
  from .bliptv import BlipTVIE, BlipTVUserIE
diff --git a/youtube_dl/extractor/beeg.py b/youtube_dl/extractor/beeg.py

new file mode 100644 (file)

index 0000000..775f6be
--- /dev/null
+++ b/youtube_dl/extractor/beeg.py
@@ -0,0 +1,48 @@
+from __future__ import unicode_literals
+
+import re
+
+from .common import InfoExtractor
+
+
+class BeegIE(InfoExtractor):
+    _VALID_URL = r'https?://(?:www\.)?beeg\.com/(?P<id>\d+)'
+    _TEST = {
+        'url': 'http://beeg.com/5416503',
+        'md5': '634526ae978711f6b748fe0dd6c11f57',
+        'info_dict': {
+            'id': '5416503',
+            'ext': 'mp4',
+            'title': 'Sultry Striptease',
+            'description': 'md5:6db3c6177972822aaba18652ff59c773',
+        }
+    }
+
+    def _real_extract(self, url):
+        mobj = re.match(self._VALID_URL, url)
+        video_id = mobj.group('id')
+
+        webpage = self._download_webpage(url, video_id)
+
+        video_url = self._html_search_regex(r"'480p'\s*:\s*'([^']+)'", webpage, 'video URL')
+
+        title = self._html_search_regex(r'<title>([^<]+)\s*-\s*beeg\.?</title>', webpage, 'title')
+        
+        description = self._html_search_regex(
+            r'<meta name="description" content="([^"]*)"', webpage, 'description', fatal=False)
+        
+        thumbnail = self._html_search_regex(
+            r'\'previewer.url\'\s*:\s*"([^"]*)"', webpage, 'thumbnail', fatal=False)
+
+        categories_str = self._html_search_regex(
+            r'<meta name="keywords" content="([^"]+)"', webpage, 'categories', fatal=False)
+        categories = categories_str.split(',')
+
+        return {
+            'id': video_id,
+            'url': video_url,
+            'title': title,
+            'description': description,
+            'thumbnail': thumbnail,
+            'categories': categories,
+        }
author	peugeot <peugeot@psa.fr>
	Sun, 31 Aug 2014 09:57:10 +0000 (11:57 +0200)
committer	peugeot <peugeot@psa.fr>
	Sun, 31 Aug 2014 09:57:10 +0000 (11:57 +0200)
youtube_dl/extractor/__init__.py		patch \| blob \| history
youtube_dl/extractor/beeg.py	[new file with mode: 0644]	patch \| blob