projects
/
youtube-dl
/ blobdiff
commit
grep
author
committer
pickaxe
?
search:
re
summary
|
shortlog
|
log
|
commit
|
commitdiff
|
tree
raw
|
inline
| side by side
[utils] Strict HTTP responses (Closes #6727)
[youtube-dl]
/
youtube_dl
/
extractor
/
dumpert.py
diff --git
a/youtube_dl/extractor/dumpert.py
b/youtube_dl/extractor/dumpert.py
index e43bc81b22c08bccb4ad87204353781c07dbf8a5..1f00386feae15d00a4421b3166335c15f3b01aa9 100644
(file)
--- a/
youtube_dl/extractor/dumpert.py
+++ b/
youtube_dl/extractor/dumpert.py
@@
-4,12
+4,13
@@
from __future__ import unicode_literals
import base64
from .common import InfoExtractor
import base64
from .common import InfoExtractor
+from ..compat import compat_urllib_request
from ..utils import qualities
class DumpertIE(InfoExtractor):
from ..utils import qualities
class DumpertIE(InfoExtractor):
- _VALID_URL = r'https?://(?:www\.)?dumpert\.nl/
mediabase
/(?P<id>[0-9]+/[0-9a-zA-Z]+)'
- _TEST
=
{
+ _VALID_URL = r'https?://(?:www\.)?dumpert\.nl/
(?:mediabase|embed)
/(?P<id>[0-9]+/[0-9a-zA-Z]+)'
+ _TEST
S = [
{
'url': 'http://www.dumpert.nl/mediabase/6646981/951bc60f/',
'md5': '1b9318d7d5054e7dcb9dc7654f21d643',
'info_dict': {
'url': 'http://www.dumpert.nl/mediabase/6646981/951bc60f/',
'md5': '1b9318d7d5054e7dcb9dc7654f21d643',
'info_dict': {
@@
-19,11
+20,18
@@
class DumpertIE(InfoExtractor):
'description': 'Niet schrikken hoor',
'thumbnail': 're:^https?://.*\.jpg$',
}
'description': 'Niet schrikken hoor',
'thumbnail': 're:^https?://.*\.jpg$',
}
- }
+ }, {
+ 'url': 'http://www.dumpert.nl/embed/6675421/dc440fe7/',
+ 'only_matching': True,
+ }]
def _real_extract(self, url):
video_id = self._match_id(url)
def _real_extract(self, url):
video_id = self._match_id(url)
- webpage = self._download_webpage(url, video_id)
+
+ url = 'https://www.dumpert.nl/mediabase/' + video_id
+ req = compat_urllib_request.Request(url)
+ req.add_header('Cookie', 'nsfw=1; cpc=10')
+ webpage = self._download_webpage(req, video_id)
files_base64 = self._search_regex(
r'data-files="([^"]+)"', webpage, 'data files')
files_base64 = self._search_regex(
r'data-files="([^"]+)"', webpage, 'data files')