Fix some regexes

author Sergey M․ <dstftw@gmail.com>

Mon, 9 Oct 2017 16:50:53 +0000 (23:50 +0700)

committer Sergey M․ <dstftw@gmail.com>

Mon, 9 Oct 2017 16:50:53 +0000 (23:50 +0700)
author Sergey M․ <dstftw@gmail.com>
Mon, 9 Oct 2017 16:50:53 +0000 (23:50 +0700)
committer Sergey M․ <dstftw@gmail.com>
Mon, 9 Oct 2017 16:50:53 +0000 (23:50 +0700)
diff --git a/youtube_dl/extractor/aenetworks.py b/youtube_dl/extractor/aenetworks.py

index 2dcdba9d22c54e57811a85cd2bceb81bf11bbdce..da1b566c20eb6c4477e86f26dfec21b281a5f07c 100644 (file)
--- a/youtube_dl/extractor/aenetworks.py
+++ b/youtube_dl/extractor/aenetworks.py
@@ -131,7 +131,7 @@ class AENetworksIE(AENetworksBaseIE):
               r'data-media-url=(["\'])(?P<url>(?:(?!\1).)+?)\1'],
              webpage, 'video url', group='url')
          theplatform_metadata = self._download_theplatform_metadata(self._search_regex(
-            r'https?://link.theplatform.com/s/([^?]+)', media_url, 'theplatform_path'), video_id)
+            r'https?://link\.theplatform\.com/s/([^?]+)', media_url, 'theplatform_path'), video_id)
          info = self._parse_theplatform_metadata(theplatform_metadata)
          if theplatform_metadata.get('AETN$isBehindWall'):
              requestor_id = self._DOMAIN_TO_REQUESTOR_ID[domain]
diff --git a/youtube_dl/extractor/appletrailers.py b/youtube_dl/extractor/appletrailers.py

index b45b431e19c1526eb9578e9cbf6a13a97939b2a8..a9ef733e011237338d904f956c4324cc6dd7a72b 100644 (file)
--- a/youtube_dl/extractor/appletrailers.py
+++ b/youtube_dl/extractor/appletrailers.py
@@ -117,7 +117,7 @@ class AppleTrailersIE(InfoExtractor):
                              continue
                          formats.append({
                              'format_id': '%s-%s' % (version, size),
-                            'url': re.sub(r'_(\d+p.mov)', r'_h\1', src),
+                            'url': re.sub(r'_(\d+p\.mov)', r'_h\1', src),
                              'width': int_or_none(size_data.get('width')),
                              'height': int_or_none(size_data.get('height')),
                              'language': version[:2],
@@ -179,7 +179,7 @@ class AppleTrailersIE(InfoExtractor):
              formats = []
              for format in settings['metadata']['sizes']:
                  # The src is a file pointing to the real video file
-                format_url = re.sub(r'_(\d*p.mov)', r'_h\1', format['src'])
+                format_url = re.sub(r'_(\d*p\.mov)', r'_h\1', format['src'])
                  formats.append({
                      'url': format_url,
                      'format': format['type'],
diff --git a/youtube_dl/extractor/ard.py b/youtube_dl/extractor/ard.py

index 3f248b14728ab3655a2e17f7b38a95184042d770..915f8862e3769c3f186209435dcc34029dead932 100644 (file)
--- a/youtube_dl/extractor/ard.py
+++ b/youtube_dl/extractor/ard.py
@@ -195,7 +195,7 @@ class ARDMediathekIE(InfoExtractor):
  
          title = self._html_search_regex(
              [r'<h1(?:\s+class="boxTopHeadline")?>(.*?)</h1>',
-             r'<meta name="dcterms.title" content="(.*?)"/>',
+             r'<meta name="dcterms\.title" content="(.*?)"/>',
               r'<h4 class="headline">(.*?)</h4>'],
              webpage, 'title')
          description = self._html_search_meta(
diff --git a/youtube_dl/extractor/bbc.py b/youtube_dl/extractor/bbc.py

index 8b20c03d6e424b95e42b1bea1ac3fb91e24bea11..5525f7c9b998c57271aba072bb698f6c03b36777 100644 (file)
--- a/youtube_dl/extractor/bbc.py
+++ b/youtube_dl/extractor/bbc.py
@@ -386,7 +386,7 @@ class BBCCoUkIE(InfoExtractor):
                              m3u8_id=format_id, fatal=False))
                          if re.search(self._USP_RE, href):
                              usp_formats = self._extract_m3u8_formats(
-                                re.sub(self._USP_RE, r'/\1.ism/\1.m3u8', href),
+                                re.sub(self._USP_RE, r'/\1\.ism/\1\.m3u8', href),
                                  programme_id, ext='mp4', entry_protocol='m3u8_native',
                                  m3u8_id=format_id, fatal=False)
                              for f in usp_formats:
diff --git a/youtube_dl/extractor/dailymotion.py b/youtube_dl/extractor/dailymotion.py

index e9d0dd19cf157d3e707da8e18638d83749b7fdc5..21a2d02392a7ad0393b7db499eb1b4a0ee054547 100644 (file)
--- a/youtube_dl/extractor/dailymotion.py
+++ b/youtube_dl/extractor/dailymotion.py
@@ -235,7 +235,7 @@ class DailymotionIE(DailymotionBaseInfoExtractor):
  
          # vevo embed
          vevo_id = self._search_regex(
-            r'<link rel="video_src" href="[^"]*?vevo.com[^"]*?video=(?P<id>[\w]*)',
+            r'<link rel="video_src" href="[^"]*?vevo\.com[^"]*?video=(?P<id>[\w]*)',
              webpage, 'vevo embed', default=None)
          if vevo_id:
              return self.url_result('vevo:%s' % vevo_id, 'Vevo')
diff --git a/youtube_dl/extractor/deezer.py b/youtube_dl/extractor/deezer.py

index ec87b94dbcc74ae60e05d1c6f43a6e4429cbb721..a38b2683d5932fa55089bc6bc610d1795c5bc07d 100644 (file)
--- a/youtube_dl/extractor/deezer.py
+++ b/youtube_dl/extractor/deezer.py
@@ -19,7 +19,7 @@ class DeezerPlaylistIE(InfoExtractor):
              'id': '176747451',
              'title': 'Best!',
              'uploader': 'Anonymous',
-            'thumbnail': r're:^https?://cdn-images.deezer.com/images/cover/.*\.jpg$',
+            'thumbnail': r're:^https?://cdn-images\.deezer\.com/images/cover/.*\.jpg$',
          },
          'playlist_count': 30,
          'skip': 'Only available in .de',
diff --git a/youtube_dl/extractor/freespeech.py b/youtube_dl/extractor/freespeech.py

index 0a70ca76351ab310ba394959b717973ec772f52d..7fa271b51fa59e14342d0de21cd50be719f3467d 100644 (file)
--- a/youtube_dl/extractor/freespeech.py
+++ b/youtube_dl/extractor/freespeech.py
@@ -27,7 +27,7 @@ class FreespeechIE(InfoExtractor):
          mobj = re.match(self._VALID_URL, url)
          title = mobj.group('title')
          webpage = self._download_webpage(url, title)
-        info_json = self._search_regex(r'jQuery.extend\(Drupal.settings, ({.*?})\);', webpage, 'info')
+        info_json = self._search_regex(r'jQuery\.extend\(Drupal\.settings, ({.*?})\);', webpage, 'info')
          info = json.loads(info_json)
  
          return {
diff --git a/youtube_dl/extractor/generic.py b/youtube_dl/extractor/generic.py

index 1721a3dbd02a73e5afb685ead0f0a6bdd87a5dd4..68b6338396dc84277792273db277154fe3cc4995 100644 (file)
--- a/youtube_dl/extractor/generic.py
+++ b/youtube_dl/extractor/generic.py
@@ -2206,7 +2206,7 @@ class GenericIE(InfoExtractor):
          # And then there are the jokers who advertise that they use RTA,
          # but actually don't.
          AGE_LIMIT_MARKERS = [
-            r'Proudly Labeled <a href="http://www.rtalabel.org/" title="Restricted to Adults">RTA</a>',
+            r'Proudly Labeled <a href="http://www\.rtalabel\.org/" title="Restricted to Adults">RTA</a>',
          ]
          if any(re.search(marker, webpage) for marker in AGE_LIMIT_MARKERS):
              age_limit = 18
diff --git a/youtube_dl/extractor/googleplus.py b/youtube_dl/extractor/googleplus.py

index 427499b11286f00a8e10e09a8de1d9f84611b5c9..6b927bb4477da8ff3f1f5635a6bf5d3a5a590984 100644 (file)
--- a/youtube_dl/extractor/googleplus.py
+++ b/youtube_dl/extractor/googleplus.py
@@ -61,7 +61,7 @@ class GooglePlusIE(InfoExtractor):
              'width': int(width),
              'height': int(height),
          } for width, height, video_url in re.findall(
-            r'\d+,(\d+),(\d+),"(https?://[^.]+\.googleusercontent.com.*?)"', webpage)]
+            r'\d+,(\d+),(\d+),"(https?://[^.]+\.googleusercontent\.com.*?)"', webpage)]
          self._sort_formats(formats)
  
          return {
diff --git a/youtube_dl/extractor/hrti.py b/youtube_dl/extractor/hrti.py

index 4f036943376e2f751fa2219101c3d7614540923d..7cef5f6ce0da52fab3e3638d81eed41788e24c20 100644 (file)
--- a/youtube_dl/extractor/hrti.py
+++ b/youtube_dl/extractor/hrti.py
@@ -173,7 +173,7 @@ class HRTiIE(HRTiBaseIE):
  
  
  class HRTiPlaylistIE(HRTiBaseIE):
-    _VALID_URL = r'https?://hrti.hrt.hr/#/video/list/category/(?P<id>[0-9]+)/(?P<display_id>[^/]+)?'
+    _VALID_URL = r'https?://hrti\.hrt\.hr/#/video/list/category/(?P<id>[0-9]+)/(?P<display_id>[^/]+)?'
      _TESTS = [{
          'url': 'https://hrti.hrt.hr/#/video/list/category/212/ekumena',
          'info_dict': {
diff --git a/youtube_dl/extractor/ign.py b/youtube_dl/extractor/ign.py

index c1367cf517ce9b39960a13705b4475bf4f3cf8d1..a96ea801019c808e6a8fe1f8f6590b0e018feeef 100644 (file)
--- a/youtube_dl/extractor/ign.py
+++ b/youtube_dl/extractor/ign.py
@@ -203,7 +203,7 @@ class PCMagIE(IGNIE):
      _VALID_URL = r'https?://(?:www\.)?pcmag\.com/(?P<type>videos|article2)(/.+)?/(?P<name_or_id>.+)'
      IE_NAME = 'pcmag'
  
-    _EMBED_RE = r'iframe.setAttribute\("src",\s*__util.objToUrlString\("http://widgets\.ign\.com/video/embed/content.html?[^"]*url=([^"]+)["&]'
+    _EMBED_RE = r'iframe\.setAttribute\("src",\s*__util.objToUrlString\("http://widgets\.ign\.com/video/embed/content\.html?[^"]*url=([^"]+)["&]'
  
      _TESTS = [{
          'url': 'http://www.pcmag.com/videos/2015/01/06/010615-whats-new-now-is-gogo-snooping-on-your-data',
diff --git a/youtube_dl/extractor/infoq.py b/youtube_dl/extractor/infoq.py

index fe425e786479e505aad8082745d43040d38ba881..57c9b0cc43fed492a4871bd5b03d442e19ba3535 100644 (file)
--- a/youtube_dl/extractor/infoq.py
+++ b/youtube_dl/extractor/infoq.py
@@ -69,9 +69,9 @@ class InfoQIE(BokeCCBaseIE):
          }]
  
      def _extract_cookies(self, webpage):
-        policy = self._search_regex(r'InfoQConstants.scp\s*=\s*\'([^\']+)\'', webpage, 'policy')
-        signature = self._search_regex(r'InfoQConstants.scs\s*=\s*\'([^\']+)\'', webpage, 'signature')
-        key_pair_id = self._search_regex(r'InfoQConstants.sck\s*=\s*\'([^\']+)\'', webpage, 'key-pair-id')
+        policy = self._search_regex(r'InfoQConstants\.scp\s*=\s*\'([^\']+)\'', webpage, 'policy')
+        signature = self._search_regex(r'InfoQConstants\.scs\s*=\s*\'([^\']+)\'', webpage, 'signature')
+        key_pair_id = self._search_regex(r'InfoQConstants\.sck\s*=\s*\'([^\']+)\'', webpage, 'key-pair-id')
          return 'CloudFront-Policy=%s; CloudFront-Signature=%s; CloudFront-Key-Pair-Id=%s' % (
              policy, signature, key_pair_id)
  
diff --git a/youtube_dl/extractor/jeuxvideo.py b/youtube_dl/extractor/jeuxvideo.py

index 1a4227f6b4b0ef7370b0f09613ef9d4b8916b435..e9f4ed7384225456edf87baf0c24ce5c6ecc4b20 100644 (file)
--- a/youtube_dl/extractor/jeuxvideo.py
+++ b/youtube_dl/extractor/jeuxvideo.py
@@ -30,7 +30,7 @@ class JeuxVideoIE(InfoExtractor):
          webpage = self._download_webpage(url, title)
          title = self._html_search_meta('name', webpage) or self._og_search_title(webpage)
          config_url = self._html_search_regex(
-            r'data-src(?:set-video)?="(/contenu/medias/video.php.*?)"',
+            r'data-src(?:set-video)?="(/contenu/medias/video\.php.*?)"',
              webpage, 'config URL')
          config_url = 'http://www.jeuxvideo.com' + config_url
  
diff --git a/youtube_dl/extractor/livestream.py b/youtube_dl/extractor/livestream.py

index 7f946c6ed9d64c54670d7fba68058144bcab494b..317ebbc4ee60d17051574ae05b8575526216de05 100644 (file)
--- a/youtube_dl/extractor/livestream.py
+++ b/youtube_dl/extractor/livestream.py
@@ -338,7 +338,7 @@ class LivestreamOriginalIE(InfoExtractor):
                  info = {
                      'title': self._og_search_title(webpage),
                      'description': self._og_search_description(webpage),
-                    'thumbnail': self._search_regex(r'channelLogo.src\s*=\s*"([^"]+)"', webpage, 'thumbnail', None),
+                    'thumbnail': self._search_regex(r'channelLogo\.src\s*=\s*"([^"]+)"', webpage, 'thumbnail', None),
                  }
              video_data = self._download_json(stream_url, content_id)
              is_live = video_data.get('isLive')
diff --git a/youtube_dl/extractor/makertv.py b/youtube_dl/extractor/makertv.py

index 3c34d4604f20699d99937b29a11aad7f8f4116a4..8eda69cfc4aded62c192d1cef00c27bee57ab296 100644 (file)
--- a/youtube_dl/extractor/makertv.py
+++ b/youtube_dl/extractor/makertv.py
@@ -5,7 +5,7 @@ from .common import InfoExtractor
  
  
  class MakerTVIE(InfoExtractor):
-    _VALID_URL = r'https?://(?:(?:www\.)?maker\.tv/(?:[^/]+/)*video|makerplayer.com/embed/maker)/(?P<id>[a-zA-Z0-9]{12})'
+    _VALID_URL = r'https?://(?:(?:www\.)?maker\.tv/(?:[^/]+/)*video|makerplayer\.com/embed/maker)/(?P<id>[a-zA-Z0-9]{12})'
      _TEST = {
          'url': 'http://www.maker.tv/video/Fh3QgymL9gsc',
          'md5': 'ca237a53a8eb20b6dc5bd60564d4ab3e',
diff --git a/youtube_dl/extractor/mangomolo.py b/youtube_dl/extractor/mangomolo.py

index 1885ac7df59684767022f95c5c35ffeb65cd33d5..dbd761a67864036cd84be24fa9ef432433c08202 100644 (file)
--- a/youtube_dl/extractor/mangomolo.py
+++ b/youtube_dl/extractor/mangomolo.py
@@ -22,7 +22,7 @@ class MangomoloBaseIE(InfoExtractor):
  
          format_url = self._html_search_regex(
              [
-                r'file\s*:\s*"(https?://[^"]+?/playlist.m3u8)',
+                r'file\s*:\s*"(https?://[^"]+?/playlist\.m3u8)',
                  r'<a[^>]+href="(rtsp://[^"]+)"'
              ], webpage, 'format url')
          formats = self._extract_wowza_formats(
diff --git a/youtube_dl/extractor/meipai.py b/youtube_dl/extractor/meipai.py

index c8eacb4f4d63ca789659ed9a3deeba7f8fe76f86..2445b8b3985fac92ad451d312f4bb105890db0f5 100644 (file)
--- a/youtube_dl/extractor/meipai.py
+++ b/youtube_dl/extractor/meipai.py
@@ -11,7 +11,7 @@ from ..utils import (
  
  class MeipaiIE(InfoExtractor):
      IE_DESC = '美拍'
-    _VALID_URL = r'https?://(?:www\.)?meipai.com/media/(?P<id>[0-9]+)'
+    _VALID_URL = r'https?://(?:www\.)?meipai\.com/media/(?P<id>[0-9]+)'
      _TESTS = [{
          # regular uploaded video
          'url': 'http://www.meipai.com/media/531697625',
diff --git a/youtube_dl/extractor/mtv.py b/youtube_dl/extractor/mtv.py

index 25af5ddfda4765132fec413caca9a09fc2ba2bb9..1154a35365ca9b388ebfdbe2a5790f67a25ee750 100644 (file)
--- a/youtube_dl/extractor/mtv.py
+++ b/youtube_dl/extractor/mtv.py
@@ -258,7 +258,7 @@ class MTVServicesInfoExtractor(InfoExtractor):
  
          if mgid is None or ':' not in mgid:
              mgid = self._search_regex(
-                [r'data-mgid="(.*?)"', r'swfobject.embedSWF\(".*?(mgid:.*?)"'],
+                [r'data-mgid="(.*?)"', r'swfobject\.embedSWF\(".*?(mgid:.*?)"'],
                  webpage, 'mgid', default=None)
  
          if not mgid:
diff --git a/youtube_dl/extractor/myvideo.py b/youtube_dl/extractor/myvideo.py

index 6bb64eb63c52018c34650a6361e7d70cad2459e0..367e811db5a1c0705626ae766483fb02a4c6162a 100644 (file)
--- a/youtube_dl/extractor/myvideo.py
+++ b/youtube_dl/extractor/myvideo.py
@@ -160,7 +160,7 @@ class MyVideoIE(InfoExtractor):
          else:
              video_playpath = ''
  
-        video_swfobj = self._search_regex(r'swfobject.embedSWF\(\'(.+?)\'', webpage, 'swfobj')
+        video_swfobj = self._search_regex(r'swfobject\.embedSWF\(\'(.+?)\'', webpage, 'swfobj')
          video_swfobj = compat_urllib_parse_unquote(video_swfobj)
  
          video_title = self._html_search_regex("<h1(?: class='globalHd')?>(.*?)</h1>",
diff --git a/youtube_dl/extractor/nationalgeographic.py b/youtube_dl/extractor/nationalgeographic.py

index b91d865286e47affdc66c138dde9507963d62733..9e8d28f4848165ccdfda771800031e6c68359684 100644 (file)
--- a/youtube_dl/extractor/nationalgeographic.py
+++ b/youtube_dl/extractor/nationalgeographic.py
@@ -111,7 +111,7 @@ class NationalGeographicIE(ThePlatformIE, AdobePassIE):
          release_url = self._search_regex(
              r'video_auth_playlist_url\s*=\s*"([^"]+)"',
              webpage, 'release url')
-        theplatform_path = self._search_regex(r'https?://link.theplatform.com/s/([^?]+)', release_url, 'theplatform path')
+        theplatform_path = self._search_regex(r'https?://link\.theplatform\.com/s/([^?]+)', release_url, 'theplatform path')
          video_id = theplatform_path.split('/')[-1]
          query = {
              'mbr': 'true',
diff --git a/youtube_dl/extractor/naver.py b/youtube_dl/extractor/naver.py

index e8131333f8458505b7a323f378c5fee848414934..2047d440266907ea6cd16631cbf235d751c83d9a 100644 (file)
--- a/youtube_dl/extractor/naver.py
+++ b/youtube_dl/extractor/naver.py
@@ -43,7 +43,7 @@ class NaverIE(InfoExtractor):
          video_id = self._match_id(url)
          webpage = self._download_webpage(url, video_id)
  
-        m_id = re.search(r'var rmcPlayer = new nhn.rmcnmv.RMCVideoPlayer\("(.+?)", "(.+?)"',
+        m_id = re.search(r'var rmcPlayer = new nhn\.rmcnmv\.RMCVideoPlayer\("(.+?)", "(.+?)"',
                           webpage)
          if m_id is None:
              error = self._html_search_regex(
diff --git a/youtube_dl/extractor/npo.py b/youtube_dl/extractor/npo.py

index fa4ef20c52959240af41a0c8a7b08c02fd3eb54c..b8fe244071d05e1daac7514b932be148802c21a7 100644 (file)
--- a/youtube_dl/extractor/npo.py
+++ b/youtube_dl/extractor/npo.py
@@ -469,7 +469,7 @@ class SchoolTVIE(NPODataMidEmbedIE):
  
  class HetKlokhuisIE(NPODataMidEmbedIE):
      IE_NAME = 'hetklokhuis'
-    _VALID_URL = r'https?://(?:www\.)?hetklokhuis.nl/[^/]+/\d+/(?P<id>[^/?#&]+)'
+    _VALID_URL = r'https?://(?:www\.)?hetklokhuis\.nl/[^/]+/\d+/(?P<id>[^/?#&]+)'
  
      _TEST = {
          'url': 'http://hetklokhuis.nl/tv-uitzending/3471/Zwaartekrachtsgolven',
diff --git a/youtube_dl/extractor/ruhd.py b/youtube_dl/extractor/ruhd.py

index 2b830cf477eef731caef1f2a6cddf10ef3efa14c..3c8053a2617669cc22549f62e386ac988b33d3c6 100644 (file)
--- a/youtube_dl/extractor/ruhd.py
+++ b/youtube_dl/extractor/ruhd.py
@@ -25,7 +25,7 @@ class RUHDIE(InfoExtractor):
          video_url = self._html_search_regex(
              r'<param name="src" value="([^"]+)"', webpage, 'video url')
          title = self._html_search_regex(
-            r'<title>([^<]+)&nbsp;&nbsp; RUHD.ru - Видео Высокого качества №1 в России!</title>',
+            r'<title>([^<]+)&nbsp;&nbsp; RUHD\.ru - Видео Высокого качества №1 в России!</title>',
              webpage, 'title')
          description = self._html_search_regex(
              r'(?s)<div id="longdesc">(.+?)<span id="showlink">',
diff --git a/youtube_dl/extractor/stanfordoc.py b/youtube_dl/extractor/stanfordoc.py

index cce65fb1014d3595670707d8009832ea37f448dc..ae3dd13807d0f9f46939f6dfab066a75eddd1ed1 100644 (file)
--- a/youtube_dl/extractor/stanfordoc.py
+++ b/youtube_dl/extractor/stanfordoc.py
@@ -66,7 +66,7 @@ class StanfordOpenClassroomIE(InfoExtractor):
                  r'(?s)<description>([^<]+)</description>',
                  coursepage, 'description', fatal=False)
  
-            links = orderedSet(re.findall(r'<a href="(VideoPage.php\?[^"]+)">', coursepage))
+            links = orderedSet(re.findall(r'<a href="(VideoPage\.php\?[^"]+)">', coursepage))
              info['entries'] = [self.url_result(
                  'http://openclassroom.stanford.edu/MainFolder/%s' % unescapeHTML(l)
              ) for l in links]
@@ -84,7 +84,7 @@ class StanfordOpenClassroomIE(InfoExtractor):
              rootpage = self._download_webpage(rootURL, info['id'],
                                                errnote='Unable to download course info page')
  
-            links = orderedSet(re.findall(r'<a href="(CoursePage.php\?[^"]+)">', rootpage))
+            links = orderedSet(re.findall(r'<a href="(CoursePage\.php\?[^"]+)">', rootpage))
              info['entries'] = [self.url_result(
                  'http://openclassroom.stanford.edu/MainFolder/%s' % unescapeHTML(l)
              ) for l in links]
diff --git a/youtube_dl/extractor/theplatform.py b/youtube_dl/extractor/theplatform.py

index de236bbba899837f87a748cb7aab6cb8182b77c4..b1a985ff6c12368347d98d95beed6a042e70093c 100644 (file)
--- a/youtube_dl/extractor/theplatform.py
+++ b/youtube_dl/extractor/theplatform.py
@@ -216,7 +216,7 @@ class ThePlatformIE(ThePlatformBaseIE, AdobePassIE):
          def hex_to_bytes(hex):
              return binascii.a2b_hex(hex.encode('ascii'))
  
-        relative_path = re.match(r'https?://link.theplatform.com/s/([^?]+)', url).group(1)
+        relative_path = re.match(r'https?://link\.theplatform\.com/s/([^?]+)', url).group(1)
          clear_text = hex_to_bytes(flags + expiration_date + str_to_hex(relative_path))
          checksum = hmac.new(sig_key.encode('ascii'), clear_text, hashlib.sha1).hexdigest()
          sig = flags + expiration_date + checksum + str_to_hex(sig_secret)
diff --git a/youtube_dl/extractor/thisav.py b/youtube_dl/extractor/thisav.py

index 33683b139dee3cbf2513a30efb979701c5f93ee9..dc3dd03c823d7ec7878943b5f99bc14d266a6257 100644 (file)
--- a/youtube_dl/extractor/thisav.py
+++ b/youtube_dl/extractor/thisav.py
@@ -57,10 +57,10 @@ class ThisAVIE(InfoExtractor):
                  info_dict = self._extract_jwplayer_data(
                      webpage, video_id, require_title=False)
          uploader = self._html_search_regex(
-            r': <a href="http://www.thisav.com/user/[0-9]+/(?:[^"]+)">([^<]+)</a>',
+            r': <a href="http://www\.thisav\.com/user/[0-9]+/(?:[^"]+)">([^<]+)</a>',
              webpage, 'uploader name', fatal=False)
          uploader_id = self._html_search_regex(
-            r': <a href="http://www.thisav.com/user/[0-9]+/([^"]+)">(?:[^<]+)</a>',
+            r': <a href="http://www\.thisav\.com/user/[0-9]+/([^"]+)">(?:[^<]+)</a>',
              webpage, 'uploader id', fatal=False)
  
          info_dict.update({
diff --git a/youtube_dl/extractor/twitter.py b/youtube_dl/extractor/twitter.py

index 0df3ad7c7c0f61b6529f0e5d09fd1694e9c84f04..1b0b9637160f3c096b4baf07f6146bc9d84a31c8 100644 (file)
--- a/youtube_dl/extractor/twitter.py
+++ b/youtube_dl/extractor/twitter.py
@@ -174,7 +174,7 @@ class TwitterCardIE(TwitterBaseIE):
          webpage = self._download_webpage(url, video_id)
  
          iframe_url = self._html_search_regex(
-            r'<iframe[^>]+src="((?:https?:)?//(?:www.youtube.com/embed/[^"]+|(?:www\.)?vine\.co/v/\w+/card))"',
+            r'<iframe[^>]+src="((?:https?:)?//(?:www\.youtube\.com/embed/[^"]+|(?:www\.)?vine\.co/v/\w+/card))"',
              webpage, 'video iframe', default=None)
          if iframe_url:
              return self.url_result(iframe_url)
diff --git a/youtube_dl/extractor/vice.py b/youtube_dl/extractor/vice.py

index b8b8bf97968ea430a445c521622461736346af7b..bcc28693a4545f9260f5e7942bcac4942faac380 100644 (file)
--- a/youtube_dl/extractor/vice.py
+++ b/youtube_dl/extractor/vice.py
@@ -198,7 +198,7 @@ class ViceShowIE(InfoExtractor):
  
  class ViceArticleIE(InfoExtractor):
      IE_NAME = 'vice:article'
-    _VALID_URL = r'https://www.vice.com/[^/]+/article/(?P<id>[^?#]+)'
+    _VALID_URL = r'https://www\.vice\.com/[^/]+/article/(?P<id>[^?#]+)'
  
      _TESTS = [{
          'url': 'https://www.vice.com/en_us/article/on-set-with-the-woman-making-mormon-porn-in-utah',
diff --git a/youtube_dl/extractor/videopremium.py b/youtube_dl/extractor/videopremium.py

index 5de8273c34aa61a6e1e79ce8b7d142ab9135d35d..cf690d7b0a669b67b84d2aedae992079040e7a64 100644 (file)
--- a/youtube_dl/extractor/videopremium.py
+++ b/youtube_dl/extractor/videopremium.py
@@ -26,7 +26,7 @@ class VideoPremiumIE(InfoExtractor):
          webpage_url = 'http://videopremium.tv/' + video_id
          webpage = self._download_webpage(webpage_url, video_id)
  
-        if re.match(r'^<html><head><script[^>]*>window.location\s*=', webpage):
+        if re.match(r'^<html><head><script[^>]*>window\.location\s*=', webpage):
              # Download again, we need a cookie
              webpage = self._download_webpage(
                  webpage_url, video_id,
diff --git a/youtube_dl/extractor/youtube.py b/youtube_dl/extractor/youtube.py

index edd8713b7eee9d78017bdbf7d10d442823ff3383..54f5d7279eb10ec43042adc3100e95a87166efba 100644 (file)
--- a/youtube_dl/extractor/youtube.py
+++ b/youtube_dl/extractor/youtube.py
@@ -1683,7 +1683,7 @@ class YoutubeIE(YoutubeBaseInfoExtractor):
          video_uploader_id = None
          video_uploader_url = None
          mobj = re.search(
-            r'<link itemprop="url" href="(?P<uploader_url>https?://www.youtube.com/(?:user|channel)/(?P<uploader_id>[^"]+))">',
+            r'<link itemprop="url" href="(?P<uploader_url>https?://www\.youtube\.com/(?:user|channel)/(?P<uploader_id>[^"]+))">',
              video_webpage)
          if mobj is not None:
              video_uploader_id = mobj.group('uploader_id')
author	Sergey M․ <dstftw@gmail.com>
	Mon, 9 Oct 2017 16:50:53 +0000 (23:50 +0700)
committer	Sergey M․ <dstftw@gmail.com>
	Mon, 9 Oct 2017 16:50:53 +0000 (23:50 +0700)
youtube_dl/extractor/aenetworks.py		patch \| blob \| history
youtube_dl/extractor/appletrailers.py		patch \| blob \| history
youtube_dl/extractor/ard.py		patch \| blob \| history
youtube_dl/extractor/bbc.py		patch \| blob \| history
youtube_dl/extractor/dailymotion.py		patch \| blob \| history
youtube_dl/extractor/deezer.py		patch \| blob \| history
youtube_dl/extractor/freespeech.py		patch \| blob \| history
youtube_dl/extractor/generic.py		patch \| blob \| history
youtube_dl/extractor/googleplus.py		patch \| blob \| history
youtube_dl/extractor/hrti.py		patch \| blob \| history
youtube_dl/extractor/ign.py		patch \| blob \| history
youtube_dl/extractor/infoq.py		patch \| blob \| history
youtube_dl/extractor/jeuxvideo.py		patch \| blob \| history
youtube_dl/extractor/livestream.py		patch \| blob \| history
youtube_dl/extractor/makertv.py		patch \| blob \| history
youtube_dl/extractor/mangomolo.py		patch \| blob \| history
youtube_dl/extractor/meipai.py		patch \| blob \| history
youtube_dl/extractor/mtv.py		patch \| blob \| history
youtube_dl/extractor/myvideo.py		patch \| blob \| history
youtube_dl/extractor/nationalgeographic.py		patch \| blob \| history
youtube_dl/extractor/naver.py		patch \| blob \| history
youtube_dl/extractor/npo.py		patch \| blob \| history
youtube_dl/extractor/ruhd.py		patch \| blob \| history
youtube_dl/extractor/stanfordoc.py		patch \| blob \| history
youtube_dl/extractor/theplatform.py		patch \| blob \| history
youtube_dl/extractor/thisav.py		patch \| blob \| history
youtube_dl/extractor/twitter.py		patch \| blob \| history
youtube_dl/extractor/vice.py		patch \| blob \| history
youtube_dl/extractor/videopremium.py		patch \| blob \| history
youtube_dl/extractor/youtube.py		patch \| blob \| history