[porncom] Fix metadata extraction (closes #14911)

author Sergey M․ <dstftw@gmail.com>

Tue, 5 Dec 2017 15:42:02 +0000 (22:42 +0700)

committer Sergey M․ <dstftw@gmail.com>

Tue, 5 Dec 2017 15:42:02 +0000 (22:42 +0700)
author Sergey M․ <dstftw@gmail.com>
Tue, 5 Dec 2017 15:42:02 +0000 (22:42 +0700)
committer Sergey M․ <dstftw@gmail.com>
Tue, 5 Dec 2017 15:42:02 +0000 (22:42 +0700)
diff --git a/youtube_dl/extractor/porncom.py b/youtube_dl/extractor/porncom.py

index 8218c7d3bf7ddc8cc7de74f2fc5d2d838cecc982..60ade06da37d2bd2a56e717f9761f525cb4b7436 100644 (file)
--- a/youtube_dl/extractor/porncom.py
+++ b/youtube_dl/extractor/porncom.py
@@ -77,12 +77,14 @@ class PornComIE(InfoExtractor):
          self._sort_formats(formats)
  
          view_count = str_to_int(self._search_regex(
-            r'class=["\']views["\'][^>]*><p>([\d,.]+)', webpage,
+            (r'Views:\s*</span>\s*<span>\s*([\d,.]+)',
+             r'class=["\']views["\'][^>]*><p>([\d,.]+)'), webpage,
              'view count', fatal=False))
  
          def extract_list(kind):
              s = self._search_regex(
-                r'(?s)<p[^>]*>%s:(.+?)</p>' % kind.capitalize(),
+                (r'(?s)%s:\s*</span>\s*<span>(.+?)</span>' % kind.capitalize(),
+                 r'(?s)<p[^>]*>%s:(.+?)</p>' % kind.capitalize()),
                  webpage, kind, fatal=False)
              return re.findall(r'<a[^>]+>([^<]+)</a>', s or '')
author	Sergey M․ <dstftw@gmail.com>
	Tue, 5 Dec 2017 15:42:02 +0000 (22:42 +0700)
committer	Sergey M․ <dstftw@gmail.com>
	Tue, 5 Dec 2017 15:42:02 +0000 (22:42 +0700)