More title extraction fixing.

[youtube-dl] / youtube_dl / extractor / xhamster.py
diff --git a/youtube_dl/extractor/xhamster.py b/youtube_dl/extractor/xhamster.py

index f76ee8fd425dc743ef7f15f3de8a70b2e404c917..8938c0e4561d2c6163158e409106dd2e928e85bf 100644 (file)
--- a/youtube_dl/extractor/xhamster.py
+++ b/youtube_dl/extractor/xhamster.py
@@ -63,7 +63,9 @@ class XHamsterIE(InfoExtractor):
          mrss_url = '%s://xhamster.com/movies/%s/%s.html' % (proto, video_id, seo)
          webpage = self._download_webpage(mrss_url, video_id)
  
-        title = self._html_search_regex(r'<title>(?P<title>.+?) - xHamster\.com</title>', webpage, 'title')
+        title = self._html_search_regex(
+            [r'<title>(?P<title>.+?)(?:, (?:[^,]+? )?Porn: xHamster| - xHamster\.com)</title>',
+             r'<h1>([^<]+)</h1>'], webpage, 'title')
  
          # Only a few videos have an description
          mobj = re.search(r'<span>Description: </span>([^<]+)', webpage)
@@ -81,7 +83,7 @@ class XHamsterIE(InfoExtractor):
          thumbnail = self._search_regex(
              [r'''thumb\s*:\s*(?P<q>["'])(?P<thumbnail>.+?)(?P=q)''',
               r'''<video[^>]+poster=(?P<q>["'])(?P<thumbnail>.+?)(?P=q)[^>]*>'''],
-             webpage, 'thumbnail', fatal=False, group='thumbnail')
+            webpage, 'thumbnail', fatal=False, group='thumbnail')
  
          duration = parse_duration(self._html_search_regex(r'<span>Runtime:</span> (\d+:\d+)</div>',
                                                            webpage, 'duration', fatal=False))