[extractor/common] Use episode name as title in _json_ld

[youtube-dl] / youtube_dl / extractor / common.py
diff --git a/youtube_dl/extractor/common.py b/youtube_dl/extractor/common.py

index 8452125c8802b1398698c334084c85b673e80964..9e7febcadf12c9d2450f35783e45b4b6d04dbe3f 100644 (file)
--- a/youtube_dl/extractor/common.py
+++ b/youtube_dl/extractor/common.py
@@ -606,6 +606,11 @@ class InfoExtractor(object):
          except (compat_urllib_error.URLError, compat_http_client.HTTPException, socket.error) as err:
              if isinstance(err, compat_urllib_error.HTTPError):
                  if self.__can_accept_status_code(err, expected_status):
+                    # Retain reference to error to prevent file object from
+                    # being closed before it can be read. Works around the
+                    # effects of <https://bugs.python.org/issue15002>
+                    # introduced in Python 3.4.1.
+                    err.fp._error = err
                      return err.fp
  
              if errnote is False:
@@ -1234,17 +1239,27 @@ class InfoExtractor(object):
                  if expected_type is not None and expected_type != item_type:
                      return info
                  if item_type in ('TVEpisode', 'Episode'):
+                    episode_name = unescapeHTML(e.get('name'))
                      info.update({
-                        'episode': unescapeHTML(e.get('name')),
+                        'episode': episode_name,
                          'episode_number': int_or_none(e.get('episodeNumber')),
                          'description': unescapeHTML(e.get('description')),
                      })
+                    if not info.get('title') and episode_name:
+                        info['title'] = episode_name
                      part_of_season = e.get('partOfSeason')
                      if isinstance(part_of_season, dict) and part_of_season.get('@type') in ('TVSeason', 'Season', 'CreativeWorkSeason'):
                          info['season_number'] = int_or_none(part_of_season.get('seasonNumber'))
                      part_of_series = e.get('partOfSeries') or e.get('partOfTVSeries')
                      if isinstance(part_of_series, dict) and part_of_series.get('@type') in ('TVSeries', 'Series', 'CreativeWorkSeries'):
                          info['series'] = unescapeHTML(part_of_series.get('name'))
+                elif item_type == 'Movie':
+                    info.update({
+                        'title': unescapeHTML(e.get('name')),
+                        'description': unescapeHTML(e.get('description')),
+                        'duration': parse_duration(e.get('duration')),
+                        'timestamp': unified_timestamp(e.get('dateCreated')),
+                    })
                  elif item_type in ('Article', 'NewsArticle'):
                      info.update({
                          'timestamp': parse_iso8601(e.get('datePublished')),