[niconico] Fix title and thumbnail extraction (#273)

Authored by: CXwudi
This commit is contained in:
CXwudi 2021-04-25 19:53:57 -07:00 committed by GitHub
parent 87c3d06271
commit 6b1d8c1e30
No known key found for this signature in database
GPG key ID: 4AEE18F83AFDEB23

View file

@ -493,7 +493,8 @@ def get_video_info_xml(items):
# Start extracting information # Start extracting information
title = ( title = (
get_video_info_web(['originalTitle', 'title']) get_video_info_xml('title') # prefer to get the untranslated original title
or get_video_info_web(['originalTitle', 'title'])
or self._og_search_title(webpage, default=None) or self._og_search_title(webpage, default=None)
or self._html_search_regex( or self._html_search_regex(
r'<span[^>]+class="videoHeaderTitle"[^>]*>([^<]+)</span>', r'<span[^>]+class="videoHeaderTitle"[^>]*>([^<]+)</span>',
@ -507,7 +508,9 @@ def get_video_info_xml(items):
thumbnail = ( thumbnail = (
self._html_search_regex(r'<meta property="og:image" content="([^"]+)">', webpage, 'thumbnail data', default=None) self._html_search_regex(r'<meta property="og:image" content="([^"]+)">', webpage, 'thumbnail data', default=None)
or get_video_info_web(['thumbnail_url', 'largeThumbnailURL', 'thumbnailURL']) or try_get( # choose highest from 720p to 240p
get_video_info_web('thumbnail'),
['ogp', 'player', 'largeUrl', 'middleUrl', 'url'])
or self._html_search_meta('image', webpage, 'thumbnail', default=None) or self._html_search_meta('image', webpage, 'thumbnail', default=None)
or video_detail.get('thumbnail')) or video_detail.get('thumbnail'))