diff --git a/yt_dlp/extractor/abc.py b/yt_dlp/extractor/abc.py index 96d92abd5..b9bf8c0a5 100644 --- a/yt_dlp/extractor/abc.py +++ b/yt_dlp/extractor/abc.py @@ -329,14 +329,19 @@ def tokenize_url(url, token): 'hdnea': token, }) - for sd_url in traverse_obj(stream, ('streams', 'hls-latest', ('1080', '720', 'sd', 'sd-low'), {str})): - if not sd_url: - continue - formats = self._extract_m3u8_formats( - tokenize_url(sd_url, token), video_id, 'mp4', - entry_protocol='m3u8_native', m3u8_id='hls', fatal=False) - if formats: - break + formats = [] + # hls: pre-merged formats + # hls-latest: same as hls, but sometimes has separate audio tracks + # Note: pre-merged formats in hls-latest are treated as video-only if audio-only tracks + # are present, so we extract both types + for label in ('hls', 'hls-latest'): + for sd_url in traverse_obj(stream, ('streams', label, ('1080', '720', 'sd', 'sd-low'), {str})): + fmts = self._extract_m3u8_formats( + tokenize_url(sd_url, token), video_id, 'mp4', + entry_protocol='m3u8_native', m3u8_id=label, fatal=False) + if fmts: + formats.extend(fmts) + break subtitles = {} src_vtt = traverse_obj(stream, ('captions', 'src-vtt'))