[Cleanup] Remove some unnecessary groups in regexes (#1738)

Authored by: Ashish0804
This commit is contained in:
Ashish Gupta 2021-11-30 21:44:47 +05:30 committed by GitHub
parent 0cbed930c8
commit 73f035e1fe
No known key found for this signature in database
GPG key ID: 4AEE18F83AFDEB23
22 changed files with 31 additions and 30 deletions

View file

@ -4,7 +4,7 @@
class AmazonStoreIE(InfoExtractor): class AmazonStoreIE(InfoExtractor):
_VALID_URL = r'(?:https?://)(?:www\.)?amazon\.(?:[a-z]{2,3})(?:\.[a-z]{2})?/(?:[^/]+/)?(?:dp|gp/product)/(?P<id>[^/&#$?]+)' _VALID_URL = r'https?://(?:www\.)?amazon\.(?:[a-z]{2,3})(?:\.[a-z]{2})?/(?:[^/]+/)?(?:dp|gp/product)/(?P<id>[^/&#$?]+)'
_TESTS = [{ _TESTS = [{
'url': 'https://www.amazon.co.uk/dp/B098XNCHLD/', 'url': 'https://www.amazon.co.uk/dp/B098XNCHLD/',

View file

@ -11,7 +11,7 @@
class CanalAlphaIE(InfoExtractor): class CanalAlphaIE(InfoExtractor):
_VALID_URL = r'(?:https?://)(?:www\.)?canalalpha\.ch/play/[^/]+/[^/]+/(?P<id>\d+)/?.*' _VALID_URL = r'https?://(?:www\.)?canalalpha\.ch/play/[^/]+/[^/]+/(?P<id>\d+)/?.*'
_TESTS = [{ _TESTS = [{
'url': 'https://www.canalalpha.ch/play/le-journal/episode/24520/jeudi-28-octobre-2021', 'url': 'https://www.canalalpha.ch/play/le-journal/episode/24520/jeudi-28-octobre-2021',

View file

@ -67,7 +67,7 @@ def _get_post(self, id, post_data):
class ChingariIE(ChingariBaseIE): class ChingariIE(ChingariBaseIE):
_VALID_URL = r'(?:https?://)(?:www\.)?chingari\.io/share/post\?id=(?P<id>[^&/#?]+)' _VALID_URL = r'https?://(?:www\.)?chingari\.io/share/post\?id=(?P<id>[^&/#?]+)'
_TESTS = [{ _TESTS = [{
'url': 'https://chingari.io/share/post?id=612f8f4ce1dc57090e8a7beb', 'url': 'https://chingari.io/share/post?id=612f8f4ce1dc57090e8a7beb',
'info_dict': { 'info_dict': {
@ -102,7 +102,7 @@ def _real_extract(self, url):
class ChingariUserIE(ChingariBaseIE): class ChingariUserIE(ChingariBaseIE):
_VALID_URL = r'(?:https?://)(?:www\.)?chingari\.io/(?!share/post)(?P<id>[^/?]+)' _VALID_URL = r'https?://(?:www\.)?chingari\.io/(?!share/post)(?P<id>[^/?]+)'
_TESTS = [{ _TESTS = [{
'url': 'https://chingari.io/dada1023', 'url': 'https://chingari.io/dada1023',
'playlist_mincount': 3, 'playlist_mincount': 3,

View file

@ -6,7 +6,7 @@
class CozyTVIE(InfoExtractor): class CozyTVIE(InfoExtractor):
_VALID_URL = r'(?:https?://)(?:www\.)?cozy\.tv/(?P<uploader>[^/]+)/replays/(?P<id>[^/$#&?]+)' _VALID_URL = r'https?://(?:www\.)?cozy\.tv/(?P<uploader>[^/]+)/replays/(?P<id>[^/$#&?]+)'
_TESTS = [{ _TESTS = [{
'url': 'https://cozy.tv/beardson/replays/2021-11-19_1', 'url': 'https://cozy.tv/beardson/replays/2021-11-19_1',

View file

@ -8,7 +8,7 @@
class EpiconIE(InfoExtractor): class EpiconIE(InfoExtractor):
_VALID_URL = r'(?:https?://)(?:www\.)?epicon\.in/(?:documentaries|movies|tv-shows/[^/?#]+/[^/?#]+)/(?P<id>[^/?#]+)' _VALID_URL = r'https?://(?:www\.)?epicon\.in/(?:documentaries|movies|tv-shows/[^/?#]+/[^/?#]+)/(?P<id>[^/?#]+)'
_TESTS = [{ _TESTS = [{
'url': 'https://www.epicon.in/documentaries/air-battle-of-srinagar', 'url': 'https://www.epicon.in/documentaries/air-battle-of-srinagar',
'info_dict': { 'info_dict': {
@ -84,7 +84,7 @@ def _real_extract(self, url):
class EpiconSeriesIE(InfoExtractor): class EpiconSeriesIE(InfoExtractor):
_VALID_URL = r'(?!.*season)(?:https?://)(?:www\.)?epicon\.in/tv-shows/(?P<id>[^/?#]+)' _VALID_URL = r'(?!.*season)https?://(?:www\.)?epicon\.in/tv-shows/(?P<id>[^/?#]+)'
_TESTS = [{ _TESTS = [{
'url': 'https://www.epicon.in/tv-shows/1-of-something', 'url': 'https://www.epicon.in/tv-shows/1-of-something',
'playlist_mincount': 5, 'playlist_mincount': 5,

View file

@ -10,7 +10,7 @@
class EUScreenIE(InfoExtractor): class EUScreenIE(InfoExtractor):
_VALID_URL = r'(?:https?://)(?:www\.)?euscreen\.eu/item.html\?id=(?P<id>[^&?$/]+)' _VALID_URL = r'https?://(?:www\.)?euscreen\.eu/item.html\?id=(?P<id>[^&?$/]+)'
_TESTS = [{ _TESTS = [{
'url': 'https://euscreen.eu/item.html?id=EUS_0EBCBF356BFC4E12A014023BA41BD98C', 'url': 'https://euscreen.eu/item.html?id=EUS_0EBCBF356BFC4E12A014023BA41BD98C',

View file

@ -15,7 +15,7 @@
class GabTVIE(InfoExtractor): class GabTVIE(InfoExtractor):
_VALID_URL = r'(?:https?://)tv.gab.com/channel/[^/]+/view/(?P<id>[a-z0-9-]+)' _VALID_URL = r'https?://tv\.gab\.com/channel/[^/]+/view/(?P<id>[a-z0-9-]+)'
_TESTS = [{ _TESTS = [{
'url': 'https://tv.gab.com/channel/wurzelroot/view/why-was-america-in-afghanistan-61217eacea5665de450d0488', 'url': 'https://tv.gab.com/channel/wurzelroot/view/why-was-america-in-afghanistan-61217eacea5665de450d0488',
'info_dict': { 'info_dict': {

View file

@ -6,7 +6,7 @@
class GronkhIE(InfoExtractor): class GronkhIE(InfoExtractor):
_VALID_URL = r'(?:https?://)(?:www\.)?gronkh\.tv/stream/(?P<id>\d+)' _VALID_URL = r'https?://(?:www\.)?gronkh\.tv/stream/(?P<id>\d+)'
_TESTS = [{ _TESTS = [{
'url': 'https://gronkh.tv/stream/536', 'url': 'https://gronkh.tv/stream/536',

View file

@ -296,7 +296,7 @@ def _real_extract(self, url):
class HotStarSeriesIE(HotStarBaseIE): class HotStarSeriesIE(HotStarBaseIE):
IE_NAME = 'hotstar:series' IE_NAME = 'hotstar:series'
_VALID_URL = r'(?P<url>(?:https?://)(?:www\.)?hotstar\.com(?:/in)?/tv/[^/]+/(?P<id>\d+))' _VALID_URL = r'(?P<url>https?://(?:www\.)?hotstar\.com(?:/in)?/tv/[^/]+/(?P<id>\d+))'
_TESTS = [{ _TESTS = [{
'url': 'https://www.hotstar.com/in/tv/radhakrishn/1260000646', 'url': 'https://www.hotstar.com/in/tv/radhakrishn/1260000646',
'info_dict': { 'info_dict': {

View file

@ -8,7 +8,7 @@
class KooIE(InfoExtractor): class KooIE(InfoExtractor):
_VALID_URL = r'(?:https?://)(?:www\.)?kooapp\.com/koo/[^/]+/(?P<id>[^/&#$?]+)' _VALID_URL = r'https?://(?:www\.)?kooapp\.com/koo/[^/]+/(?P<id>[^/&#$?]+)'
_TESTS = [{ # Test for video in the comments _TESTS = [{ # Test for video in the comments
'url': 'https://www.kooapp.com/koo/ytdlpTestAccount/946c4189-bc2d-4524-b95b-43f641e2adde', 'url': 'https://www.kooapp.com/koo/ytdlpTestAccount/946c4189-bc2d-4524-b95b-43f641e2adde',
'info_dict': { 'info_dict': {

View file

@ -6,7 +6,7 @@
class MLSSoccerIE(InfoExtractor): class MLSSoccerIE(InfoExtractor):
_VALID_DOMAINS = r'(?:(?:cfmontreal|intermiamicf|lagalaxy|lafc|houstondynamofc|dcunited|atlutd|mlssoccer|fcdallas|columbuscrew|coloradorapids|fccincinnati|chicagofirefc|austinfc|nashvillesc|whitecapsfc|sportingkc|soundersfc|sjearthquakes|rsl|timbers|philadelphiaunion|orlandocitysc|newyorkredbulls|nycfc)\.com|(?:torontofc)\.ca|(?:revolutionsoccer)\.net)' _VALID_DOMAINS = r'(?:(?:cfmontreal|intermiamicf|lagalaxy|lafc|houstondynamofc|dcunited|atlutd|mlssoccer|fcdallas|columbuscrew|coloradorapids|fccincinnati|chicagofirefc|austinfc|nashvillesc|whitecapsfc|sportingkc|soundersfc|sjearthquakes|rsl|timbers|philadelphiaunion|orlandocitysc|newyorkredbulls|nycfc)\.com|(?:torontofc)\.ca|(?:revolutionsoccer)\.net)'
_VALID_URL = r'(?:https?://)(?:www\.)?%s/video/#?(?P<id>[^/&$#?]+)' % _VALID_DOMAINS _VALID_URL = r'https?://(?:www\.)?%s/video/#?(?P<id>[^/&$#?]+)' % _VALID_DOMAINS
_TESTS = [{ _TESTS = [{
'url': 'https://www.mlssoccer.com/video/the-octagon-can-alphonso-davies-lead-canada-to-first-world-cup-since-1986#the-octagon-can-alphonso-davies-lead-canada-to-first-world-cup-since-1986', 'url': 'https://www.mlssoccer.com/video/the-octagon-can-alphonso-davies-lead-canada-to-first-world-cup-since-1986#the-octagon-can-alphonso-davies-lead-canada-to-first-world-cup-since-1986',

View file

@ -5,7 +5,7 @@
class MuseScoreIE(InfoExtractor): class MuseScoreIE(InfoExtractor):
_VALID_URL = r'(?:https?://)(?:www\.)?musescore\.com/(?:user/\d+|[^/]+)(?:/scores)?/(?P<id>[^#&?]+)' _VALID_URL = r'https?://(?:www\.)?musescore\.com/(?:user/\d+|[^/]+)(?:/scores)?/(?P<id>[^#&?]+)'
_TESTS = [{ _TESTS = [{
'url': 'https://musescore.com/user/73797/scores/142975', 'url': 'https://musescore.com/user/73797/scores/142975',
'info_dict': { 'info_dict': {
@ -13,7 +13,7 @@ class MuseScoreIE(InfoExtractor):
'ext': 'mp3', 'ext': 'mp3',
'title': 'WA Mozart Marche Turque (Turkish March fingered)', 'title': 'WA Mozart Marche Turque (Turkish March fingered)',
'description': 'md5:7ede08230e4eaabd67a4a98bb54d07be', 'description': 'md5:7ede08230e4eaabd67a4a98bb54d07be',
'thumbnail': r're:(?:https?://)(?:www\.)?musescore\.com/.*\.png[^$]+', 'thumbnail': r're:https?://(?:www\.)?musescore\.com/.*\.png[^$]+',
'uploader': 'PapyPiano', 'uploader': 'PapyPiano',
'creator': 'Wolfgang Amadeus Mozart', 'creator': 'Wolfgang Amadeus Mozart',
} }
@ -24,7 +24,7 @@ class MuseScoreIE(InfoExtractor):
'ext': 'mp3', 'ext': 'mp3',
'title': 'Sweet Child O\' Mine Guns N\' Roses sweet child', 'title': 'Sweet Child O\' Mine Guns N\' Roses sweet child',
'description': 'md5:4dca71191c14abc312a0a4192492eace', 'description': 'md5:4dca71191c14abc312a0a4192492eace',
'thumbnail': r're:(?:https?://)(?:www\.)?musescore\.com/.*\.png[^$]+', 'thumbnail': r're:https?://(?:www\.)?musescore\.com/.*\.png[^$]+',
'uploader': 'roxbelviolin', 'uploader': 'roxbelviolin',
'creator': 'Guns N´Roses Arr. Roxbel Violin', 'creator': 'Guns N´Roses Arr. Roxbel Violin',
} }
@ -35,7 +35,7 @@ class MuseScoreIE(InfoExtractor):
'ext': 'mp3', 'ext': 'mp3',
'title': 'Für Elise Beethoven', 'title': 'Für Elise Beethoven',
'description': 'md5:49515a3556d5ecaf9fa4b2514064ac34', 'description': 'md5:49515a3556d5ecaf9fa4b2514064ac34',
'thumbnail': r're:(?:https?://)(?:www\.)?musescore\.com/.*\.png[^$]+', 'thumbnail': r're:https?://(?:www\.)?musescore\.com/.*\.png[^$]+',
'uploader': 'ClassicMan', 'uploader': 'ClassicMan',
'creator': 'Ludwig van Beethoven (17701827)', 'creator': 'Ludwig van Beethoven (17701827)',
} }

View file

@ -180,7 +180,7 @@ def _real_extract(self, url):
class MxplayerShowIE(InfoExtractor): class MxplayerShowIE(InfoExtractor):
_VALID_URL = r'(?:https?://)(?:www\.)?mxplayer\.in/show/(?P<display_id>[-\w]+)-(?P<id>\w+)/?(?:$|[#?])' _VALID_URL = r'https?://(?:www\.)?mxplayer\.in/show/(?P<display_id>[-\w]+)-(?P<id>\w+)/?(?:$|[#?])'
_TESTS = [{ _TESTS = [{
'url': 'https://www.mxplayer.in/show/watch-chakravartin-ashoka-samrat-series-online-a8f44e3cc0814b5601d17772cedf5417', 'url': 'https://www.mxplayer.in/show/watch-chakravartin-ashoka-samrat-series-online-a8f44e3cc0814b5601d17772cedf5417',
'playlist_mincount': 440, 'playlist_mincount': 440,

View file

@ -5,7 +5,7 @@
class OneFootballIE(InfoExtractor): class OneFootballIE(InfoExtractor):
_VALID_URL = r'(?:https?://)(?:www\.)?onefootball\.com/[a-z]{2}/video/[^/&?#]+-(?P<id>\d+)' _VALID_URL = r'https?://(?:www\.)?onefootball\.com/[a-z]{2}/video/[^/&?#]+-(?P<id>\d+)'
_TESTS = [{ _TESTS = [{
'url': 'https://onefootball.com/en/video/highlights-fc-zuerich-3-3-fc-basel-34012334', 'url': 'https://onefootball.com/en/video/highlights-fc-zuerich-3-3-fc-basel-34012334',

View file

@ -9,7 +9,7 @@
class PlanetMarathiIE(InfoExtractor): class PlanetMarathiIE(InfoExtractor):
_VALID_URL = r'(?:https?://)(?:www\.)?planetmarathi\.com/titles/(?P<id>[^/#&?$]+)' _VALID_URL = r'https?://(?:www\.)?planetmarathi\.com/titles/(?P<id>[^/#&?$]+)'
_TESTS = [{ _TESTS = [{
'url': 'https://www.planetmarathi.com/titles/ek-unad-divas', 'url': 'https://www.planetmarathi.com/titles/ek-unad-divas',
'playlist_mincount': 2, 'playlist_mincount': 2,

View file

@ -10,7 +10,7 @@
class ProjectVeritasIE(InfoExtractor): class ProjectVeritasIE(InfoExtractor):
_VALID_URL = r'(?:https?://)(?:www\.)?projectveritas\.com/(?P<type>news|video)/(?P<id>[^/?#]+)' _VALID_URL = r'https?://(?:www\.)?projectveritas\.com/(?P<type>news|video)/(?P<id>[^/?#]+)'
_TESTS = [{ _TESTS = [{
'url': 'https://www.projectveritas.com/news/exclusive-inside-the-new-york-and-new-jersey-hospitals-battling-coronavirus/', 'url': 'https://www.projectveritas.com/news/exclusive-inside-the-new-york-and-new-jersey-hospitals-battling-coronavirus/',
'info_dict': { 'info_dict': {

View file

@ -16,7 +16,7 @@
class ShemarooMeIE(InfoExtractor): class ShemarooMeIE(InfoExtractor):
_VALID_URL = r'(?:https?://)(?:www\.)?shemaroome\.com/(?:movies|shows)/(?P<id>[^?#]+)' _VALID_URL = r'https?://(?:www\.)?shemaroome\.com/(?:movies|shows)/(?P<id>[^?#]+)'
_TESTS = [{ _TESTS = [{
'url': 'https://www.shemaroome.com/movies/dil-hai-tumhaara', 'url': 'https://www.shemaroome.com/movies/dil-hai-tumhaara',
'info_dict': { 'info_dict': {
@ -78,7 +78,7 @@ def _real_extract(self, url):
iv = [0] * 16 iv = [0] * 16
m3u8_url = intlist_to_bytes(aes_cbc_decrypt(url_data, key, iv)) m3u8_url = intlist_to_bytes(aes_cbc_decrypt(url_data, key, iv))
m3u8_url = m3u8_url[:-compat_ord((m3u8_url[-1]))].decode('ascii') m3u8_url = m3u8_url[:-compat_ord((m3u8_url[-1]))].decode('ascii')
formats = self._extract_m3u8_formats(m3u8_url, video_id, fatal=False, headers={'stream_key': data_json['stream_key']}) formats, m3u8_subs = self._extract_m3u8_formats_and_subtitles(m3u8_url, video_id, fatal=False, headers={'stream_key': data_json['stream_key']})
self._sort_formats(formats) self._sort_formats(formats)
release_date = self._html_search_regex( release_date = self._html_search_regex(
@ -91,6 +91,7 @@ def _real_extract(self, url):
subtitles.setdefault('EN', []).append({ subtitles.setdefault('EN', []).append({
'url': self._proto_relative_url(sub_url), 'url': self._proto_relative_url(sub_url),
}) })
subtitles = self._merge_subtitles(subtitles, m3u8_subs)
description = self._html_search_regex(r'(?s)>Synopsis(</.+?)</', webpage, 'description', fatal=False) description = self._html_search_regex(r'(?s)>Synopsis(</.+?)</', webpage, 'description', fatal=False)
return { return {

View file

@ -9,7 +9,7 @@
class SkyNewsAUIE(InfoExtractor): class SkyNewsAUIE(InfoExtractor):
_VALID_URL = r'(?:https?://)(?:www\.)?skynews\.com\.au/[^/]+/[^/]+/[^/]+/video/(?P<id>[a-z0-9]+)' _VALID_URL = r'https?://(?:www\.)?skynews\.com\.au/[^/]+/[^/]+/[^/]+/video/(?P<id>[a-z0-9]+)'
_TESTS = [{ _TESTS = [{
'url': 'https://www.skynews.com.au/world-news/united-states/incredible-vision-shows-lava-overflowing-from-spains-la-palma-volcano/video/0f4c6243d6903502c01251f228b91a71', 'url': 'https://www.skynews.com.au/world-news/united-states/incredible-vision-shows-lava-overflowing-from-spains-la-palma-volcano/video/0f4c6243d6903502c01251f228b91a71',

View file

@ -11,7 +11,7 @@
class ThreeSpeakIE(InfoExtractor): class ThreeSpeakIE(InfoExtractor):
_VALID_URL = r'(?:https?://)(?:www\.)?3speak\.tv/watch\?v\=[^/]+/(?P<id>[^/$&#?]+)' _VALID_URL = r'https?://(?:www\.)?3speak\.tv/watch\?v\=[^/]+/(?P<id>[^/$&#?]+)'
_TESTS = [{ _TESTS = [{
'url': 'https://3speak.tv/watch?v=dannyshine/wjgoxyfy', 'url': 'https://3speak.tv/watch?v=dannyshine/wjgoxyfy',
@ -75,7 +75,7 @@ def _real_extract(self, url):
class ThreeSpeakUserIE(InfoExtractor): class ThreeSpeakUserIE(InfoExtractor):
_VALID_URL = r'(?:https?://)(?:www\.)?3speak\.tv/user/(?P<id>[^/$&?#]+)' _VALID_URL = r'https?://(?:www\.)?3speak\.tv/user/(?P<id>[^/$&?#]+)'
_TESTS = [{ _TESTS = [{
'url': 'https://3speak.tv/user/theycallmedan', 'url': 'https://3speak.tv/user/theycallmedan',

View file

@ -13,7 +13,7 @@
class UtreonIE(InfoExtractor): class UtreonIE(InfoExtractor):
_VALID_URL = r'(?:https?://)(?:www\.)?utreon.com/v/(?P<id>[a-zA-Z0-9_-]+)' _VALID_URL = r'https?://(?:www\.)?utreon.com/v/(?P<id>[a-zA-Z0-9_-]+)'
_TESTS = [{ _TESTS = [{
'url': 'https://utreon.com/v/z_I7ikQbuDw', 'url': 'https://utreon.com/v/z_I7ikQbuDw',
'info_dict': { 'info_dict': {

View file

@ -15,7 +15,7 @@ class VootIE(InfoExtractor):
_VALID_URL = r'''(?x) _VALID_URL = r'''(?x)
(?: (?:
voot:| voot:|
(?:https?://)(?:www\.)?voot\.com/? https?://(?:www\.)?voot\.com/?
(?: (?:
movies/[^/]+/| movies/[^/]+/|
(?:shows|kids)/(?:[^/]+/){4} (?:shows|kids)/(?:[^/]+/){4}

View file

@ -21,7 +21,7 @@ class Zee5IE(InfoExtractor):
_VALID_URL = r'''(?x) _VALID_URL = r'''(?x)
(?: (?:
zee5:| zee5:|
(?:https?://)(?:www\.)?zee5\.com/(?:[^#?]+/)? https?://(?:www\.)?zee5\.com/(?:[^#?]+/)?
(?: (?:
(?:tvshows|kids|zee5originals)(?:/[^#/?]+){3} (?:tvshows|kids|zee5originals)(?:/[^#/?]+){3}
|movies/[^#/?]+ |movies/[^#/?]+
@ -174,7 +174,7 @@ class Zee5SeriesIE(InfoExtractor):
_VALID_URL = r'''(?x) _VALID_URL = r'''(?x)
(?: (?:
zee5:series:| zee5:series:|
(?:https?://)(?:www\.)?zee5\.com/(?:[^#?]+/)? https?://(?:www\.)?zee5\.com/(?:[^#?]+/)?
(?:tvshows|kids|zee5originals)(?:/[^#/?]+){2}/ (?:tvshows|kids|zee5originals)(?:/[^#/?]+){2}/
) )
(?P<id>[^#/?]+)/?(?:$|[?#]) (?P<id>[^#/?]+)/?(?:$|[?#])