[rdsca] New extractor

This commit is contained in:
felix 2015-07-11 18:56:07 +02:00
parent d919fa3344
commit ac8f97f2b3
2 changed files with 51 additions and 0 deletions

View file

@ -460,6 +460,7 @@
from .radiofrance import RadioFranceIE from .radiofrance import RadioFranceIE
from .rai import RaiIE from .rai import RaiIE
from .rbmaradio import RBMARadioIE from .rbmaradio import RBMARadioIE
from .rdsca import RDScaIE
from .redtube import RedTubeIE from .redtube import RedTubeIE
from .restudy import RestudyIE from .restudy import RestudyIE
from .reverbnation import ReverbNationIE from .reverbnation import ReverbNationIE

View file

@ -0,0 +1,50 @@
# coding: utf-8
from __future__ import unicode_literals
from .common import InfoExtractor
from ..utils import (
parse_iso8601,
url_basename,
)
class RDScaIE(InfoExtractor):
IE_NAME = 'RDS.ca'
_VALID_URL = r'http://(?:www\.)?rds\.ca/videos/(?P<id>.*)'
_TESTS = [{
'url': 'http://www.rds.ca/videos/football/nfl/fowler-jr-prend-la-direction-de-jacksonville-3.1132799',
'info_dict': {
"ext": "mp4",
"title": "Fowler Jr. prend la direction de Jacksonville",
"description": "Dante Fowler Jr. est le troisième choix du repêchage 2015 de la NFL. ",
"timestamp": 1430397346,
}
}]
def _real_extract(self, url):
video_id = url_basename(url)
webpage = self._download_webpage(url, video_id)
title = self._search_regex(
r'<span itemprop="name"[^>]*>([^\n]*)</span>', webpage, 'video title', default=None)
video_url = self._search_regex(
r'<span itemprop="contentURL" content="([^"]+)"', webpage, 'video URL')
upload_date = parse_iso8601(self._search_regex(
r'<span itemprop="uploadDate" content="([^"]+)"', webpage, 'upload date', default=None))
description = self._search_regex(
r'<span itemprop="description"[^>]*>([^\n]*)</span>', webpage, 'description', default=None)
thumbnail = self._search_regex(
r'<span itemprop="thumbnailUrl" content="([^"]+)"', webpage, 'upload date', default=None)
return {
'id': video_id,
'title': title,
'description': description,
'thumbnail': thumbnail,
'timestamp': upload_date,
'formats': [{
'url': video_url,
}],
}