2015-08-13 02:07:27 +10:00
|
|
|
# coding: utf-8
|
|
|
|
from __future__ import unicode_literals
|
|
|
|
|
|
|
|
from .common import InfoExtractor
|
2015-08-13 05:11:55 +10:00
|
|
|
from ..utils import ExtractorError
|
2015-08-13 02:07:27 +10:00
|
|
|
|
|
|
|
|
2015-08-13 04:26:13 +10:00
|
|
|
class RTVNHIE(InfoExtractor):
|
2015-08-13 02:07:27 +10:00
|
|
|
_VALID_URL = r'https?://(?:www\.)?rtvnh\.nl/video/(?P<id>[0-9]+)'
|
|
|
|
_TEST = {
|
|
|
|
'url': 'http://www.rtvnh.nl/video/131946',
|
|
|
|
'md5': '6e1d0ab079e2a00b6161442d3ceacfc1',
|
|
|
|
'info_dict': {
|
|
|
|
'id': '131946',
|
|
|
|
'ext': 'mp4',
|
|
|
|
'title': 'Grote zoektocht in zee bij Zandvoort naar vermiste vrouw',
|
2015-08-13 04:26:13 +10:00
|
|
|
'thumbnail': 're:^https?:.*\.jpg$'
|
2015-08-13 02:07:27 +10:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
def _real_extract(self, url):
|
|
|
|
video_id = self._match_id(url)
|
2015-08-13 05:00:05 +10:00
|
|
|
|
|
|
|
meta = self._parse_json(self._download_webpage(
|
|
|
|
'http://www.rtvnh.nl/video/json?m=' + video_id, video_id), video_id)
|
2015-08-13 05:11:55 +10:00
|
|
|
|
|
|
|
status = meta.get('status')
|
|
|
|
if status != 200:
|
|
|
|
raise ExtractorError(
|
|
|
|
'%s returned error code %d' % (self.IE_NAME, status), expected=True)
|
|
|
|
|
2015-08-13 05:00:05 +10:00
|
|
|
formats = self._extract_smil_formats(
|
2015-08-13 05:02:50 +10:00
|
|
|
'http://www.rtvnh.nl/video/smil?m=' + video_id, video_id, fatal=False)
|
2015-08-13 02:07:27 +10:00
|
|
|
|
|
|
|
for item in meta['source']['fb']:
|
|
|
|
if item.get('type') == 'hls':
|
2015-08-13 05:00:05 +10:00
|
|
|
formats.extend(self._extract_m3u8_formats(
|
|
|
|
item['file'], video_id, ext='mp4', entry_protocol='m3u8_native'))
|
2015-08-13 02:07:27 +10:00
|
|
|
elif item.get('type') == '':
|
|
|
|
formats.append({'url': item['file']})
|
2016-03-27 12:03:08 +11:00
|
|
|
self._sort_formats(formats)
|
2015-08-13 05:11:55 +10:00
|
|
|
|
2015-08-13 02:07:27 +10:00
|
|
|
return {
|
|
|
|
'id': video_id,
|
|
|
|
'title': meta['title'].strip(),
|
2015-08-13 05:00:25 +10:00
|
|
|
'thumbnail': meta.get('image'),
|
2015-08-13 02:07:27 +10:00
|
|
|
'formats': formats
|
|
|
|
}
|