[filmon] improve extraction

pull/11956/head
Remita Amine 7 years ago
parent a0758dfa1a
commit 4ce3407d08

@ -287,7 +287,10 @@ from .fc2 import (
FC2EmbedIE, FC2EmbedIE,
) )
from .fczenit import FczenitIE from .fczenit import FczenitIE
from .filmon import FilmOnIE, FilmOnVODIE from .filmon import (
FilmOnIE,
FilmOnChannelIE,
)
from .firstpost import FirstpostIE from .firstpost import FirstpostIE
from .firsttv import FirstTVIE from .firsttv import FirstTVIE
from .fivemin import FiveMinIE from .fivemin import FiveMinIE

@ -2,143 +2,177 @@
from __future__ import unicode_literals from __future__ import unicode_literals
from .common import InfoExtractor from .common import InfoExtractor
from ..utils import qualities from ..compat import (
from ..compat import compat_urllib_request compat_str,
compat_HTTPError,
)
_QUALITY = qualities(('low', 'high')) from ..utils import (
qualities,
strip_or_none,
int_or_none,
ExtractorError,
)
class FilmOnIE(InfoExtractor): class FilmOnIE(InfoExtractor):
_VALID_URL = r'https?://(?:www\.)?filmon\.com/(?:tv|channel)/(?P<id>[a-z0-9-]+)' IE_NAME = 'filmon'
_VALID_URL = r'(?:https?://(?:www\.)?filmon\.com/vod/view/|filmon:)(?P<id>\d+)'
_TESTS = [{ _TESTS = [{
'url': 'https://www.filmon.com/channel/filmon-sports', 'url': 'https://www.filmon.com/vod/view/24869-0-plan-9-from-outer-space',
'only_matching': True, 'info_dict': {
'id': '24869',
'ext': 'mp4',
'title': 'Plan 9 From Outer Space',
'description': 'Dead human, zombies and vampires',
},
}, { }, {
'url': 'https://www.filmon.com/tv/2894', 'url': 'https://www.filmon.com/vod/view/2825-1-popeye-series-1',
'only_matching': True, 'info_dict': {
'id': '2825',
'title': 'Popeye Series 1',
'description': 'The original series of Popeye.',
},
'playlist_mincount': 8,
}] }]
def _real_extract(self, url): def _real_extract(self, url):
channel_id = self._match_id(url) video_id = self._match_id(url)
request = compat_urllib_request.Request('https://www.filmon.com/channel/%s' % (channel_id)) try:
request.add_header('X-Requested-With', 'XMLHttpRequest') response = self._download_json(
channel_info = self._download_json(request, channel_id) 'https://www.filmon.com/api/vod/movie?id=%s' % video_id,
now_playing = channel_info['now_playing'] video_id)['response']
except ExtractorError as e:
if isinstance(e.cause, compat_HTTPError):
errmsg = self._parse_json(e.cause.read().decode(), video_id)['reason']
raise ExtractorError('%s said: %s' % (self.IE_NAME, errmsg), expected=True)
raise
thumbnails = [] title = response['title']
for thumb in now_playing.get('images', ()): description = strip_or_none(response.get('description'))
if thumb['type'] != '2':
continue
thumbnails.append({
'url': thumb['url'],
'width': int(thumb['width']),
'height': int(thumb['height']),
})
formats = [] if response.get('type_id') == 1:
entries = [self.url_result('filmon:' + episode_id) for episode_id in response.get('episodes', [])]
return self.playlist_result(entries, video_id, title, description)
for stream in channel_info['streams']: QUALITY = qualities(('low', 'high'))
formats = []
for format_id, stream in response.get('streams', {}).items():
stream_url = stream.get('url')
if not stream_url:
continue
formats.append({ formats.append({
'format_id': str(stream['id']), 'format_id': format_id,
# this is an m3u8 stream, but we are deliberately not using _extract_m3u8_formats 'url': stream_url,
# because 0) it doesn't have bitrate variants anyway, and 1) the ids generated
# by that method are highly unstable (because the bitrate is variable)
'url': stream['url'],
'resolution': stream['name'],
'format_note': 'expires after %u seconds' % int(stream['watch-timeout']),
'ext': 'mp4', 'ext': 'mp4',
'quality': _QUALITY(stream['quality']), 'quality': QUALITY(stream.get('quality')),
'preference': int(stream['watch-timeout']), 'protocol': 'm3u8_native',
}) })
self._sort_formats(formats) self._sort_formats(formats)
thumbnails = []
poster = response.get('poster', {})
thumbs = poster.get('thumbs', {})
thumbs['poster'] = poster
for thumb_id, thumb in thumbs.items():
thumb_url = thumb.get('url')
if not thumb_url:
continue
thumbnails.append({
'id': thumb_id,
'url': thumb_url,
'width': int_or_none(thumb.get('width')),
'height': int_or_none(thumb.get('height')),
})
return { return {
'id': str(channel_info['id']), 'id': video_id,
'display_id': channel_info['alias'], 'title': title,
'formats': formats, 'formats': formats,
# XXX: use the channel description (channel_info['description'])? 'description': description,
'uploader_id': channel_info['alias'],
'uploader': channel_info['title'], # XXX: kinda stretching it...
'title': now_playing.get('programme_name') or channel_info['title'],
'description': now_playing.get('programme_description'),
'thumbnails': thumbnails, 'thumbnails': thumbnails,
'is_live': True,
} }
class FilmOnVODIE(InfoExtractor): class FilmOnChannelIE(InfoExtractor):
_VALID_URL = r'https?://(?:www\.)?filmon\.com/vod/view/(?P<id>\d+)' IE_NAME = 'filmon:channel'
_VALID_URL = r'https?://(?:www\.)?filmon\.com/(?:tv|channel)/(?P<id>[a-z0-9-]+)'
_TESTS = [{ _TESTS = [{
'url': 'https://www.filmon.com/vod/view/24869-0-plan-9-from-outer-space', # VOD
'url': 'http://www.filmon.com/tv/sports-haters',
'info_dict': { 'info_dict': {
'id': '24869', 'id': '4190',
'ext': 'mp4', 'ext': 'mp4',
'title': 'Plan 9 From Outer Space', 'title': 'Sports Haters',
'description': 'Dead human, zombies and vampires', 'description': 'md5:dabcb4c1d9cfc77085612f1a85f8275d',
}, },
}, { }, {
'url': 'https://www.filmon.com/vod/view/2825-1-popeye-series-1', # LIVE
'info_dict': { 'url': 'https://www.filmon.com/channel/filmon-sports',
'id': '2825', 'only_matching': True,
'title': 'Popeye Series 1', }, {
}, 'url': 'https://www.filmon.com/tv/2894',
'playlist_count': 8, 'only_matching': True,
}] }]
def _real_extract(self, url): _THUMBNAIL_RES = [
video_id = self._match_id(url) ('logo', 56, 28),
('big_logo', 106, 106),
('extra_big_logo', 300, 300),
]
result = self._download_json('https://www.filmon.com/api/vod/movie?id=%s' % (video_id), video_id) def _real_extract(self, url):
if result['code'] != 200: channel_id = self._match_id(url)
raise ExtractorError('FilmOn said: %s' % (result['reason']), expected=True)
response = result['response'] try:
channel_data = self._download_json(
'http://www.filmon.com/api-v2/channel/' + channel_id, channel_id)['data']
except ExtractorError as e:
if isinstance(e.cause, compat_HTTPError):
errmsg = self._parse_json(e.cause.read().decode(), channel_id)['message']
raise ExtractorError('%s said: %s' % (self.IE_NAME, errmsg), expected=True)
raise
if response.get('episodes'): channel_id = compat_str(channel_data['id'])
return { is_live = not channel_data.get('is_vod') and not channel_data.get('is_vox')
'_type': 'playlist', title = channel_data['title']
'id': video_id,
'title': response['title'],
'entries': [{
'_type': 'url',
'url': 'https://www.filmon.com/vod/view/%s' % (ep),
} for ep in response['episodes']]
}
QUALITY = qualities(('low', 'high'))
formats = [] formats = []
for (id, stream) in response['streams'].items(): for stream in channel_data.get('streams', []):
stream_url = stream.get('url')
if not stream_url:
continue
if not is_live:
formats.extend(self._extract_wowza_formats(
stream_url, channel_id, skip_protocols=['dash', 'rtmp', 'rtsp']))
continue
quality = stream.get('quality')
formats.append({ formats.append({
'format_id': id, 'format_id': quality,
'url': stream['url'], # this is an m3u8 stream, but we are deliberately not using _extract_m3u8_formats
'resolution': stream['name'], # because it doesn't have bitrate variants anyway
'format_note': 'expires after %u seconds' % int(stream['watch-timeout']), 'url': stream_url,
'ext': 'mp4', 'ext': 'mp4',
'quality': _QUALITY(stream['quality']), 'quality': QUALITY(quality),
'preference': int(stream['watch-timeout']),
}) })
self._sort_formats(formats) self._sort_formats(formats)
poster = response['poster'] thumbnails = []
thumbnails = [{ for name, width, height in self._THUMBNAIL_RES:
'id': 'poster',
'url': poster['url'],
'width': poster['width'],
'height': poster['height'],
}]
for (id, thumb) in poster['thumbs'].items():
thumbnails.append({ thumbnails.append({
'id': id, 'id': name,
'url': thumb['url'], 'url': 'http://static.filmon.com/assets/channels/%s/%s.png' % (channel_id, name),
'width': thumb['width'], 'width': width,
'height': thumb['height'], 'height': height,
}) })
return { return {
'id': video_id, 'id': channel_id,
'title': response['title'], 'display_id': channel_data.get('alias'),
'formats': formats, 'title': self._live_title(title) if is_live else title,
'description': response['description'], 'description': channel_data.get('description'),
'thumbnails': thumbnails, 'thumbnails': thumbnails,
'formats': formats,
'is_live': is_live,
} }

Loading…
Cancel
Save