[lnkgo] Adapt to website changes

This commit is contained in:
Naglis Jonaitis 2015-01-27 15:38:54 +02:00
parent 9f0df77ab1
commit 2103d038b3

View File

@ -6,13 +6,12 @@ import re
from .common import InfoExtractor from .common import InfoExtractor
from ..utils import ( from ..utils import (
int_or_none, int_or_none,
js_to_json,
unified_strdate, unified_strdate,
) )
class LnkGoIE(InfoExtractor): class LnkGoIE(InfoExtractor):
_VALID_URL = r'https?://(?:www\.)?lnkgo\.alfa\.lt/visi\-video/(?P<show>[^/]+)/ziurek\-(?P<display_id>[A-Za-z0-9\-]+)' _VALID_URL = r'https?://(?:www\.)?lnkgo\.alfa\.lt/visi-video/(?P<show>[^/]+)/ziurek-(?P<id>[A-Za-z0-9-]+)'
_TESTS = [{ _TESTS = [{
'url': 'http://lnkgo.alfa.lt/visi-video/yra-kaip-yra/ziurek-yra-kaip-yra-162', 'url': 'http://lnkgo.alfa.lt/visi-video/yra-kaip-yra/ziurek-yra-kaip-yra-162',
'info_dict': { 'info_dict': {
@ -51,8 +50,7 @@ class LnkGoIE(InfoExtractor):
} }
def _real_extract(self, url): def _real_extract(self, url):
mobj = re.match(self._VALID_URL, url) display_id = self._match_id(url)
display_id = mobj.group('display_id')
webpage = self._download_webpage( webpage = self._download_webpage(
url, display_id, 'Downloading player webpage') url, display_id, 'Downloading player webpage')
@ -61,6 +59,8 @@ class LnkGoIE(InfoExtractor):
r'data-ep="([^"]+)"', webpage, 'video ID') r'data-ep="([^"]+)"', webpage, 'video ID')
title = self._og_search_title(webpage) title = self._og_search_title(webpage)
description = self._og_search_description(webpage) description = self._og_search_description(webpage)
upload_date = unified_strdate(self._search_regex(
r'class="[^"]*meta-item[^"]*air-time[^"]*">.*?<strong>([^<]+)</strong>', webpage, 'upload date', fatal=False))
thumbnail_w = int_or_none( thumbnail_w = int_or_none(
self._og_search_property('image:width', webpage, 'thumbnail width', fatal=False)) self._og_search_property('image:width', webpage, 'thumbnail width', fatal=False))
@ -75,39 +75,28 @@ class LnkGoIE(InfoExtractor):
'height': thumbnail_h, 'height': thumbnail_h,
}) })
upload_date = unified_strdate(self._search_regex( config = self._parse_json(self._search_regex(
r'class="meta-item\sair-time">.*?<strong>([^<]+)</strong>', webpage, 'upload date', fatal=False)) r'episodePlayer\((\{.*?\}),\s*\{', webpage, 'sources'), video_id)
duration = int_or_none(self._search_regex(
r'VideoDuration = "([^"]+)"', webpage, 'duration', fatal=False))
pg_rating = self._search_regex( if config.get('pGeo'):
r'pgrating="([^"]+)"', webpage, 'PG rating', fatal=False, default='') self.report_warning(
age_limit = self._AGE_LIMITS.get(pg_rating.upper(), 0) 'This content might not be available in your country due to copyright reasons')
sources_js = self._search_regex( formats = [{
r'(?s)sources:\s(\[.*?\]),', webpage, 'sources') 'format_id': 'hls',
sources = self._parse_json( 'ext': 'mp4',
sources_js, video_id, transform_source=js_to_json) 'url': config['EpisodeVideoLink_HLS'],
}]
formats = [] m = re.search(r'^(?P<url>rtmp://[^/]+/(?P<app>[^/]+))/(?P<play_path>.+)$', config['EpisodeVideoLink'])
for source in sources: if m:
if source.get('provider') == 'rtmp': formats.append({
m = re.search(r'^(?P<url>rtmp://[^/]+/(?P<app>[^/]+))/(?P<play_path>.+)$', source['file']) 'format_id': 'rtmp',
if not m: 'ext': 'flv',
continue 'url': m.group('url'),
formats.append({ 'play_path': m.group('play_path'),
'format_id': 'rtmp', 'page_url': url,
'ext': 'flv', })
'url': m.group('url'),
'play_path': m.group('play_path'),
'page_url': url,
})
elif source.get('file').endswith('.m3u8'):
formats.append({
'format_id': 'hls',
'ext': source.get('type', 'mp4'),
'url': source['file'],
})
self._sort_formats(formats) self._sort_formats(formats)
@ -117,8 +106,8 @@ class LnkGoIE(InfoExtractor):
'title': title, 'title': title,
'formats': formats, 'formats': formats,
'thumbnails': [thumbnail], 'thumbnails': [thumbnail],
'duration': duration, 'duration': int_or_none(config.get('VideoTime')),
'description': description, 'description': description,
'age_limit': age_limit, 'age_limit': self._AGE_LIMITS.get(config.get('PGRating'), 0),
'upload_date': upload_date, 'upload_date': upload_date,
} }