diff --git a/youtube_dl/extractor/gamekings.py b/youtube_dl/extractor/gamekings.py index cf8e90d7d..1821f26d8 100644 --- a/youtube_dl/extractor/gamekings.py +++ b/youtube_dl/extractor/gamekings.py @@ -3,11 +3,16 @@ from __future__ import unicode_literals import re from .common import InfoExtractor +from ..utils import ( + xpath_text, + xpath_with_ns + ) class GamekingsIE(InfoExtractor): _VALID_URL = r'http://www\.gamekings\.tv/videos/(?P[0-9a-z\-]+)' - _TEST = { + _TESTS = [ + { 'url': 'http://www.gamekings.tv/videos/phoenix-wright-ace-attorney-dual-destinies-review/', # MD5 is flaky, seems to change regularly # 'md5': '2f32b1f7b80fdc5cb616efb4f387f8a3', @@ -16,21 +21,44 @@ class GamekingsIE(InfoExtractor): 'ext': 'mp4', 'title': 'Phoenix Wright: Ace Attorney \u2013 Dual Destinies Review', 'description': 'md5:36fd701e57e8c15ac8682a2374c99731', + } + }, + { + 'url': 'http://www.gamekings.tv/videos/the-legend-of-zelda-majoras-mask/', + 'info_dict': { + 'id': '118933752', + 'ext': 'mp4', + 'title': 'The Legend of Zelda: Majora’s Mask', + 'description': 'md5:9917825fe0e9f4057601fe1e38860de3' + } } - } + ] def _real_extract(self, url): mobj = re.match(self._VALID_URL, url) name = mobj.group('name') webpage = self._download_webpage(url, name) - video_url = self._og_search_video_url(webpage) + playlist_id = re.search(r'(?:gogoVideo)\(\d+,"?(?P.*)"', webpage, re.MULTILINE).group('playlist_id') + playlist_url = 'http://www.gamekings.tv/wp-content/themes/gk2010/rss_playlist.php?id=' + playlist_id + playlist_rss = self._download_xml(playlist_url, playlist_id) + + + NS_MAP = { + 'jwplayer': 'http://rss.jwpcdn.com/' + } + + item = playlist_rss.find('./channel/item') + + image = xpath_text(item, xpath_with_ns('./jwplayer:image', NS_MAP), 'image') + file_node = item.find(xpath_with_ns('./jwplayer:source', NS_MAP)) + + video_url = file_node.get('file') video = re.search(r'[0-9]+', video_url) video_id = video.group(0) - - # Todo: add medium format - video_url = video_url.replace(video_id, 'large/' + video_id) + + # Todo: Add medium format return { 'id': video_id, @@ -38,4 +66,5 @@ class GamekingsIE(InfoExtractor): 'url': video_url, 'title': self._og_search_title(webpage), 'description': self._og_search_description(webpage), + 'thumbnail': image }