2014-08-27 19:52:55 +02:00
from __future__ import unicode_literals
2013-10-10 15:25:11 +02:00
import re
import json
from . common import InfoExtractor
2014-11-26 13:06:02 +01:00
from . . compat import (
2013-10-10 15:25:11 +02:00
compat_urlparse ,
compat_urllib_parse ,
2014-12-02 23:23:18 +01:00
compat_urllib_parse_urlparse
2014-11-26 13:06:02 +01:00
)
from . . utils import (
2013-10-10 15:25:11 +02:00
unified_strdate ,
)
2013-10-11 14:33:26 +02:00
class NHLBaseInfoExtractor ( InfoExtractor ) :
@staticmethod
def _fix_json ( json_string ) :
return json_string . replace ( ' \\ \' ' , ' \' ' )
def _extract_video ( self , info ) :
video_id = info [ ' id ' ]
self . report_extraction ( video_id )
initial_video_url = info [ ' publishPoint ' ]
2014-10-25 13:56:21 +07:00
if info [ ' formats ' ] == ' 1 ' :
2014-12-02 23:23:18 +01:00
parsed_url = compat_urllib_parse_urlparse ( initial_video_url )
path = parsed_url . path
extension_index = path . rfind ( ' . ' )
path = path [ : extension_index ] + ' _sd ' + path [ extension_index : ]
2014-10-25 13:56:21 +07:00
data = compat_urllib_parse . urlencode ( {
' type ' : ' fvod ' ,
2014-12-02 23:23:18 +01:00
' path ' : compat_urlparse . urlunparse ( parsed_url [ : 2 ] + ( path , ) + parsed_url [ 3 : ] )
2014-10-25 13:56:21 +07:00
} )
path_url = ' http://video.nhl.com/videocenter/servlets/encryptvideopath? ' + data
path_doc = self . _download_xml (
path_url , video_id , ' Downloading final video url ' )
video_url = path_doc . find ( ' path ' ) . text
else :
2014-11-23 20:41:03 +01:00
video_url = initial_video_url
2013-10-11 14:33:26 +02:00
join = compat_urlparse . urljoin
return {
' id ' : video_id ,
' title ' : info [ ' name ' ] ,
' url ' : video_url ,
' description ' : info [ ' description ' ] ,
' duration ' : int ( info [ ' duration ' ] ) ,
' thumbnail ' : join ( join ( video_url , ' /u/ ' ) , info [ ' bigImage ' ] ) ,
' upload_date ' : unified_strdate ( info [ ' releaseDate ' ] . split ( ' . ' ) [ 0 ] ) ,
}
class NHLIE ( NHLBaseInfoExtractor ) :
2014-08-27 19:52:55 +02:00
IE_NAME = ' nhl.com '
2014-10-25 13:56:21 +07:00
_VALID_URL = r ' https?://video(?P<team> \ .[^.]*)? \ .nhl \ .com/videocenter/console(?: \ ?(?:.*?[?&])?)id=(?P<id>[0-9a-z-]+) '
2013-10-10 15:25:11 +02:00
2014-09-16 10:08:34 +02:00
_TESTS = [ {
2014-08-27 19:52:55 +02:00
' url ' : ' http://video.canucks.nhl.com/videocenter/console?catid=6?id=453614 ' ,
2014-10-25 13:56:21 +07:00
' md5 ' : ' db704a4ea09e8d3988c85e36cc892d09 ' ,
2014-08-27 19:52:55 +02:00
' info_dict ' : {
' id ' : ' 453614 ' ,
' ext ' : ' mp4 ' ,
' title ' : ' Quick clip: Weise 4-3 goal vs Flames ' ,
' description ' : ' Dale Weise scores his first of the season to put the Canucks up 4-3. ' ,
' duration ' : 18 ,
' upload_date ' : ' 20131006 ' ,
2013-10-10 15:25:11 +02:00
} ,
2014-10-25 13:56:21 +07:00
} , {
' url ' : ' http://video.nhl.com/videocenter/console?id=2014020024-628-h ' ,
' md5 ' : ' d22e82bc592f52d37d24b03531ee9696 ' ,
' info_dict ' : {
' id ' : ' 2014020024-628-h ' ,
' ext ' : ' mp4 ' ,
' title ' : ' Alex Galchenyuk Goal on Ray Emery (14:40/3rd) ' ,
' description ' : ' Home broadcast - Montreal Canadiens at Philadelphia Flyers - October 11, 2014 ' ,
' duration ' : 0 ,
' upload_date ' : ' 20141011 ' ,
} ,
2014-12-02 23:23:18 +01:00
} , {
' url ' : ' http://video.mapleleafs.nhl.com/videocenter/console?id=58665&catid=802 ' ,
' md5 ' : ' c78fc64ea01777e426cfc202b746c825 ' ,
' info_dict ' : {
' id ' : ' 58665 ' ,
' ext ' : ' flv ' ,
' title ' : ' Classic Game In Six - April 22, 1979 ' ,
' description ' : ' It was the last playoff game for the Leafs in the decade, and the last time the Leafs and Habs played in the playoffs. Great game, not a great ending. ' ,
' duration ' : 400 ,
' upload_date ' : ' 20100129 '
} ,
2014-09-16 10:08:34 +02:00
} , {
' url ' : ' http://video.flames.nhl.com/videocenter/console?id=630616 ' ,
' only_matching ' : True ,
} ]
2013-10-10 15:25:11 +02:00
def _real_extract ( self , url ) :
mobj = re . match ( self . _VALID_URL , url )
video_id = mobj . group ( ' id ' )
json_url = ' http://video.nhl.com/videocenter/servlets/playlist?ids= %s &format=json ' % video_id
2014-08-27 19:52:55 +02:00
data = self . _download_json (
json_url , video_id , transform_source = self . _fix_json )
return self . _extract_video ( data [ 0 ] )
2013-10-11 14:33:26 +02:00
class NHLVideocenterIE ( NHLBaseInfoExtractor ) :
2014-08-27 19:52:55 +02:00
IE_NAME = ' nhl.com:videocenter '
IE_DESC = ' NHL videocenter category '
2014-12-02 23:56:30 +01:00
_VALID_URL = r ' https?://video \ .(?P<team>[^.]*) \ .nhl \ .com/videocenter/(console \ ?[^(id=)]*catid=(?P<catid>[0-9]+)(?![&?]id=).*?)?$ '
2014-08-27 19:52:55 +02:00
_TEST = {
' url ' : ' http://video.canucks.nhl.com/videocenter/console?catid=999 ' ,
' info_dict ' : {
' id ' : ' 999 ' ,
' title ' : ' Highlights ' ,
} ,
' playlist_count ' : 12 ,
}
2013-10-11 14:33:26 +02:00
def _real_extract ( self , url ) :
mobj = re . match ( self . _VALID_URL , url )
team = mobj . group ( ' team ' )
webpage = self . _download_webpage ( url , team )
cat_id = self . _search_regex (
[ r ' var defaultCatId = " (.+?) " ; ' ,
r ' { statusIndex:0,index:0,.*?id:(.*?), ' ] ,
2014-08-27 19:52:55 +02:00
webpage , ' category id ' )
2013-10-11 14:33:26 +02:00
playlist_title = self . _html_search_regex (
2013-10-22 21:01:16 +02:00
r ' tab0 " [^>]*?>(.*?)</td> ' ,
2014-08-27 19:52:55 +02:00
webpage , ' playlist title ' , flags = re . DOTALL ) . lower ( ) . capitalize ( )
2013-10-10 15:25:11 +02:00
data = compat_urllib_parse . urlencode ( {
2013-10-11 14:33:26 +02:00
' cid ' : cat_id ,
# This is the default value
' count ' : 12 ,
' ptrs ' : 3 ,
' format ' : ' json ' ,
2013-10-10 15:25:11 +02:00
} )
2013-10-11 14:33:26 +02:00
path = ' /videocenter/servlets/browse? ' + data
request_url = compat_urlparse . urljoin ( url , path )
response = self . _download_webpage ( request_url , playlist_title )
response = self . _fix_json ( response )
if not response . strip ( ) :
2014-11-26 13:06:02 +01:00
self . _downloader . report_warning ( ' Got an empty reponse, trying '
2014-08-27 19:52:55 +02:00
' adding the " newvideos " parameter ' )
2013-10-11 14:33:26 +02:00
response = self . _download_webpage ( request_url + ' &newvideos=true ' ,
2014-11-23 21:39:15 +01:00
playlist_title )
2013-10-11 14:33:26 +02:00
response = self . _fix_json ( response )
videos = json . loads ( response )
2013-10-10 15:25:11 +02:00
return {
2013-10-11 14:33:26 +02:00
' _type ' : ' playlist ' ,
' title ' : playlist_title ,
' id ' : cat_id ,
2014-08-27 19:52:55 +02:00
' entries ' : [ self . _extract_video ( v ) for v in videos ] ,
2013-10-10 15:25:11 +02:00
}