2014-08-28 01:52:55 +08:00
from __future__ import unicode_literals
2013-10-10 21:25:11 +08:00
import re
import json
2014-12-07 18:26:07 +08:00
import os
2013-10-10 21:25:11 +08:00
from . common import InfoExtractor
2014-11-26 20:06:02 +08:00
from . . compat import (
2013-10-10 21:25:11 +08:00
compat_urlparse ,
compat_urllib_parse ,
2014-12-03 06:23:18 +08:00
compat_urllib_parse_urlparse
2014-11-26 20:06:02 +08:00
)
from . . utils import (
2013-10-10 21:25:11 +08:00
unified_strdate ,
)
2013-10-11 20:33:26 +08:00
class NHLBaseInfoExtractor ( InfoExtractor ) :
@staticmethod
def _fix_json ( json_string ) :
return json_string . replace ( ' \\ \' ' , ' \' ' )
2015-01-31 01:12:27 +08:00
def _real_extract_video ( self , video_id ) :
2015-05-08 02:12:28 +08:00
vid_parts = video_id . split ( ' , ' )
if len ( vid_parts ) == 3 :
video_id = ' %s 0 %s %s -X-h ' % ( vid_parts [ 0 ] [ : 4 ] , vid_parts [ 1 ] , vid_parts [ 2 ] . rjust ( 4 , ' 0 ' ) )
2015-01-31 01:12:27 +08:00
json_url = ' http://video.nhl.com/videocenter/servlets/playlist?ids= %s &format=json ' % video_id
data = self . _download_json (
json_url , video_id , transform_source = self . _fix_json )
return self . _extract_video ( data [ 0 ] )
2013-10-11 20:33:26 +08:00
def _extract_video ( self , info ) :
video_id = info [ ' id ' ]
self . report_extraction ( video_id )
initial_video_url = info [ ' publishPoint ' ]
2014-10-25 14:56:21 +08:00
if info [ ' formats ' ] == ' 1 ' :
2014-12-03 06:23:18 +08:00
parsed_url = compat_urllib_parse_urlparse ( initial_video_url )
2014-12-07 18:26:07 +08:00
filename , ext = os . path . splitext ( parsed_url . path )
path = ' %s _sd %s ' % ( filename , ext )
2014-10-25 14:56:21 +08:00
data = compat_urllib_parse . urlencode ( {
' type ' : ' fvod ' ,
2014-12-03 06:23:18 +08:00
' path ' : compat_urlparse . urlunparse ( parsed_url [ : 2 ] + ( path , ) + parsed_url [ 3 : ] )
2014-10-25 14:56:21 +08:00
} )
path_url = ' http://video.nhl.com/videocenter/servlets/encryptvideopath? ' + data
path_doc = self . _download_xml (
path_url , video_id , ' Downloading final video url ' )
video_url = path_doc . find ( ' path ' ) . text
else :
2014-11-24 03:41:03 +08:00
video_url = initial_video_url
2013-10-11 20:33:26 +08:00
join = compat_urlparse . urljoin
2015-05-08 03:09:19 +08:00
ret = {
2013-10-11 20:33:26 +08:00
' id ' : video_id ,
' title ' : info [ ' name ' ] ,
' url ' : video_url ,
' description ' : info [ ' description ' ] ,
' duration ' : int ( info [ ' duration ' ] ) ,
' thumbnail ' : join ( join ( video_url , ' /u/ ' ) , info [ ' bigImage ' ] ) ,
' upload_date ' : unified_strdate ( info [ ' releaseDate ' ] . split ( ' . ' ) [ 0 ] ) ,
}
2015-05-08 03:09:19 +08:00
if video_url . startswith ( ' rtmp: ' ) :
mobj = re . match ( r ' (?P<tc_url>rtmp://[^/]+/(?P<app>[a-z0-9/]+))/(?P<play_path>mp4:.*) ' , video_url )
ret . update ( {
' tc_url ' : mobj . group ( ' tc_url ' ) ,
' play_path ' : mobj . group ( ' play_path ' ) ,
' app ' : mobj . group ( ' app ' ) ,
' no_resume ' : True ,
} )
return ret
2013-10-11 20:33:26 +08:00
class NHLIE ( NHLBaseInfoExtractor ) :
2014-08-28 01:52:55 +08:00
IE_NAME = ' nhl.com '
2015-05-08 02:12:28 +08:00
_VALID_URL = r ' https?://video(?P<team> \ .[^.]*)? \ .nhl \ .com/videocenter/(?:console)?(?: \ ?(?:.*?[?&])?)(?:id|hlg)=(?P<id>[-0-9a-zA-Z,]+) '
2013-10-10 21:25:11 +08:00
2014-09-16 16:08:34 +08:00
_TESTS = [ {
2014-08-28 01:52:55 +08:00
' url ' : ' http://video.canucks.nhl.com/videocenter/console?catid=6?id=453614 ' ,
2014-10-25 14:56:21 +08:00
' md5 ' : ' db704a4ea09e8d3988c85e36cc892d09 ' ,
2014-08-28 01:52:55 +08:00
' info_dict ' : {
' id ' : ' 453614 ' ,
' ext ' : ' mp4 ' ,
' title ' : ' Quick clip: Weise 4-3 goal vs Flames ' ,
' description ' : ' Dale Weise scores his first of the season to put the Canucks up 4-3. ' ,
' duration ' : 18 ,
' upload_date ' : ' 20131006 ' ,
2013-10-10 21:25:11 +08:00
} ,
2014-10-25 14:56:21 +08:00
} , {
' url ' : ' http://video.nhl.com/videocenter/console?id=2014020024-628-h ' ,
' md5 ' : ' d22e82bc592f52d37d24b03531ee9696 ' ,
' info_dict ' : {
' id ' : ' 2014020024-628-h ' ,
' ext ' : ' mp4 ' ,
' title ' : ' Alex Galchenyuk Goal on Ray Emery (14:40/3rd) ' ,
' description ' : ' Home broadcast - Montreal Canadiens at Philadelphia Flyers - October 11, 2014 ' ,
' duration ' : 0 ,
' upload_date ' : ' 20141011 ' ,
} ,
2014-12-03 06:23:18 +08:00
} , {
' url ' : ' http://video.mapleleafs.nhl.com/videocenter/console?id=58665&catid=802 ' ,
' md5 ' : ' c78fc64ea01777e426cfc202b746c825 ' ,
' info_dict ' : {
' id ' : ' 58665 ' ,
' ext ' : ' flv ' ,
' title ' : ' Classic Game In Six - April 22, 1979 ' ,
' description ' : ' It was the last playoff game for the Leafs in the decade, and the last time the Leafs and Habs played in the playoffs. Great game, not a great ending. ' ,
' duration ' : 400 ,
' upload_date ' : ' 20100129 '
} ,
2014-09-16 16:08:34 +08:00
} , {
' url ' : ' http://video.flames.nhl.com/videocenter/console?id=630616 ' ,
' only_matching ' : True ,
2015-01-31 00:46:53 +08:00
} , {
' url ' : ' http://video.nhl.com/videocenter/?id=736722 ' ,
' only_matching ' : True ,
2015-05-08 02:12:28 +08:00
} , {
' url ' : ' http://video.nhl.com/videocenter/console?hlg=20142015,2,299&lang=en ' ,
' md5 ' : ' 076fcb88c255154aacbf0a7accc3f340 ' ,
' info_dict ' : {
' id ' : ' 2014020299-X-h ' ,
' ext ' : ' mp4 ' ,
' title ' : ' Penguins at Islanders / Game Highlights ' ,
' description ' : ' Home broadcast - Pittsburgh Penguins at New York Islanders - November 22, 2014 ' ,
' duration ' : 268 ,
' upload_date ' : ' 20141122 ' ,
}
2015-05-08 03:09:19 +08:00
} , {
' url ' : ' http://video.oilers.nhl.com/videocenter/console?id=691469&catid=4 ' ,
' info_dict ' : {
' id ' : ' 691469 ' ,
' ext ' : ' mp4 ' ,
' title ' : ' RAW | Craig MacTavish Full Press Conference ' ,
' description ' : ' Oilers GM Craig MacTavish addresses the media at Rexall Place on Friday. ' ,
' upload_date ' : ' 20141205 ' ,
} ,
' params ' : {
' skip_download ' : True , # Requires rtmpdump
}
2014-09-16 16:08:34 +08:00
} ]
2013-10-10 21:25:11 +08:00
def _real_extract ( self , url ) :
2015-01-31 01:12:27 +08:00
video_id = self . _match_id ( url )
return self . _real_extract_video ( video_id )
class NHLNewsIE ( NHLBaseInfoExtractor ) :
IE_NAME = ' nhl.com:news '
IE_DESC = ' NHL news '
_VALID_URL = r ' https?://(?:www \ .)?nhl \ .com/ice/news \ .html?(?: \ ?(?:.*?[?&])?)id=(?P<id>[-0-9a-zA-Z]+) '
_TEST = {
' url ' : ' http://www.nhl.com/ice/news.htm?id=750727 ' ,
' md5 ' : ' 4b3d1262e177687a3009937bd9ec0be8 ' ,
' info_dict ' : {
' id ' : ' 736722 ' ,
' ext ' : ' mp4 ' ,
' title ' : ' Cal Clutterbuck has been fined $2,000 ' ,
' description ' : ' md5:45fe547d30edab88b23e0dd0ab1ed9e6 ' ,
' duration ' : 37 ,
' upload_date ' : ' 20150128 ' ,
} ,
}
def _real_extract ( self , url ) :
news_id = self . _match_id ( url )
webpage = self . _download_webpage ( url , news_id )
video_id = self . _search_regex (
[ r ' pVid( \ d+) ' , r " nlid \ s*: \ s* ' ( \ d+) ' " ] ,
webpage , ' video id ' )
return self . _real_extract_video ( video_id )
2013-10-11 20:33:26 +08:00
class NHLVideocenterIE ( NHLBaseInfoExtractor ) :
2014-08-28 01:52:55 +08:00
IE_NAME = ' nhl.com:videocenter '
IE_DESC = ' NHL videocenter category '
2014-12-03 06:56:30 +08:00
_VALID_URL = r ' https?://video \ .(?P<team>[^.]*) \ .nhl \ .com/videocenter/(console \ ?[^(id=)]*catid=(?P<catid>[0-9]+)(?![&?]id=).*?)?$ '
2014-08-28 01:52:55 +08:00
_TEST = {
' url ' : ' http://video.canucks.nhl.com/videocenter/console?catid=999 ' ,
' info_dict ' : {
' id ' : ' 999 ' ,
' title ' : ' Highlights ' ,
} ,
' playlist_count ' : 12 ,
}
2013-10-11 20:33:26 +08:00
def _real_extract ( self , url ) :
mobj = re . match ( self . _VALID_URL , url )
team = mobj . group ( ' team ' )
webpage = self . _download_webpage ( url , team )
cat_id = self . _search_regex (
[ r ' var defaultCatId = " (.+?) " ; ' ,
r ' { statusIndex:0,index:0,.*?id:(.*?), ' ] ,
2014-08-28 01:52:55 +08:00
webpage , ' category id ' )
2013-10-11 20:33:26 +08:00
playlist_title = self . _html_search_regex (
2013-10-23 03:01:16 +08:00
r ' tab0 " [^>]*?>(.*?)</td> ' ,
2014-08-28 01:52:55 +08:00
webpage , ' playlist title ' , flags = re . DOTALL ) . lower ( ) . capitalize ( )
2013-10-10 21:25:11 +08:00
data = compat_urllib_parse . urlencode ( {
2013-10-11 20:33:26 +08:00
' cid ' : cat_id ,
# This is the default value
' count ' : 12 ,
' ptrs ' : 3 ,
' format ' : ' json ' ,
2013-10-10 21:25:11 +08:00
} )
2013-10-11 20:33:26 +08:00
path = ' /videocenter/servlets/browse? ' + data
request_url = compat_urlparse . urljoin ( url , path )
response = self . _download_webpage ( request_url , playlist_title )
response = self . _fix_json ( response )
if not response . strip ( ) :
2014-11-26 20:06:02 +08:00
self . _downloader . report_warning ( ' Got an empty reponse, trying '
2014-08-28 01:52:55 +08:00
' adding the " newvideos " parameter ' )
2013-10-11 20:33:26 +08:00
response = self . _download_webpage ( request_url + ' &newvideos=true ' ,
2014-11-24 04:39:15 +08:00
playlist_title )
2013-10-11 20:33:26 +08:00
response = self . _fix_json ( response )
videos = json . loads ( response )
2013-10-10 21:25:11 +08:00
return {
2013-10-11 20:33:26 +08:00
' _type ' : ' playlist ' ,
' title ' : playlist_title ,
' id ' : cat_id ,
2014-08-28 01:52:55 +08:00
' entries ' : [ self . _extract_video ( v ) for v in videos ] ,
2013-10-10 21:25:11 +08:00
}