2015-12-13 19:15:45 +08:00 
										
									 
								 
							 
							
								
									
										 
								
							 
							
								 
							
							
								# coding: utf-8  
						 
					
						
							
								
							 
							
								
							 
							
								 
							
							
								
							 
						 
					
						
							
								
									
										
										
										
											2014-01-29 15:34:35 +01:00 
										
									 
								 
							 
							
								
									
										 
								
							 
							
								 
							
							
								from  __future__  import  unicode_literals  
						 
					
						
							
								
							 
							
								
							 
							
								 
							
							
								
							 
						 
					
						
							
								
									
										
										
										
											2017-02-03 05:10:13 +01:00 
										
									 
								 
							 
							
								
									
										 
								
							 
							
								 
							
							
								from  . . compat  import  (  
						 
					
						
							
								
									
										
										
										
											2018-01-23 22:23:12 +07:00 
										
									 
								 
							 
							
								
									
										 
								
							 
							
								 
							
							
								    compat_b64decode , 
							 
						 
					
						
							
								
									
										
										
										
											2017-02-03 05:10:13 +01:00 
										
									 
								 
							 
							
								
									
										 
								
							 
							
								 
							
							
								    compat_urllib_parse_unquote , 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							
							
								    compat_urlparse , 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							
							
								)  
						 
					
						
							
								
									
										
										
										
											2017-10-12 17:39:51 +00:00 
										
									 
								 
							 
							
								
									
										 
								
							 
							
								 
							
							
								from  . . utils  import  (  
						 
					
						
							
								
							 
							
								
							 
							
								 
							
							
								    determine_ext , 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							
							
								    update_url_query , 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							
							
								)  
						 
					
						
							
								
									
										
										
										
											2016-02-27 02:55:11 +08:00 
										
									 
								 
							 
							
								
									
										 
								
							 
							
								 
							
							
								from  . bokecc  import  BokeCCBaseIE  
						 
					
						
							
								
									
										
										
										
											2013-06-23 21:14:19 +02:00 
										
									 
								 
							 
							
								
							 
							
								 
							
							
								
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							
							
								
							 
						 
					
						
							
								
									
										
										
										
											2016-02-27 02:55:11 +08:00 
										
									 
								 
							 
							
								
									
										 
								
							 
							
								 
							
							
								class  InfoQIE ( BokeCCBaseIE ) :  
						 
					
						
							
								
									
										
										
										
											2015-06-25 19:54:44 +06:00 
										
									 
								 
							 
							
								
									
										 
								
							 
							
								 
							
							
								    _VALID_URL  =  r ' https?://(?:www \ .)?infoq \ .com/(?:[^/]+/)+(?P<id>[^/]+) ' 
							 
						 
					
						
							
								
									
										
										
										
											2014-04-20 01:01:37 +02:00 
										
									 
								 
							 
							
								
									
										 
								
							 
							
								 
							
							
								
							 
						 
					
						
							
								
									
										
										
										
											2015-06-25 19:54:44 +06:00 
										
									 
								 
							 
							
								
									
										 
								
							 
							
								 
							
							
								    _TESTS  =  [ { 
							 
						 
					
						
							
								
									
										
										
										
											2014-04-21 02:55:35 +02:00 
										
									 
								 
							 
							
								
									
										 
								
							 
							
								 
							
							
								        ' url ' :  ' http://www.infoq.com/presentations/A-Few-of-My-Favorite-Python-Things ' , 
							 
						 
					
						
							
								
									
										
										
										
											2014-04-21 03:21:34 +02:00 
										
									 
								 
							 
							
								
									
										 
								
							 
							
								 
							
							
								        ' md5 ' :  ' b5ca0e0a8c1fed93b0e65e48e462f9a2 ' , 
							 
						 
					
						
							
								
									
										
										
										
											2014-04-21 02:55:35 +02:00 
										
									 
								 
							 
							
								
									
										 
								
							 
							
								 
							
							
								        ' info_dict ' :  { 
							 
						 
					
						
							
								
									
										
										
										
											2015-12-13 19:15:45 +08:00 
										
									 
								 
							 
							
								
									
										 
								
							 
							
								 
							
							
								            ' id ' :  ' A-Few-of-My-Favorite-Python-Things ' , 
							 
						 
					
						
							
								
									
										
										
										
											2014-04-21 02:55:35 +02:00 
										
									 
								 
							 
							
								
									
										 
								
							 
							
								 
							
							
								            ' ext ' :  ' mp4 ' , 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							
							
								            ' description ' :  ' Mike Pirnat presents some tips and tricks, standard libraries and third party packages that make programming in Python a richer experience. ' , 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							
							
								            ' title ' :  ' A Few of My Favorite [Python] Things ' , 
							 
						 
					
						
							
								
									
										
										
										
											2013-06-27 20:27:08 +02:00 
										
									 
								 
							 
							
								
									
										 
								
							 
							
								 
							
							
								        } , 
							 
						 
					
						
							
								
									
										
										
										
											2015-06-25 19:54:44 +06:00 
										
									 
								 
							 
							
								
									
										 
								
							 
							
								 
							
							
								    } ,  { 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							
							
								        ' url ' :  ' http://www.infoq.com/fr/presentations/changez-avis-sur-javascript ' , 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							
							
								        ' only_matching ' :  True , 
							 
						 
					
						
							
								
									
										
										
										
											2015-12-13 19:15:45 +08:00 
										
									 
								 
							 
							
								
									
										 
								
							 
							
								 
							
							
								    } ,  { 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							
							
								        ' url ' :  ' http://www.infoq.com/cn/presentations/openstack-continued-delivery ' , 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							
							
								        ' md5 ' :  ' 4918d0cca1497f2244572caf626687ef ' , 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							
							
								        ' info_dict ' :  { 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							
							
								            ' id ' :  ' openstack-continued-delivery ' , 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							
							
								            ' title ' :  ' OpenStack持续交付之路 ' , 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							
							
								            ' ext ' :  ' flv ' , 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							
							
								            ' description ' :  ' md5:308d981fb28fa42f49f9568322c683ff ' , 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							
							
								        } , 
							 
						 
					
						
							
								
									
										
										
										
											2017-02-03 05:10:13 +01:00 
										
									 
								 
							 
							
								
									
										 
								
							 
							
								 
							
							
								    } ,  { 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							
							
								        ' url ' :  ' https://www.infoq.com/presentations/Simple-Made-Easy ' , 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							
							
								        ' md5 ' :  ' 0e34642d4d9ef44bf86f66f6399672db ' , 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							
							
								        ' info_dict ' :  { 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							
							
								            ' id ' :  ' Simple-Made-Easy ' , 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							
							
								            ' title ' :  ' Simple Made Easy ' , 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							
							
								            ' ext ' :  ' mp3 ' , 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							
							
								            ' description ' :  ' md5:3e0e213a8bbd074796ef89ea35ada25b ' , 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							
							
								        } , 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							
							
								        ' params ' :  { 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							
							
								            ' format ' :  ' bestaudio ' , 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							
							
								        } , 
							 
						 
					
						
							
								
									
										
										
										
											2015-06-25 19:54:44 +06:00 
										
									 
								 
							 
							
								
									
										 
								
							 
							
								 
							
							
								    } ] 
							 
						 
					
						
							
								
									
										
										
										
											2013-06-23 21:14:19 +02:00 
										
									 
								 
							 
							
								
							 
							
								 
							
							
								
							 
						 
					
						
							
								
									
										
										
										
											2017-02-03 05:10:13 +01:00 
										
									 
								 
							 
							
								
									
										 
								
							 
							
								 
							
							
								    def  _extract_rtmp_video ( self ,  webpage ) : 
							 
						 
					
						
							
								
									
										
										
										
											2014-04-20 01:10:30 +02:00 
										
									 
								 
							 
							
								
									
										 
								
							 
							
								 
							
							
								        # The server URL is hardcoded 
							 
						 
					
						
							
								
									
										
										
										
											2014-04-20 01:01:37 +02:00 
										
									 
								 
							 
							
								
									
										 
								
							 
							
								 
							
							
								        video_url  =  ' rtmpe://video.infoq.com/cfx/st/ ' 
							 
						 
					
						
							
								
									
										
										
										
											2014-04-20 01:10:30 +02:00 
										
									 
								 
							 
							
								
									
										 
								
							 
							
								 
							
							
								
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							
							
								        # Extract video URL 
							 
						 
					
						
							
								
									
										
										
										
											2014-04-21 03:21:34 +02:00 
										
									 
								 
							 
							
								
									
										 
								
							 
							
								 
							
							
								        encoded_id  =  self . _search_regex ( 
							 
						 
					
						
							
								
									
										
										
										
											2015-12-13 19:15:45 +08:00 
										
									 
								 
							 
							
								
									
										 
								
							 
							
								 
							
							
								            r " jsclassref \ s*= \ s* ' ([^ ' ]*) ' " ,  webpage ,  ' encoded id ' ,  default = None ) 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							
							
								
							 
						 
					
						
							
								
									
										
										
										
											2018-01-23 22:23:12 +07:00 
										
									 
								 
							 
							
								
									
										 
								
							 
							
								 
							
							
								        real_id  =  compat_urllib_parse_unquote ( compat_b64decode ( encoded_id ) . decode ( ' utf-8 ' ) ) 
							 
						 
					
						
							
								
									
										
										
										
											2014-04-20 01:10:30 +02:00 
										
									 
								 
							 
							
								
									
										 
								
							 
							
								 
							
							
								        playpath  =  ' mp4: '  +  real_id 
							 
						 
					
						
							
								
									
										
										
										
											2013-06-23 21:14:19 +02:00 
										
									 
								 
							 
							
								
							 
							
								 
							
							
								
							 
						 
					
						
							
								
									
										
										
										
											2015-12-13 19:15:45 +08:00 
										
									 
								 
							 
							
								
									
										 
								
							 
							
								 
							
							
								        return  [ { 
							 
						 
					
						
							
								
									
										
										
										
											2017-02-03 05:10:13 +01:00 
										
									 
								 
							 
							
								
									
										 
								
							 
							
								 
							
							
								            ' format_id ' :  ' rtmp_video ' , 
							 
						 
					
						
							
								
									
										
										
										
											2015-12-13 19:15:45 +08:00 
										
									 
								 
							 
							
								
									
										 
								
							 
							
								 
							
							
								            ' url ' :  video_url , 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							
							
								            ' ext ' :  determine_ext ( playpath ) , 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							
							
								            ' play_path ' :  playpath , 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							
							
								        } ] 
							 
						 
					
						
							
								
									
										
										
										
											2013-06-23 21:14:19 +02:00 
										
									 
								 
							 
							
								
							 
							
								 
							
							
								
							 
						 
					
						
							
								
									
										
										
										
											2017-10-12 17:39:51 +00:00 
										
									 
								 
							 
							
								
									
										 
								
							 
							
								 
							
							
								    def  _extract_cf_auth ( self ,  webpage ) : 
							 
						 
					
						
							
								
									
										
										
										
											2017-10-09 23:50:53 +07:00 
										
									 
								 
							 
							
								
									
										 
								
							 
							
								 
							
							
								        policy  =  self . _search_regex ( r ' InfoQConstants \ .scp \ s*= \ s* \' ([^ \' ]+) \' ' ,  webpage ,  ' policy ' ) 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							
							
								        signature  =  self . _search_regex ( r ' InfoQConstants \ .scs \ s*= \ s* \' ([^ \' ]+) \' ' ,  webpage ,  ' signature ' ) 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							
							
								        key_pair_id  =  self . _search_regex ( r ' InfoQConstants \ .sck \ s*= \ s* \' ([^ \' ]+) \' ' ,  webpage ,  ' key-pair-id ' ) 
							 
						 
					
						
							
								
									
										
										
										
											2017-10-12 17:39:51 +00:00 
										
									 
								 
							 
							
								
									
										 
								
							 
							
								 
							
							
								        return  { 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							
							
								            ' Policy ' :  policy , 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							
							
								            ' Signature ' :  signature , 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							
							
								            ' Key-Pair-Id ' :  key_pair_id , 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							
							
								        } 
							 
						 
					
						
							
								
									
										
										
										
											2014-04-21 03:21:34 +02:00 
										
									 
								 
							 
							
								
									
										 
								
							 
							
								 
							
							
								
							 
						 
					
						
							
								
									
										
										
										
											2017-02-03 05:10:13 +01:00 
										
									 
								 
							 
							
								
									
										 
								
							 
							
								 
							
							
								    def  _extract_http_video ( self ,  webpage ) : 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							
							
								        http_video_url  =  self . _search_regex ( r ' P \ .s \ s*= \ s* \' ([^ \' ]+) \' ' ,  webpage ,  ' video URL ' ) 
							 
						 
					
						
							
								
									
										
										
										
											2017-10-12 17:39:51 +00:00 
										
									 
								 
							 
							
								
									
										 
								
							 
							
								 
							
							
								        http_video_url  =  update_url_query ( http_video_url ,  self . _extract_cf_auth ( webpage ) ) 
							 
						 
					
						
							
								
									
										
										
										
											2015-12-13 19:15:45 +08:00 
										
									 
								 
							 
							
								
									
										 
								
							 
							
								 
							
							
								        return  [ { 
							 
						 
					
						
							
								
									
										
										
										
											2017-02-03 05:10:13 +01:00 
										
									 
								 
							 
							
								
									
										 
								
							 
							
								 
							
							
								            ' format_id ' :  ' http_video ' , 
							 
						 
					
						
							
								
									
										
										
										
											2015-12-13 17:29:27 +08:00 
										
									 
								 
							 
							
								
									
										 
								
							 
							
								 
							
							
								            ' url ' :  http_video_url , 
							 
						 
					
						
							
								
									
										
										
										
											2014-04-21 03:21:34 +02:00 
										
									 
								 
							 
							
								
									
										 
								
							 
							
								 
							
							
								        } ] 
							 
						 
					
						
							
								
									
										
										
										
											2015-12-13 19:15:45 +08:00 
										
									 
								 
							 
							
								
									
										 
								
							 
							
								 
							
							
								
							 
						 
					
						
							
								
									
										
										
										
											2017-02-03 05:10:13 +01:00 
										
									 
								 
							 
							
								
									
										 
								
							 
							
								 
							
							
								    def  _extract_http_audio ( self ,  webpage ,  video_id ) : 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							
							
								        fields  =  self . _hidden_inputs ( webpage ) 
							 
						 
					
						
							
								
									
										
										
										
											2017-05-01 01:23:05 +07:00 
										
									 
								 
							 
							
								
									
										 
								
							 
							
								 
							
							
								        http_audio_url  =  fields . get ( ' filename ' ) 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							
							
								        if  not  http_audio_url : 
							 
						 
					
						
							
								
									
										
										
										
											2017-02-03 05:10:13 +01:00 
										
									 
								 
							 
							
								
									
										 
								
							 
							
								 
							
							
								            return  [ ] 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							
							
								
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							
							
								        # base URL is found in the Location header in the response returned by 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							
							
								        # GET https://www.infoq.com/mp3download.action?filename=... when logged in. 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							
							
								        http_audio_url  =  compat_urlparse . urljoin ( ' http://res.infoq.com/downloads/mp3downloads/ ' ,  http_audio_url ) 
							 
						 
					
						
							
								
									
										
										
										
											2017-10-12 17:39:51 +00:00 
										
									 
								 
							 
							
								
									
										 
								
							 
							
								 
							
							
								        http_audio_url  =  update_url_query ( http_audio_url ,  self . _extract_cf_auth ( webpage ) ) 
							 
						 
					
						
							
								
									
										
										
										
											2017-02-03 05:10:13 +01:00 
										
									 
								 
							 
							
								
									
										 
								
							 
							
								 
							
							
								
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							
							
								        # audio file seem to be missing some times even if there is a download link 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							
							
								        # so probe URL to make sure 
							 
						 
					
						
							
								
									
										
										
										
											2017-10-12 17:39:51 +00:00 
										
									 
								 
							 
							
								
									
										 
								
							 
							
								 
							
							
								        if  not  self . _is_valid_url ( http_audio_url ,  video_id ) : 
							 
						 
					
						
							
								
									
										
										
										
											2017-02-03 05:10:13 +01:00 
										
									 
								 
							 
							
								
									
										 
								
							 
							
								 
							
							
								            return  [ ] 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							
							
								
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							
							
								        return  [ { 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							
							
								            ' format_id ' :  ' http_audio ' , 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							
							
								            ' url ' :  http_audio_url , 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							
							
								            ' vcodec ' :  ' none ' , 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							
							
								        } ] 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							
							
								
							 
						 
					
						
							
								
									
										
										
										
											2015-12-13 19:15:45 +08:00 
										
									 
								 
							 
							
								
									
										 
								
							 
							
								 
							
							
								    def  _real_extract ( self ,  url ) : 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							
							
								        video_id  =  self . _match_id ( url ) 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							
							
								        webpage  =  self . _download_webpage ( url ,  video_id ) 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							
							
								
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							
							
								        video_title  =  self . _html_search_regex ( r ' <title>(.*?)</title> ' ,  webpage ,  ' title ' ) 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							
							
								        video_description  =  self . _html_search_meta ( ' description ' ,  webpage ,  ' description ' ) 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							
							
								
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							
							
								        if  ' /cn/ '  in  url : 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							
							
								            # for China videos, HTTP video URL exists but always fails with 403 
							 
						 
					
						
							
								
									
										
										
										
											2016-02-27 02:55:11 +08:00 
										
									 
								 
							 
							
								
									
										 
								
							 
							
								 
							
							
								            formats  =  self . _extract_bokecc_formats ( webpage ,  video_id ) 
							 
						 
					
						
							
								
									
										
										
										
											2015-12-13 19:15:45 +08:00 
										
									 
								 
							 
							
								
									
										 
								
							 
							
								 
							
							
								        else : 
							 
						 
					
						
							
								
									
										
										
										
											2017-02-03 05:10:13 +01:00 
										
									 
								 
							 
							
								
									
										 
								
							 
							
								 
							
							
								            formats  =  ( 
							 
						 
					
						
							
								
									
										
										
										
											2019-05-11 03:56:22 +07:00 
										
									 
								 
							 
							
								
									
										 
								
							 
							
								 
							
							
								                self . _extract_rtmp_video ( webpage ) 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							
							
								                +  self . _extract_http_video ( webpage ) 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							
							
								                +  self . _extract_http_audio ( webpage ,  video_id ) ) 
							 
						 
					
						
							
								
									
										
										
										
											2015-12-13 19:15:45 +08:00 
										
									 
								 
							 
							
								
									
										 
								
							 
							
								 
							
							
								
							 
						 
					
						
							
								
									
										
										
										
											2014-04-21 03:21:34 +02:00 
										
									 
								 
							 
							
								
									
										 
								
							 
							
								 
							
							
								        self . _sort_formats ( formats ) 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							
							
								
							 
						 
					
						
							
								
									
										
										
										
											2014-04-21 02:55:35 +02:00 
										
									 
								 
							 
							
								
									
										 
								
							 
							
								 
							
							
								        return  { 
							 
						 
					
						
							
								
									
										
										
										
											2013-06-23 21:14:19 +02:00 
										
									 
								 
							 
							
								
							 
							
								 
							
							
								            ' id ' :  video_id , 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							
							
								            ' title ' :  video_title , 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							
							
								            ' description ' :  video_description , 
							 
						 
					
						
							
								
									
										
										
										
											2014-04-21 03:21:34 +02:00 
										
									 
								 
							 
							
								
									
										 
								
							 
							
								 
							
							
								            ' formats ' :  formats , 
							 
						 
					
						
							
								
									
										
										
										
											2014-04-21 02:55:35 +02:00 
										
									 
								 
							 
							
								
									
										 
								
							 
							
								 
							
							
								        }