[nhk] add support for audio URLs
This commit is contained in:
		
							parent
							
								
									5de538787d
								
							
						
					
					
						commit
						061d1cd948
					
				| @ -1,54 +1,80 @@ | ||||
| from __future__ import unicode_literals | ||||
| 
 | ||||
| import re | ||||
| 
 | ||||
| from .common import InfoExtractor | ||||
| from ..utils import ExtractorError | ||||
| 
 | ||||
| 
 | ||||
| class NhkVodIE(InfoExtractor): | ||||
|     _VALID_URL = r'https?://www3\.nhk\.or\.jp/nhkworld/en/(?:vod|ondemand)/(?P<id>[^/]+/[^/?#&]+)' | ||||
|     _VALID_URL = r'https?://www3\.nhk\.or\.jp/nhkworld/(?P<lang>[a-z]{2})/ondemand/(?P<type>video|audio)/(?P<id>\d{7}|[a-z]+-\d{8}-\d+)' | ||||
|     # Content available only for a limited period of time. Visit | ||||
|     # https://www3.nhk.or.jp/nhkworld/en/ondemand/ for working samples. | ||||
|     _TESTS = [{ | ||||
|         # Videos available only for a limited period of time. Visit | ||||
|         # http://www3.nhk.or.jp/nhkworld/en/vod/ for working samples. | ||||
|         'url': 'http://www3.nhk.or.jp/nhkworld/en/vod/tokyofashion/20160815', | ||||
|         'info_dict': { | ||||
|             'id': 'A1bnNiNTE6nY3jLllS-BIISfcC_PpvF5', | ||||
|             'ext': 'flv', | ||||
|             'title': 'TOKYO FASHION EXPRESS - The Kimono as Global Fashion', | ||||
|             'description': 'md5:db338ee6ce8204f415b754782f819824', | ||||
|             'series': 'TOKYO FASHION EXPRESS', | ||||
|             'episode': 'The Kimono as Global Fashion', | ||||
|         }, | ||||
|         'skip': 'Videos available only for a limited period of time', | ||||
|     }, { | ||||
|         'url': 'https://www3.nhk.or.jp/nhkworld/en/ondemand/video/2015173/', | ||||
|         'only_matching': True, | ||||
|     }, { | ||||
|         'url': 'https://www3.nhk.or.jp/nhkworld/en/ondemand/audio/plugin-20190404-1/', | ||||
|         'only_matching': True, | ||||
|     }, { | ||||
|         'url': 'https://www3.nhk.or.jp/nhkworld/fr/ondemand/audio/plugin-20190404-1/', | ||||
|         'only_matching': True, | ||||
|     }] | ||||
|     _API_URL = 'http://api.nhk.or.jp/nhkworld/vodesdlist/v1/all/all/all.json?apikey=EJfK8jdS57GqlupFgAfAAwr573q01y6k' | ||||
|     _API_URL_TEMPLATE = 'https://api.nhk.or.jp/nhkworld/%sodesdlist/v7/episode/%s/%s/all%s.json' | ||||
| 
 | ||||
|     def _real_extract(self, url): | ||||
|         video_id = self._match_id(url) | ||||
| 
 | ||||
|         data = self._download_json(self._API_URL, video_id) | ||||
| 
 | ||||
|         try: | ||||
|             episode = next( | ||||
|                 e for e in data['data']['episodes'] | ||||
|                 if e.get('url') and video_id in e['url']) | ||||
|         except StopIteration: | ||||
|             raise ExtractorError('Unable to find episode') | ||||
| 
 | ||||
|         embed_code = episode['vod_id'] | ||||
|         lang, m_type, episode_id = re.match(self._VALID_URL, url).groups() | ||||
|         if episode_id.isdigit(): | ||||
|             episode_id = episode_id[:4] + '-' + episode_id[4:] | ||||
| 
 | ||||
|         is_video = m_type == 'video' | ||||
|         episode = self._download_json( | ||||
|             self._API_URL_TEMPLATE % ('v' if is_video else 'r', episode_id, lang, '/all' if is_video else ''), | ||||
|             episode_id, query={'apikey': 'EJfK8jdS57GqlupFgAfAAwr573q01y6k'})['data']['episodes'][0] | ||||
|         title = episode.get('sub_title_clean') or episode['sub_title'] | ||||
|         description = episode.get('description_clean') or episode.get('description') | ||||
|         series = episode.get('title_clean') or episode.get('title') | ||||
| 
 | ||||
|         return { | ||||
|             '_type': 'url_transparent', | ||||
|             'ie_key': 'Ooyala', | ||||
|             'url': 'ooyala:%s' % embed_code, | ||||
|         def get_clean_field(key): | ||||
|             return episode.get(key + '_clean') or episode.get(key) | ||||
| 
 | ||||
|         series = get_clean_field('title') | ||||
| 
 | ||||
|         thumbnails = [] | ||||
|         for s, w, h in [('', 640, 360), ('_l', 1280, 720)]: | ||||
|             img_path = episode.get('image' + s) | ||||
|             if not img_path: | ||||
|                 continue | ||||
|             thumbnails.append({ | ||||
|                 'id': '%dp' % h, | ||||
|                 'height': h, | ||||
|                 'width': w, | ||||
|                 'url': 'https://www3.nhk.or.jp' + img_path, | ||||
|             }) | ||||
| 
 | ||||
|         info = { | ||||
|             'id': episode_id + '-' + lang, | ||||
|             'title': '%s - %s' % (series, title) if series and title else title, | ||||
|             'description': description, | ||||
|             'description': get_clean_field('description'), | ||||
|             'thumbnails': thumbnails, | ||||
|             'series': series, | ||||
|             'episode': title, | ||||
|         } | ||||
|         if is_video: | ||||
|             info.update({ | ||||
|                 '_type': 'url_transparent', | ||||
|                 'ie_key': 'Ooyala', | ||||
|                 'url': 'ooyala:' + episode['vod_id'], | ||||
|             }) | ||||
|         else: | ||||
|             audio = episode['audio'] | ||||
|             audio_path = audio['audio'] | ||||
|             info['formats'] = self._extract_m3u8_formats( | ||||
|                 'https://nhks-vh.akamaihd.net/i%s/master.m3u8' % audio_path, | ||||
|                 episode_id, 'm4a', m3u8_id='hls', fatal=False) | ||||
|             info['formats'].append({ | ||||
|                 'ext': 'flv', | ||||
|                 'format_id': 'flv', | ||||
|                 'url': 'rtmp://flv.nhk.or.jp/ondemand/mp4:flv' + audio_path, | ||||
|                 'vcodec': 'none', | ||||
|             }) | ||||
|             for f in info['formats']: | ||||
|                 f['language'] = lang | ||||
|         return info | ||||
|  | ||||
		Loading…
	
	
			
			x
			
			
		
	
		Reference in New Issue
	
	Block a user