| 
									
										
										
										
											2014-10-24 09:49:01 +05:30
										 |  |  | # coding: utf-8 | 
					
						
							|  |  |  | from __future__ import unicode_literals | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2016-02-06 18:42:57 +00:00
										 |  |  | import re | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2014-10-24 09:49:01 +05:30
										 |  |  | from .common import InfoExtractor | 
					
						
							|  |  |  | from ..utils import ( | 
					
						
							|  |  |  |     float_or_none, | 
					
						
							| 
									
										
										
										
											2016-01-04 05:04:48 +06:00
										 |  |  |     parse_iso8601, | 
					
						
							| 
									
										
										
										
											2015-12-30 21:50:26 +00:00
										 |  |  |     unescapeHTML, | 
					
						
							| 
									
										
										
										
											2014-10-24 09:49:01 +05:30
										 |  |  | ) | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | class RteIE(InfoExtractor): | 
					
						
							| 
									
										
										
										
											2015-12-30 21:50:26 +00:00
										 |  |  |     IE_NAME = 'rte' | 
					
						
							|  |  |  |     IE_DESC = 'Raidió Teilifís Éireann TV' | 
					
						
							| 
									
										
										
										
											2015-10-17 11:53:59 +02:00
										 |  |  |     _VALID_URL = r'https?://(?:www\.)?rte\.ie/player/[^/]{2,3}/show/[^/]+/(?P<id>[0-9]+)' | 
					
						
							| 
									
										
										
										
											2014-10-24 09:49:01 +05:30
										 |  |  |     _TEST = { | 
					
						
							| 
									
										
										
										
											2015-10-17 11:49:51 +02:00
										 |  |  |         'url': 'http://www.rte.ie/player/ie/show/iwitness-862/10478715/', | 
					
						
							| 
									
										
										
										
											2014-10-24 09:49:01 +05:30
										 |  |  |         'info_dict': { | 
					
						
							| 
									
										
										
										
											2015-10-17 11:49:51 +02:00
										 |  |  |             'id': '10478715', | 
					
						
							| 
									
										
										
										
											2015-12-30 21:50:26 +00:00
										 |  |  |             'ext': 'flv', | 
					
						
							| 
									
										
										
										
											2015-10-17 11:49:51 +02:00
										 |  |  |             'title': 'Watch iWitness  online', | 
					
						
							| 
									
										
										
										
											2014-10-24 09:49:01 +05:30
										 |  |  |             'thumbnail': 're:^https?://.*\.jpg$', | 
					
						
							| 
									
										
										
										
											2015-10-17 11:49:51 +02:00
										 |  |  |             'description': 'iWitness : The spirit of Ireland, one voice and one minute at a time.', | 
					
						
							|  |  |  |             'duration': 60.046, | 
					
						
							| 
									
										
										
										
											2015-01-10 17:57:21 +01:00
										 |  |  |         }, | 
					
						
							|  |  |  |         'params': { | 
					
						
							|  |  |  |             'skip_download': 'f4m fails with --test atm' | 
					
						
							| 
									
										
										
										
											2014-10-24 09:49:01 +05:30
										 |  |  |         } | 
					
						
							|  |  |  |     } | 
					
						
							| 
									
										
										
										
											2015-01-10 17:59:07 +01:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2014-10-24 09:49:01 +05:30
										 |  |  |     def _real_extract(self, url): | 
					
						
							|  |  |  |         video_id = self._match_id(url) | 
					
						
							|  |  |  |         webpage = self._download_webpage(url, video_id) | 
					
						
							| 
									
										
										
										
											2015-01-10 17:57:21 +01:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2014-10-24 09:49:01 +05:30
										 |  |  |         title = self._og_search_title(webpage) | 
					
						
							| 
									
										
										
										
											2015-01-10 17:57:21 +01:00
										 |  |  |         description = self._html_search_meta('description', webpage, 'description') | 
					
						
							|  |  |  |         duration = float_or_none(self._html_search_meta( | 
					
						
							|  |  |  |             'duration', webpage, 'duration', fatal=False), 1000) | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |         thumbnail_id = self._search_regex( | 
					
						
							|  |  |  |             r'<meta name="thumbnail" content="uri:irus:(.*?)" />', webpage, 'thumbnail') | 
					
						
							|  |  |  |         thumbnail = 'http://img.rasset.ie/' + thumbnail_id + '.jpg' | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2016-02-14 15:37:17 +06:00
										 |  |  |         feeds_url = self._html_search_meta('feeds-prefix', webpage, 'feeds url') + video_id | 
					
						
							| 
									
										
										
										
											2014-10-24 09:49:01 +05:30
										 |  |  |         json_string = self._download_json(feeds_url, video_id) | 
					
						
							| 
									
										
										
										
											2015-01-10 17:57:21 +01:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2014-10-24 09:49:01 +05:30
										 |  |  |         # f4m_url = server + relative_url | 
					
						
							|  |  |  |         f4m_url = json_string['shows'][0]['media:group'][0]['rte:server'] + json_string['shows'][0]['media:group'][0]['url'] | 
					
						
							|  |  |  |         f4m_formats = self._extract_f4m_formats(f4m_url, video_id) | 
					
						
							| 
									
										
										
										
											2016-03-27 07:03:08 +06:00
										 |  |  |         self._sort_formats(f4m_formats) | 
					
						
							| 
									
										
										
										
											2015-01-10 17:57:21 +01:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2014-10-24 09:49:01 +05:30
										 |  |  |         return { | 
					
						
							|  |  |  |             'id': video_id, | 
					
						
							|  |  |  |             'title': title, | 
					
						
							|  |  |  |             'formats': f4m_formats, | 
					
						
							|  |  |  |             'description': description, | 
					
						
							|  |  |  |             'thumbnail': thumbnail, | 
					
						
							|  |  |  |             'duration': duration, | 
					
						
							| 
									
										
										
										
											2015-01-10 17:57:21 +01:00
										 |  |  |         } | 
					
						
							| 
									
										
										
										
											2015-12-30 21:50:26 +00:00
										 |  |  | 
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | class RteRadioIE(InfoExtractor): | 
					
						
							|  |  |  |     IE_NAME = 'rte:radio' | 
					
						
							|  |  |  |     IE_DESC = 'Raidió Teilifís Éireann radio' | 
					
						
							| 
									
										
										
										
											2016-02-06 18:42:57 +00:00
										 |  |  |     # Radioplayer URLs have two distinct specifier formats, | 
					
						
							|  |  |  |     # the old format #!rii=<channel_id>:<id>:<playable_item_id>:<date>: | 
					
						
							|  |  |  |     # the new format #!rii=b<channel_id>_<id>_<playable_item_id>_<date>_ | 
					
						
							| 
									
										
										
										
											2015-12-30 21:50:26 +00:00
										 |  |  |     # where the IDs are int/empty, the date is DD-MM-YYYY, and the specifier may be truncated. | 
					
						
							|  |  |  |     # An <id> uniquely defines an individual recording, and is the only part we require. | 
					
						
							| 
									
										
										
										
											2016-02-06 18:42:57 +00:00
										 |  |  |     _VALID_URL = r'https?://(?:www\.)?rte\.ie/radio/utils/radioplayer/rteradioweb\.html#!rii=(?:b?[0-9]*)(?:%3A|:|%5F|_)(?P<id>[0-9]+)' | 
					
						
							| 
									
										
										
										
											2015-12-30 21:50:26 +00:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2016-02-06 18:42:57 +00:00
										 |  |  |     _TESTS = [{ | 
					
						
							|  |  |  |         # Old-style player URL; HLS and RTMPE formats | 
					
						
							| 
									
										
										
										
											2015-12-30 21:50:26 +00:00
										 |  |  |         'url': 'http://www.rte.ie/radio/utils/radioplayer/rteradioweb.html#!rii=16:10507902:2414:27-12-2015:', | 
					
						
							|  |  |  |         'info_dict': { | 
					
						
							|  |  |  |             'id': '10507902', | 
					
						
							| 
									
										
										
										
											2016-01-04 05:04:48 +06:00
										 |  |  |             'ext': 'mp4', | 
					
						
							| 
									
										
										
										
											2015-12-30 21:50:26 +00:00
										 |  |  |             'title': 'Gloria', | 
					
						
							|  |  |  |             'thumbnail': 're:^https?://.*\.jpg$', | 
					
						
							| 
									
										
										
										
											2016-01-04 05:04:48 +06:00
										 |  |  |             'description': 'md5:9ce124a7fb41559ec68f06387cabddf0', | 
					
						
							|  |  |  |             'timestamp': 1451203200, | 
					
						
							|  |  |  |             'upload_date': '20151227', | 
					
						
							| 
									
										
										
										
											2015-12-30 21:50:26 +00:00
										 |  |  |             'duration': 7230.0, | 
					
						
							|  |  |  |         }, | 
					
						
							|  |  |  |         'params': { | 
					
						
							|  |  |  |             'skip_download': 'f4m fails with --test atm' | 
					
						
							|  |  |  |         } | 
					
						
							| 
									
										
										
										
											2016-02-06 18:42:57 +00:00
										 |  |  |     }, { | 
					
						
							|  |  |  |         # New-style player URL; RTMPE formats only | 
					
						
							|  |  |  |         'url': 'http://rte.ie/radio/utils/radioplayer/rteradioweb.html#!rii=b16_3250678_8861_06-04-2012_', | 
					
						
							|  |  |  |         'info_dict': { | 
					
						
							|  |  |  |             'id': '3250678', | 
					
						
							|  |  |  |             'ext': 'flv', | 
					
						
							|  |  |  |             'title': 'The Lyric Concert with Paul Herriott', | 
					
						
							|  |  |  |             'thumbnail': 're:^https?://.*\.jpg$', | 
					
						
							|  |  |  |             'description': '', | 
					
						
							|  |  |  |             'timestamp': 1333742400, | 
					
						
							|  |  |  |             'upload_date': '20120406', | 
					
						
							|  |  |  |             'duration': 7199.016, | 
					
						
							|  |  |  |         }, | 
					
						
							|  |  |  |         'params': { | 
					
						
							|  |  |  |             'skip_download': 'f4m fails with --test atm' | 
					
						
							|  |  |  |         } | 
					
						
							|  |  |  |     }] | 
					
						
							| 
									
										
										
										
											2015-12-30 21:50:26 +00:00
										 |  |  | 
 | 
					
						
							|  |  |  |     def _real_extract(self, url): | 
					
						
							|  |  |  |         item_id = self._match_id(url) | 
					
						
							| 
									
										
										
										
											2016-01-04 05:04:48 +06:00
										 |  |  | 
 | 
					
						
							|  |  |  |         json_string = self._download_json( | 
					
						
							|  |  |  |             'http://www.rte.ie/rteavgen/getplaylist/?type=web&format=json&id=' + item_id, | 
					
						
							|  |  |  |             item_id) | 
					
						
							| 
									
										
										
										
											2015-12-30 21:50:26 +00:00
										 |  |  | 
 | 
					
						
							|  |  |  |         # NB the string values in the JSON are stored using XML escaping(!) | 
					
						
							|  |  |  |         show = json_string['shows'][0] | 
					
						
							|  |  |  |         title = unescapeHTML(show['title']) | 
					
						
							|  |  |  |         description = unescapeHTML(show.get('description')) | 
					
						
							|  |  |  |         thumbnail = show.get('thumbnail') | 
					
						
							|  |  |  |         duration = float_or_none(show.get('duration'), 1000) | 
					
						
							| 
									
										
										
										
											2016-01-04 05:04:48 +06:00
										 |  |  |         timestamp = parse_iso8601(show.get('published')) | 
					
						
							| 
									
										
										
										
											2015-12-30 21:50:26 +00:00
										 |  |  | 
 | 
					
						
							|  |  |  |         mg = show['media:group'][0] | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |         formats = [] | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2016-02-06 18:42:57 +00:00
										 |  |  |         if mg.get('url'): | 
					
						
							|  |  |  |             m = re.match(r'(?P<url>rtmpe?://[^/]+)/(?P<app>.+)/(?P<playpath>mp4:.*)', mg['url']) | 
					
						
							|  |  |  |             if m: | 
					
						
							|  |  |  |                 m = m.groupdict() | 
					
						
							|  |  |  |                 formats.append({ | 
					
						
							|  |  |  |                     'url': m['url'] + '/' + m['app'], | 
					
						
							|  |  |  |                     'app': m['app'], | 
					
						
							|  |  |  |                     'play_path': m['playpath'], | 
					
						
							|  |  |  |                     'player_url': url, | 
					
						
							|  |  |  |                     'ext': 'flv', | 
					
						
							|  |  |  |                     'format_id': 'rtmp', | 
					
						
							|  |  |  |                 }) | 
					
						
							| 
									
										
										
										
											2015-12-30 21:50:26 +00:00
										 |  |  | 
 | 
					
						
							|  |  |  |         if mg.get('hls_server') and mg.get('hls_url'): | 
					
						
							| 
									
										
										
										
											2016-01-04 05:01:32 +06:00
										 |  |  |             formats.extend(self._extract_m3u8_formats( | 
					
						
							|  |  |  |                 mg['hls_server'] + mg['hls_url'], item_id, 'mp4', | 
					
						
							|  |  |  |                 entry_protocol='m3u8_native', m3u8_id='hls', fatal=False)) | 
					
						
							| 
									
										
										
										
											2015-12-30 21:50:26 +00:00
										 |  |  | 
 | 
					
						
							|  |  |  |         if mg.get('hds_server') and mg.get('hds_url'): | 
					
						
							| 
									
										
										
										
											2016-01-04 05:01:32 +06:00
										 |  |  |             formats.extend(self._extract_f4m_formats( | 
					
						
							|  |  |  |                 mg['hds_server'] + mg['hds_url'], item_id, | 
					
						
							|  |  |  |                 f4m_id='hds', fatal=False)) | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |         self._sort_formats(formats) | 
					
						
							| 
									
										
										
										
											2015-12-30 21:50:26 +00:00
										 |  |  | 
 | 
					
						
							|  |  |  |         return { | 
					
						
							|  |  |  |             'id': item_id, | 
					
						
							|  |  |  |             'title': title, | 
					
						
							|  |  |  |             'description': description, | 
					
						
							|  |  |  |             'thumbnail': thumbnail, | 
					
						
							| 
									
										
										
										
											2016-01-04 05:04:48 +06:00
										 |  |  |             'timestamp': timestamp, | 
					
						
							| 
									
										
										
										
											2015-12-30 21:50:26 +00:00
										 |  |  |             'duration': duration, | 
					
						
							| 
									
										
										
										
											2016-01-04 05:04:48 +06:00
										 |  |  |             'formats': formats, | 
					
						
							| 
									
										
										
										
											2015-12-30 21:50:26 +00:00
										 |  |  |         } |