| 
									
										
										
										
											2015-08-24 00:36:24 +06:00
										 |  |  |  | # coding: utf-8 | 
					
						
							| 
									
										
										
										
											2015-03-09 19:06:49 +06:00
										 |  |  |  | from __future__ import unicode_literals | 
					
						
							|  |  |  |  | 
 | 
					
						
							|  |  |  |  | import re | 
					
						
							|  |  |  |  | import hashlib | 
					
						
							|  |  |  |  | 
 | 
					
						
							|  |  |  |  | from .common import InfoExtractor | 
					
						
							| 
									
										
										
										
											2015-08-26 00:11:15 +06:00
										 |  |  |  | from ..compat import ( | 
					
						
							|  |  |  |  |     compat_str, | 
					
						
							|  |  |  |  |     compat_urllib_parse, | 
					
						
							|  |  |  |  | ) | 
					
						
							| 
									
										
										
										
											2015-03-09 21:43:46 +06:00
										 |  |  |  | from ..utils import ( | 
					
						
							| 
									
										
										
										
											2016-03-04 21:32:54 +06:00
										 |  |  |  |     ExtractorError, | 
					
						
							| 
									
										
										
										
											2015-03-09 21:43:46 +06:00
										 |  |  |  |     int_or_none, | 
					
						
							|  |  |  |  |     float_or_none, | 
					
						
							| 
									
										
										
										
											2015-11-21 22:18:17 +06:00
										 |  |  |  |     sanitized_Request, | 
					
						
							| 
									
										
										
										
											2015-03-09 21:43:46 +06:00
										 |  |  |  | ) | 
					
						
							| 
									
										
										
										
											2015-03-09 19:06:49 +06:00
										 |  |  |  | 
 | 
					
						
							|  |  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2016-03-04 21:32:54 +06:00
										 |  |  |  | class YandexMusicBaseIE(InfoExtractor): | 
					
						
							|  |  |  |  |     @staticmethod | 
					
						
							|  |  |  |  |     def _handle_error(response): | 
					
						
							|  |  |  |  |         error = response.get('error') | 
					
						
							|  |  |  |  |         if error: | 
					
						
							|  |  |  |  |             raise ExtractorError(error, expected=True) | 
					
						
							|  |  |  |  | 
 | 
					
						
							|  |  |  |  |     def _download_json(self, *args, **kwargs): | 
					
						
							|  |  |  |  |         response = super(YandexMusicBaseIE, self)._download_json(*args, **kwargs) | 
					
						
							|  |  |  |  |         self._handle_error(response) | 
					
						
							|  |  |  |  |         return response | 
					
						
							|  |  |  |  | 
 | 
					
						
							|  |  |  |  | 
 | 
					
						
							|  |  |  |  | class YandexMusicTrackIE(YandexMusicBaseIE): | 
					
						
							| 
									
										
										
										
											2015-08-24 00:36:54 +06:00
										 |  |  |  |     IE_NAME = 'yandexmusic:track' | 
					
						
							|  |  |  |  |     IE_DESC = 'Яндекс.Музыка - Трек' | 
					
						
							|  |  |  |  |     _VALID_URL = r'https?://music\.yandex\.(?:ru|kz|ua|by)/album/(?P<album_id>\d+)/track/(?P<id>\d+)' | 
					
						
							|  |  |  |  | 
 | 
					
						
							|  |  |  |  |     _TEST = { | 
					
						
							|  |  |  |  |         'url': 'http://music.yandex.ru/album/540508/track/4878838', | 
					
						
							|  |  |  |  |         'md5': 'f496818aa2f60b6c0062980d2e00dc20', | 
					
						
							|  |  |  |  |         'info_dict': { | 
					
						
							|  |  |  |  |             'id': '4878838', | 
					
						
							|  |  |  |  |             'ext': 'mp3', | 
					
						
							|  |  |  |  |             'title': 'Carlo Ambrosio - Gypsy Eyes 1', | 
					
						
							|  |  |  |  |             'filesize': 4628061, | 
					
						
							|  |  |  |  |             'duration': 193.04, | 
					
						
							|  |  |  |  |         } | 
					
						
							|  |  |  |  |     } | 
					
						
							|  |  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2015-03-09 19:06:49 +06:00
										 |  |  |  |     def _get_track_url(self, storage_dir, track_id): | 
					
						
							| 
									
										
										
										
											2015-03-09 21:43:46 +06:00
										 |  |  |  |         data = self._download_json( | 
					
						
							|  |  |  |  |             'http://music.yandex.ru/api/v1.5/handlers/api-jsonp.jsx?action=getTrackSrc&p=download-info/%s' | 
					
						
							|  |  |  |  |             % storage_dir, | 
					
						
							|  |  |  |  |             track_id, 'Downloading track location JSON') | 
					
						
							| 
									
										
										
										
											2015-03-09 19:06:49 +06:00
										 |  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2015-03-09 21:43:46 +06:00
										 |  |  |  |         key = hashlib.md5(('XGRlBW9FXlekgbPrRHuSiA' + data['path'][1:] + data['s']).encode('utf-8')).hexdigest() | 
					
						
							| 
									
										
										
										
											2015-03-09 19:06:49 +06:00
										 |  |  |  |         storage = storage_dir.split('.') | 
					
						
							|  |  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2015-03-09 21:43:46 +06:00
										 |  |  |  |         return ('http://%s/get-mp3/%s/%s?track-id=%s&from=service-10-track&similarities-experiment=default' | 
					
						
							|  |  |  |  |                 % (data['host'], key, data['ts'] + data['path'], storage[1])) | 
					
						
							| 
									
										
										
										
											2015-03-09 19:06:49 +06:00
										 |  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2015-03-09 21:43:46 +06:00
										 |  |  |  |     def _get_track_info(self, track): | 
					
						
							| 
									
										
										
										
											2015-10-14 21:15:29 +06:00
										 |  |  |  |         thumbnail = None | 
					
						
							|  |  |  |  |         cover_uri = track.get('albums', [{}])[0].get('coverUri') | 
					
						
							|  |  |  |  |         if cover_uri: | 
					
						
							|  |  |  |  |             thumbnail = cover_uri.replace('%%', 'orig') | 
					
						
							|  |  |  |  |             if not thumbnail.startswith('http'): | 
					
						
							|  |  |  |  |                 thumbnail = 'http://' + thumbnail | 
					
						
							| 
									
										
										
										
											2015-03-09 21:43:46 +06:00
										 |  |  |  |         return { | 
					
						
							|  |  |  |  |             'id': track['id'], | 
					
						
							|  |  |  |  |             'ext': 'mp3', | 
					
						
							|  |  |  |  |             'url': self._get_track_url(track['storageDir'], track['id']), | 
					
						
							|  |  |  |  |             'title': '%s - %s' % (track['artists'][0]['name'], track['title']), | 
					
						
							|  |  |  |  |             'filesize': int_or_none(track.get('fileSize')), | 
					
						
							|  |  |  |  |             'duration': float_or_none(track.get('durationMs'), 1000), | 
					
						
							| 
									
										
										
										
											2015-10-14 21:15:29 +06:00
										 |  |  |  |             'thumbnail': thumbnail, | 
					
						
							| 
									
										
										
										
											2015-03-09 21:43:46 +06:00
										 |  |  |  |         } | 
					
						
							| 
									
										
										
										
											2015-03-09 19:06:49 +06:00
										 |  |  |  | 
 | 
					
						
							|  |  |  |  |     def _real_extract(self, url): | 
					
						
							| 
									
										
										
										
											2015-03-09 21:43:46 +06:00
										 |  |  |  |         mobj = re.match(self._VALID_URL, url) | 
					
						
							|  |  |  |  |         album_id, track_id = mobj.group('album_id'), mobj.group('id') | 
					
						
							| 
									
										
										
										
											2015-03-09 19:06:49 +06:00
										 |  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2015-03-09 21:43:46 +06:00
										 |  |  |  |         track = self._download_json( | 
					
						
							|  |  |  |  |             'http://music.yandex.ru/handlers/track.jsx?track=%s:%s' % (track_id, album_id), | 
					
						
							|  |  |  |  |             track_id, 'Downloading track JSON')['track'] | 
					
						
							| 
									
										
										
										
											2015-03-09 19:06:49 +06:00
										 |  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2015-03-09 21:43:46 +06:00
										 |  |  |  |         return self._get_track_info(track) | 
					
						
							| 
									
										
										
										
											2015-03-09 19:06:49 +06:00
										 |  |  |  | 
 | 
					
						
							|  |  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2016-03-04 21:32:54 +06:00
										 |  |  |  | class YandexMusicPlaylistBaseIE(YandexMusicBaseIE): | 
					
						
							| 
									
										
										
										
											2015-08-24 00:36:24 +06:00
										 |  |  |  |     def _build_playlist(self, tracks): | 
					
						
							|  |  |  |  |         return [ | 
					
						
							|  |  |  |  |             self.url_result( | 
					
						
							|  |  |  |  |                 'http://music.yandex.ru/album/%s/track/%s' % (track['albums'][0]['id'], track['id'])) | 
					
						
							| 
									
										
										
										
											2015-08-25 23:29:02 +06:00
										 |  |  |  |             for track in tracks if track.get('albums') and isinstance(track.get('albums'), list)] | 
					
						
							| 
									
										
										
										
											2015-08-24 00:36:24 +06:00
										 |  |  |  | 
 | 
					
						
							|  |  |  |  | 
 | 
					
						
							|  |  |  |  | class YandexMusicAlbumIE(YandexMusicPlaylistBaseIE): | 
					
						
							| 
									
										
										
										
											2015-03-09 21:43:46 +06:00
										 |  |  |  |     IE_NAME = 'yandexmusic:album' | 
					
						
							|  |  |  |  |     IE_DESC = 'Яндекс.Музыка - Альбом' | 
					
						
							| 
									
										
										
										
											2015-03-14 13:56:04 +06:00
										 |  |  |  |     _VALID_URL = r'https?://music\.yandex\.(?:ru|kz|ua|by)/album/(?P<id>\d+)/?(\?|$)' | 
					
						
							| 
									
										
										
										
											2015-03-09 19:06:49 +06:00
										 |  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2015-03-09 21:43:46 +06:00
										 |  |  |  |     _TEST = { | 
					
						
							|  |  |  |  |         'url': 'http://music.yandex.ru/album/540508', | 
					
						
							|  |  |  |  |         'info_dict': { | 
					
						
							|  |  |  |  |             'id': '540508', | 
					
						
							|  |  |  |  |             'title': 'Carlo Ambrosio - Gypsy Soul (2009)', | 
					
						
							|  |  |  |  |         }, | 
					
						
							|  |  |  |  |         'playlist_count': 50, | 
					
						
							|  |  |  |  |     } | 
					
						
							| 
									
										
										
										
											2015-03-09 19:06:49 +06:00
										 |  |  |  | 
 | 
					
						
							|  |  |  |  |     def _real_extract(self, url): | 
					
						
							| 
									
										
										
										
											2015-03-09 21:43:46 +06:00
										 |  |  |  |         album_id = self._match_id(url) | 
					
						
							| 
									
										
										
										
											2015-03-09 19:06:49 +06:00
										 |  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2015-03-09 21:43:46 +06:00
										 |  |  |  |         album = self._download_json( | 
					
						
							|  |  |  |  |             'http://music.yandex.ru/handlers/album.jsx?album=%s' % album_id, | 
					
						
							|  |  |  |  |             album_id, 'Downloading album JSON') | 
					
						
							| 
									
										
										
										
											2015-03-09 19:06:49 +06:00
										 |  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2015-08-24 00:36:24 +06:00
										 |  |  |  |         entries = self._build_playlist(album['volumes'][0]) | 
					
						
							| 
									
										
										
										
											2015-03-09 21:43:46 +06:00
										 |  |  |  | 
 | 
					
						
							|  |  |  |  |         title = '%s - %s' % (album['artists'][0]['name'], album['title']) | 
					
						
							|  |  |  |  |         year = album.get('year') | 
					
						
							|  |  |  |  |         if year: | 
					
						
							|  |  |  |  |             title += ' (%s)' % year | 
					
						
							|  |  |  |  | 
 | 
					
						
							|  |  |  |  |         return self.playlist_result(entries, compat_str(album['id']), title) | 
					
						
							| 
									
										
										
										
											2015-03-09 19:06:49 +06:00
										 |  |  |  | 
 | 
					
						
							|  |  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2015-08-24 00:36:24 +06:00
										 |  |  |  | class YandexMusicPlaylistIE(YandexMusicPlaylistBaseIE): | 
					
						
							| 
									
										
										
										
											2015-03-09 21:43:46 +06:00
										 |  |  |  |     IE_NAME = 'yandexmusic:playlist' | 
					
						
							|  |  |  |  |     IE_DESC = 'Яндекс.Музыка - Плейлист' | 
					
						
							| 
									
										
										
										
											2015-03-14 13:56:04 +06:00
										 |  |  |  |     _VALID_URL = r'https?://music\.yandex\.(?:ru|kz|ua|by)/users/[^/]+/playlists/(?P<id>\d+)' | 
					
						
							| 
									
										
										
										
											2015-03-09 21:43:46 +06:00
										 |  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2015-08-26 00:11:15 +06:00
										 |  |  |  |     _TESTS = [{ | 
					
						
							| 
									
										
										
										
											2015-03-09 21:43:46 +06:00
										 |  |  |  |         'url': 'http://music.yandex.ru/users/music.partners/playlists/1245', | 
					
						
							| 
									
										
										
										
											2015-03-09 19:06:49 +06:00
										 |  |  |  |         'info_dict': { | 
					
						
							| 
									
										
										
										
											2015-03-09 21:43:46 +06:00
										 |  |  |  |             'id': '1245', | 
					
						
							|  |  |  |  |             'title': 'Что слушают Enter Shikari', | 
					
						
							|  |  |  |  |             'description': 'md5:3b9f27b0efbe53f2ee1e844d07155cc9', | 
					
						
							|  |  |  |  |         }, | 
					
						
							|  |  |  |  |         'playlist_count': 6, | 
					
						
							| 
									
										
										
										
											2015-08-26 00:11:15 +06:00
										 |  |  |  |     }, { | 
					
						
							|  |  |  |  |         # playlist exceeding the limit of 150 tracks shipped with webpage (see | 
					
						
							|  |  |  |  |         # https://github.com/rg3/youtube-dl/issues/6666) | 
					
						
							|  |  |  |  |         'url': 'https://music.yandex.ru/users/ya.playlist/playlists/1036', | 
					
						
							|  |  |  |  |         'info_dict': { | 
					
						
							|  |  |  |  |             'id': '1036', | 
					
						
							|  |  |  |  |             'title': 'Музыка 90-х', | 
					
						
							|  |  |  |  |         }, | 
					
						
							|  |  |  |  |         'playlist_count': 310, | 
					
						
							|  |  |  |  |     }] | 
					
						
							| 
									
										
										
										
											2015-03-09 19:06:49 +06:00
										 |  |  |  | 
 | 
					
						
							|  |  |  |  |     def _real_extract(self, url): | 
					
						
							| 
									
										
										
										
											2015-03-09 21:43:46 +06:00
										 |  |  |  |         playlist_id = self._match_id(url) | 
					
						
							| 
									
										
										
										
											2015-03-09 19:06:49 +06:00
										 |  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2015-03-09 21:43:46 +06:00
										 |  |  |  |         webpage = self._download_webpage(url, playlist_id) | 
					
						
							| 
									
										
										
										
											2015-03-09 19:06:49 +06:00
										 |  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2015-08-26 00:11:15 +06:00
										 |  |  |  |         mu = self._parse_json( | 
					
						
							| 
									
										
										
										
											2015-03-09 21:43:46 +06:00
										 |  |  |  |             self._search_regex( | 
					
						
							|  |  |  |  |                 r'var\s+Mu\s*=\s*({.+?});\s*</script>', webpage, 'player'), | 
					
						
							| 
									
										
										
										
											2015-08-26 00:11:15 +06:00
										 |  |  |  |             playlist_id) | 
					
						
							|  |  |  |  | 
 | 
					
						
							|  |  |  |  |         playlist = mu['pageData']['playlist'] | 
					
						
							|  |  |  |  |         tracks, track_ids = playlist['tracks'], playlist['trackIds'] | 
					
						
							|  |  |  |  | 
 | 
					
						
							|  |  |  |  |         # tracks dictionary shipped with webpage is limited to 150 tracks, | 
					
						
							|  |  |  |  |         # missing tracks should be retrieved manually. | 
					
						
							|  |  |  |  |         if len(tracks) < len(track_ids): | 
					
						
							|  |  |  |  |             present_track_ids = set([compat_str(track['id']) for track in tracks if track.get('id')]) | 
					
						
							|  |  |  |  |             missing_track_ids = set(map(compat_str, track_ids)) - set(present_track_ids) | 
					
						
							| 
									
										
										
										
											2015-11-21 22:18:17 +06:00
										 |  |  |  |             request = sanitized_Request( | 
					
						
							| 
									
										
										
										
											2015-08-26 00:11:15 +06:00
										 |  |  |  |                 'https://music.yandex.ru/handlers/track-entries.jsx', | 
					
						
							|  |  |  |  |                 compat_urllib_parse.urlencode({ | 
					
						
							|  |  |  |  |                     'entries': ','.join(missing_track_ids), | 
					
						
							|  |  |  |  |                     'lang': mu.get('settings', {}).get('lang', 'en'), | 
					
						
							|  |  |  |  |                     'external-domain': 'music.yandex.ru', | 
					
						
							|  |  |  |  |                     'overembed': 'false', | 
					
						
							|  |  |  |  |                     'sign': mu.get('authData', {}).get('user', {}).get('sign'), | 
					
						
							|  |  |  |  |                     'strict': 'true', | 
					
						
							|  |  |  |  |                 }).encode('utf-8')) | 
					
						
							|  |  |  |  |             request.add_header('Referer', url) | 
					
						
							|  |  |  |  |             request.add_header('X-Requested-With', 'XMLHttpRequest') | 
					
						
							|  |  |  |  | 
 | 
					
						
							|  |  |  |  |             missing_tracks = self._download_json( | 
					
						
							|  |  |  |  |                 request, playlist_id, 'Downloading missing tracks JSON', fatal=False) | 
					
						
							|  |  |  |  |             if missing_tracks: | 
					
						
							|  |  |  |  |                 tracks.extend(missing_tracks) | 
					
						
							| 
									
										
										
										
											2015-03-09 21:43:46 +06:00
										 |  |  |  | 
 | 
					
						
							|  |  |  |  |         return self.playlist_result( | 
					
						
							| 
									
										
										
										
											2015-08-26 00:11:15 +06:00
										 |  |  |  |             self._build_playlist(tracks), | 
					
						
							| 
									
										
										
										
											2015-08-24 00:36:24 +06:00
										 |  |  |  |             compat_str(playlist_id), | 
					
						
							| 
									
										
										
										
											2015-03-09 21:43:46 +06:00
										 |  |  |  |             playlist['title'], playlist.get('description')) |