[thisamericanlife] Add a new extractor

This commit is contained in:
Eric Wong 2015-06-15 01:07:48 -07:00
parent 4b9f9010b0
commit 0283618ac2
2 changed files with 33 additions and 0 deletions

View File

@ -560,6 +560,7 @@ from .tf1 import TF1IE
from .theonion import TheOnionIE
from .theplatform import ThePlatformIE
from .thesixtyone import TheSixtyOneIE
from .thisamericanlife import ThisAmericanLifeIE
from .thisav import ThisAVIE
from .tinypic import TinyPicIE
from .tlc import TlcIE, TlcDeIE

View File

@ -0,0 +1,32 @@
# coding: utf-8
from __future__ import unicode_literals
from .common import InfoExtractor
class ThisAmericanLifeIE(InfoExtractor):
_VALID_URL = r'https?://(?:www\.)?thisamericanlife\.org/radio-archives/episode/(?P<id>\d+)'
_TEST = {
'url': 'http://www.thisamericanlife.org/radio-archives/episode/487/harper-high-school-part-one',
'md5': '5cda28076c9f9d1fd0b0f5cff5959948',
'info_dict': {
'id': '487',
'title': '487: Harper High School, Part One',
'url' : 'http://stream.thisamericanlife.org/487/stream/487_64k.m3u8',
'ext': 'aac',
}
}
def _real_extract(self, url):
video_id = self._match_id(url)
webpage = self._download_webpage(url, video_id)
title = self._html_search_regex(r'<h1[^>]*>(.*?)</h1>', webpage, 'title')
media_url = 'http://stream.thisamericanlife.org/' + video_id + '/stream/' + video_id + '_64k.m3u8'
return {
'id': video_id,
'title': title,
'url': media_url,
'ext': 'aac',
}