fix playpage extraction and username extraction

This commit is contained in:
kjy00302 2016-05-14 17:19:27 +09:00
parent f34dc267d4
commit 0b426f926e

View File

@ -107,10 +107,10 @@ class TvpleIE(InfoExtractor):
def _real_extract(self, url): def _real_extract(self, url):
video_id = self._match_id(url) video_id = self._match_id(url)
webpage = self._download_webpage(url, video_id) webpage = self._download_webpage(url, video_id)
playpage = self._download_json(re.search(r'data-meta="(.*)"', webpage).group(1), "playurl_%d" % int(video_id)) playpage = self._download_json(re.search(r'data-meta="(.*?)"', webpage).group(1), "playurl_%d" % int(video_id))
title = re.search("<h2.*title=\"(.*)\"", webpage).group(1) # title title = re.search("<h2.*title=\"(.*)\"", webpage).group(1) # title
uploader = re.search(r'personacon-sm".*/>\s*(.*)\s*</a>', webpage).group(1) # username uploader = re.search(r'personacon-sm".*/>\s*(.*?)\s*<', webpage).group(1) # username
uploader_id = re.search(r'"/ch/(.*)/videos"', webpage).group(1) # userid uploader_id = re.search(r'"/ch/(.*)/videos"', webpage).group(1) # userid
description = re.search(r'collapse-content linkify break-word video-body">\s*(.*)\s*<button type="button" class="collapse-button', webpage, re.DOTALL).group(1).replace(" <br />", "").replace("<br />", "").replace("\n ", "") # description description = re.search(r'collapse-content linkify break-word video-body">\s*(.*)\s*<button type="button" class="collapse-button', webpage, re.DOTALL).group(1).replace(" <br />", "").replace("<br />", "").replace("\n ", "") # description
view_count = int(re.search(r'fa-play"></i></span>\s*(.*)\s*</li>', webpage).group(1).replace(",", "")) # played view_count = int(re.search(r'fa-play"></i></span>\s*(.*)\s*</li>', webpage).group(1).replace(",", "")) # played