diff --git a/youtube_dl/extractor/pornhub.py b/youtube_dl/extractor/pornhub.py index e16c10f97..428324ef0 100644 --- a/youtube_dl/extractor/pornhub.py +++ b/youtube_dl/extractor/pornhub.py @@ -302,14 +302,17 @@ class PornHubIE(PornHubBaseIE): comment_count = self._extract_count( r'All Comments\s*\(([\d,.]+)\)', webpage, 'comment') - def _get_text(class_name, page): - div = re.search( - r'
\s+[^\n]+\s+([^\n]+)\s+[^\n]+\s+
', page) + def _get_items(class_name): + div = self._search_regex( + r'
([\S\s]+?)
', + webpage, class_name, default=None) if div: - return [a for a in re.findall(r']+>([^<]+)', div.group(1))] + return [a for a in re.findall(r']+>([^<]+)', div)] + else: + return None - categories = _get_text('categoriesWrapper', webpage) - tags = _get_text('tagsWrapper', webpage) + categories = _get_items('categoriesWrapper') + tags = _get_items('tagsWrapper') return { 'id': video_id,