46 lines
		
	
	
		
			1.3 KiB
		
	
	
	
		
			Python
		
	
	
	
	
	
			
		
		
	
	
			46 lines
		
	
	
		
			1.3 KiB
		
	
	
	
		
			Python
		
	
	
	
	
	
import re
 | 
						|
 | 
						|
from .common import InfoExtractor
 | 
						|
from ..utils import (
 | 
						|
    ExtractorError,
 | 
						|
)
 | 
						|
 | 
						|
 | 
						|
class YouJizzIE(InfoExtractor):
 | 
						|
    _VALID_URL = r'^(?:https?://)?(?:\w+\.)?youjizz\.com/videos/(?P<videoid>[^.]+).html$'
 | 
						|
 | 
						|
    def _real_extract(self, url):
 | 
						|
        mobj = re.match(self._VALID_URL, url)
 | 
						|
 | 
						|
        video_id = mobj.group('videoid')
 | 
						|
 | 
						|
        # Get webpage content
 | 
						|
        webpage = self._download_webpage(url, video_id)
 | 
						|
 | 
						|
        # Get the video title
 | 
						|
        video_title = self._html_search_regex(r'<title>(?P<title>.*)</title>',
 | 
						|
            webpage, u'title').strip()
 | 
						|
 | 
						|
        # Get the embed page
 | 
						|
        result = re.search(r'https?://www.youjizz.com/videos/embed/(?P<videoid>[0-9]+)', webpage)
 | 
						|
        if result is None:
 | 
						|
            raise ExtractorError(u'ERROR: unable to extract embed page')
 | 
						|
 | 
						|
        embed_page_url = result.group(0).strip()
 | 
						|
        video_id = result.group('videoid')
 | 
						|
 | 
						|
        webpage = self._download_webpage(embed_page_url, video_id)
 | 
						|
 | 
						|
        # Get the video URL
 | 
						|
        video_url = self._search_regex(r'so.addVariable\("file",encodeURIComponent\("(?P<source>[^"]+)"\)\);',
 | 
						|
            webpage, u'video URL')
 | 
						|
 | 
						|
        info = {'id': video_id,
 | 
						|
                'url': video_url,
 | 
						|
                'title': video_title,
 | 
						|
                'ext': 'flv',
 | 
						|
                'format': 'flv',
 | 
						|
                'player_url': embed_page_url}
 | 
						|
 | 
						|
        return [info]
 |