mirror of
				https://github.com/yt-dlp/yt-dlp.git
				synced 2025-10-26 04:00:46 +00:00 
			
		
		
		
	 6d6536acb2
			
		
	
	6d6536acb2
	
	
	
		
			
			- skip m3u8 formats(404 error) - skip unavailable test - download embed page only when it's needed - update _VALID_URL regex(joystiq.com redirect to engadget.com)
		
			
				
	
	
		
			152 lines
		
	
	
		
			5.3 KiB
		
	
	
	
		
			Python
		
	
	
	
	
	
			
		
		
	
	
			152 lines
		
	
	
		
			5.3 KiB
		
	
	
	
		
			Python
		
	
	
	
	
	
| from __future__ import unicode_literals
 | |
| 
 | |
| import re
 | |
| 
 | |
| from .common import InfoExtractor
 | |
| from ..compat import (
 | |
|     compat_urllib_parse,
 | |
|     compat_parse_qs,
 | |
|     compat_urllib_parse_urlparse,
 | |
|     compat_urlparse,
 | |
| )
 | |
| from ..utils import (
 | |
|     ExtractorError,
 | |
|     parse_duration,
 | |
|     replace_extension,
 | |
| )
 | |
| 
 | |
| 
 | |
| class FiveMinIE(InfoExtractor):
 | |
|     IE_NAME = '5min'
 | |
|     _VALID_URL = r'(?:5min:(?P<id>\d+)(?::(?P<sid>\d+))?|https?://[^/]*?5min\.com/Scripts/PlayerSeed\.js\?(?P<query>.*))'
 | |
| 
 | |
|     _TESTS = [
 | |
|         {
 | |
|             # From http://www.engadget.com/2013/11/15/ipad-mini-retina-display-review/
 | |
|             'url': 'http://pshared.5min.com/Scripts/PlayerSeed.js?sid=281&width=560&height=345&playList=518013791',
 | |
|             'md5': '4f7b0b79bf1a470e5004f7112385941d',
 | |
|             'info_dict': {
 | |
|                 'id': '518013791',
 | |
|                 'ext': 'mp4',
 | |
|                 'title': 'iPad Mini with Retina Display Review',
 | |
|                 'duration': 177,
 | |
|             },
 | |
|         },
 | |
|         {
 | |
|             # From http://on.aol.com/video/how-to-make-a-next-level-fruit-salad-518086247
 | |
|             'url': '5min:518086247',
 | |
|             'md5': 'e539a9dd682c288ef5a498898009f69e',
 | |
|             'info_dict': {
 | |
|                 'id': '518086247',
 | |
|                 'ext': 'mp4',
 | |
|                 'title': 'How to Make a Next-Level Fruit Salad',
 | |
|                 'duration': 184,
 | |
|             },
 | |
|             'skip': 'no longer available',
 | |
|         },
 | |
|     ]
 | |
|     _ERRORS = {
 | |
|         'ErrorVideoNotExist': 'We\'re sorry, but the video you are trying to watch does not exist.',
 | |
|         'ErrorVideoNoLongerAvailable': 'We\'re sorry, but the video you are trying to watch is no longer available.',
 | |
|         'ErrorVideoRejected': 'We\'re sorry, but the video you are trying to watch has been removed.',
 | |
|         'ErrorVideoUserNotGeo': 'We\'re sorry, but the video you are trying to watch cannot be viewed from your current location.',
 | |
|         'ErrorVideoLibraryRestriction': 'We\'re sorry, but the video you are trying to watch is currently unavailable for viewing at this domain.',
 | |
|         'ErrorExposurePermission': 'We\'re sorry, but the video you are trying to watch is currently unavailable for viewing at this domain.',
 | |
|     }
 | |
|     _QUALITIES = {
 | |
|         1: {
 | |
|             'width': 640,
 | |
|             'height': 360,
 | |
|         },
 | |
|         2: {
 | |
|             'width': 854,
 | |
|             'height': 480,
 | |
|         },
 | |
|         4: {
 | |
|             'width': 1280,
 | |
|             'height': 720,
 | |
|         },
 | |
|         8: {
 | |
|             'width': 1920,
 | |
|             'height': 1080,
 | |
|         },
 | |
|         16: {
 | |
|             'width': 640,
 | |
|             'height': 360,
 | |
|         },
 | |
|         32: {
 | |
|             'width': 854,
 | |
|             'height': 480,
 | |
|         },
 | |
|         64: {
 | |
|             'width': 1280,
 | |
|             'height': 720,
 | |
|         },
 | |
|         128: {
 | |
|             'width': 640,
 | |
|             'height': 360,
 | |
|         },
 | |
|     }
 | |
| 
 | |
|     def _real_extract(self, url):
 | |
|         mobj = re.match(self._VALID_URL, url)
 | |
|         video_id = mobj.group('id')
 | |
|         sid = mobj.group('sid')
 | |
| 
 | |
|         if mobj.group('query'):
 | |
|             qs = compat_parse_qs(mobj.group('query'))
 | |
|             if not qs.get('playList'):
 | |
|                 raise ExtractorError('Invalid URL', expected=True)
 | |
|             video_id = qs['playList'][0]
 | |
|             if qs.get('sid'):
 | |
|                 sid = qs['sid'][0]
 | |
| 
 | |
|         embed_url = 'https://embed.5min.com/playerseed/?playList=%s' % video_id
 | |
|         if not sid:
 | |
|             embed_page = self._download_webpage(embed_url, video_id,
 | |
|                                                 'Downloading embed page')
 | |
|             sid = self._search_regex(r'sid=(\d+)', embed_page, 'sid')
 | |
| 
 | |
|         response = self._download_json(
 | |
|             'https://syn.5min.com/handlers/SenseHandler.ashx?' +
 | |
|             compat_urllib_parse.urlencode({
 | |
|                 'func': 'GetResults',
 | |
|                 'playlist': video_id,
 | |
|                 'sid': sid,
 | |
|                 'isPlayerSeed': 'true',
 | |
|                 'url': embed_url,
 | |
|             }),
 | |
|             video_id)
 | |
|         if not response['success']:
 | |
|             raise ExtractorError(
 | |
|                 '%s said: %s' % (
 | |
|                     self.IE_NAME,
 | |
|                     self._ERRORS.get(response['errorMessage'], response['errorMessage'])),
 | |
|                 expected=True)
 | |
|         info = response['binding'][0]
 | |
| 
 | |
|         formats = []
 | |
|         parsed_video_url = compat_urllib_parse_urlparse(compat_parse_qs(
 | |
|             compat_urllib_parse_urlparse(info['EmbededURL']).query)['videoUrl'][0])
 | |
|         for rendition in info['Renditions']:
 | |
|             if rendition['RenditionType'] == 'aac' or rendition['RenditionType'] == 'm3u8':
 | |
|                 continue
 | |
|             else:
 | |
|                 rendition_url = compat_urlparse.urlunparse(parsed_video_url._replace(path=replace_extension(parsed_video_url.path.replace('//', '/%s/' % rendition['ID']), rendition['RenditionType'])))
 | |
|                 quality = self._QUALITIES.get(rendition['ID'], {})
 | |
|                 formats.append({
 | |
|                     'format_id': '%s-%d' % (rendition['RenditionType'], rendition['ID']),
 | |
|                     'url': rendition_url,
 | |
|                     'width': quality.get('width'),
 | |
|                     'height': quality.get('height'),
 | |
|                 })
 | |
|         self._sort_formats(formats)
 | |
| 
 | |
|         return {
 | |
|             'id': video_id,
 | |
|             'title': info['Title'],
 | |
|             'thumbnail': info.get('ThumbURL'),
 | |
|             'duration': parse_duration(info.get('Duration')),
 | |
|             'formats': formats,
 | |
|         }
 |