mirror of
				https://github.com/yt-dlp/yt-dlp.git
				synced 2025-10-24 19:28:42 +00:00 
			
		
		
		
	
		
			
				
	
	
		
			91 lines
		
	
	
		
			2.7 KiB
		
	
	
	
		
			Python
		
	
	
	
	
	
			
		
		
	
	
			91 lines
		
	
	
		
			2.7 KiB
		
	
	
	
		
			Python
		
	
	
	
	
	
| # coding: utf-8
 | |
| from __future__ import unicode_literals
 | |
| 
 | |
| from .common import InfoExtractor
 | |
| import re
 | |
| 
 | |
| 
 | |
| class ToypicsIE(InfoExtractor):
 | |
|     IE_DESC = 'Toypics video'
 | |
|     _VALID_URL = r'https?://videos\.toypics\.net/view/(?P<id>[0-9]+)'
 | |
|     _TEST = {
 | |
|         'url': 'http://videos.toypics.net/view/514/chancebulged,-2-1/',
 | |
|         'md5': '16e806ad6d6f58079d210fe30985e08b',
 | |
|         'info_dict': {
 | |
|             'id': '514',
 | |
|             'ext': 'mp4',
 | |
|             'title': "Chance-Bulge'd, 2",
 | |
|             'age_limit': 18,
 | |
|             'uploader': 'kidsune',
 | |
|         }
 | |
|     }
 | |
| 
 | |
|     def _real_extract(self, url):
 | |
|         video_id = self._match_id(url)
 | |
| 
 | |
|         webpage = self._download_webpage(url, video_id)
 | |
| 
 | |
|         formats = self._parse_html5_media_entries(
 | |
|             url, webpage, video_id)[0]['formats']
 | |
|         title = self._html_search_regex([
 | |
|             r'<h1[^>]+class=["\']view-video-title[^>]+>([^<]+)</h',
 | |
|             r'<title>([^<]+) - Toypics</title>',
 | |
|         ], webpage, 'title')
 | |
| 
 | |
|         uploader = self._html_search_regex(
 | |
|             r'More videos from <strong>([^<]+)</strong>', webpage, 'uploader',
 | |
|             fatal=False)
 | |
| 
 | |
|         return {
 | |
|             'id': video_id,
 | |
|             'formats': formats,
 | |
|             'title': title,
 | |
|             'uploader': uploader,
 | |
|             'age_limit': 18,
 | |
|         }
 | |
| 
 | |
| 
 | |
| class ToypicsUserIE(InfoExtractor):
 | |
|     IE_DESC = 'Toypics user profile'
 | |
|     _VALID_URL = r'https?://videos\.toypics\.net/(?!view)(?P<id>[^/?#&]+)'
 | |
|     _TEST = {
 | |
|         'url': 'http://videos.toypics.net/Mikey',
 | |
|         'info_dict': {
 | |
|             'id': 'Mikey',
 | |
|         },
 | |
|         'playlist_mincount': 19,
 | |
|     }
 | |
| 
 | |
|     def _real_extract(self, url):
 | |
|         username = self._match_id(url)
 | |
| 
 | |
|         profile_page = self._download_webpage(
 | |
|             url, username, note='Retrieving profile page')
 | |
| 
 | |
|         video_count = int(self._search_regex(
 | |
|             r'public/">Public Videos \(([0-9]+)\)</a></li>', profile_page,
 | |
|             'video count'))
 | |
| 
 | |
|         PAGE_SIZE = 8
 | |
|         urls = []
 | |
|         page_count = (video_count + PAGE_SIZE + 1) // PAGE_SIZE
 | |
|         for n in range(1, page_count + 1):
 | |
|             lpage_url = url + '/public/%d' % n
 | |
|             lpage = self._download_webpage(
 | |
|                 lpage_url, username,
 | |
|                 note='Downloading page %d/%d' % (n, page_count))
 | |
|             urls.extend(
 | |
|                 re.findall(
 | |
|                     r'<div[^>]+class=["\']preview[^>]+>\s*<a[^>]+href="(https?://videos\.toypics\.net/view/[^"]+)"',
 | |
|                     lpage))
 | |
| 
 | |
|         return {
 | |
|             '_type': 'playlist',
 | |
|             'id': username,
 | |
|             'entries': [{
 | |
|                 '_type': 'url',
 | |
|                 'url': eurl,
 | |
|                 'ie_key': 'Toypics',
 | |
|             } for eurl in urls]
 | |
|         }
 | 
