1
0
Fork 0
mirror of https://github.com/yt-dlp/yt-dlp synced 2025-01-18 14:53:04 +01:00
yt-dlp/yt_dlp/extractor/younow.py

195 lines
6.7 KiB
Python
Raw Normal View History

import itertools
2017-03-12 18:19:32 -04:00
from .common import InfoExtractor
from ..utils import (
ExtractorError,
format_field,
int_or_none,
str_or_none,
try_get,
)
2017-03-12 18:19:32 -04:00
CDN_API_BASE = 'https://cdn.younow.com/php/api'
MOMENT_URL_FORMAT = f'{CDN_API_BASE}/moment/fetch/id=%s'
2017-03-12 18:19:32 -04:00
class YouNowLiveIE(InfoExtractor):
_VALID_URL = r'https?://(?:www\.)?younow\.com/(?P<id>[^/?#&]+)'
2017-03-12 18:19:32 -04:00
_TEST = {
'url': 'https://www.younow.com/AmandaPadeezy',
'info_dict': {
'id': 'AmandaPadeezy',
'ext': 'mp4',
'is_live': True,
'title': 'March 26, 2017',
'thumbnail': r're:^https?://.*\.jpg$',
2017-03-12 18:19:32 -04:00
'tags': ['girls'],
'categories': ['girls'],
'uploader': 'AmandaPadeezy',
'uploader_id': '6716501',
'uploader_url': 'https://www.younow.com/AmandaPadeezy',
'creator': 'AmandaPadeezy',
},
'skip': True,
2017-03-12 18:19:32 -04:00
}
@classmethod
def suitable(cls, url):
return (False
if YouNowChannelIE.suitable(url) or YouNowMomentIE.suitable(url)
else super().suitable(url))
2017-03-12 18:19:32 -04:00
def _real_extract(self, url):
username = self._match_id(url)
data = self._download_json(
f'https://api.younow.com/php/api/broadcast/info/curId=0/user={username}', username)
if data.get('errorCode') != 0:
raise ExtractorError(data['errorMsg'], expected=True)
uploader = try_get(
data, lambda x: x['user']['profileUrlString'],
str) or username
2017-03-12 18:19:32 -04:00
return {
'id': uploader,
'is_live': True,
2021-12-15 21:30:46 +05:30
'title': uploader,
2017-03-12 18:19:32 -04:00
'thumbnail': data.get('awsUrl'),
'tags': data.get('tags'),
'categories': data.get('tags'),
'uploader': uploader,
'uploader_id': data.get('userId'),
'uploader_url': f'https://www.younow.com/{username}',
2017-03-12 18:19:32 -04:00
'creator': uploader,
'view_count': int_or_none(data.get('viewers')),
'like_count': int_or_none(data.get('likes')),
'formats': [{
'url': '{}/broadcast/videoPath/hls=1/broadcastId={}/channelId={}'.format(CDN_API_BASE, data['broadcastId'], data['userId']),
2017-03-12 18:19:32 -04:00
'ext': 'mp4',
'protocol': 'm3u8',
}],
}
def _extract_moment(item, fatal=True):
moment_id = item.get('momentId')
if not moment_id:
if not fatal:
return
raise ExtractorError('Unable to extract moment id')
moment_id = str(moment_id)
2017-03-12 18:19:32 -04:00
title = item.get('text')
if not title:
title = 'YouNow %s' % (
item.get('momentType') or item.get('titleType') or 'moment')
uploader = try_get(item, lambda x: x['owner']['name'], str)
uploader_id = try_get(item, lambda x: x['owner']['userId'])
uploader_url = format_field(uploader, None, 'https://www.younow.com/%s')
2017-03-12 18:19:32 -04:00
return {
'extractor_key': 'YouNowMoment',
'id': moment_id,
2017-03-12 18:19:32 -04:00
'title': title,
'view_count': int_or_none(item.get('views')),
'like_count': int_or_none(item.get('likes')),
'timestamp': int_or_none(item.get('created')),
'creator': uploader,
'uploader': uploader,
'uploader_id': str_or_none(uploader_id),
'uploader_url': uploader_url,
2017-03-12 18:19:32 -04:00
'formats': [{
'url': f'https://hls.younow.com/momentsplaylists/live/{moment_id}/{moment_id}.m3u8',
2017-03-12 18:19:32 -04:00
'ext': 'mp4',
'protocol': 'm3u8_native',
2017-03-12 18:19:32 -04:00
}],
}
class YouNowChannelIE(InfoExtractor):
_VALID_URL = r'https?://(?:www\.)?younow\.com/(?P<id>[^/]+)/channel'
_TEST = {
'url': 'https://www.younow.com/its_Kateee_/channel',
2017-03-12 18:19:32 -04:00
'info_dict': {
'id': '14629760',
'title': 'its_Kateee_ moments',
2017-03-12 18:19:32 -04:00
},
'playlist_mincount': 8,
2017-03-12 18:19:32 -04:00
}
def _entries(self, username, channel_id):
2017-03-12 18:19:32 -04:00
created_before = 0
for page_num in itertools.count(1):
if created_before is None:
2017-03-12 18:19:32 -04:00
break
info = self._download_json(
f'{CDN_API_BASE}/moment/profile/channelId={channel_id}/createdBefore={created_before}/records=20',
username, note=f'Downloading moments page {page_num}')
items = info.get('items')
if not items or not isinstance(items, list):
break
for item in items:
if not isinstance(item, dict):
continue
item_type = item.get('type')
if item_type == 'moment':
entry = _extract_moment(item, fatal=False)
if entry:
yield entry
elif item_type == 'collection':
moments = item.get('momentsIds')
if isinstance(moments, list):
for moment_id in moments:
m = self._download_json(
MOMENT_URL_FORMAT % moment_id, username,
note=f'Downloading {moment_id} moment JSON',
fatal=False)
if m and isinstance(m, dict) and m.get('item'):
entry = _extract_moment(m['item'])
if entry:
yield entry
created_before = int_or_none(item.get('created'))
2017-03-12 18:19:32 -04:00
def _real_extract(self, url):
username = self._match_id(url)
channel_id = str(self._download_json(
f'https://api.younow.com/php/api/broadcast/info/curId=0/user={username}',
username, note='Downloading user information')['userId'])
return self.playlist_result(
self._entries(username, channel_id), channel_id,
f'{username} moments')
2017-03-12 18:19:32 -04:00
class YouNowMomentIE(InfoExtractor):
_VALID_URL = r'https?://(?:www\.)?younow\.com/[^/]+/(?P<id>[^/?#&]+)'
2017-03-12 18:19:32 -04:00
_TEST = {
'url': 'https://www.younow.com/GABO.../20712117/36319236/3b316doc/m',
'md5': 'a30c70eadb9fb39a1aa3c8c0d22a0807',
2017-03-12 18:19:32 -04:00
'info_dict': {
'id': '20712117',
'ext': 'mp4',
'title': 'YouNow capture',
'view_count': int,
'like_count': int,
2017-03-12 18:19:32 -04:00
'timestamp': 1490432040,
'upload_date': '20170325',
'uploader': 'GABO...',
'uploader_id': '35917228',
2017-03-12 18:19:32 -04:00
},
}
@classmethod
def suitable(cls, url):
return (False
if YouNowChannelIE.suitable(url)
else super().suitable(url))
2017-03-12 18:19:32 -04:00
def _real_extract(self, url):
video_id = self._match_id(url)
item = self._download_json(MOMENT_URL_FORMAT % video_id, video_id)
return _extract_moment(item['item'])