mirror of
https://github.com/yt-dlp/yt-dlp
synced 2025-01-18 14:53:04 +01:00
parent
ed3bb2b0a1
commit
615a84447e
19 changed files with 80 additions and 94 deletions
3
.gitignore
vendored
3
.gitignore
vendored
|
@ -33,6 +33,7 @@ cookies
|
||||||
*.gif
|
*.gif
|
||||||
*.jpeg
|
*.jpeg
|
||||||
*.jpg
|
*.jpg
|
||||||
|
*.lrc
|
||||||
*.m4a
|
*.m4a
|
||||||
*.m4v
|
*.m4v
|
||||||
*.mhtml
|
*.mhtml
|
||||||
|
@ -40,6 +41,7 @@ cookies
|
||||||
*.mov
|
*.mov
|
||||||
*.mp3
|
*.mp3
|
||||||
*.mp4
|
*.mp4
|
||||||
|
*.mpg
|
||||||
*.mpga
|
*.mpga
|
||||||
*.oga
|
*.oga
|
||||||
*.ogg
|
*.ogg
|
||||||
|
@ -47,6 +49,7 @@ cookies
|
||||||
*.png
|
*.png
|
||||||
*.sbv
|
*.sbv
|
||||||
*.srt
|
*.srt
|
||||||
|
*.ssa
|
||||||
*.swf
|
*.swf
|
||||||
*.swp
|
*.swp
|
||||||
*.tt
|
*.tt
|
||||||
|
|
4
Makefile
4
Makefile
|
@ -17,8 +17,8 @@ pypi-files: AUTHORS Changelog.md LICENSE README.md README.txt supportedsites \
|
||||||
clean-test:
|
clean-test:
|
||||||
rm -rf test/testdata/sigs/player-*.js tmp/ *.annotations.xml *.aria2 *.description *.dump *.frag \
|
rm -rf test/testdata/sigs/player-*.js tmp/ *.annotations.xml *.aria2 *.description *.dump *.frag \
|
||||||
*.frag.aria2 *.frag.urls *.info.json *.live_chat.json *.meta *.part* *.tmp *.temp *.unknown_video *.ytdl \
|
*.frag.aria2 *.frag.urls *.info.json *.live_chat.json *.meta *.part* *.tmp *.temp *.unknown_video *.ytdl \
|
||||||
*.3gp *.ape *.ass *.avi *.desktop *.f4v *.flac *.flv *.gif *.jpeg *.jpg *.m4a *.m4v *.mhtml *.mkv *.mov *.mp3 \
|
*.3gp *.ape *.ass *.avi *.desktop *.f4v *.flac *.flv *.gif *.jpeg *.jpg *.lrc *.m4a *.m4v *.mhtml *.mkv *.mov *.mp3 *.mp4 \
|
||||||
*.mp4 *.mpga *.oga *.ogg *.opus *.png *.sbv *.srt *.swf *.swp *.tt *.ttml *.url *.vtt *.wav *.webloc *.webm *.webp
|
*.mpg *.mpga *.oga *.ogg *.opus *.png *.sbv *.srt *.ssa *.swf *.swp *.tt *.ttml *.url *.vtt *.wav *.webloc *.webm *.webp
|
||||||
clean-dist:
|
clean-dist:
|
||||||
rm -rf yt-dlp.1.temp.md yt-dlp.1 README.txt MANIFEST build/ dist/ .coverage cover/ yt-dlp.tar.gz completions/ \
|
rm -rf yt-dlp.1.temp.md yt-dlp.1 README.txt MANIFEST build/ dist/ .coverage cover/ yt-dlp.tar.gz completions/ \
|
||||||
yt_dlp/extractor/lazy_extractors.py *.spec CONTRIBUTING.md.tmp yt-dlp yt-dlp.exe yt_dlp.egg-info/ AUTHORS
|
yt_dlp/extractor/lazy_extractors.py *.spec CONTRIBUTING.md.tmp yt-dlp yt-dlp.exe yt_dlp.egg-info/ AUTHORS
|
||||||
|
|
|
@ -1 +0,0 @@
|
||||||
# Empty file
|
|
|
@ -20,7 +20,7 @@ def main():
|
||||||
'py2exe builds do not support pycryptodomex and needs VC++14 to run. '
|
'py2exe builds do not support pycryptodomex and needs VC++14 to run. '
|
||||||
'It is recommended to run "pyinst.py" to build using pyinstaller instead')
|
'It is recommended to run "pyinst.py" to build using pyinstaller instead')
|
||||||
|
|
||||||
return freeze(
|
freeze(
|
||||||
console=[{
|
console=[{
|
||||||
'script': './yt_dlp/__main__.py',
|
'script': './yt_dlp/__main__.py',
|
||||||
'dest_base': 'yt-dlp',
|
'dest_base': 'yt-dlp',
|
||||||
|
|
|
@ -1 +0,0 @@
|
||||||
# Empty file needed to make devscripts.utils properly importable from outside
|
|
|
@ -120,5 +120,11 @@
|
||||||
"when": "15f22b4880b6b3f71f350c64d70976ae65b9f1ca",
|
"when": "15f22b4880b6b3f71f350c64d70976ae65b9f1ca",
|
||||||
"short": "[webvtt] Allow spaces before newlines for CueBlock (#7681)",
|
"short": "[webvtt] Allow spaces before newlines for CueBlock (#7681)",
|
||||||
"authors": ["TSRBerry"]
|
"authors": ["TSRBerry"]
|
||||||
|
},
|
||||||
|
{
|
||||||
|
"action": "change",
|
||||||
|
"when": "4ce57d3b873c2887814cbec03d029533e82f7db5",
|
||||||
|
"short": "[ie] Support multi-period MPD streams (#6654)",
|
||||||
|
"authors": ["alard", "pukkandan"]
|
||||||
}
|
}
|
||||||
]
|
]
|
||||||
|
|
|
@ -253,7 +253,7 @@ class CommitRange:
|
||||||
''', re.VERBOSE | re.DOTALL)
|
''', re.VERBOSE | re.DOTALL)
|
||||||
EXTRACTOR_INDICATOR_RE = re.compile(r'(?:Fix|Add)\s+Extractors?', re.IGNORECASE)
|
EXTRACTOR_INDICATOR_RE = re.compile(r'(?:Fix|Add)\s+Extractors?', re.IGNORECASE)
|
||||||
REVERT_RE = re.compile(r'(?:\[[^\]]+\]\s+)?(?i:Revert)\s+([\da-f]{40})')
|
REVERT_RE = re.compile(r'(?:\[[^\]]+\]\s+)?(?i:Revert)\s+([\da-f]{40})')
|
||||||
FIXES_RE = re.compile(r'(?i:Fix(?:es)?(?:\s+bugs?)?(?:\s+in|\s+for)?|Revert)\s+([\da-f]{40})')
|
FIXES_RE = re.compile(r'(?i:Fix(?:es)?(?:\s+bugs?)?(?:\s+in|\s+for)?|Revert|Improve)\s+([\da-f]{40})')
|
||||||
UPSTREAM_MERGE_RE = re.compile(r'Update to ytdl-commit-([\da-f]+)')
|
UPSTREAM_MERGE_RE = re.compile(r'Update to ytdl-commit-([\da-f]+)')
|
||||||
|
|
||||||
def __init__(self, start, end, default_author=None):
|
def __init__(self, start, end, default_author=None):
|
||||||
|
|
|
@ -69,7 +69,7 @@ def _build_proxy_handler(name):
|
||||||
self.send_response(200)
|
self.send_response(200)
|
||||||
self.send_header('Content-Type', 'text/plain; charset=utf-8')
|
self.send_header('Content-Type', 'text/plain; charset=utf-8')
|
||||||
self.end_headers()
|
self.end_headers()
|
||||||
self.wfile.write('{self.proxy_name}: {self.path}'.format(self=self).encode())
|
self.wfile.write(f'{self.proxy_name}: {self.path}'.encode())
|
||||||
return HTTPTestRequestHandler
|
return HTTPTestRequestHandler
|
||||||
|
|
||||||
|
|
||||||
|
|
|
@ -575,7 +575,7 @@ class YoutubeDL:
|
||||||
'url', 'manifest_url', 'manifest_stream_number', 'ext', 'format', 'format_id', 'format_note',
|
'url', 'manifest_url', 'manifest_stream_number', 'ext', 'format', 'format_id', 'format_note',
|
||||||
'width', 'height', 'aspect_ratio', 'resolution', 'dynamic_range', 'tbr', 'abr', 'acodec', 'asr', 'audio_channels',
|
'width', 'height', 'aspect_ratio', 'resolution', 'dynamic_range', 'tbr', 'abr', 'acodec', 'asr', 'audio_channels',
|
||||||
'vbr', 'fps', 'vcodec', 'container', 'filesize', 'filesize_approx', 'rows', 'columns',
|
'vbr', 'fps', 'vcodec', 'container', 'filesize', 'filesize_approx', 'rows', 'columns',
|
||||||
'player_url', 'protocol', 'fragment_base_url', 'fragments', 'is_from_start',
|
'player_url', 'protocol', 'fragment_base_url', 'fragments', 'is_from_start', 'is_dash_periods', 'request_data',
|
||||||
'preference', 'language', 'language_preference', 'quality', 'source_preference', 'cookies',
|
'preference', 'language', 'language_preference', 'quality', 'source_preference', 'cookies',
|
||||||
'http_headers', 'stretched_ratio', 'no_resume', 'has_drm', 'extra_param_to_segment_url', 'hls_aes', 'downloader_options',
|
'http_headers', 'stretched_ratio', 'no_resume', 'has_drm', 'extra_param_to_segment_url', 'hls_aes', 'downloader_options',
|
||||||
'page_url', 'app', 'play_path', 'tc_url', 'flash_version', 'rtmp_live', 'rtmp_conn', 'rtmp_protocol', 'rtmp_real_time'
|
'page_url', 'app', 'play_path', 'tc_url', 'flash_version', 'rtmp_live', 'rtmp_conn', 'rtmp_protocol', 'rtmp_real_time'
|
||||||
|
|
|
@ -4,6 +4,7 @@ from .archiveorg import ArchiveOrgIE
|
||||||
from .common import InfoExtractor
|
from .common import InfoExtractor
|
||||||
from ..utils import (
|
from ..utils import (
|
||||||
InAdvancePagedList,
|
InAdvancePagedList,
|
||||||
|
clean_html,
|
||||||
int_or_none,
|
int_or_none,
|
||||||
orderedSet,
|
orderedSet,
|
||||||
str_to_int,
|
str_to_int,
|
||||||
|
@ -32,13 +33,15 @@ class AltCensoredIE(InfoExtractor):
|
||||||
'duration': 926.09,
|
'duration': 926.09,
|
||||||
'thumbnail': 'https://archive.org/download/youtube-k0srjLSkga8/youtube-k0srjLSkga8.thumbs/k0srjLSkga8_000925.jpg',
|
'thumbnail': 'https://archive.org/download/youtube-k0srjLSkga8/youtube-k0srjLSkga8.thumbs/k0srjLSkga8_000925.jpg',
|
||||||
'view_count': int,
|
'view_count': int,
|
||||||
'categories': ['News & Politics'], # FIXME
|
'categories': ['News & Politics'],
|
||||||
}
|
}
|
||||||
}]
|
}]
|
||||||
|
|
||||||
def _real_extract(self, url):
|
def _real_extract(self, url):
|
||||||
video_id = self._match_id(url)
|
video_id = self._match_id(url)
|
||||||
webpage = self._download_webpage(url, video_id)
|
webpage = self._download_webpage(url, video_id)
|
||||||
|
category = clean_html(self._html_search_regex(
|
||||||
|
r'<a href="/category/\d+">([^<]+)</a>', webpage, 'category', default=None))
|
||||||
|
|
||||||
return {
|
return {
|
||||||
'_type': 'url_transparent',
|
'_type': 'url_transparent',
|
||||||
|
@ -46,9 +49,7 @@ class AltCensoredIE(InfoExtractor):
|
||||||
'ie_key': ArchiveOrgIE.ie_key(),
|
'ie_key': ArchiveOrgIE.ie_key(),
|
||||||
'view_count': str_to_int(self._html_search_regex(
|
'view_count': str_to_int(self._html_search_regex(
|
||||||
r'YouTube Views:(?:\s| )*([\d,]+)', webpage, 'view count', default=None)),
|
r'YouTube Views:(?:\s| )*([\d,]+)', webpage, 'view count', default=None)),
|
||||||
'categories': self._html_search_regex(
|
'categories': [category] if category else None,
|
||||||
r'<a href="/category/\d+">\s*\n?\s*([^<]+)</a>',
|
|
||||||
webpage, 'category', default='').split() or None,
|
|
||||||
}
|
}
|
||||||
|
|
||||||
|
|
||||||
|
|
|
@ -142,10 +142,10 @@ class ArteTVIE(ArteTVBaseIE):
|
||||||
def _fix_accessible_subs_locale(subs):
|
def _fix_accessible_subs_locale(subs):
|
||||||
updated_subs = {}
|
updated_subs = {}
|
||||||
for lang, sub_formats in subs.items():
|
for lang, sub_formats in subs.items():
|
||||||
for format in sub_formats:
|
for fmt in sub_formats:
|
||||||
if format.get('url', '').endswith('-MAL.m3u8'):
|
if fmt.get('url', '').endswith('-MAL.m3u8'):
|
||||||
lang += '-acc'
|
lang += '-acc'
|
||||||
updated_subs.setdefault(lang, []).append(format)
|
updated_subs.setdefault(lang, []).append(fmt)
|
||||||
return updated_subs
|
return updated_subs
|
||||||
|
|
||||||
def _real_extract(self, url):
|
def _real_extract(self, url):
|
||||||
|
|
|
@ -160,9 +160,8 @@ class GetCourseRuIE(InfoExtractor):
|
||||||
self._login(hostname, username, password)
|
self._login(hostname, username, password)
|
||||||
|
|
||||||
display_id = self._match_id(url)
|
display_id = self._match_id(url)
|
||||||
# NB: 404 is returned due to yt-dlp not properly following redirects #9020
|
webpage, urlh = self._download_webpage_handle(url, display_id)
|
||||||
webpage, urlh = self._download_webpage_handle(url, display_id, expected_status=404)
|
if self._LOGIN_URL_PATH in urlh.url:
|
||||||
if self._LOGIN_URL_PATH in urlh.url or urlh.status == 404:
|
|
||||||
raise ExtractorError(
|
raise ExtractorError(
|
||||||
f'This video is only available for registered users. {self._login_hint("any", netrc=hostname)}',
|
f'This video is only available for registered users. {self._login_hint("any", netrc=hostname)}',
|
||||||
expected=True)
|
expected=True)
|
||||||
|
|
|
@ -9,7 +9,6 @@ from ..utils import (
|
||||||
int_or_none,
|
int_or_none,
|
||||||
str_or_none,
|
str_or_none,
|
||||||
traverse_obj,
|
traverse_obj,
|
||||||
update_url_query,
|
|
||||||
)
|
)
|
||||||
|
|
||||||
|
|
||||||
|
@ -82,7 +81,7 @@ class MedalTVIE(InfoExtractor):
|
||||||
def _real_extract(self, url):
|
def _real_extract(self, url):
|
||||||
video_id = self._match_id(url)
|
video_id = self._match_id(url)
|
||||||
|
|
||||||
webpage = self._download_webpage(update_url_query(url, {'mobilebypass': 'true'}), video_id)
|
webpage = self._download_webpage(url, video_id, query={'mobilebypass': 'true'})
|
||||||
|
|
||||||
hydration_data = self._search_json(
|
hydration_data = self._search_json(
|
||||||
r'<script[^>]*>[^<]*\bhydrationData\s*=', webpage,
|
r'<script[^>]*>[^<]*\bhydrationData\s*=', webpage,
|
||||||
|
|
|
@ -162,10 +162,8 @@ class RadikoBaseIE(InfoExtractor):
|
||||||
return formats
|
return formats
|
||||||
|
|
||||||
def _extract_performers(self, prog):
|
def _extract_performers(self, prog):
|
||||||
performers = traverse_obj(prog, (
|
return traverse_obj(prog, (
|
||||||
'pfm/text()', ..., {lambda x: re.split(r'[//、 ,,]', x)}, ..., {str.strip}))
|
'pfm/text()', ..., {lambda x: re.split(r'[//、 ,,]', x)}, ..., {str.strip})) or None
|
||||||
# TODO: change 'artist' fields to 'artists' and return traversal list instead of str
|
|
||||||
return ', '.join(performers) or None
|
|
||||||
|
|
||||||
|
|
||||||
class RadikoIE(RadikoBaseIE):
|
class RadikoIE(RadikoBaseIE):
|
||||||
|
@ -194,7 +192,7 @@ class RadikoIE(RadikoBaseIE):
|
||||||
return {
|
return {
|
||||||
'id': video_id,
|
'id': video_id,
|
||||||
'title': try_call(lambda: prog.find('title').text),
|
'title': try_call(lambda: prog.find('title').text),
|
||||||
'artist': self._extract_performers(prog),
|
'cast': self._extract_performers(prog),
|
||||||
'description': clean_html(try_call(lambda: prog.find('info').text)),
|
'description': clean_html(try_call(lambda: prog.find('info').text)),
|
||||||
'uploader': try_call(lambda: station_program.find('.//name').text),
|
'uploader': try_call(lambda: station_program.find('.//name').text),
|
||||||
'uploader_id': station,
|
'uploader_id': station,
|
||||||
|
@ -253,7 +251,7 @@ class RadikoRadioIE(RadikoBaseIE):
|
||||||
return {
|
return {
|
||||||
'id': station,
|
'id': station,
|
||||||
'title': title,
|
'title': title,
|
||||||
'artist': self._extract_performers(prog),
|
'cast': self._extract_performers(prog),
|
||||||
'description': description,
|
'description': description,
|
||||||
'uploader': station_name,
|
'uploader': station_name,
|
||||||
'uploader_id': station,
|
'uploader_id': station,
|
||||||
|
|
|
@ -25,8 +25,8 @@ class SlidesLiveIE(InfoExtractor):
|
||||||
'id': '38902413',
|
'id': '38902413',
|
||||||
'ext': 'mp4',
|
'ext': 'mp4',
|
||||||
'title': 'GCC IA16 backend',
|
'title': 'GCC IA16 backend',
|
||||||
'timestamp': 1648189972,
|
'timestamp': 1697793372,
|
||||||
'upload_date': '20220325',
|
'upload_date': '20231020',
|
||||||
'thumbnail': r're:^https?://.*\.jpg',
|
'thumbnail': r're:^https?://.*\.jpg',
|
||||||
'thumbnails': 'count:42',
|
'thumbnails': 'count:42',
|
||||||
'chapters': 'count:41',
|
'chapters': 'count:41',
|
||||||
|
@ -42,8 +42,8 @@ class SlidesLiveIE(InfoExtractor):
|
||||||
'id': '38935785',
|
'id': '38935785',
|
||||||
'ext': 'mp4',
|
'ext': 'mp4',
|
||||||
'title': 'Offline Reinforcement Learning: From Algorithms to Practical Challenges',
|
'title': 'Offline Reinforcement Learning: From Algorithms to Practical Challenges',
|
||||||
'upload_date': '20211115',
|
'upload_date': '20231020',
|
||||||
'timestamp': 1636996003,
|
'timestamp': 1697807002,
|
||||||
'thumbnail': r're:^https?://.*\.(?:jpg|png)',
|
'thumbnail': r're:^https?://.*\.(?:jpg|png)',
|
||||||
'thumbnails': 'count:640',
|
'thumbnails': 'count:640',
|
||||||
'chapters': 'count:639',
|
'chapters': 'count:639',
|
||||||
|
@ -59,9 +59,9 @@ class SlidesLiveIE(InfoExtractor):
|
||||||
'id': '38973182',
|
'id': '38973182',
|
||||||
'ext': 'mp4',
|
'ext': 'mp4',
|
||||||
'title': 'How Should a Machine Learning Researcher Think About AI Ethics?',
|
'title': 'How Should a Machine Learning Researcher Think About AI Ethics?',
|
||||||
'upload_date': '20220201',
|
'upload_date': '20231020',
|
||||||
'thumbnail': r're:^https?://.*\.jpg',
|
'thumbnail': r're:^https?://.*\.jpg',
|
||||||
'timestamp': 1643728135,
|
'timestamp': 1697822521,
|
||||||
'thumbnails': 'count:3',
|
'thumbnails': 'count:3',
|
||||||
'chapters': 'count:2',
|
'chapters': 'count:2',
|
||||||
'duration': 5889,
|
'duration': 5889,
|
||||||
|
@ -70,37 +70,22 @@ class SlidesLiveIE(InfoExtractor):
|
||||||
'skip_download': 'm3u8',
|
'skip_download': 'm3u8',
|
||||||
},
|
},
|
||||||
}, {
|
}, {
|
||||||
# service_name = youtube, only XML slides info
|
# formerly youtube, converted to native
|
||||||
'url': 'https://slideslive.com/38897546/special-metaprednaska-petra-ludwiga-hodnoty-pro-lepsi-spolecnost',
|
'url': 'https://slideslive.com/38897546/special-metaprednaska-petra-ludwiga-hodnoty-pro-lepsi-spolecnost',
|
||||||
'md5': '8a79b5e3d700837f40bd2afca3c8fa01',
|
'md5': '8a79b5e3d700837f40bd2afca3c8fa01',
|
||||||
'info_dict': {
|
'info_dict': {
|
||||||
'id': 'jmg02wCJD5M',
|
'id': '38897546',
|
||||||
'display_id': '38897546',
|
|
||||||
'ext': 'mp4',
|
'ext': 'mp4',
|
||||||
'title': 'SPECIÁL: Meta-přednáška Petra Ludwiga - Hodnoty pro lepší společnost',
|
'title': 'SPECIÁL: Meta-přednáška Petra Ludwiga - Hodnoty pro lepší společnost',
|
||||||
'description': 'Watch full version of this video at https://slideslive.com/38897546.',
|
'thumbnail': r're:^https?://.*\.jpg',
|
||||||
'channel_url': 'https://www.youtube.com/channel/UCZWdAkNYFncuX0khyvhqnxw',
|
'upload_date': '20231029',
|
||||||
'channel': 'SlidesLive Videos - G1',
|
'timestamp': 1698588144,
|
||||||
'channel_id': 'UCZWdAkNYFncuX0khyvhqnxw',
|
|
||||||
'uploader_id': 'UCZWdAkNYFncuX0khyvhqnxw',
|
|
||||||
'uploader': 'SlidesLive Videos - G1',
|
|
||||||
'uploader_url': 'http://www.youtube.com/channel/UCZWdAkNYFncuX0khyvhqnxw',
|
|
||||||
'live_status': 'not_live',
|
|
||||||
'upload_date': '20160710',
|
|
||||||
'timestamp': 1618786715,
|
|
||||||
'duration': 6827,
|
|
||||||
'like_count': int,
|
|
||||||
'view_count': int,
|
|
||||||
'comment_count': int,
|
|
||||||
'channel_follower_count': int,
|
|
||||||
'age_limit': 0,
|
|
||||||
'thumbnail': r're:^https?://.*\.(?:jpg|webp)',
|
|
||||||
'thumbnails': 'count:169',
|
'thumbnails': 'count:169',
|
||||||
'playable_in_embed': True,
|
|
||||||
'availability': 'unlisted',
|
|
||||||
'tags': [],
|
|
||||||
'categories': ['People & Blogs'],
|
|
||||||
'chapters': 'count:168',
|
'chapters': 'count:168',
|
||||||
|
'duration': 6827,
|
||||||
|
},
|
||||||
|
'params': {
|
||||||
|
'skip_download': 'm3u8',
|
||||||
},
|
},
|
||||||
}, {
|
}, {
|
||||||
# embed-only presentation, only XML slides info
|
# embed-only presentation, only XML slides info
|
||||||
|
@ -111,8 +96,8 @@ class SlidesLiveIE(InfoExtractor):
|
||||||
'title': 'Towards a Deep Network Architecture for Structured Smoothness',
|
'title': 'Towards a Deep Network Architecture for Structured Smoothness',
|
||||||
'thumbnail': r're:^https?://.*\.jpg',
|
'thumbnail': r're:^https?://.*\.jpg',
|
||||||
'thumbnails': 'count:8',
|
'thumbnails': 'count:8',
|
||||||
'timestamp': 1629671508,
|
'timestamp': 1697803109,
|
||||||
'upload_date': '20210822',
|
'upload_date': '20231020',
|
||||||
'chapters': 'count:7',
|
'chapters': 'count:7',
|
||||||
'duration': 326,
|
'duration': 326,
|
||||||
},
|
},
|
||||||
|
@ -128,8 +113,8 @@ class SlidesLiveIE(InfoExtractor):
|
||||||
'title': 'MoReL: Multi-omics Relational Learning',
|
'title': 'MoReL: Multi-omics Relational Learning',
|
||||||
'thumbnail': r're:^https?://.*\.(?:jpg|png)',
|
'thumbnail': r're:^https?://.*\.(?:jpg|png)',
|
||||||
'thumbnails': 'count:7',
|
'thumbnails': 'count:7',
|
||||||
'timestamp': 1654714970,
|
'timestamp': 1697824939,
|
||||||
'upload_date': '20220608',
|
'upload_date': '20231020',
|
||||||
'chapters': 'count:6',
|
'chapters': 'count:6',
|
||||||
'duration': 171,
|
'duration': 171,
|
||||||
},
|
},
|
||||||
|
@ -145,8 +130,8 @@ class SlidesLiveIE(InfoExtractor):
|
||||||
'title': 'Decentralized Attribution of Generative Models',
|
'title': 'Decentralized Attribution of Generative Models',
|
||||||
'thumbnail': r're:^https?://.*\.jpg',
|
'thumbnail': r're:^https?://.*\.jpg',
|
||||||
'thumbnails': 'count:16',
|
'thumbnails': 'count:16',
|
||||||
'timestamp': 1622806321,
|
'timestamp': 1697814901,
|
||||||
'upload_date': '20210604',
|
'upload_date': '20231020',
|
||||||
'chapters': 'count:15',
|
'chapters': 'count:15',
|
||||||
'duration': 306,
|
'duration': 306,
|
||||||
},
|
},
|
||||||
|
@ -162,8 +147,8 @@ class SlidesLiveIE(InfoExtractor):
|
||||||
'title': 'Efficient Active Search for Combinatorial Optimization Problems',
|
'title': 'Efficient Active Search for Combinatorial Optimization Problems',
|
||||||
'thumbnail': r're:^https?://.*\.(?:jpg|png)',
|
'thumbnail': r're:^https?://.*\.(?:jpg|png)',
|
||||||
'thumbnails': 'count:9',
|
'thumbnails': 'count:9',
|
||||||
'timestamp': 1654714896,
|
'timestamp': 1697824757,
|
||||||
'upload_date': '20220608',
|
'upload_date': '20231020',
|
||||||
'chapters': 'count:8',
|
'chapters': 'count:8',
|
||||||
'duration': 295,
|
'duration': 295,
|
||||||
},
|
},
|
||||||
|
@ -177,10 +162,10 @@ class SlidesLiveIE(InfoExtractor):
|
||||||
'id': '38979880',
|
'id': '38979880',
|
||||||
'ext': 'mp4',
|
'ext': 'mp4',
|
||||||
'title': 'The Representation Power of Neural Networks',
|
'title': 'The Representation Power of Neural Networks',
|
||||||
'timestamp': 1654714962,
|
'timestamp': 1697824919,
|
||||||
'thumbnail': r're:^https?://.*\.(?:jpg|png)',
|
'thumbnail': r're:^https?://.*\.(?:jpg|png)',
|
||||||
'thumbnails': 'count:22',
|
'thumbnails': 'count:22',
|
||||||
'upload_date': '20220608',
|
'upload_date': '20231020',
|
||||||
'chapters': 'count:21',
|
'chapters': 'count:21',
|
||||||
'duration': 294,
|
'duration': 294,
|
||||||
},
|
},
|
||||||
|
@ -200,10 +185,10 @@ class SlidesLiveIE(InfoExtractor):
|
||||||
'id': '38979682',
|
'id': '38979682',
|
||||||
'ext': 'mp4',
|
'ext': 'mp4',
|
||||||
'title': 'LoRA: Low-Rank Adaptation of Large Language Models',
|
'title': 'LoRA: Low-Rank Adaptation of Large Language Models',
|
||||||
'timestamp': 1654714920,
|
'timestamp': 1697824815,
|
||||||
'thumbnail': r're:^https?://.*\.(?:jpg|png)',
|
'thumbnail': r're:^https?://.*\.(?:jpg|png)',
|
||||||
'thumbnails': 'count:30',
|
'thumbnails': 'count:30',
|
||||||
'upload_date': '20220608',
|
'upload_date': '20231020',
|
||||||
'chapters': 'count:31',
|
'chapters': 'count:31',
|
||||||
'duration': 272,
|
'duration': 272,
|
||||||
},
|
},
|
||||||
|
@ -213,8 +198,8 @@ class SlidesLiveIE(InfoExtractor):
|
||||||
'ext': 'mp4',
|
'ext': 'mp4',
|
||||||
'title': 'LoRA: Low-Rank Adaptation of Large Language Models - Slide 021',
|
'title': 'LoRA: Low-Rank Adaptation of Large Language Models - Slide 021',
|
||||||
'duration': 3,
|
'duration': 3,
|
||||||
'timestamp': 1654714920,
|
'timestamp': 1697824815,
|
||||||
'upload_date': '20220608',
|
'upload_date': '20231020',
|
||||||
},
|
},
|
||||||
}, {
|
}, {
|
||||||
'info_dict': {
|
'info_dict': {
|
||||||
|
@ -222,8 +207,8 @@ class SlidesLiveIE(InfoExtractor):
|
||||||
'ext': 'mp4',
|
'ext': 'mp4',
|
||||||
'title': 'LoRA: Low-Rank Adaptation of Large Language Models - Slide 024',
|
'title': 'LoRA: Low-Rank Adaptation of Large Language Models - Slide 024',
|
||||||
'duration': 4,
|
'duration': 4,
|
||||||
'timestamp': 1654714920,
|
'timestamp': 1697824815,
|
||||||
'upload_date': '20220608',
|
'upload_date': '20231020',
|
||||||
},
|
},
|
||||||
}],
|
}],
|
||||||
'params': {
|
'params': {
|
||||||
|
@ -242,10 +227,10 @@ class SlidesLiveIE(InfoExtractor):
|
||||||
'id': '38979481',
|
'id': '38979481',
|
||||||
'ext': 'mp4',
|
'ext': 'mp4',
|
||||||
'title': 'How to Train Your MAML to Excel in Few-Shot Classification',
|
'title': 'How to Train Your MAML to Excel in Few-Shot Classification',
|
||||||
'timestamp': 1654714877,
|
'timestamp': 1697824716,
|
||||||
'thumbnail': r're:^https?://.*\.(?:jpg|png)',
|
'thumbnail': r're:^https?://.*\.(?:jpg|png)',
|
||||||
'thumbnails': 'count:43',
|
'thumbnails': 'count:43',
|
||||||
'upload_date': '20220608',
|
'upload_date': '20231020',
|
||||||
'chapters': 'count:43',
|
'chapters': 'count:43',
|
||||||
'duration': 315,
|
'duration': 315,
|
||||||
},
|
},
|
||||||
|
@ -255,8 +240,8 @@ class SlidesLiveIE(InfoExtractor):
|
||||||
'ext': 'mp4',
|
'ext': 'mp4',
|
||||||
'title': 'How to Train Your MAML to Excel in Few-Shot Classification - Slide 013',
|
'title': 'How to Train Your MAML to Excel in Few-Shot Classification - Slide 013',
|
||||||
'duration': 3,
|
'duration': 3,
|
||||||
'timestamp': 1654714877,
|
'timestamp': 1697824716,
|
||||||
'upload_date': '20220608',
|
'upload_date': '20231020',
|
||||||
},
|
},
|
||||||
}],
|
}],
|
||||||
'params': {
|
'params': {
|
||||||
|
@ -275,10 +260,10 @@ class SlidesLiveIE(InfoExtractor):
|
||||||
'channel_id': 'UC62SdArr41t_-_fX40QCLRw',
|
'channel_id': 'UC62SdArr41t_-_fX40QCLRw',
|
||||||
'channel_url': 'https://www.youtube.com/channel/UC62SdArr41t_-_fX40QCLRw',
|
'channel_url': 'https://www.youtube.com/channel/UC62SdArr41t_-_fX40QCLRw',
|
||||||
'uploader': 'SlidesLive Videos - A',
|
'uploader': 'SlidesLive Videos - A',
|
||||||
'uploader_id': 'UC62SdArr41t_-_fX40QCLRw',
|
'uploader_id': '@slideslivevideos-a6075',
|
||||||
'uploader_url': 'http://www.youtube.com/channel/UC62SdArr41t_-_fX40QCLRw',
|
'uploader_url': 'https://www.youtube.com/@slideslivevideos-a6075',
|
||||||
'upload_date': '20200903',
|
'upload_date': '20200903',
|
||||||
'timestamp': 1602599092,
|
'timestamp': 1697805922,
|
||||||
'duration': 942,
|
'duration': 942,
|
||||||
'age_limit': 0,
|
'age_limit': 0,
|
||||||
'live_status': 'not_live',
|
'live_status': 'not_live',
|
||||||
|
@ -303,8 +288,8 @@ class SlidesLiveIE(InfoExtractor):
|
||||||
'id': '38983994',
|
'id': '38983994',
|
||||||
'ext': 'mp4',
|
'ext': 'mp4',
|
||||||
'title': 'Zero-Shot AutoML with Pretrained Models',
|
'title': 'Zero-Shot AutoML with Pretrained Models',
|
||||||
'timestamp': 1662384834,
|
'timestamp': 1697826708,
|
||||||
'upload_date': '20220905',
|
'upload_date': '20231020',
|
||||||
'thumbnail': r're:^https?://.*\.(?:jpg|png)',
|
'thumbnail': r're:^https?://.*\.(?:jpg|png)',
|
||||||
'thumbnails': 'count:23',
|
'thumbnails': 'count:23',
|
||||||
'chapters': 'count:22',
|
'chapters': 'count:22',
|
||||||
|
@ -336,8 +321,8 @@ class SlidesLiveIE(InfoExtractor):
|
||||||
'title': 'Towards a Deep Network Architecture for Structured Smoothness',
|
'title': 'Towards a Deep Network Architecture for Structured Smoothness',
|
||||||
'thumbnail': r're:^https?://.*\.jpg',
|
'thumbnail': r're:^https?://.*\.jpg',
|
||||||
'thumbnails': 'count:8',
|
'thumbnails': 'count:8',
|
||||||
'timestamp': 1629671508,
|
'timestamp': 1697803109,
|
||||||
'upload_date': '20210822',
|
'upload_date': '20231020',
|
||||||
'chapters': 'count:7',
|
'chapters': 'count:7',
|
||||||
'duration': 326,
|
'duration': 326,
|
||||||
},
|
},
|
||||||
|
|
|
@ -190,10 +190,9 @@ class TwitchBaseIE(InfoExtractor):
|
||||||
'url': thumbnail,
|
'url': thumbnail,
|
||||||
}] if thumbnail else None
|
}] if thumbnail else None
|
||||||
|
|
||||||
def _extract_twitch_m3u8_formats(self, video_id, token, signature):
|
def _extract_twitch_m3u8_formats(self, path, video_id, token, signature):
|
||||||
"""Subclasses must define _M3U8_PATH"""
|
|
||||||
return self._extract_m3u8_formats(
|
return self._extract_m3u8_formats(
|
||||||
f'{self._USHER_BASE}/{self._M3U8_PATH}/{video_id}.m3u8', video_id, 'mp4', query={
|
f'{self._USHER_BASE}/{path}/{video_id}.m3u8', video_id, 'mp4', query={
|
||||||
'allow_source': 'true',
|
'allow_source': 'true',
|
||||||
'allow_audio_only': 'true',
|
'allow_audio_only': 'true',
|
||||||
'allow_spectre': 'true',
|
'allow_spectre': 'true',
|
||||||
|
@ -216,7 +215,6 @@ class TwitchVodIE(TwitchBaseIE):
|
||||||
)
|
)
|
||||||
(?P<id>\d+)
|
(?P<id>\d+)
|
||||||
'''
|
'''
|
||||||
_M3U8_PATH = 'vod'
|
|
||||||
|
|
||||||
_TESTS = [{
|
_TESTS = [{
|
||||||
'url': 'http://www.twitch.tv/riotgames/v/6528877?t=5m10s',
|
'url': 'http://www.twitch.tv/riotgames/v/6528877?t=5m10s',
|
||||||
|
@ -547,7 +545,7 @@ class TwitchVodIE(TwitchBaseIE):
|
||||||
access_token = self._download_access_token(vod_id, 'video', 'id')
|
access_token = self._download_access_token(vod_id, 'video', 'id')
|
||||||
|
|
||||||
formats = self._extract_twitch_m3u8_formats(
|
formats = self._extract_twitch_m3u8_formats(
|
||||||
vod_id, access_token['value'], access_token['signature'])
|
'vod', vod_id, access_token['value'], access_token['signature'])
|
||||||
formats.extend(self._extract_storyboard(vod_id, video.get('storyboard'), info.get('duration')))
|
formats.extend(self._extract_storyboard(vod_id, video.get('storyboard'), info.get('duration')))
|
||||||
|
|
||||||
self._prefer_source(formats)
|
self._prefer_source(formats)
|
||||||
|
@ -926,7 +924,6 @@ class TwitchStreamIE(TwitchBaseIE):
|
||||||
)
|
)
|
||||||
(?P<id>[^/#?]+)
|
(?P<id>[^/#?]+)
|
||||||
'''
|
'''
|
||||||
_M3U8_PATH = 'api/channel/hls'
|
|
||||||
|
|
||||||
_TESTS = [{
|
_TESTS = [{
|
||||||
'url': 'http://www.twitch.tv/shroomztv',
|
'url': 'http://www.twitch.tv/shroomztv',
|
||||||
|
@ -1032,7 +1029,7 @@ class TwitchStreamIE(TwitchBaseIE):
|
||||||
|
|
||||||
stream_id = stream.get('id') or channel_name
|
stream_id = stream.get('id') or channel_name
|
||||||
formats = self._extract_twitch_m3u8_formats(
|
formats = self._extract_twitch_m3u8_formats(
|
||||||
channel_name, access_token['value'], access_token['signature'])
|
'api/channel/hls', channel_name, access_token['value'], access_token['signature'])
|
||||||
self._prefer_source(formats)
|
self._prefer_source(formats)
|
||||||
|
|
||||||
view_count = stream.get('viewers')
|
view_count = stream.get('viewers')
|
||||||
|
|
|
@ -43,7 +43,7 @@ class Vbox7IE(InfoExtractor):
|
||||||
'uploader': 'svideteliat_ot_varshava',
|
'uploader': 'svideteliat_ot_varshava',
|
||||||
'view_count': int,
|
'view_count': int,
|
||||||
'timestamp': 1360215023,
|
'timestamp': 1360215023,
|
||||||
'thumbnail': 'https://i49.vbox7.com/design/iconci/png/noimg6.png',
|
'thumbnail': 'https://i49.vbox7.com/o/249/249bb972c20.jpg',
|
||||||
'description': 'Смях! Чудо - чист за секунди - Скрита камера',
|
'description': 'Смях! Чудо - чист за секунди - Скрита камера',
|
||||||
'upload_date': '20130207',
|
'upload_date': '20130207',
|
||||||
'duration': 83,
|
'duration': 83,
|
||||||
|
|
|
@ -10,14 +10,14 @@ import urllib.request
|
||||||
import zlib
|
import zlib
|
||||||
|
|
||||||
from ._utils import Popen, decode_base_n, preferredencoding
|
from ._utils import Popen, decode_base_n, preferredencoding
|
||||||
from .networking import escape_rfc3986 # noqa: F401
|
|
||||||
from .networking import normalize_url as escape_url # noqa: F401
|
|
||||||
from .traversal import traverse_obj
|
from .traversal import traverse_obj
|
||||||
from ..dependencies import certifi, websockets
|
from ..dependencies import certifi, websockets
|
||||||
from ..networking._helper import make_ssl_context
|
from ..networking._helper import make_ssl_context
|
||||||
from ..networking._urllib import HTTPHandler
|
from ..networking._urllib import HTTPHandler
|
||||||
|
|
||||||
# isort: split
|
# isort: split
|
||||||
|
from .networking import escape_rfc3986 # noqa: F401
|
||||||
|
from .networking import normalize_url as escape_url # noqa: F401
|
||||||
from .networking import random_user_agent, std_headers # noqa: F401
|
from .networking import random_user_agent, std_headers # noqa: F401
|
||||||
from ..cookies import YoutubeDLCookieJar # noqa: F401
|
from ..cookies import YoutubeDLCookieJar # noqa: F401
|
||||||
from ..networking._urllib import PUTRequest # noqa: F401
|
from ..networking._urllib import PUTRequest # noqa: F401
|
||||||
|
|
|
@ -78,7 +78,7 @@ class _MatchChildParser(_MatchParser):
|
||||||
class ParseError(Exception):
|
class ParseError(Exception):
|
||||||
def __init__(self, parser):
|
def __init__(self, parser):
|
||||||
super().__init__("Parse error at position %u (near %r)" % (
|
super().__init__("Parse error at position %u (near %r)" % (
|
||||||
parser._pos, parser._data[parser._pos:parser._pos + 20]
|
parser._pos, parser._data[parser._pos:parser._pos + 100]
|
||||||
))
|
))
|
||||||
|
|
||||||
|
|
||||||
|
|
Loading…
Add table
Reference in a new issue