import asyncio from typing import OrderedDict import m3u8 import os import re import requests import shutil import subprocess import tempfile from os import path from pathlib import Path from urllib.parse import urlparse, urlencode from twitchdl import twitch, utils from twitchdl.download import download_file from twitchdl.exceptions import ConsoleError from twitchdl.http import download_all from twitchdl.output import print_out def _parse_playlists(playlists_m3u8): playlists = m3u8.loads(playlists_m3u8) for p in sorted(playlists.playlists, key=lambda p: p.stream_info.resolution is None): if p.stream_info.resolution: name = p.media[0].name description = "x".join(str(r) for r in p.stream_info.resolution) else: name = p.media[0].group_id description = None yield name, description, p.uri def _get_playlist_by_name(playlists, quality): if quality == "source": _, _, uri = playlists[0] return uri for name, _, uri in playlists: if name == quality: return uri available = ", ".join([name for (name, _, _) in playlists]) msg = "Quality '{}' not found. Available qualities are: {}".format(quality, available) raise ConsoleError(msg) def _select_playlist_interactive(playlists): print_out("\nAvailable qualities:") for n, (name, resolution, uri) in enumerate(playlists): if resolution: print_out("{}) {} [{}]".format(n + 1, name, resolution)) else: print_out("{}) {}".format(n + 1, name)) no = utils.read_int("Choose quality", min=1, max=len(playlists) + 1, default=1) _, _, uri = playlists[no - 1] return uri def _join_vods(playlist_path, target, overwrite, video): command = [ "ffmpeg", "-i", playlist_path, "-c", "copy", "-metadata", "artist={}".format(video["creator"]["displayName"]), "-metadata", "title={}".format(video["title"]), "-metadata", "encoded_by=twitch-dl", "-stats", "-loglevel", "warning", "file:{}".format(target), ] if overwrite: command.append("-y") print_out("{}".format(" ".join(command))) result = subprocess.run(command) if result.returncode != 0: raise ConsoleError("Joining files failed") def _video_target_filename(video, args): date, time = video['publishedAt'].split("T") game = video["game"]["name"] if video["game"] else "Unknown" subs = { "channel": video["creator"]["displayName"], "channel_login": video["creator"]["login"], "date": date, "datetime": video["publishedAt"], "format": args.format, "game": game, "game_slug": utils.slugify(game), "id": video["id"], "time": time, "title": utils.titlify(video["title"]), "title_slug": utils.slugify(video["title"]), } try: return args.output.format(**subs) except KeyError as e: supported = ", ".join(subs.keys()) raise ConsoleError("Invalid key {} used in --output. Supported keys are: {}".format(e, supported)) def _clip_target_filename(clip, args): date, time = clip["createdAt"].split("T") game = clip["game"]["name"] if clip["game"] else "Unknown" url = clip["videoQualities"][0]["sourceURL"] _, ext = path.splitext(url) ext = ext.lstrip(".") subs = { "channel": clip["broadcaster"]["displayName"], "channel_login": clip["broadcaster"]["login"], "date": date, "datetime": clip["createdAt"], "format": ext, "game": game, "game_slug": utils.slugify(game), "id": clip["id"], "slug": clip["slug"], "time": time, "title": utils.titlify(clip["title"]), "title_slug": utils.slugify(clip["title"]), } try: return args.output.format(**subs) except KeyError as e: supported = ", ".join(subs.keys()) raise ConsoleError("Invalid key {} used in --output. Supported keys are: {}".format(e, supported)) def _get_vod_paths(playlist, start, end): """Extract unique VOD paths for download from playlist.""" files = [] vod_start = 0 for segment in playlist.segments: vod_end = vod_start + segment.duration # `vod_end > start` is used here becuase it's better to download a bit # more than a bit less, similar for the end condition start_condition = not start or vod_end > start end_condition = not end or vod_start < end if start_condition and end_condition and segment.uri not in files: files.append(segment.uri) vod_start = vod_end return files def _crete_temp_dir(base_uri): """Create a temp dir to store downloads if it doesn't exist.""" path = urlparse(base_uri).path.lstrip("/") temp_dir = Path(tempfile.gettempdir(), "twitch-dl", path) temp_dir.mkdir(parents=True, exist_ok=True) return str(temp_dir) def download(args): video_id = utils.parse_video_identifier(args.video) if video_id: return _download_video(video_id, args) clip_slug = utils.parse_clip_identifier(args.video) if clip_slug: return _download_clip(clip_slug, args) raise ConsoleError("Invalid input: {}".format(args.video)) def _get_clip_url(clip, quality): qualities = clip["videoQualities"] # Quality given as an argument if quality: if quality == "source": return qualities[0]["sourceURL"] selected_quality = quality.rstrip("p") # allow 720p as well as 720 for q in qualities: if q["quality"] == selected_quality: return q["sourceURL"] available = ", ".join([str(q["quality"]) for q in qualities]) msg = "Quality '{}' not found. Available qualities are: {}".format(quality, available) raise ConsoleError(msg) # Ask user to select quality print_out("\nAvailable qualities:") for n, q in enumerate(qualities): print_out("{}) {} [{} fps]".format(n + 1, q["quality"], q["frameRate"])) print_out() no = utils.read_int("Choose quality", min=1, max=len(qualities), default=1) selected_quality = qualities[no - 1] return selected_quality["sourceURL"] def get_clip_authenticated_url(slug, quality): print_out("Fetching access token...") access_token = twitch.get_clip_access_token(slug) if not access_token: raise ConsoleError("Access token not found for slug '{}'".format(slug)) url = _get_clip_url(access_token, quality) query = urlencode({ "sig": access_token["playbackAccessToken"]["signature"], "token": access_token["playbackAccessToken"]["value"], }) return "{}?{}".format(url, query) def _download_clip(slug, args): print_out("Looking up clip...") clip = twitch.get_clip(slug) game = clip["game"]["name"] if clip["game"] else "Unknown" if not clip: raise ConsoleError("Clip '{}' not found".format(slug)) print_out("Found: {} by {}, playing {} ({})".format( clip["title"], clip["broadcaster"]["displayName"], game, utils.format_duration(clip["durationSeconds"]) )) target = _clip_target_filename(clip, args) print_out("Target: {}".format(target)) if not args.overwrite and path.exists(target): response = input("File exists. Overwrite? [Y/n]: ") if response.lower().strip() not in ["", "y"]: raise ConsoleError("Aborted") args.overwrite = True url = get_clip_authenticated_url(slug, args.quality) print_out("Selected URL: {}".format(url)) print_out("Downloading clip...") download_file(url, target) print_out("Downloaded: {}".format(target)) def _download_video(video_id, args): if args.start and args.end and args.end <= args.start: raise ConsoleError("End time must be greater than start time") print_out("Looking up video...") video = twitch.get_video(video_id) if not video: raise ConsoleError("Video {} not found".format(video_id)) print_out("Found: {} by {}".format( video['title'], video['creator']['displayName'])) target = _video_target_filename(video, args) print_out("Output: {}".format(target)) if not args.overwrite and path.exists(target): response = input("File exists. Overwrite? [Y/n]: ") if response.lower().strip() not in ["", "y"]: raise ConsoleError("Aborted") args.overwrite = True print_out("Fetching access token...") access_token = twitch.get_access_token(video_id, auth_token=args.auth_token) print_out("Fetching playlists...") playlists_m3u8 = twitch.get_playlists(video_id, access_token) playlists = list(_parse_playlists(playlists_m3u8)) playlist_uri = (_get_playlist_by_name(playlists, args.quality) if args.quality else _select_playlist_interactive(playlists)) print_out("Fetching playlist...") response = requests.get(playlist_uri) response.raise_for_status() playlist = m3u8.loads(response.text) base_uri = re.sub("/[^/]+$", "/", playlist_uri) target_dir = _crete_temp_dir(base_uri) vod_paths = _get_vod_paths(playlist, args.start, args.end) # Save playlists for debugging purposes with open(path.join(target_dir, "playlists.m3u8"), "w") as f: f.write(playlists_m3u8) with open(path.join(target_dir, "playlist.m3u8"), "w") as f: f.write(response.text) print_out("\nDownloading {} VODs using {} workers to {}".format( len(vod_paths), args.max_workers, target_dir)) sources = [base_uri + path for path in vod_paths] targets = [os.path.join(target_dir, "{:05d}.ts".format(k)) for k, _ in enumerate(vod_paths)] asyncio.run(download_all(sources, targets, args.max_workers, rate_limit=args.rate_limit)) # Make a modified playlist which references downloaded VODs # Keep only the downloaded segments and skip the rest org_segments = playlist.segments.copy() path_map = OrderedDict(zip(vod_paths, targets)) playlist.segments.clear() for segment in org_segments: if segment.uri in path_map: segment.uri = path_map[segment.uri] playlist.segments.append(segment) playlist_path = path.join(target_dir, "playlist_downloaded.m3u8") playlist.dump(playlist_path) if args.no_join: print_out("\n\nSkipping joining files...") print_out("VODs downloaded to:\n{}".format(target_dir)) return print_out("\n\nJoining files...") _join_vods(playlist_path, target, args.overwrite, video) if args.keep: print_out("\nTemporary files not deleted: {}".format(target_dir)) else: print_out("\nDeleting temporary files...") shutil.rmtree(target_dir) print_out("\nDownloaded: {}".format(target))