import os import shutil import subprocess import sys import threading import time import shlex from xml.dom.minidom import parse, parseString from instagram_private_api import ClientConnectionError from instagram_private_api import ClientError from instagram_private_api import ClientThrottledError from instagram_private_api_extensions import live from instagram_private_api_extensions import replay from .comments import CommentsDownloader from .logger import log from .logger import seperator def main(instagram_api_arg, download_arg, settings_arg): global instagram_api global user_to_download global broadcast global settings settings = settings_arg instagram_api = instagram_api_arg user_to_download = download_arg get_user_info(user_to_download) def run_command(command): try: FNULL = open(os.devnull, 'w') subprocess.Popen(shlex.split(command), stdout=FNULL, stderr=subprocess.STDOUT) except Exception as e: pass def get_stream_duration(compare_time, broadcast=None): try: had_wrong_time = False if broadcast: if (int(time.time()) < int(compare_time)): had_wrong_time = True corrected_compare_time = int(compare_time) - 5 download_time = int(time.time()) - int(corrected_compare_time) else: download_time = int(time.time()) - int(compare_time) stream_time = int(time.time()) - int(broadcast.get('published_time')) stream_started_mins, stream_started_secs = divmod(stream_time - download_time, 60) else: if (int(time.time()) < int(compare_time)): had_wrong_time = True corrected_compare_time = int(compare_time) - 5 stream_started_mins, stream_started_secs = divmod((int(time.time()) - int(corrected_compare_time)), 60) else: stream_started_mins, stream_started_secs = divmod((int(time.time()) - int(compare_time)), 60) stream_duration_str = '%d minutes' % stream_started_mins if stream_started_secs: stream_duration_str += ' and %d seconds' % stream_started_secs if had_wrong_time: return "{:s} (corrected)".format(stream_duration_str) else: return stream_duration_str except Exception as e: return "Not available" def download_livestream(broadcast): try: def print_status(sep=True): heartbeat_info = instagram_api.broadcast_heartbeat_and_viewercount(broadcast.get('id')) viewers = broadcast.get('viewer_count', 0) if sep: seperator("GREEN") log('[I] Viewers : {:s} watching'.format(str(int(viewers))), "GREEN") log('[I] Airing time : {:s}'.format(get_stream_duration(broadcast.get('published_time'))), "GREEN") log('[I] Status : {:s}'.format(heartbeat_info.get('broadcast_status').title()), "GREEN") return heartbeat_info.get('broadcast_status') not in ['active', 'interrupted'] mpd_url = (broadcast.get('dash_manifest') or broadcast.get('dash_abr_playback_url') or broadcast.get('dash_playback_url')) output_dir = '{}{}_{}_{}_{}_live_downloads'.format(settings.save_path, settings.current_date, user_to_download, broadcast.get('id'), settings.current_time) broadcast_downloader = live.Downloader( mpd=mpd_url, output_dir=output_dir, user_agent=instagram_api.user_agent, max_connection_error_retry=3, duplicate_etag_retry=30, callback_check=print_status, mpd_download_timeout=3, download_timeout=3) except Exception as e: log('[E] Could not start downloading livestream: {:s}'.format(str(e)), "RED") seperator("GREEN") sys.exit(1) try: log('[I] Livestream found, beginning download...', "GREEN") broadcast_owner = broadcast.get('broadcast_owner', {}).get('username') try: broadcast_guest = broadcast.get('cobroadcasters', {})[0].get('username') except: broadcast_guest = None if (broadcast_owner != user_to_download): log('[I] This livestream is a dual-live, the owner is "{}".'.format(broadcast_owner), "BLUE") broadcast_guest = None if broadcast_guest: log('[I] This livestream is a dual-live, the current guest is "{}".'.format(broadcast_guest), "BLUE") seperator("GREEN") log('[I] Username : {:s}'.format(user_to_download), "GREEN") print_status(False) log('[I] MPD URL : {:s}'.format(mpd_url), "GREEN") seperator("GREEN") open(os.path.join(output_dir, 'folder.lock'), 'a').close() log('[I] Downloading livestream... press [CTRL+C] to abort.', "GREEN") if (settings.run_at_start is not "None"): try: thread = threading.Thread(target=run_command, args=(settings.run_at_start,)) thread.daemon = True thread.start() log("[I] Command executed: \033[94m{:s}".format(settings.run_at_start), "GREEN") except Exception as e: log('[W] Could not execute command: {:s}'.format(str(e)), "YELLOW") comment_thread_worker = None if settings.save_comments.title() == "True": try: comments_json_file = os.path.join(output_dir, '{}_{}_{}_{}_live_comments.json'.format(settings.current_date, user_to_download, broadcast.get('id'), settings.current_time)) comment_thread_worker = threading.Thread(target=get_live_comments, args=(instagram_api, broadcast, comments_json_file, broadcast_downloader,)) comment_thread_worker.start() except Exception as e: log('[E] An error occurred while downloading comments: {:s}'.format(str(e)), "RED") broadcast_downloader.run() seperator("GREEN") log('[I] The livestream has ended.\n[I] Download duration : {}\n[I] Stream duration : {}\n[I] Missing (approx.) : {}'.format(get_stream_duration(int(settings.current_time)), get_stream_duration(broadcast.get('published_time')), get_stream_duration(int(settings.current_time), broadcast)), "YELLOW") seperator("GREEN") stitch_video(broadcast_downloader, broadcast, comment_thread_worker) except KeyboardInterrupt: seperator("GREEN") log('[I] The download has been aborted by the user.\n[I] Download duration : {}\n[I] Stream duration : {}\n[I] Missing (approx.) : {}'.format(get_stream_duration(int(settings.current_time)), get_stream_duration(broadcast.get('published_time')), get_stream_duration(int(settings.current_time), broadcast)), "YELLOW") seperator("GREEN") if not broadcast_downloader.is_aborted: broadcast_downloader.stop() stitch_video(broadcast_downloader, broadcast, comment_thread_worker) except Exception as e: log("[E] Could not download livestream: {:s}".format(str(e)), "RED") try: os.remove(os.path.join(output_dir, 'folder.lock')) except Exception: pass def stitch_video(broadcast_downloader, broadcast, comment_thread_worker): try: live_mp4_file = '{}{}_{}_{}_{}_live.mp4'.format(settings.save_path, settings.current_date, user_to_download, broadcast.get('id'), settings.current_time) live_folder_path = "{:s}_downloads".format(live_mp4_file.split('.mp4')[0]) if comment_thread_worker and comment_thread_worker.is_alive(): log("[I] Waiting for comment downloader to end cycle...", "GREEN") comment_thread_worker.join() if (settings.run_at_finish is not "None"): try: thread = threading.Thread(target=run_command, args=(settings.run_at_finish,)) thread.daemon = True thread.start() log("[I] Command executed: \033[94m{:s}".format(settings.run_at_finish), "GREEN") except Exception as e: log('[W] Could not execute command: {:s}'.format(str(e)), "YELLOW") log('[I] Stitching downloaded files into video...', "GREEN") try: if settings.clear_temp_files.title() == "True": broadcast_downloader.stitch(live_mp4_file, cleartempfiles=True) else: broadcast_downloader.stitch(live_mp4_file, cleartempfiles=False) log('[I] Successfully stitched downloaded files into video.', "GREEN") try: os.remove(os.path.join(live_folder_path, 'folder.lock')) except Exception: pass if settings.clear_temp_files.title() == "True": try: shutil.rmtree(live_folder_path) except Exception as e: log("[E] Could not remove temp folder: {:s}".format(str(e)), "RED") seperator("GREEN") sys.exit(0) except ValueError as e: log('[E] Could not stitch downloaded files: {:s}\n[E] Likely the download duration was too short and no temp files were saved.'.format(str(e)), "RED") seperator("GREEN") try: os.remove(os.path.join(live_folder_path, 'folder.lock')) except Exception: pass sys.exit(1) except Exception as e: log('[E] Could not stitch downloaded files: {:s}'.format(str(e)), "RED") seperator("GREEN") try: os.remove(os.path.join(live_folder_path, 'folder.lock')) except Exception: pass sys.exit(1) except KeyboardInterrupt: log('[I] Aborted stitching process, no video was created.', "YELLOW") seperator("GREEN") try: os.remove(os.path.join(live_folder_path, 'folder.lock')) except Exception: pass sys.exit(0) def get_user_info(user_to_download): try: user_res = instagram_api.username_info(user_to_download) user_id = user_res.get('user', {}).get('pk') except ClientConnectionError as cce: log('[E] Could not get user info for "{:s}": {:d} {:s}'.format(user_to_download, cce.code, str(cce)), "RED") if "getaddrinfo failed" in str(cce): log('[E] Could not resolve host, check your internet connection.', "RED") if "timed out" in str(cce): log('[E] The connection timed out, check your internet connection.', "RED") seperator("GREEN") sys.exit(1) except ClientThrottledError as cte: log('[E] Could not get user info for "{:s}": {:d} {:s}\n[E] You are making too many requests at this time.'.format(user_to_download, cte.code, str(cte)), "RED") seperator("GREEN") sys.exit(1) except ClientError as ce: log('[E] Could not get user info for "{:s}": {:d} {:s}'.format(user_to_download, ce.code, str(ce)), "RED") if ("Not Found") in str(ce): log('[E] The specified user does not exist.', "RED") seperator("GREEN") sys.exit(1) except Exception as e: log('[E] Could not get user info for "{:s}": {:s}'.format(user_to_download, str(e)), "RED") seperator("GREEN") sys.exit(1) except KeyboardInterrupt: log('[W] Aborted getting user info for "{:s}", exiting...'.format(user_to_download), "YELLOW") seperator("GREEN") sys.exit(0) log('[I] Getting info for "{:s}" successful.'.format(user_to_download), "GREEN") get_broadcasts_info(user_id) def get_broadcasts_info(user_id): seperator("GREEN") try: log('[I] Checking for livestreams and replays...', "GREEN") seperator("GREEN") broadcasts = instagram_api.user_story_feed(user_id) livestream = broadcasts.get('broadcast') replays = broadcasts.get('post_live_item', {}).get('broadcasts', []) if livestream: download_livestream(livestream) else: log('[I] There are no available livestreams.', "YELLOW") if settings.save_replays.title() == "True": if replays: seperator("GREEN") log('[I] Replays found, beginning download...', "GREEN") seperator("GREEN") download_replays(replays) else: log('[I] There are no available replays.', "YELLOW") else: log("[I] Replay saving is disabled either with an argument or in the config file.", "BLUE") seperator("GREEN") except Exception as e: log('[E] Could not finish checking: {:s}'.format(str(e)), "RED") if "timed out" in str(e): log('[E] The connection timed out, check your internet connection.', "RED") seperator("GREEN") exit(1) except KeyboardInterrupt: log('[W] Aborted checking for livestreams and replays, exiting...'.format(user_to_download), "YELLOW") seperator("GREEN") sys.exit(1) except ClientThrottledError as cte: log('[E] Could not check because you are making too many requests at this time.', "RED") seperator("GREEN") exit(1) def download_replays(broadcasts): try: try: log('[I] Amount of replays : {:s}'.format(str(len(broadcasts))), "GREEN") for replay_index, broadcast in enumerate(broadcasts): bc_dash_manifest = parseString(broadcast.get('dash_manifest')).getElementsByTagName('Period') bc_duration_raw = bc_dash_manifest[0].getAttribute("duration") bc_hours = (bc_duration_raw.split("PT"))[1].split("H")[0] bc_minutes = (bc_duration_raw.split("H"))[1].split("M")[0] bc_seconds = ((bc_duration_raw.split("M"))[1].split("S")[0]).split('.')[0] log('[I] Replay {:s} duration : {:s} minutes and {:s} seconds'.format(str(replay_index + 1), bc_minutes, bc_seconds), "GREEN") except Exception as e: log("[W] An error occurred while getting replay duration information: {:s}".format(str(e))) seperator("GREEN") log("[I] Downloading replays... press [CTRL+C] to abort.", "GREEN") seperator("GREEN") for replay_index, broadcast in enumerate(broadcasts): exists = False if sys.version.split(' ')[0].startswith('2'): directories = (os.walk(settings.save_path).next()[1]) else: directories = (os.walk(settings.save_path).__next__()[1]) for directory in directories: if (str(broadcast.get('id')) in directory) and ("_live_" not in directory): log("[W] Already downloaded a replay with ID '{:s}'.".format(str(broadcast.get('id'))), "YELLOW") exists = True if not exists: current = replay_index + 1 log("[I] Downloading replay {:s} of {:s} with ID '{:s}'...".format(str(current), str(len(broadcasts)), str(broadcast.get('id'))), "GREEN") current_time = str(int(time.time())) output_dir = '{}{}_{}_{}_{}_replay_downloads'.format(settings.save_path, settings.current_date, user_to_download, broadcast.get('id'), settings.current_time) broadcast_downloader = replay.Downloader( mpd=broadcast.get('dash_manifest'), output_dir=output_dir, user_agent=instagram_api.user_agent) open(os.path.join(output_dir, 'folder.lock'), 'a').close() replay_mp4_file = '{}{}_{}_{}_{}_replay.mp4'.format(settings.save_path, settings.current_date, user_to_download, broadcast.get('id'), settings.current_time) replay_json_file = os.path.join(output_dir, '{}_{}_{}_{}_replay_comments.json'.format(settings.current_date, user_to_download, broadcast.get('id'), settings.current_time)) if settings.clear_temp_files.title() == "True": replay_saved = broadcast_downloader.download(replay_mp4_file, cleartempfiles=True) else: replay_saved = broadcast_downloader.download(replay_mp4_file, cleartempfiles=False) if settings.save_comments.title() == "True": log("[I] Downloading replay comments...", "GREEN") try: get_replay_comments(instagram_api, broadcast, replay_json_file, broadcast_downloader) except Exception as e: log('[E] An error occurred while downloading comments: {:s}'.format(str(e)), "RED") if (len(replay_saved) == 1): log("[I] Finished downloading replay {:s} of {:s}.".format(str(current), str(len(broadcasts))), "GREEN") try: os.remove(os.path.join(output_dir, 'folder.lock')) except Exception: pass if (current != len(broadcasts)): seperator("GREEN") else: log("[W] No output video file was made, please merge the files manually if possible.", "YELLOW") log("[W] Check if ffmpeg is available by running ffmpeg in your terminal/cmd prompt.", "YELLOW") log("", "GREEN") seperator("GREEN") log("[I] Finished downloading all available replays.", "GREEN") seperator("GREEN") sys.exit(0) except Exception as e: log('[E] Could not save replay: {:s}'.format(str(e)), "RED") seperator("GREEN") try: os.remove(os.path.join(output_dir, 'folder.lock')) except Exception: pass sys.exit(1) except KeyboardInterrupt: seperator("GREEN") log('[I] The download has been aborted by the user.', "YELLOW") seperator("GREEN") try: shutil.rmtree(output_dir) except Exception as e: log("[E] Could not remove temp folder: {:s}".format(str(e)), "RED") sys.exit(1) sys.exit(0) def get_replay_comments(instagram_api, broadcast, comments_json_file, broadcast_downloader): try: comments_downloader = CommentsDownloader( api=instagram_api, broadcast=broadcast, destination_file=comments_json_file) comments_downloader.get_replay() try: if comments_downloader.comments: comments_log_file = comments_json_file.replace('.json', '.log') comment_errors, total_comments = CommentsDownloader.generate_log( comments_downloader.comments, broadcast.get('published_time'), comments_log_file, comments_delay=0) if total_comments == 1: log("[I] Successfully saved 1 comment to logfile.", "GREEN") seperator("GREEN") return True else: if comment_errors: log("[W] Successfully saved {:s} comments to logfile but {:s} comments are (partially) missing.".format(str(total_comments), str(comment_errors)), "YELLOW") else: log("[I] Successfully saved {:s} comments to logfile.".format(str(total_comments)), "GREEN") seperator("GREEN") return True else: log("[I] There are no available comments to save.", "GREEN") return False except Exception as e: log('[E] Could not save comments to logfile: {:s}'.format(str(e)), "RED") return False except KeyboardInterrupt as e: log("[W] Downloading replay comments has been aborted.", "YELLOW") return False def get_live_comments(instagram_api, broadcast, comments_json_file, broadcast_downloader): try: comments_downloader = CommentsDownloader( api=instagram_api, broadcast=broadcast, destination_file=comments_json_file) first_comment_created_at = 0 try: while not broadcast_downloader.is_aborted: if 'initial_buffered_duration' not in broadcast and broadcast_downloader.initial_buffered_duration: broadcast['initial_buffered_duration'] = broadcast_downloader.initial_buffered_duration comments_downloader.broadcast = broadcast first_comment_created_at = comments_downloader.get_live(first_comment_created_at) except ClientError as e: if not 'media has been deleted' in e.error_response: log("[W] Comment collection ClientError: %d %s" % (e.code, e.error_response), "YELLOW") try: if comments_downloader.comments: comments_downloader.save() comments_log_file = comments_json_file.replace('.json', '.log') comment_errors, total_comments = CommentsDownloader.generate_log( comments_downloader.comments, settings.current_time, comments_log_file, comments_delay=broadcast_downloader.initial_buffered_duration) if len(comments_downloader.comments) == 1: log("[I] Successfully saved 1 comment to logfile.", "GREEN") seperator("GREEN") return True else: if comment_errors: log("[W] Successfully saved {:s} comments to logfile but {:s} comments are (partially) missing.".format(str(total_comments), str(comment_errors)), "YELLOW") else: log("[I] Successfully saved {:s} comments to logfile.".format(str(total_comments)), "GREEN") seperator("GREEN") return True else: log("[I] There are no available comments to save.", "GREEN") return False seperator("GREEN") except Exception as e: log('[E] Could not save comments to logfile: {:s}'.format(str(e)), "RED") return False except KeyboardInterrupt as e: log("[W] Downloading livestream comments has been aborted.", "YELLOW") return False