sudoalx · October 29, 2023 20:16 · sudoalx · Oct 29, 2023
diff --git a/gotodownloader.py b/gotodownloader.py
 import time
 import requests
 from tqdm import tqdm
 from selenium import webdriver
 from selenium.webdriver.common.by import By
 from selenium.webdriver.support.ui import WebDriverWait
 from selenium.webdriver.support import expected_conditions as EC
 from selenium.webdriver.common.action_chains import ActionChains

 def download_video(link, destination_directory):
    # Set up Chrome in headless mode
    chrome_options = webdriver.ChromeOptions()
    chrome_options.add_argument('--headless')
    chrome_options.add_argument('--disable-gpu')  # Required when running in headless mode
    chrome_options.add_argument('--no-sandbox')  # Required when running in headless mode

    # Create a WebDriver instance with headless mode
    driver = webdriver.Chrome(options=chrome_options)

    # Load the URL
    driver.get(link)

    # Wait for the <video> tag to be present in the page
    wait = WebDriverWait(driver, 10)  # Wait for up to 10 seconds
    video_element = wait.until(EC.presence_of_element_located((By.TAG_NAME, 'video')))

    # Find the date element and extract its text
    date_element = driver.find_element(By.XPATH, '//div[p[text()="Date"]]/p[contains(@class, "src-components-Info-MeetingStats-MeetingStats--text")]')
    date_text = date_element.text

    # Get the title meta tag from the page
    title_element = driver.find_element(By.TAG_NAME, 'title')
    title_text = title_element.get_attribute('textContent')

    # Wait for a few seconds (adjust the sleep time as needed)
    time.sleep(5)  # Wait for 5 seconds

    # Define the filename for the downloaded video
    full_filename = f"{destination_directory}/{title_text} - {date_text}.mp4"
    short_filename = f"{title_text}_{date_text}.mp4"

    # Download the video using requests and display a progress bar
    response = requests.get(video_element.get_attribute("src"), stream=True)
    total_size = int(response.headers.get('content-length', 0))

    with open(full_filename, "wb") as video_file:
        with tqdm(total=total_size, unit='B', unit_scale=True, unit_divisor=1024) as pbar:
            for data in response.iter_content(chunk_size=1024):
                video_file.write(data)
                pbar.update(len(data))

    # When you're done, close the browser
    driver.quit()

 if __name__ == "__main__":
    import argparse

    parser = argparse.ArgumentParser(description="Download videos from a list of links.")
    parser.add_argument("-f", "--links-file", required=True, help="Path to the text file containing comma-separated links.")
    parser.add_argument("-d", "--destination-directory", required=True, help="Directory where downloaded videos will be saved.")

    args = parser.parse_args()

    with open(args.links_file, "r") as file:
        links = file.read().strip().split(",")

    for link in links:
        download_video(link, args.destination_directory)
	import time
	import requests
	from tqdm import tqdm
	from selenium import webdriver
	from selenium.webdriver.common.by import By
	from selenium.webdriver.support.ui import WebDriverWait
	from selenium.webdriver.support import expected_conditions as EC
	from selenium.webdriver.common.action_chains import ActionChains

	def download_video(link, destination_directory):
	# Set up Chrome in headless mode
	chrome_options = webdriver.ChromeOptions()
	chrome_options.add_argument('--headless')
	chrome_options.add_argument('--disable-gpu') # Required when running in headless mode
	chrome_options.add_argument('--no-sandbox') # Required when running in headless mode

	# Create a WebDriver instance with headless mode
	driver = webdriver.Chrome(options=chrome_options)

	# Load the URL
	driver.get(link)

	# Wait for the <video> tag to be present in the page
	wait = WebDriverWait(driver, 10) # Wait for up to 10 seconds
	video_element = wait.until(EC.presence_of_element_located((By.TAG_NAME, 'video')))

	# Find the date element and extract its text
	date_element = driver.find_element(By.XPATH, '//div[p[text()="Date"]]/p[contains(@class, "src-components-Info-MeetingStats-MeetingStats--text")]')
	date_text = date_element.text

	# Get the title meta tag from the page
	title_element = driver.find_element(By.TAG_NAME, 'title')
	title_text = title_element.get_attribute('textContent')

	# Wait for a few seconds (adjust the sleep time as needed)
	time.sleep(5) # Wait for 5 seconds

	# Define the filename for the downloaded video
	full_filename = f"{destination_directory}/{title_text} - {date_text}.mp4"
	short_filename = f"{title_text}_{date_text}.mp4"

	# Download the video using requests and display a progress bar
	response = requests.get(video_element.get_attribute("src"), stream=True)
	total_size = int(response.headers.get('content-length', 0))

	with open(full_filename, "wb") as video_file:
	with tqdm(total=total_size, unit='B', unit_scale=True, unit_divisor=1024) as pbar:
	for data in response.iter_content(chunk_size=1024):
	video_file.write(data)
	pbar.update(len(data))

	# When you're done, close the browser
	driver.quit()

	if __name__ == "__main__":
	import argparse

	parser = argparse.ArgumentParser(description="Download videos from a list of links.")
	parser.add_argument("-f", "--links-file", required=True, help="Path to the text file containing comma-separated links.")
	parser.add_argument("-d", "--destination-directory", required=True, help="Directory where downloaded videos will be saved.")

	args = parser.parse_args()

	with open(args.links_file, "r") as file:
	links = file.read().strip().split(",")

	for link in links:
	download_video(link, args.destination_directory)