Add median time statistics, log levels, print successful and failed album titles, update README

This commit is contained in:
csd4ni3l
2025-06-17 11:08:07 +02:00
parent efd60fd633
commit 301956a954
5 changed files with 71 additions and 60 deletions

View File

@@ -4,38 +4,37 @@
This tool automates the process of downloading photos from Google Photos albums by simulating user interaction with the web interface. It uses Selenium to open shared album links, click the "Download all" button, and extract the images to your local system. This tool automates the process of downloading photos from Google Photos albums by simulating user interaction with the web interface. It uses Selenium to open shared album links, click the "Download all" button, and extract the images to your local system.
## Features ## Features
* 🔗 Accepts public/shared Google Photos album URLs * Accepts link-shared Google Photos album URLs
* 🖱️ Simulates browser behavior to download photos via the "Download all" option * Accepts your own Google Photos album URLs if you supply the profile directory.
* 🗃️ Automatically extracts downloaded `.zip` files into organized folders * Automatically extracts downloaded `.zip` files into organized folders
* 🛠️ Works without needing any API keys or OAuth setup * Works without needing any API keys or OAuth setup
* 📂 Supports batch downloading of multiple album links * Supports batch downloading of multiple album links
## 🛑 Why not use the Google Photos API? ## Why not use the Google Photos API?
As of recent updates, **the original Google Photos API is deprecated**. While the **Google Picker API** is still available, it comes with several major limitations: **The original Google Photos API is deprecated**. While the **Google Picker API** is still available, it comes with several major limitations:
* 🚫 You must select each photo manually no "select all" option * You must select each photo manually, no "select all" option, meaning it can not be automated.
* 📉 Limited to a maximum number of items (up to 100 photos per interaction) * Limited to a maximum number of items
* 🔐 Requires setting up a Google Cloud project and API credentials * It requires setting up a Google Cloud project and API credentials, which is pretty hard.
Due to these restrictions, this Selenium-based solution is one of the few remaining ways to fully automate bulk downloads from Google Photos albums. ## Disclaimer
## ⚠️ Disclaimer
* The project was not made by AI, just the README.
* It automates actions that a human user would normally perform in a browser.
* Be aware of Googles Terms of Service before using this tool. * Be aware of Googles Terms of Service before using this tool.
* It simulates human actions, but Google might not be happy about someone using this.
## 🧰 Requirements ## Requirements
* Python 3.11+ * Python 3.11+
* Selenium * Selenium
* Chrome or Chromium + WebDriver * Chrome or Chromium + WebDriver (Auto-installed by Selenium if not found)
## 💡 Usage ## Installation
```bash `pip install gp-dl`
python main.py --album-urls YOUR_ALBUM_LINK_HERE --output-dir test_images
``` ## Usage
`gp-dl --album-urls ALBUM_URL ALBUM_URL2 --output-dir test --log-level info`

View File

@@ -1 +1 @@
__version__ = "0.1.0" __version__ = "0.2.0"

View File

@@ -1,10 +1,11 @@
import os, time, argparse, re, sys, logging import os, time, argparse, logging, sys
from selenium.webdriver import Chrome, ChromeService from selenium.webdriver import Chrome, ChromeService
from selenium.webdriver.common.by import By from selenium.webdriver.common.by import By
from selenium.webdriver.chrome.options import Options from selenium.webdriver.chrome.options import Options
from selenium.common.exceptions import TimeoutException from selenium.common.exceptions import TimeoutException
from selenium.webdriver.support.ui import WebDriverWait from selenium.webdriver.support.ui import WebDriverWait
from selenium.webdriver.support import expected_conditions as EC from selenium.webdriver.support import expected_conditions as EC
from statistics import median
from zipfile import ZipFile from zipfile import ZipFile
BANNER = """ BANNER = """
@@ -15,18 +16,27 @@ BANNER = """
██████ ██ ██████ ███████ ██████ ██ ██████ ███████
gp-dl — Google Photos Downloader gp-dl — Google Photos Downloader
Download full-res albums using Selenium Download full-resolution albums from Google Photos using Selenium
Author: csd4ni3l | GitHub: https://github.com/csd4ni3l Author: csd4ni3l | GitHub: https://github.com/csd4ni3l
""" """
LOG_LEVELS = {
"DEBUG": logging.DEBUG,
"INFO": logging.INFO,
"ERROR": logging.ERROR,
"FATAL": logging.FATAL,
"QUIET": 999999999
}
def parse_args(): def parse_args():
parser = argparse.ArgumentParser(description="Download full-res images from a Google Photos album using Selenium.") parser = argparse.ArgumentParser(description="Download full-res images from a Google Photos album using Selenium.")
parser.add_argument("--album-urls", nargs="+", required=True, help="Google Photos album URL(s)") parser.add_argument("--album-urls", nargs="+", required=True, help="Google Photos album URL(s)")
parser.add_argument("--output-dir", required=True, help="Directory to save downloaded albums") parser.add_argument("--output-dir", required=True, help="The directory to save downloaded albums")
parser.add_argument("--driver-path", default=None, help="Custom Chrome driver path") parser.add_argument("--driver-path", default=None, help="Custom Chrome driver path")
parser.add_argument("--profile-dir", default=None, help="Chrome user data directory for session reuse") parser.add_argument("--profile-dir", default=None, help="A Chrome user data directory for sessions, set this if you want to open non-shared links.")
parser.add_argument("--headless", action="store_true", help="Run Chrome headlessly") parser.add_argument("--headless", action="store_true", help="Run Chrome headlessly")
parser.add_argument("--log-level", default="INFO", help="Specifies what to include in log output. Available levels: debug, info, error, fatal")
return parser.parse_args() return parser.parse_args()
def setup_driver(driver_path=None, profile_dir=None, headless=True): def setup_driver(driver_path=None, profile_dir=None, headless=True):
@@ -62,14 +72,23 @@ def find_crdownload_file():
if file.endswith(".crdownload"): if file.endswith(".crdownload"):
return file return file
def configure_logging(): def configure_logging(log_level: str):
logging.basicConfig(format='%(asctime)s %(levelname)s: %(message)s', level=logging.DEBUG) if not log_level.upper() in LOG_LEVELS:
print(f"Invalid logging level: {log_level}")
sys.exit(1)
logging.basicConfig(format='%(asctime)s %(levelname)s: %(message)s', level=LOG_LEVELS[log_level.upper()])
for logger_to_disable in ["selenium", "urllib3"]: for logger_to_disable in ["selenium", "urllib3"]:
logging.getLogger(logger_to_disable).propagate = False logging.getLogger(logger_to_disable).propagate = False
logging.getLogger(logger_to_disable).disabled = True logging.getLogger(logger_to_disable).disabled = True
def main(): def run_cli():
args = parse_args() args = parse_args()
if not args.log_level.upper() == "QUIET":
print(BANNER)
configure_logging(args.log_level)
driver = setup_driver(profile_dir=args.profile_dir, headless=args.headless) driver = setup_driver(profile_dir=args.profile_dir, headless=args.headless)
if not os.path.exists("gp_temp") or not os.path.isdir("gp_temp"): if not os.path.exists("gp_temp") or not os.path.isdir("gp_temp"):
@@ -80,8 +99,8 @@ def main():
logging.fatal("Invalid output directory. Please supply a valid and existing directory.") logging.fatal("Invalid output directory. Please supply a valid and existing directory.")
return return
failed_album_count = 0 failed_albums = []
successful_album_count = 0 successful_albums = []
total_albums = len(args.album_urls) total_albums = len(args.album_urls)
all_start = time.perf_counter() all_start = time.perf_counter()
album_times = [] album_times = []
@@ -89,23 +108,19 @@ def main():
for album_url in args.album_urls: for album_url in args.album_urls:
album_start = time.perf_counter() album_start = time.perf_counter()
if re.match(r'^https?://photos\.app\.goo\.gl/[A-Za-z0-9]+$', album_url) is None:
logging.error(f"Invalid album URL: {album_url}")
logging.info("Continuing with next album URL.")
failed_album_count += 1
continue
logging.info(f"Now downloading {album_url}")
driver.get(album_url) driver.get(album_url)
album_title = driver.title.split(" -")[0]
logging.info(f"Now downloading {album_title} ({album_url})")
logging.debug("Waiting for menu button...") logging.debug("Waiting for menu button...")
try: try:
menu_button = WebDriverWait(driver, 10).until(EC.presence_of_element_located((By.XPATH, '//*[@aria-label="More options"]'))) menu_button = WebDriverWait(driver, 10).until(EC.presence_of_element_located((By.XPATH, '//*[@aria-label="More options"]')))
except TimeoutException: except TimeoutException:
logging.error("Could not find more options button in time.") logging.error("Could not find the 'more options' button in time.")
logging.info("Continuing with next album URL.") logging.info("Continuing with next album URL.")
failed_album_count += 1 failed_albums.append(album_title)
continue continue
logging.debug("Clicking menu button...") logging.debug("Clicking menu button...")
@@ -115,9 +130,9 @@ def main():
try: try:
download_all_button = WebDriverWait(driver, 10).until(EC.presence_of_element_located((By.XPATH, '//*[@aria-label="Download all"]'))) download_all_button = WebDriverWait(driver, 10).until(EC.presence_of_element_located((By.XPATH, '//*[@aria-label="Download all"]')))
except TimeoutException: except TimeoutException:
logging.error("Could not find download all button in time.") logging.error("Could not find the 'download all' button in time.")
logging.info("Continuing with next album.") logging.info("Continuing with next album.")
failed_album_count += 1 failed_albums.append(album_title)
continue continue
logging.debug("Clicking the download all button...") logging.debug("Clicking the download all button...")
@@ -145,23 +160,20 @@ def main():
logging.info(f"Succesfully extracted zip file to {args.output_dir}") logging.info(f"Succesfully extracted zip file to {args.output_dir}")
successful_album_count += 1 successful_albums.append(album_title)
album_times.append(time.perf_counter() - album_start) album_times.append(time.perf_counter() - album_start)
logging.debug("Removing temporary gp_temp directory.") logging.debug("Removing temporary gp_temp directory.")
os.removedirs("gp_temp") os.removedirs("gp_temp")
print("\n===== DOWNLOAD STATISTICS =====") logging.info("")
print(f"Total albums given: {total_albums}") logging.info("===== DOWNLOAD STATISTICS =====")
print(f"Successfully downloaded: {successful_album_count}") logging.info(f"Total albums given: {total_albums}")
print(f"Failed downloads: {failed_album_count}") logging.info(f"Successful albums ({len(successful_albums)}): {', '.join(successful_albums) or None}")
print(f"Average time taken per album: {sum(album_times) / len(album_times):.2f} seconds") logging.info(f"Failed albums ({len(failed_albums)}): {', '.join(failed_albums) or 'None'}")
print(f"Total time taken: {time.perf_counter() - all_start:.2f} seconds") logging.info(f"Median time taken per album: {median(album_times or [0]):.2f} seconds")
print("================================") logging.info(f"Average time taken per album: {sum(album_times or [0]) / len(album_times or [0]):.2f} seconds")
logging.info(f"Total time taken: {time.perf_counter() - all_start:.2f} seconds")
logging.info("================================")
driver.quit() driver.quit()
def run_cli():
print(BANNER)
configure_logging()
main()

View File

@@ -1,6 +1,6 @@
[project] [project]
name = "gp-dl" name = "gp-dl"
version = "0.1.0" version = "0.2.0"
description = "A Python-based Google Photos downloader built with Selenium." description = "A Python-based Google Photos downloader built with Selenium."
readme = "README.md" readme = "README.md"
requires-python = ">=3.11" requires-python = ">=3.11"

2
uv.lock generated
View File

@@ -39,7 +39,7 @@ wheels = [
[[package]] [[package]]
name = "gp-dl" name = "gp-dl"
version = "0.1.0" version = "0.2.0"
source = { editable = "." } source = { editable = "." }
dependencies = [ dependencies = [
{ name = "selenium" }, { name = "selenium" },