Overview
This Python script is designed to process image files by converting them to the WebP format, organizing them into specific folders, and preserving their metadata. It also handles the renaming of files to remove spaces and ensures that the original metadata is preserved in the converted files.
Usage
To use this script, run it from the command line and provide the following arguments:
input_dir
: The path to the directory containing the images you want to process.output_dir
: The path to the directory where the converted images will be saved.--ext
: (Optional) A list of image extensions to process. Default is["all"]
.--subdir
: (Optional) A flag to indicate whether to search for images recursively in subdirectories. Default isFalse
.
Example command:
python image_processing_script.py /path/to/input /path/to/output --ext jpg png --subdir
Features
- Converts images to WebP format using the
cwebp
command. - Organizes converted images into folders based on conversion options.
- Renames files to remove spaces.
- Preserves metadata from the original images in the converted files using
exiftool
. - Provides logging information with timestamps and log levels.
Functions
process_single_image
: Converts a single image and writes the markdown link to a file.process_images
: Processes all image files in the input directory with the specified extensions.expand_image_extensions
: Expands a list of image extensions to include common variants.find_image_files
: Finds all image files in the given directory with the specified extensions.create_output_directories
: Creates the necessary output directories within the base directory.convert_image_with_cwebp
: Converts an image usingcwebp
and saves it to the output directory.build_converted_path
: Builds the path for the converted image file.
Requirements
- Python 3.x
- The
cwebp
command-line tool must be installed and available in the system’s PATH. - The
exiftool
command-line tool must be installed and available in the system’s PATH.
Notes
- Ensure that you have the necessary permissions to read and write files in the specified directories.
- Always backup your original images before running the script to prevent data loss.
- The script assumes that the
cwebp
andexiftool
tools are correctly installed and configured on your system.
Code
import argparse
import subprocess
from pathlib import Path
import logging
# Enable logger, print to console with timestamp and log level
logging.basicConfig(
level=logging.INFO, format="\n%(asctime)s - %(levelname)s - %(message)s"
)
logger = logging.getLogger(__name__)
def process_single_image(
image_path: Path,
output_dir: Path,
) -> None:
"""
Processes a single image file: converts it, uploads it, and writes the markdown link to a file.
Args:
image_path (Path): The path to the input image file.
output_dir (Path): The directory where the converted images will be saved.
Returns:
None
"""
folder_options = [
# ("Lossless", ["-z", "8", "-mt"]),
# ("6MB", ["-size", "6291456", "-pass", "10", "-qrange", "80", "100", "-mt"]),
("Web", ["-resize", "1280", "0", "-mt"]),
]
for folder_name, options in folder_options:
folder_path = output_dir / folder_name
create_output_directories(output_dir, folder_name)
convert_image_with_cwebp(image_path, folder_path, options)
def process_images(
input_dir: Path,
output_dir: Path,
extensions: list[str],
subdir: bool,
) -> None:
"""
Processes all image files in the input directory with the specified extensions.
Args:
input_dir (Path): The directory containing the input image files.
output_dir (Path): The directory where the converted images and markdown links will be saved.
extensions (list[str]): A space-separated list of image extensions.
subdir (bool): Whether to search recursively in subdirectories.
md_links_file_name (str): The name of the file where the markdown links will be written.
"""
image_files = find_image_files(input_dir, extensions, subdir)
for image_path in image_files:
image_path.rename(image_path.parent / image_path.name.replace(" ", "-"))
process_single_image(image_path, output_dir)
def expand_image_extensions(extensions: list[str]) -> list[str]:
"""
Expands a comma-separated list of image extensions to include common variants.
Args:
extensions (list[str]): A list of image extensions.
Returns:
list[str]: A list of expanded image extensions.
"""
supported_extensions = ["jpg", "jpeg", "png", "tif", "tiff", "webp"]
expanded_extensions = []
for ext in [s.lower() for s in extensions]:
if ext == "all":
expanded_extensions = supported_extensions
break
elif ext in ["jpg", "jpeg"]:
expanded_extensions.extend(["jpg", "jpeg"])
elif ext in ["tif", "tiff"]:
expanded_extensions.extend(["tif", "tiff"])
else:
expanded_extensions.append(ext)
return [s.lower() for s in expanded_extensions] + [
s.upper() for s in expanded_extensions
]
def find_image_files(
directory: Path, extensions: list[str], subdir: bool
) -> list[Path]:
"""
Finds all image files in the given directory with the specified extensions.
Args:
directory (Path): The directory to search for image files.
extensions (list[str]): A list of image file extensions.
subdir (bool): Whether to search recursively in subdirectories.
Returns:
list[Path]: A list of paths to the found image files.
"""
return sorted(
[
file
for ext in extensions
for file in directory.rglob(f"*.{ext}")
if not file.name.startswith(".")
]
if subdir
else [
file
for ext in extensions
for file in directory.glob(f"*.{ext}")
if not file.name.startswith(".")
]
)
def create_output_directories(base_dir: Path, *folder_names: str) -> None:
"""
Creates the necessary output directories within the base directory.
Args:
base_dir (Path): The base directory where the output directories will be created.
*folder_names (str): Variable number of folder names to create.
"""
for folder_name in folder_names:
Path(base_dir, folder_name).mkdir(parents=True, exist_ok=True)
def convert_image_with_cwebp(input_path: Path, output_dir: Path, options: list) -> None:
"""
Converts an image using cwebp and saves it to the output directory.
Args:
input_path (Path): The path to the input image file.
output_dir (Path): The directory where the converted image will be saved.
options (list): A list of options to pass to the cwebp command.
"""
output_path = build_converted_path(input_path, output_dir)
cweb_cmd = [
"cwebp",
*options,
"-metadata",
"all",
str(input_path),
"-o",
str(output_path),
]
try:
subprocess.run(cweb_cmd, check=True)
subprocess.run(
[
"exiftool",
"-TagsFromFile",
str(input_path),
"-overwrite_original",
str(output_path),
],
check=True,
)
except subprocess.CalledProcessError as e:
logger.error(f"Failed to convert {input_path}: {e}")
def build_converted_path(input_path: Path, output_dir: Path) -> Path:
"""
Builds the path for the converted image file.
Args:
input_path (Path): The path to the input image file.
output_dir (Path): The directory where the converted image will be saved.
Returns:
Path: The path to the converted image file.
"""
return output_dir / (input_path.stem + ".webp")
def main() -> None:
"""
The main function that parses command line arguments and processes images.
"""
parser = argparse.ArgumentParser(description="Convert and upload images.")
parser.add_argument("input_dir", type=str, help="Input directory path")
parser.add_argument("output_dir", type=str, help="Output directory path")
parser.add_argument(
"--ext",
nargs="+",
default=["all"],
help="List of input image extensions",
)
parser.add_argument(
"--subdir",
action="store_false",
help="Search for images recursively in subdirectories",
)
args = parser.parse_args()
input_dir = Path(args.input_dir)
output_dir = Path(args.output_dir)
process_images(
input_dir, output_dir, expand_image_extensions(args.ext), args.subdir
)
if __name__ == "__main__":
main()