Last active
May 8, 2023 20:43
-
-
Save pklaus/4271012 to your computer and use it in GitHub Desktop.
Do you own a DSLR? If so, do you transfer your images to your computer, then look at the JPEGs and delete the crappy ones? If you do, your RAW images may be leftover. This Python script helps you cleaning up your image folders after deleting unwanted JPEGs. See http://blog.philippklaus.de/2012/12/cleaning-leftover-raw-images-after-selecting-imag…
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
#!/usr/bin/env python2.7 | |
# -*- coding: utf-8 -*- | |
""" | |
This script was moved to | |
https://github.com/pklaus/pklaus/blob/master/pklaus/images/orphans/remove.py | |
Here's the original content left for you as a reference: | |
Do you own a DSLR? If so, do you transfer your images to your computer, | |
then look at the JPEGs and delete the crappy ones? If you do, your RAW | |
mages may be leftover. This Python script helps you cleaning up your image | |
folders after deleting unwanted JPEGs. See | |
http://blog.philippklaus.de/2012/12/cleaning-leftover-raw-images-after-selecting-images-based-on-jpegs/ | |
for more information. | |
Started on 2012-12-12 by Philipp Klaus <philipp.l.klaus →AT→ web.de>. | |
""" | |
import argparse, os, errno, re, shutil, sys | |
def stderr(line): | |
sys.stderr.write(line + '\n') | |
sys.stderr.flush() | |
def delete(files, backup_folder=None, verbose=True, dry=True): | |
if len(files) == 0: return | |
if backup_folder: | |
try: | |
os.mkdir(backup_folder) | |
except OSError, e: | |
if not e.errno == errno.EEXIST: | |
raise | |
for filename in files: | |
if verbose: print "Moving %s to %s." % (filename, backup_folder) | |
if not dry: shutil.move(filename, os.path.join(backup_folder)) | |
else: | |
for filename in files: | |
if verbose: print "Deleting %s." % (filename,) | |
if not dry: os.remove(filename) | |
if __name__ == '__main__': | |
parser = argparse.ArgumentParser(description='Cleanup of leftover raw image files (*.CR2).') | |
parser.add_argument('--no-backup', '-n', action='store_true', | |
help='Don\'t backup orphaned raw images - delete them immediately.') | |
parser.add_argument('--backup-folder', '-b', default='raw_orphans', | |
help='Folder to move orphaned raw images to.') | |
parser.add_argument('--tolerant', '-t', action='store_true', | |
help='Accept JPEGs that just start with the name of the raw image as a match too.') | |
parser.add_argument('--quiet', '-q', action='store_true', | |
help='Silence the less important output of this tool.') | |
parser.add_argument('--dry', '-d', action='store_true', | |
help='Dry run: Only show what the tool would do without actually executing.') | |
parser.add_argument('folder', metavar='CHECK_FOLDER', default='./', nargs='?', | |
help='Folder to check for raw images. Defaults to the current working directory') | |
args = parser.parse_args() | |
verbose = not args.quiet | |
raw_images, jpeg_images_bare_names = [], [] | |
all_files = list(os.listdir(args.folder)) | |
# sort files into raw and jpeg files | |
for filename in all_files: | |
# The file name of raw image ends with .CR2 for Canon EOS cameras | |
if re.match(r'(.*)\.[cC][rR]2$', filename): | |
raw_images.append(filename) | |
if re.match(r'(.*)\.[jJ][pP][eE]?[gG]$', filename): | |
jpeg_images_bare_names.append(os.path.splitext(filename)[0]) | |
# Check if there is a jpeg for each raw image | |
orphans = [] | |
for raw_image in raw_images: | |
if args.tolerant: | |
is_orphan = True | |
for jpg in jpeg_images_bare_names: | |
if jpg.startswith(os.path.splitext(raw_image)[0]): | |
is_orphan = False | |
if is_orphan: | |
orphans.append(raw_image) | |
elif os.path.splitext(raw_image)[0] not in jpeg_images_bare_names: | |
orphans.append(raw_image) | |
if len(raw_images) + len(jpeg_images_bare_names) == 0: | |
if verbose: stderr("No images found. Are you sure you wanted to check '%s' for orphaned RAW images?" % | |
(args.folder,)) | |
sys.exit(2) | |
elif len(raw_images) == 0: | |
if verbose: print "No RAW images found, but %i JPEGs. Won't do anything now." % ( | |
len(jpeg_images_bare_names),) | |
sys.exit(0) | |
elif len(orphans) == 0: | |
if verbose: print "%i RAW images found, and %i JPEGs but no orphans. Won't do anything now." % ( | |
len(raw_images), len(jpeg_images_bare_names)) | |
sys.exit(0) | |
else: | |
print "Found %i JPEGs and %i .CR2s. Of those RAW images, %i are orphans and will be removed." % ( | |
len(jpeg_images_bare_names), len(raw_images), len(orphans)) | |
backup_folder = None if args.no_backup else os.path.join(args.folder,args.backup_folder) | |
delete([os.path.join(args.folder,orphan) for orphan in orphans], backup_folder=backup_folder, verbose=verbose, dry=args.dry) | |
Install Instructions:
download the .py file
put the .py file in the folder with your images
Open terminal
navigate to the folder where your images are
type python
double click on the .py file
copy the text in the file
paste the text in terminal
done!
Hi!
Thanks! i just lookinf for something like this.
One question. How i apply this with many folders and sub folders?
Thanks! Regards!
For NEF files, same script as before but one line changed:
#!/usr/bin/env python2.7
# -*- coding: utf-8 -*-
"""
Written on 2012-12-12 by Philipp Klaus <philipp.l.klaus →AT→ web.de>.
Check <https://gist.github.com/4271012> for newer versions.
Also check <https://gist.github.com/3155743> for a tool to
rename JPEGs according to their EXIF shot time.
"""
import argparse, os, errno, re, shutil, sys
def stderr(line):
sys.stderr.write(line + '\n')
sys.stderr.flush()
def delete(files, backup_folder=None, verbose=True, dry=True):
if len(files) == 0: return
if backup_folder:
try:
os.mkdir(backup_folder)
except OSError, e:
if not e.errno == errno.EEXIST:
raise
for filename in files:
if verbose: print "Moving %s to %s." % (filename, backup_folder)
if not dry: shutil.move(filename, os.path.join(backup_folder))
else:
for filename in files:
if verbose: print "Deleting %s." % (filename,)
if not dry: os.remove(filename)
if __name__ == '__main__':
parser = argparse.ArgumentParser(description='Cleanup of leftover raw image files (*.CR2).')
parser.add_argument('--no-backup', '-n', action='store_true',
help='Don\'t backup orphaned raw images - delete them immediately.')
parser.add_argument('--backup-folder', '-b', default='raw_orphans',
help='Folder to move orphaned raw images to.')
parser.add_argument('--tolerant', '-t', action='store_true',
help='Accept JPEGs that just start with the name of the raw image as a match too.')
parser.add_argument('--quiet', '-q', action='store_true',
help='Silence the less important output of this tool.')
parser.add_argument('--dry', '-d', action='store_true',
help='Dry run: Only show what the tool would do without actually executing.')
parser.add_argument('folder', metavar='CHECK_FOLDER', default='./', nargs='?',
help='Folder to check for raw images. Defaults to the current working directory')
args = parser.parse_args()
verbose = not args.quiet
raw_images, jpeg_images_bare_names = [], []
all_files = list(os.listdir(args.folder))
# sort files into raw and jpeg files
for filename in all_files:
# The file name of raw image ends with .CR2 for Canon EOS cameras
if re.match(r'(.*)\.[nN][eE][fF]$', filename):
raw_images.append(filename)
if re.match(r'(.*)\.[jJ][pP][eE]?[gG]$', filename):
jpeg_images_bare_names.append(os.path.splitext(filename)[0])
# Check if there is a jpeg for each raw image
orphans = []
for raw_image in raw_images:
if args.tolerant:
is_orphan = True
for jpg in jpeg_images_bare_names:
if jpg.startswith(os.path.splitext(raw_image)[0]):
is_orphan = False
if is_orphan:
orphans.append(raw_image)
elif os.path.splitext(raw_image)[0] not in jpeg_images_bare_names:
orphans.append(raw_image)
if len(raw_images) + len(jpeg_images_bare_names) == 0:
if verbose: stderr("No images found. Are you sure you wanted to check '%s' for orphaned RAW images?" %
(args.folder,))
sys.exit(2)
elif len(raw_images) == 0:
if verbose: print "No RAW images found, but %i JPEGs. Won't do anything now." % (
len(jpeg_images_bare_names),)
sys.exit(0)
elif len(orphans) == 0:
if verbose: print "%i RAW images found, and %i JPEGs but no orphans. Won't do anything now." % (
len(raw_images), len(jpeg_images_bare_names))
sys.exit(0)
else:
print "Found %i JPEGs and %i .CR2s. Of those RAW images, %i are orphans and will be removed." % (
len(jpeg_images_bare_names), len(raw_images), len(orphans))
backup_folder = None if args.no_backup else os.path.join(args.folder,args.backup_folder)
delete([os.path.join(args.folder,orphan) for orphan in orphans], backup_folder=backup_folder, verbose=verbose, dry=args.dry)
Sign up for free
to join this conversation on GitHub.
Already have an account?
Sign in to comment
I want to do something similar on my Mac. I want to remove RAW files but keep Orphaned RAW files. I have no idea how to run this script. Do I need to install Github?