Create a gist now

Instantly share code, notes, and snippets.

What would you like to do?
Do you own a DSLR? If so, do you transfer your images to your computer, then look at the JPEGs and delete the crappy ones? If you do, your RAW images may be leftover. This Python script helps you cleaning up your image folders after deleting unwanted JPEGs. See…
#!/usr/bin/env python2.7
# -*- coding: utf-8 -*-
Written on 2012-12-12 by Philipp Klaus <philipp.l.klaus →AT→>.
Check <> for newer versions.
Also check <> for a tool to
rename JPEGs according to their EXIF shot time.
import argparse, os, errno, re, shutil, sys
def stderr(line):
sys.stderr.write(line + '\n')
def delete(files, backup_folder=None, verbose=True, dry=True):
if len(files) == 0: return
if backup_folder:
except OSError, e:
if not e.errno == errno.EEXIST:
for filename in files:
if verbose: print "Moving %s to %s." % (filename, backup_folder)
if not dry: shutil.move(filename, os.path.join(backup_folder))
for filename in files:
if verbose: print "Deleting %s." % (filename,)
if not dry: os.remove(filename)
if __name__ == '__main__':
parser = argparse.ArgumentParser(description='Cleanup of leftover raw image files (*.CR2).')
parser.add_argument('--no-backup', '-n', action='store_true',
help='Don\'t backup orphaned raw images - delete them immediately.')
parser.add_argument('--backup-folder', '-b', default='raw_orphans',
help='Folder to move orphaned raw images to.')
parser.add_argument('--tolerant', '-t', action='store_true',
help='Accept JPEGs that just start with the name of the raw image as a match too.')
parser.add_argument('--quiet', '-q', action='store_true',
help='Silence the less important output of this tool.')
parser.add_argument('--dry', '-d', action='store_true',
help='Dry run: Only show what the tool would do without actually executing.')
parser.add_argument('folder', metavar='CHECK_FOLDER', default='./', nargs='?',
help='Folder to check for raw images. Defaults to the current working directory')
args = parser.parse_args()
verbose = not args.quiet
raw_images, jpeg_images_bare_names = [], []
all_files = list(os.listdir(args.folder))
# sort files into raw and jpeg files
for filename in all_files:
# The file name of raw image ends with .CR2 for Canon EOS cameras
if re.match(r'(.*)\.[cC][rR]2$', filename):
if re.match(r'(.*)\.[jJ][pP][eE]?[gG]$', filename):
# Check if there is a jpeg for each raw image
orphans = []
for raw_image in raw_images:
if args.tolerant:
is_orphan = True
for jpg in jpeg_images_bare_names:
if jpg.startswith(os.path.splitext(raw_image)[0]):
is_orphan = False
if is_orphan:
elif os.path.splitext(raw_image)[0] not in jpeg_images_bare_names:
if len(raw_images) + len(jpeg_images_bare_names) == 0:
if verbose: stderr("No images found. Are you sure you wanted to check '%s' for orphaned RAW images?" %
elif len(raw_images) == 0:
if verbose: print "No RAW images found, but %i JPEGs. Won't do anything now." % (
elif len(orphans) == 0:
if verbose: print "%i RAW images found, and %i JPEGs but no orphans. Won't do anything now." % (
len(raw_images), len(jpeg_images_bare_names))
print "Found %i JPEGs and %i .CR2s. Of those RAW images, %i are orphans and will be removed." % (
len(jpeg_images_bare_names), len(raw_images), len(orphans))
backup_folder = None if args.no_backup else os.path.join(args.folder,args.backup_folder)
delete([os.path.join(args.folder,orphan) for orphan in orphans], backup_folder=backup_folder, verbose=verbose, dry=args.dry)

sirdavy commented Nov 20, 2014

I want to do something similar on my Mac. I want to remove RAW files but keep Orphaned RAW files. I have no idea how to run this script. Do I need to install Github?

Install Instructions:
download the .py file
put the .py file in the folder with your images
Open terminal
navigate to the folder where your images are
type python
double click on the .py file
copy the text in the file
paste the text in terminal

Sign up for free to join this conversation on GitHub. Already have an account? Sign in to comment