AntumDeluge/cleanwhitespace.py

## cleanwhitespace.py
#!/usr/bin/env python

## The MIT License (MIT)
#
#  Copyright © 2022 Jordan Irwin (AntumDeluge)
#
#  Permission is hereby granted, free of charge, to any person obtaining a copy of
#  this software and associated documentation files (the "Software"), to deal in
#  the Software without restriction, including without limitation the rights to
#  use, copy, modify, merge, publish, distribute, sublicense, and/or sell copies
#  of the Software, and to permit persons to whom the Software is furnished to do
#  so, subject to the following conditions:
#
#    The above copyright notice and this permission notice shall be included in
#    all copies or substantial portions of the Software.
#
#  THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
#  IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
#  FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
#  AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
#  LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
#  OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
## SOFTWARE.

import os, sys, errno, platform, codecs, traceback
from enum import Enum


## Converts a type to string.
def toString(t, delim=None):
	t_type = type(t);

	if t_type == tuple or t_type == list:
		endcaps = "()";
		if t_type == list:
			endcaps = "[]";

		if delim == None:
			tmp = endcaps[0];
			for v in t:
				if tmp != endcaps[0]:
					tmp = tmp + ",";

				tmp = tmp + str(v);
			t = tmp + endcaps[1];
		else:
			tmp = [];
			for v in t:
				tmp.append(str(v));
			t = delim.join(tmp);

	return t;

## Debugging output level.
class Level(Enum):
	SILENT = 0;
	ERROR = 1;
	WARN = 2;
	INFO = 3;
	DEBUG = 4;
	VERBOSE = 5;

## Message printing/logging.
#
#  @param msg
#      Message to be printed to console.
#  @param lvl
#      Debugging level (default: INFO).
def log(msg=None, lvl=Level.INFO):
	if (type(lvl) != int):
		lvl = lvl.value;

	if lvl == Level.SILENT.value:
		return;

	global_level = options["level"];
	if (type(global_level) != int):
		global_level = global_level.value;

	if global_level == Level.SILENT.value or lvl > global_level:
		return;

	# write newline for empty messages
	if msg == None:
		sys.stdout.write("\n");
		return;

	if type(msg) != str:
		msg = toString(msg);

	stream = sys.stdout;
	prefix = "";

	if lvl == Level.ERROR.value:
		stream = sys.stderr;
		prefix = "ERROR";
	elif lvl == Level.WARN.value:
		prefix = "WARNING";

	if prefix != "":
		prefix = prefix + ": ";

	stream.write(prefix + msg + "\n");

ver_py_min = (3, 0, 0);
ver_py = [];
# convert version tuple to integer values
for v in platform.python_version_tuple():
	ver_py.append(int(v));
ver_py = tuple(ver_py);

if ver_py < ver_py_min:
	msg = "\nERROR: incompatible Python version " + toString(ver_py, ".") + "\n  \
		requires version " + toString(ver_py_min, ".") + " or later"
	log(msg);
	sys.exit(1);

file_exe = os.path.basename(__file__);
dir_tools = os.path.normpath(os.path.dirname(__file__));
dir_root = os.getcwd();

scount_default = 4;
level_default = Level.INFO;

# flag type options
flags = {
	"help": False,
	"fake": False,
	"convert-le": False,
	"notrail": False,
	"nolead": False,
}

# all available parameters ("None" denotes parameter is required)
options = {
	"dirs": None,
	"filetypes": None,
	"scount": scount_default,
	"level": level_default.value,
}

# add flags to all parameters
for opt in flags:
	options[opt] = flags[opt];

# alternative shorthands for parameters
short_options = {
	"h": "help",
	"d": "dirs",
	"f": "filetypes",
	"s": "scount",
	"x": "fake",
	"l": "level",
}

class OptType(Enum):
	NONE = ("none", "");
	FLAG = ("flag", "");
	BOOL = ("bool", "");
	STRING = ("string", "");
	LIST = ("list", "");
	INT = ("int", "");

	def __init__(self, identifier, description):
		super();

		self.__name__ = identifier;
		self.desc = description;

	# FIXME: doesn't work
	def __eq__(self, other):
		self.equals(other);

	def equals(self, other):
		# treat tuples & lists the same
		if (other == tuple):
			other = list;

		return other.__name__ == self.__name__;

	def getId(self):
		return self.__name__;

	def getDescription(self):
		return self.desc;

	def getOptionType(opt):
		if (opt not in options):
			return OptType.NONE;

		if (opt in flags):
			return OptType.FLAG;

		val = options[opt];

		# default to list
		if (val == None):
			return OptType.LIST;

		for t in OptType:
			if (t.equals(type(val))):
				return t;

		return OptType.NONE;

	def toBoolean(val):
		if (type(val) == bool):
			return val;

		if (val.lower() in ("y", "yes", "true")):
			return True;

		return False;

	def toInt(val):
		return int(val);


def optionIsRequired(opt):
	return opt in req_options;

def setOption(opt, value):
	options[opt] = value;

## Displays usage help text.
def showUsage():
	msg = "\nUsage:" \
		+ "\n  {} -f <filtypes>[ -d <dirs>][ <flags>]".format(file_exe) \
		+ "\n  {} -h".format(file_exe) \
		+ "\n\nOptions:" \
		+ "\n  -f|--filetypes:\tComma-seprated list of filename extensions to parse." \
		+ "\n  -d|--dirs:\t\tComma-separated list of directories to search." \
		+ "\n  -s|--scount:\t\tNumber of leading spaces to replace with tab" \
		+ " (default: {}).".format(scount_default) \
		+ "\n  -l|--level:\t\tLogging level (default: {}).".format(level_default.value) \
		+ "\n\nFlags:" \
		+ "\n  -h|--help:\t\tShow usage information." \
		+ "\n  -x|--fake:\t\tSimulate (don't apply changes)." \
		+ "\n  --convert-le:\t\tConvert CR/CRLF line endings to LF." \
		+ "\n  --nolead:\t\tDon't replace leading spaces with tabs." \
		+ "\n  --notrail:\t\tDon't clean trailing whitespace."

	log(msg);

## Displays an error message & exits the process.
#
#  @param code
#      Exit code to use.
#  @param msg
#      Message to display.
#  @param[opt] usage
#      If <code>True</code>, shows usage information before exiting.
def exitWithError(code, msg, usage=True):
	log();
	log(msg, Level.ERROR);
	if (usage):
		showUsage();

	sys.exit(code);

## Compatibility function for case matching in different Python versions.
#
#  @param match
#      The statement to be compared.
#  @param cases
#      Cases to be checked.
def switch(match, cases, default=None):
	if (match in cases):
		return cases[match];

	if (default != None):
		return default;

	return match;

## Parses command line arguments & sets up file & directory options.
#
#  @param args
#      List of args to parse.
def parseArgs(args, flags=False):
	idx = 0;
	while (idx < len(args)):
		cur_arg = args[idx];

		s_arg = cur_arg[0] == "-" and cur_arg.count("-") == 1;
		l_arg = cur_arg[0:2] == "--" and len(cur_arg) - len(cur_arg.lstrip("-")) == 2;

		# all accepted arguments use a switch ("-")
		if not (s_arg or l_arg):
			exitWithError(errno.EINVAL, "malformatted argument: {}".format(cur_arg));

		cur_arg = cur_arg.lstrip("-");

		if (s_arg):
			if (len(cur_arg) > 1):
				# parse individual short args that are grouped together
				grouped_flags = [];
				for c in cur_arg:
					# make sure flags got split into individual characters
					if (len(c) > 1):
						exitWithError(1, "internal error parsing grouped flags: {}".format(cur_arg));

					grouped_flags.append("-" + c);

				parseArgs(grouped_flags, True);
				idx = idx + 1
				continue;
			else:
				cur_arg = switch(cur_arg, short_options);

		if (not (cur_arg in options)):
			exitWithError(errno.EINVAL, "unknown argument: {}".format(cur_arg));

		otype = OptType.getOptionType(cur_arg);

		if (not otype.equals(OptType.FLAG)):
			if (flags):
				exitWithError(1, "argument \"{}\" is not a flag type & cannot be grouped".format(cur_arg));

			# arguments must have a parameter
			if (len(args) == idx + 1):
				exitWithError(1, "argument \"{}\" requires a value".format(cur_arg));

		val = None;
		if (otype.equals(OptType.FLAG)):
			val = True;
		else:
			if (not args[idx + 1].startswith("-")):
				# value is located at next index
				val = args[idx + 1];
				idx = idx + 1;

				if (otype.equals(OptType.BOOL)):
					val = OptType.toBoolean(val);
				elif (otype.equals(OptType.INT)):
					val = OptType.toInt(val);
				elif (otype.equals(OptType.LIST)):
					if ("," in val):
						val = tuple(val.split(","));
					else:
						val = tuple([val]);

		options[cur_arg] = val;
		idx = idx + 1;

if (len(sys.argv) == 1):
	exitWithError(1, "missing parameters");

parseArgs(sys.argv[1:]);

if (options["help"]):
	showUsage();
	sys.exit(0);

single_file = False;
in_paths = options["dirs"];

if (in_paths and len(in_paths) == 1 and os.path.isfile(in_paths[0])):
	single_file = True;

for opt in options:
	if (opt == "filetypes" and single_file):
		continue;

	if (options[opt] == None):
		exitWithError(1, "missing required argument: {}".format(opt));


# the actual work

apply_changes = not options["fake"];
if (not apply_changes):
	log("\nsimulation run, changes will not be applied\n");

scount = options["scount"];
spaces_prefix = "";
for num in range(scount):
	spaces_prefix = spaces_prefix + " ";

def replaceLeadingSpaces(line):
	lcontent = line.lstrip();
	idx = len(line) - len(lcontent);
	pre = line[:idx];

	if (spaces_prefix in pre):
		pre = "\t".join(pre.split(spaces_prefix));

	return pre + lcontent;


cleaned_count = 0;

def checkFile(f):
	# not sure why this needs declared here
	global cleaned_count;

	contents_orig = None;
	contents_new = [];

	try:
		buffer = codecs.open(f, "r", "utf-8");
		if (not buffer):
			exitWithError(1, "could not open file for reading: {}".format(f), False);

		contents_orig = buffer.read();
		buffer.close();
	except UnicodeDecodeError:
		exitWithError(1, \
			"could not read file {}, please check that it is a text file".format(f), \
			False);

	st_orig = contents_orig;

	# line endings to be written to output
	le = "\n";
	le_name = "LF";

	# ensure we are working with LF line endings
	if ("\r\n" in contents_orig):
		contents_orig = contents_orig.replace("\r\n", "\n");
		# preserve line endings
		if (not options["convert-le"]):
			le = "\r\n";
			le_name = "CRLF";
	if ("\r" in contents_orig):
		contents_orig = contents_orig.replace("\r", "\n");
		# preserve line endings
		if (not options["convert-le"]):
			le = "\r";
			le_name = "CR";

	contents_orig = tuple(contents_orig.split("\n"));

	idx = 0;
	for line in contents_orig:
		line_orig = line;

		if (not options["notrail"]):
			# clean trailing whitespace
			line = line.rstrip();

		if (not options["nolead"]):
			# replace leading spaces with tabs
			line = replaceLeadingSpaces(line);

		if (line != line_orig):
			log("cleaned line {} ({})".format(idx + 1, f), Level.DEBUG);

		contents_new.append(line);
		idx = idx + 1;

	st_new = None;
	if (le != "\n"):
		log("preserving line endings \"{}\" in file: {}".format(le_name, f), Level.DEBUG);
		st_new = le.join(contents_new);
	else:
		st_new = "\n".join(contents_new);

	if (st_new != st_orig):
		try:
			if (apply_changes):
				buffer = codecs.open(f, "w", "utf-8");
				buffer.write(st_new);
				buffer.close();

			cleaned_count = cleaned_count + 1;
			log("updated file: {}".format(f));
		except:
			exitWithError(1, "error while opening file for writing: {}\n{}" \
				.format(f, traceback.format_exc()), False);


if (single_file):
	checkFile(in_paths[0]);
else:
	# check that all directories exist before doing anything
	for d in in_paths:
		if (not os.path.isdir(d)):
			exitWithError(errno.ENOENT, "file or directory not found: {}".format(d));

	for d in in_paths:
		for ROOT, DIRS, FILES in os.walk(d):
			for FILE in FILES:
				f = os.path.join(ROOT, FILE);

				fsuffix = f.split(".")[-1];
				if (fsuffix in options["filetypes"]):
					checkFile(f);


log("\ncleaned {} files".format(cleaned_count));
	#!/usr/bin/env python

	## The MIT License (MIT)
	#
	# Copyright © 2022 Jordan Irwin (AntumDeluge)
	#
	# Permission is hereby granted, free of charge, to any person obtaining a copy of
	# this software and associated documentation files (the "Software"), to deal in
	# the Software without restriction, including without limitation the rights to
	# use, copy, modify, merge, publish, distribute, sublicense, and/or sell copies
	# of the Software, and to permit persons to whom the Software is furnished to do
	# so, subject to the following conditions:
	#
	# The above copyright notice and this permission notice shall be included in
	# all copies or substantial portions of the Software.
	#
	# THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
	# IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
	# FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
	# AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
	# LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
	# OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
	## SOFTWARE.

	import os, sys, errno, platform, codecs, traceback
	from enum import Enum


	## Converts a type to string.
	def toString(t, delim=None):
	t_type = type(t);

	if t_type == tuple or t_type == list:
	endcaps = "()";
	if t_type == list:
	endcaps = "[]";

	if delim == None:
	tmp = endcaps[0];
	for v in t:
	if tmp != endcaps[0]:
	tmp = tmp + ",";

	tmp = tmp + str(v);
	t = tmp + endcaps[1];
	else:
	tmp = [];
	for v in t:
	tmp.append(str(v));
	t = delim.join(tmp);

	return t;

	## Debugging output level.
	class Level(Enum):
	SILENT = 0;
	ERROR = 1;
	WARN = 2;
	INFO = 3;
	DEBUG = 4;
	VERBOSE = 5;

	## Message printing/logging.
	#
	# @param msg
	# Message to be printed to console.
	# @param lvl
	# Debugging level (default: INFO).
	def log(msg=None, lvl=Level.INFO):
	if (type(lvl) != int):
	lvl = lvl.value;

	if lvl == Level.SILENT.value:
	return;

	global_level = options["level"];
	if (type(global_level) != int):
	global_level = global_level.value;

	if global_level == Level.SILENT.value or lvl > global_level:
	return;

	# write newline for empty messages
	if msg == None:
	sys.stdout.write("\n");
	return;

	if type(msg) != str:
	msg = toString(msg);

	stream = sys.stdout;
	prefix = "";

	if lvl == Level.ERROR.value:
	stream = sys.stderr;
	prefix = "ERROR";
	elif lvl == Level.WARN.value:
	prefix = "WARNING";

	if prefix != "":
	prefix = prefix + ": ";

	stream.write(prefix + msg + "\n");

	ver_py_min = (3, 0, 0);
	ver_py = [];
	# convert version tuple to integer values
	for v in platform.python_version_tuple():
	ver_py.append(int(v));
	ver_py = tuple(ver_py);

	if ver_py < ver_py_min:
	msg = "\nERROR: incompatible Python version " + toString(ver_py, ".") + "\n \
	requires version " + toString(ver_py_min, ".") + " or later"
	log(msg);
	sys.exit(1);

	file_exe = os.path.basename(__file__);
	dir_tools = os.path.normpath(os.path.dirname(__file__));
	dir_root = os.getcwd();

	scount_default = 4;
	level_default = Level.INFO;

	# flag type options
	flags = {
	"help": False,
	"fake": False,
	"convert-le": False,
	"notrail": False,
	"nolead": False,
	}

	# all available parameters ("None" denotes parameter is required)
	options = {
	"dirs": None,
	"filetypes": None,
	"scount": scount_default,
	"level": level_default.value,
	}

	# add flags to all parameters
	for opt in flags:
	options[opt] = flags[opt];

	# alternative shorthands for parameters
	short_options = {
	"h": "help",
	"d": "dirs",
	"f": "filetypes",
	"s": "scount",
	"x": "fake",
	"l": "level",
	}

	class OptType(Enum):
	NONE = ("none", "");
	FLAG = ("flag", "");
	BOOL = ("bool", "");
	STRING = ("string", "");
	LIST = ("list", "");
	INT = ("int", "");

	def __init__(self, identifier, description):
	super();

	self.__name__ = identifier;
	self.desc = description;

	# FIXME: doesn't work
	def __eq__(self, other):
	self.equals(other);

	def equals(self, other):
	# treat tuples & lists the same
	if (other == tuple):
	other = list;

	return other.__name__ == self.__name__;

	def getId(self):
	return self.__name__;

	def getDescription(self):
	return self.desc;

	def getOptionType(opt):
	if (opt not in options):
	return OptType.NONE;

	if (opt in flags):
	return OptType.FLAG;

	val = options[opt];

	# default to list
	if (val == None):
	return OptType.LIST;

	for t in OptType:
	if (t.equals(type(val))):
	return t;

	return OptType.NONE;

	def toBoolean(val):
	if (type(val) == bool):
	return val;

	if (val.lower() in ("y", "yes", "true")):
	return True;

	return False;

	def toInt(val):
	return int(val);


	def optionIsRequired(opt):
	return opt in req_options;

	def setOption(opt, value):
	options[opt] = value;

	## Displays usage help text.
	def showUsage():
	msg = "\nUsage:" \
	+ "\n {} -f <filtypes>[ -d <dirs>][ <flags>]".format(file_exe) \
	+ "\n {} -h".format(file_exe) \
	+ "\n\nOptions:" \
	+ "\n -f\|--filetypes:\tComma-seprated list of filename extensions to parse." \
	+ "\n -d\|--dirs:\t\tComma-separated list of directories to search." \
	+ "\n -s\|--scount:\t\tNumber of leading spaces to replace with tab" \
	+ " (default: {}).".format(scount_default) \
	+ "\n -l\|--level:\t\tLogging level (default: {}).".format(level_default.value) \
	+ "\n\nFlags:" \
	+ "\n -h\|--help:\t\tShow usage information." \
	+ "\n -x\|--fake:\t\tSimulate (don't apply changes)." \
	+ "\n --convert-le:\t\tConvert CR/CRLF line endings to LF." \
	+ "\n --nolead:\t\tDon't replace leading spaces with tabs." \
	+ "\n --notrail:\t\tDon't clean trailing whitespace."

	log(msg);

	## Displays an error message & exits the process.
	#
	# @param code
	# Exit code to use.
	# @param msg
	# Message to display.
	# @param[opt] usage
	# If <code>True</code>, shows usage information before exiting.
	def exitWithError(code, msg, usage=True):
	log();
	log(msg, Level.ERROR);
	if (usage):
	showUsage();

	sys.exit(code);

	## Compatibility function for case matching in different Python versions.
	#
	# @param match
	# The statement to be compared.
	# @param cases
	# Cases to be checked.
	def switch(match, cases, default=None):
	if (match in cases):
	return cases[match];

	if (default != None):
	return default;

	return match;

	## Parses command line arguments & sets up file & directory options.
	#
	# @param args
	# List of args to parse.
	def parseArgs(args, flags=False):
	idx = 0;
	while (idx < len(args)):
	cur_arg = args[idx];

	s_arg = cur_arg[0] == "-" and cur_arg.count("-") == 1;
	l_arg = cur_arg[0:2] == "--" and len(cur_arg) - len(cur_arg.lstrip("-")) == 2;

	# all accepted arguments use a switch ("-")
	if not (s_arg or l_arg):
	exitWithError(errno.EINVAL, "malformatted argument: {}".format(cur_arg));

	cur_arg = cur_arg.lstrip("-");

	if (s_arg):
	if (len(cur_arg) > 1):
	# parse individual short args that are grouped together
	grouped_flags = [];
	for c in cur_arg:
	# make sure flags got split into individual characters
	if (len(c) > 1):
	exitWithError(1, "internal error parsing grouped flags: {}".format(cur_arg));

	grouped_flags.append("-" + c);

	parseArgs(grouped_flags, True);
	idx = idx + 1
	continue;
	else:
	cur_arg = switch(cur_arg, short_options);

	if (not (cur_arg in options)):
	exitWithError(errno.EINVAL, "unknown argument: {}".format(cur_arg));

	otype = OptType.getOptionType(cur_arg);

	if (not otype.equals(OptType.FLAG)):
	if (flags):
	exitWithError(1, "argument \"{}\" is not a flag type & cannot be grouped".format(cur_arg));

	# arguments must have a parameter
	if (len(args) == idx + 1):
	exitWithError(1, "argument \"{}\" requires a value".format(cur_arg));

	val = None;
	if (otype.equals(OptType.FLAG)):
	val = True;
	else:
	if (not args[idx + 1].startswith("-")):
	# value is located at next index
	val = args[idx + 1];
	idx = idx + 1;

	if (otype.equals(OptType.BOOL)):
	val = OptType.toBoolean(val);
	elif (otype.equals(OptType.INT)):
	val = OptType.toInt(val);
	elif (otype.equals(OptType.LIST)):
	if ("," in val):
	val = tuple(val.split(","));
	else:
	val = tuple([val]);

	options[cur_arg] = val;
	idx = idx + 1;

	if (len(sys.argv) == 1):
	exitWithError(1, "missing parameters");

	parseArgs(sys.argv[1:]);

	if (options["help"]):
	showUsage();
	sys.exit(0);

	single_file = False;
	in_paths = options["dirs"];

	if (in_paths and len(in_paths) == 1 and os.path.isfile(in_paths[0])):
	single_file = True;

	for opt in options:
	if (opt == "filetypes" and single_file):
	continue;

	if (options[opt] == None):
	exitWithError(1, "missing required argument: {}".format(opt));


	# the actual work

	apply_changes = not options["fake"];
	if (not apply_changes):
	log("\nsimulation run, changes will not be applied\n");

	scount = options["scount"];
	spaces_prefix = "";
	for num in range(scount):
	spaces_prefix = spaces_prefix + " ";

	def replaceLeadingSpaces(line):
	lcontent = line.lstrip();
	idx = len(line) - len(lcontent);
	pre = line[:idx];

	if (spaces_prefix in pre):
	pre = "\t".join(pre.split(spaces_prefix));

	return pre + lcontent;


	cleaned_count = 0;

	def checkFile(f):
	# not sure why this needs declared here
	global cleaned_count;

	contents_orig = None;
	contents_new = [];

	try:
	buffer = codecs.open(f, "r", "utf-8");
	if (not buffer):
	exitWithError(1, "could not open file for reading: {}".format(f), False);

	contents_orig = buffer.read();
	buffer.close();
	except UnicodeDecodeError:
	exitWithError(1, \
	"could not read file {}, please check that it is a text file".format(f), \
	False);

	st_orig = contents_orig;

	# line endings to be written to output
	le = "\n";
	le_name = "LF";

	# ensure we are working with LF line endings
	if ("\r\n" in contents_orig):
	contents_orig = contents_orig.replace("\r\n", "\n");
	# preserve line endings
	if (not options["convert-le"]):
	le = "\r\n";
	le_name = "CRLF";
	if ("\r" in contents_orig):
	contents_orig = contents_orig.replace("\r", "\n");
	# preserve line endings
	if (not options["convert-le"]):
	le = "\r";
	le_name = "CR";

	contents_orig = tuple(contents_orig.split("\n"));

	idx = 0;
	for line in contents_orig:
	line_orig = line;

	if (not options["notrail"]):
	# clean trailing whitespace
	line = line.rstrip();

	if (not options["nolead"]):
	# replace leading spaces with tabs
	line = replaceLeadingSpaces(line);

	if (line != line_orig):
	log("cleaned line {} ({})".format(idx + 1, f), Level.DEBUG);

	contents_new.append(line);
	idx = idx + 1;

	st_new = None;
	if (le != "\n"):
	log("preserving line endings \"{}\" in file: {}".format(le_name, f), Level.DEBUG);
	st_new = le.join(contents_new);
	else:
	st_new = "\n".join(contents_new);

	if (st_new != st_orig):
	try:
	if (apply_changes):
	buffer = codecs.open(f, "w", "utf-8");
	buffer.write(st_new);
	buffer.close();

	cleaned_count = cleaned_count + 1;
	log("updated file: {}".format(f));
	except:
	exitWithError(1, "error while opening file for writing: {}\n{}" \
	.format(f, traceback.format_exc()), False);


	if (single_file):
	checkFile(in_paths[0]);
	else:
	# check that all directories exist before doing anything
	for d in in_paths:
	if (not os.path.isdir(d)):
	exitWithError(errno.ENOENT, "file or directory not found: {}".format(d));

	for d in in_paths:
	for ROOT, DIRS, FILES in os.walk(d):
	for FILE in FILES:
	f = os.path.join(ROOT, FILE);

	fsuffix = f.split(".")[-1];
	if (fsuffix in options["filetypes"]):
	checkFile(f);


	log("\ncleaned {} files".format(cleaned_count));