ewels/find_uncompressed_files.pl

## find_uncompressed_files.pl
#/usr/bin/perl
use warnings;
use strict;
use Cwd;
use File::Find;
####
# FIND UNCOMPRESSED FILES
# Prints the full path of any files larger than 50mb which are uncompressed
# One file path per newline, so output can be piped to other tools, eg:
# perl find_uncompressed_files.pl | xargs gzip
# perl find_uncompressed_files.pl | grep sra
####

my $dir = $ARGV[0];
unless (defined $dir) {
	$dir = getcwd();
}

find(\&print_large_uncompressed, $dir);

sub print_large_uncompressed {
	if( -s > 52428800){ # file larger than 50mb
		if ( index ( `file $_`, "ASCII text" ) != -1 ) {
			print $File::Find::name . "\n";
		}
	}
}
	#/usr/bin/perl
	use warnings;
	use strict;
	use Cwd;
	use File::Find;
	####
	# FIND UNCOMPRESSED FILES
	# Prints the full path of any files larger than 50mb which are uncompressed
	# One file path per newline, so output can be piped to other tools, eg:
	# perl find_uncompressed_files.pl \| xargs gzip
	# perl find_uncompressed_files.pl \| grep sra
	####

	my $dir = $ARGV[0];
	unless (defined $dir) {
	$dir = getcwd();
	}

	find(\&print_large_uncompressed, $dir);

	sub print_large_uncompressed {
	if( -s > 52428800){ # file larger than 50mb
	if ( index ( `file $_`, "ASCII text" ) != -1 ) {
	print $File::Find::name . "\n";
	}
	}
	}