jrherr/quick random sample of a fasta file

## quick random sample of a fasta file
cat name.fasta |\ # identify file name
awk '/^>/ { if(i>0) printf("\n"); i++; printf("%s\t",$0); next;} {printf("%s",$0);} END { printf("\n");}' |\ # read data
perl -MList::Util -e 'print List::Util::shuffle <>' |\  # random sample of sequences with shuffle
head -n 50000 |\ # break fasta file into sections of 50000 sequences in length
awk '{printf("%s\n%s\n",$1,$2)}' > name_1.fasta  # write sequence output
	cat name.fasta \|\ # identify file name
	awk '/^>/ { if(i>0) printf("\n"); i++; printf("%s\t",$0); next;} {printf("%s",$0);} END { printf("\n");}' \|\ # read data
	perl -MList::Util -e 'print List::Util::shuffle <>' \|\ # random sample of sequences with shuffle
	head -n 50000 \|\ # break fasta file into sections of 50000 sequences in length
	awk '{printf("%s\n%s\n",$1,$2)}' > name_1.fasta # write sequence output