AlaaALatif/tabulate_variants.py

## tabulate_variants.py
import bjorn_support as bs
import mutations as bm


# FASTA must include reference NC_045512.2 (e.g. use cat to add the reference)
fasta_filepath = '/valhalla/2021-02-08_release/msa/2021-02-08_release.fa'
# specify name for output alignment
msa_filepath = 'msa.fa'
# run alignment (uses MAFFT but can be changed from bjorn_support.py)
bs.align_fasta(fasta_filepath, msa_filepath);
# load alignment
msa_data = bs.load_fasta(msa_filepath, is_aligned=True)
# identify variants for each sample
# must identify insertions before anything else, otherwise information is lost
try:
  insertions, _ = bm.identify_insertions_per_sample(msa_data)
except:
  insertions = None
substitutions, _ = bm.identify_replacements_per_sample(msa_data)
deletions, _ = bm.identify_deletions_per_sample(msa_data)
	import bjorn_support as bs
	import mutations as bm


	# FASTA must include reference NC_045512.2 (e.g. use cat to add the reference)
	fasta_filepath = '/valhalla/2021-02-08_release/msa/2021-02-08_release.fa'
	# specify name for output alignment
	msa_filepath = 'msa.fa'
	# run alignment (uses MAFFT but can be changed from bjorn_support.py)
	bs.align_fasta(fasta_filepath, msa_filepath);
	# load alignment
	msa_data = bs.load_fasta(msa_filepath, is_aligned=True)
	# identify variants for each sample
	# must identify insertions before anything else, otherwise information is lost
	try:
	insertions, _ = bm.identify_insertions_per_sample(msa_data)
	except:
	insertions = None
	substitutions, _ = bm.identify_replacements_per_sample(msa_data)
	deletions, _ = bm.identify_deletions_per_sample(msa_data)