Skip to content

Instantly share code, notes, and snippets.

@adamwespiser
Created November 18, 2012 08:37
Show Gist options
  • Star 0 You must be signed in to star a gist
  • Fork 0 You must be signed in to fork a gist
  • Save adamwespiser/4104276 to your computer and use it in GitHub Desktop.
Save adamwespiser/4104276 to your computer and use it in GitHub Desktop.
Solution to rosalind's "corr" problem
Solution to rosalind's "CORR" problem.
http://rosalind.info/problems/corr/
The problem is:
Given a collection of reads(same size), a read is either:
1) Correct, and is the same as another read or its reverse trans
2) Incorrect by a point mutation, and the thus one base pair difference between the read and a correct read. (Hamming distance = 1)
report incorrect reads and their correct counterparts.
There is a strong assumption that a read must be either correct or incorrect, and that all incorrect reads map to at least one correct read.
import string
import itertools
from optparse import OptionParser
import corrLib
def readInDnaSequence(fileName):
""" problem specific function:
read in the dna sequences, one sequence per line, no annotation,
[ATCG] chars only"""
file = open(fileName, 'r')
dnaSeqs = []
index = 0
for line in file:
dnaSeqs.append(corrLib.Dna(index,line.strip()))
index += 1
return dnaSeqs
def main():
""" run the main loop taking an input file designated by the
'--file' option
"""
parser = OptionParser()
parser.add_option("-f","--file")
(option, args ) = parser.parse_args()
file = option.file
#print("reading in dna sequence")
seqs = readInDnaSequence(file)
#print("sequence in....")
# O(n^2)
# determine all of the correct sequences with full matches
for s,t in itertools.product(seqs,repeat=2):
s.setPairFound(t)
#s.setErrorPairFound(t)
#split the sequences into matching and no matching lists
seqsWithMatch = filter(lambda x: x.pair == True, seqs)
seqsNoMatch = filter(lambda x: x.pair == False, seqs)
# this may work as well, if oneErrorSeq is set with setPairFound
# in the above loop
#for s in seqs:
# if (s.pair == False):
# print("{0}->{1}".format(s.seq,s.oneErrorSeq))
#print(len(seqsWithMatch))
#print(len(seqsNoMatch))
# over sequences with no match, iterate over matching sequences
# and find the corresponding correct sequence
for s in seqsNoMatch:
for t in seqsWithMatch:
if( s.oneErrorMatch(t)):
True
s.reportOneErrorMatch()
break
if (__name__ == '__main__'):
main()
AAATAGCCCCCACCCAGCATGAAAATGGTTGCAATACGTGTAAGGCCCTG
TGAAGTTATCCCGTGCAGGTTCTTGATTTAGTTGGCCGCCTAACGCATCT
TACGTTTAAGGCCCTGTGCATTAAGCCGGCCATGAGTCGTAAGCCGCATA
TATGAAGTTATCCCGTGCAGGTTCTTGATTTAGTTGGCCGCCTAACGCAT
ATATGAAGTTATCCCGTGCAGGTTCTTGATTTAGTTGGCCGCCTAACGCA
CAACCATTTTCATGCTGGGTGGTGGCTATTTGAGATGCGTTAGGCGGCCA
TTGATTTAGTTGGCCGCCTAACGCATCTCAAATAGCCACCACCCAGCATG
CGTATTGCAACCATTTTCATGCTGGGTGGTGGCTATTTGAGATGCGTTAG
ACAGGGCCTTACACGTATTGCAACCATTTTCATGCTGGGTGGTGGCTATT
CGGCTTAATGCACAGGGCCTTACACGTATTGCAACCATTTTCATGCTGGG
AAGCCATATGAAGTTATCCCGTGCAGGTTCTTGATTTAGTTGGCCGCCTA
TTGAGATGCGTTAGGCGGCCAACTAAATCAAGAACCTACACGGGATAACT
GCGGCTTACGACTCATGGCCGGCTTAATGCACAGGGCCTTACACGTATTC
CGTTAGGCGGCCAACTAAATCAAGAACGTGCACGGGATAACTTCATATGG
TCTCAAATAGCCACCACCCAGCATGAAAATGGTTGCAATACGAGTAAGGC
TGCAATACGTGTAAGGCCCTGTGCATTAAGCCGGCCATGAGTCGTAAGCC
AAGTTATCCCGTGCAGGTTCTTGATTTAGTTGGCCGCCTAACGCATCTCA
AATGCACAGGGCCTTACACGTATTGCAACCATTTTCATGCTGGGTGGTGG
ATTGCAACCATTTTCATGCTGGGTGGTGGCTATATGAGATGCGTTAGGCG
AAATAGCCACCACCCAGCATTAAAATGGTTGCAATACGTGTAAGGCCCTG
ACGACTCATGGCCGGCTTAATGCACAGGGCCTTACACGTATTGCAACCAT
GGTGGTGGCTATTTGAGATGCGTTAGGCGGCCAACTAAATCAAGAACCTG
CTTACACGTATTGCAACCATTTTCATGCTGGGTGGTGGCTATTTGAGATG
TGCGTTAGGCGGCCAACTAAATCAAGAACCTGCACGGGATAACTTCATAT
GCCATATGAAGTTATCCCGTGCAGGTTCTTGATTTATTTGGCCGCCTAAC
GACATATGAAGTTATCCCGTGCAGGTTCTTGATTTAGTTGGCCGCCTAAC
CACCACCCAGCATGAAAATGGTTGCAATACGTGTAAGGCCCTGTGCATTA
GTATTGCAACCATTTTCATGCTGGGTGGTGGCTATATGAGATGCGTTAGG
GGTTGCAATACGTGTAAGGCCCTGTGCATTAAGCCGGACATGAGTCGTAA
TCCCGTGCAGGTTCTTGATTTAGTTGGCCGCCTAACGCATCTCAAATAGC
CCCGTGCAGGTTCTTGATTTAGTTGGCCGGCTAACGCATCTCAAATAGCC
TAGGCGGCCAACTAAATCAAGAACCTGCACGGGATAACTTCATATGGCTT
TTAGGCGGCCAACTAAATCAAGAACCTGCAGGGGATAACTTCATATGGCT
ACGACTCATGGCCGGCTTAATGCACAGGGCCTTACACGTATTGCAACCAT
GCCTAACGCATCTCAAATAGCCACCACCCAGCATGAAAATGGGTGCAATA
TATTTGAGATGCGTTAGGCGGCCAACTAAATCAAGAACCTGCACGGGATA
GCTGGGTGGTGGCTATTTGAGATGCGTTAGGAGGCCAACTAAATCAAGAA
GCAAAGGGCCTTACACGTATTGCAACCATTTTCATGCTGGGTGGTGGCTA
TTGAGATGCGTTAGGCGGCCAACTAAATCCAGAACCTGCACGGGATAACT
GGCCGGCTTAATGCACAGGGCCTTACACGTATTGCAACCATTTTCATGCT
CCATTTTCATGCTGGGTGGTGGCTATTTGAGATGCGTTAGGCGGCCAACT
TTTAGTTGGCCGCCTAACGCATCTCAAATAGCCACCACCCCGCATGAAAA
GGCGGCCAACTAAATCAAGAACCTGCACGGGATAACTTCATATGGCTTCA
CAGGTTCTTGATTTAGTTGGCCGCCTAACGCATCTCAAATAGCCACCACC
GGTGGCTATTTGAGATGCGTTAGGCGGCCAACTAAATCAAGAACCTACAC
GTGGTGGCTATTTGAGATGCGTTAGGCGGCCAACTAAATCAAGAACCTGC
CACCCAGCAGGAAAATGGTTGCAATACGTGTAAGGCCCTGTGCATTAAGC
CTATTTGAGATGCGTTAGGCGGCCAACTAAATTAAGAACCTGCACGGGAT
CGAGTCATGGCCGGCTTAATGCACAGGGCCTTACACGTATTGCAACCATT
ACCATTTTCATGCTGGGTGGTGGCTATTTGAGATGCGTTAGGCGGCCAAC
GGCGGCCAACTAAATCAAGAACCTGCACGGGATAACTTCATATGGCTTCA
GGTGGTGGCTATTTGAGATGCGTTAGGCGGCCAACTAAATCAAGAACCTG
CGTATTGCAACCATTTTCATGCTGGGTGGTGGCTATTTGAGATGCGTTAG
GCATTGCAACCATTTTCATGCTGGGTGGTGGCTATTTGAGATGCGTTAGG
TGGCCGGCTTAATGCACAGGGCCTTACACGTATTGCAACCATTTTCATGC
TTTGAGATGCGTTAGGCGGCCAACTAAATCAAGAACCTGCACGGGATAAC
CGGTTCTTGATTTAGTTGGCCGCCTAACGCATCTCAAATAGCCACCACCC
ATGAAAATGGTTGCAATACGTGTAAGGCCCGGTGCATTAAGCCGGCCATG
GACTCATGGCCGGCTTAATGCACAGGGCCTTACACGTATTGCAACCATTT
ACAGGGCCTTACACGTATTGCAACCATTTTCATGCTGGGTGGTGGCTATT
GATGCGTTAGGCGGCCAACTAAATCAAGAACCTGCACGGGATAACTTCAT
ATCCCGTGCAGGTTCTTGATTTAGTTGGCCGCCTAACGCATCTCAAATAG
GGTGGTGGCTATTTGAGATGCGTTAGGCGGCCAAGTAAATCAAGAACCTG
CTTACACGTATTGCAACCATTTTCATGCTGGGTGGTGGCTATTTGAGATG
ACGTATTGCATCCATTTTCATGCTGGGTGGTGGCTATTTGAGATGCGTTA
GATGCGTTAGGAGGCCAACTAAATCAAGAACCTGCACGGGATAACTTCAT
ATAGCCACCACCCAGCATGACAATGGTTGCAATACGTGTAAGGCCCTGTG
ACGCATCTCAAATAGCCACCACCCAGCATGAAAATGGATGCAATACGTGT
TTATCCCGTGCAGGTTCTTGATTTAGTTGGCCGCCTAACGCATCTCAAAT
CTTAATGCACAGGGCCTTACACGTATTGCAACCATTTTCATGCTGGGTGC
CACGTATTGCAACCATTTTCATGCTGGGTGGTGGCTATTTGAGATGCGTT
TTTCATGCTGGGTGGTGGCTATTTGAGATGCGTTAGGCGGCCAACTAAAT
TCAGATGCGTTAGGCGGCCAACTAAATCAAGAACCTGCACGGGATAACTT
ACACGAATTGCAACCATTTTCATGCTGGGTGGTGGCTATTTGAGATGCGT
TGCAGGTTCTTGATTTAGTTGGCCGCCTAACGCATCTCAAATAGCCACCA
CAGGTTCTTGATTTAGTTGGCCGCCTAACGCATCTCAAATAGCCACCACC
TTATCCCGTGCAGGTTCTTGATTTAGTTGGCCGCCTAATGCATCTCAAAT
CCGACTCATGGCCGGCTTAATGCACAGGGCCTTACACGTATTGCAACCAT
AAATAGCCACCACCCAGCATGAAAATGGTTGCAATACGTGTAAGGCCCTG
GCTGAGTGGTGGCTATTTGAGATGCGTTAGGCGGCCAACTAAATCAAGAA
TTACACGTATTGCAACCATTTTCATGCTGGGTGGTGGCTATTTGAGATGC
ATTTTCATGCTGGGTGGTGGCTATTTGAGATGCGTTAGGCGGCCAACTAA
CACCACCCAGCATGAAAATGGTTGCAATACGTGTAAGGCCCTGTGCATTA
AGCCATATGAAGTTATCCCGTGCAGGTTCTTGACTTAGTTGGCCGCCTAA
GATGCGTTAGGCGGCCAACTAAATCAAGAACCTGCACGGGATAACTTCAT
GCCGGCTTAATGCACAGGGCCTTTCACGTATTGCAACCATTTTCATGCTG
CACCACCCAGCATGAAAATGGTTGCAATACGTGTAAGGCCCTGTGCATTA
CGGCTTAATGCACAGGGCCTTACACGTATTGCAACCATTTTCATGCTGGG
GTTATCCCGTGCAGGTCCTTGATTTAGTTGGCCGCCTAACGCATCTCAAA
ACCATTTTCATGCTGGGTGGTGGCTATTTGAGATGCGTTAGGCGGCCAAC
GTGGCTATTTGAGATGCGTTAGGCGGCCAACTAAAACAAGAACCTGCACG
TACGTGTAAGGCCCTGTGCATTAAGCCGGCCATGAGTCGTAAGCCGCATA
CATGAAAATGGTTGCAATACGTGTAAGGCCCTGTGCATTAAGCCGGCCAT
CATGAAAATGGTTGCAATACGTGTAAGGCCCTGTGCATTAAGCCGGCCAT
TTATCCCCTGCAGGTTCTTGATTTAGTTGGCCGCCTAACGCATCTCAAAT
GCTTAATGCACAGGGCCTTACACGTATTGCAACCATTTTCATGCTGGGTG
GGCCTTACACGTATTGCAACCATTTTCATGCTGGGTGGTGGCTATTTGAG
TGAAAATGGTTGCAATACGTGTAAGGACCTGTGCATTAAGCCGGCCATGA
ACGACTCATGGCCGGCTTAAGGCACAGGGCCTTACACGTATTGCAACCAT
ACGTGTAAGGCCCTGTGCATTAAGCCGGCCATGAGTCGTAAGCCGCATAT
GGCTTACGACTCATGGCCGGCTTAATGCACAGGGTCTTACACGTATTGCA
CGTATTGCAACCATTTTCATGCTGGGTGGTGGCTATTTGAGATGCGTTAG
GTGGCTATTTGAGATGCGTTAGGCGGCCAACTAAATCAAGAACCTGCAGG
GATTTAGTTGGCCGCCTAACGCATCTCAAATAGCCACCACCCAGCATGAA
GGCGGCCAACTAAATCAAGAACCTGCAAGGGATAACTTCATATGGCTTCA
AGGCGGCCAACTAAATCAAGAACCTGCACGGGATAACTTCATATGGCTTC
CAGGGCCTTACACGTATTGCAACCATTTTCATGCGGGGTGGTGGCTATTT
AGCATGAAAATGGTTGCAATACGTGTAAGGCCCTGTGCATTAAGCCGGCC
TGCAATACGTGTAAGGCCCTGTGCATTAAGCCGGCCATGAGTCGTAAGCC
AGTTGGCCGCCTAACGCATCTCAAATAGCCACCACCCAGCATGAAAATGG
TGGTGGCTATTTGAGATGCGTTAGGCGGCCAACTAAATCAAGAACCTGCA
GCCGCCTAACGCATCTCAAATAGCCACCACCCAGCATGAAAATGTTTGCA
CACAGGGCCTTACACGTATTGCAACCATTTTCATGCTGGGTGGTGGCTAT
TATTCATGCTGGGTGGTGGCTATTTGAGATGCGTTAGGCGGCCAACTAAA
TAGGCGGCCAACTAAATCAAGAACCTGCACGGGATAACTTCATATGGCTT
AGAGGGCCTTACACGTATTGCAACCATTTTCATGCTGGGTGGTGGCTATT
GTTATCCCGTGCAGGTTCTTGATTTAGTTGGCCGCCTAACGCATCTCAAA
AATAGCCACCACCCAGCATGAAAATGGTTGCAATACGTGTAAGGCCCTGT
AGGTTCTTGATTTAGTTGGCCGCCTAACGCATCTCAAATAGCCACCACCC
TTTCATGCTGGGTGGTGGCTATTTGAGATGCGTTAGGAGGCCAACTAAAT
CCCAGCATGAAAATGGTTGCAATACGTGTAAGGCCCTGTGCATTAAGCCG
CATTTTCATGCTGGGTGGTGGCTATTTGAGATGCGTTAGGCGGCCAACTA
CTCATGGCCGGCTTAATGCACAGGGCCTTACACGTATTGCAACCATTTTC
TGATTTAGTTGGCCGCCTAACGCATCTCAAATAGCCACCACCCAGCATGA
AGTTATCCCGTGCAGGTTCTTGATTTAGTTGGCCGCCTTACGCATCTCAA
GCAACCATTTTCATGCAGGGTGGTGGCTATTTGAGATGCGTTAGGCGGCC
GGCTATTTGAGATGCGTTAGGCGGCCAACTAAATCAAGAACCTGCACGGG
CGCCTAACGCATCTCAAGTAGCCACCACCCAGCATGAAAATGGTTGCAAT
ATCATGAAAATGGTTGCAATACGTGTAAGGCCCTGTGCATTAAGCCGGCC
AGGGCCTTACACGTATTGCAACCATTTTCATGCTGGGTGGTGGCTATTTG
GGGCCTTACACGTATTGCAACCATTTGCATGCTGGGTGGTGGCTATTTGA
CAGCATGAAAATGGTTGCAATACGTGTAAGGCCCTGTGCATTAAGCCGGC
GTTATCCCGTGCAGGTTCTTGATTTAGTTGGCCGCCTAACGCATCTCAAA
CCACCACCCAGCATGAAAATGGTTGCAATACGTGTGAGGCCCTGTGCATT
GCAATACGTGTAAGGCCCTGTGTATTAAGCCGGCCATGAGTCGTAAGCCG
GATGCGTTAGGCGGCCAACTAAATCAAGAACCTGCACGGGATAACTTCAT
GTTTAGTTGGCCGCCTAACGCATCTCAAATAGCCACCACCCAGCATGAAA
CACGTATTGCAACCATTTTCATGCTGGGTGGTGGCTATTTGAGAGGCGTT
AGATGCGTTAGGCGGCCAACTAAATCAAGAACCTGCACGGGATAACTTCA
GAAGCCATATGAAGTTATCCCGTGCAGGTTCTTGATTTAGTTGGCCGCCT
CCCGTGCAGGTTCTTGATTTAGTTGGCCGCCTAACGCATCTCAAATAGCC
GTTGCAATACGTGAAAGGCCCTGTGCATTAAGCCGGCCATGAGTCGTAAG
GCTATTTGAGATGCGTTAGGCGGCCAACTAAATCAAGTACCTGCACGGGA
ACGTATTGCAACCATTTTCATGCTGGGTGGTGACTATTTGAGATGCGTTA
GAGATGCGTTAGGCGGCCAACTAAATCAAGAACCTGCACGGGATAACTTC
TTGCAACCATTTTCATGCTGGGTGGTGGCTATTTGAGATGCGTTAGGCGG
TGCACAGGGCCTTACACGTATTGCAACCATTTTCATGCTGGATGGTGGCT
GGTGGCTATTTGAGATGCTTTAGGCGGCCAACTAAATCAAGAACCTGCAC
GGCTTAATGCCCAGGGCCTTACACGTATTGCAACCATTTTCATGCTGGGT
GCAGGTTCTTGATTTAGTTGGCCGCCTAACGCATCTCAAATAGCCACCAC
ATATGCGGCTTACGACTCATGGCCGGCTTAATGCACAGGGCCTTACACGT
TAGCCACCACCCAGCATGAAGATGGTTGCAATACGTGTAAGGCCCTGTGC
CTTATGGCCGGCTTAATGCACAGGGCCTTACACGTATTGCAACCATTTTC
CTCAAATAGCCACCACGCAGCATGAAAATGGTTGCAATACGTGTAAGGCC
AAATGGTAGCAATACGTGTAAGGCCCTGTGCATTAAGCCGGCCATGAGTC
TCTTGATTTAGTTGGCCGCCTAACGCATCTCAAATAGCCACCACCCAGCA
GGGCCTTACACGTGTTGCAACCATTTTCATGCTGGGTGGTGGCTATTTGA
AGGCCCTTACACGTATTGCAACCATTTTCATGCTGGGTGGTGGCTATTTG
AAGCCATATGAAGTTATCCCGTGCAGGTTCTTGATTTAGTTGGCCGCCTA
TATGCTGCTTACGACTCATGGCCGGCTTAATGCACAGGGCCTTACACGTA
TCTTGATTTAGTTGGCCGCCTAACGCATCTCAAATAGCCACCACCCAGCA
TACGACTCATGGCCGGCTTAATGCACAGGGCCTTACACGTATTGCACCCA
CTTACACGTATTGCAACCATTTTCATGCTGGGTGGTGGCTATTTGAGATG
TGCTGGGTGGTGGCTATTTGAGATGCGTTAGGCGGCCAACTAAATCAAGA
AATACGTCTAAGGCCCTGTGCATTAAGCCGGCCATGAGTCGTAAGCCGCA
GTTCTTGATTTAGTTGGCCGCCTAACGCATCTCAAATAGCCGCCACCCAG
CGTCTTACGACTCATGGCCGGCTTAATGCACAGGGCCTTACACGTATTGC
ATGCTGGGTGGTGGCTATTTGAGATGCGTTAGGCGGCCAACTAAATCCAG
CTGGGTGGTGGCTACTTGAGATGCGTTAGGCGGCCAACTAAATCAAGAAC
TGGGTGGTGGCTATTTGAGATGCGTTAGGCGGCCAACTAAATCAAGAACC
TGCACAGGGCCTTACACGTATTGCAACCATTTTCACGCTGGGTGGTGGCT
GGTTGCAATACGTGTAAGGCCCTGTGCATTAAGCCGGCCATGAGGCGTAA
GTTAGGCGGCCAACTAAATCAAGAACCGGCACGGGATAACTTCATATGGC
ATTGCAACCATTTTCATGCTGGGTGGTGGCTATTTGAGATGCGTTATGCG
TTAATGCACAGGGCCTTACACGTATTGCAACCATTTTCATGCTGGGTGGT
ACACGTATTGCAACCATTTTCATGCTGGGTCGTGGCTATTTGAGATGCGT
ACCATTTTCATGCTGGGTGGTGGCTATTTGAGATGCGTTAGGCGGCCAAC
ACTTATCCCGTGCAGGTTCTTGATTTAGTTGGCCGCCTAACGCATCTCAA
GCTTAACGCACAGGGCCTTACACGTATTGCAACCATTTTCATGCTGGGTG
CCGTGCAGGTTCTTGATTTTGTTGGCCGCCTAACGCATCTCAAATAGCCA
TGAAGCCATATGAAGTTATCCCGTGCAGGTTCTTGATTTAGTTGGCCGCC
AGGCGGCCAACTAAATCAAGAACCTGCACGGGATAACTTCATATGGCTTC
TGAAGTTATCCCGTGCAGGTTCTTGATTTAGTTGGCCGCCTAACGCATCT
CCCGCGCAGGTTCTTGATTTAGTTGGCCGCCTAACGCATCTCAAATAGCC
TATTGCAACCATTTTCAAGCTGGGTGGTGGCTATTTGAGATGCGTTAGGC
GCAACCATTTTCATGCTGGGTGGTGGCTATTTGAGATGCGTTAGGCGGCC
ATAGCCACCACCCAGCATGAAAATGGTTGCAATACGTGTAAGGCCCTGTG
GAAGTTATCCCGTGCAGGTTCTTGATTTAGTTGGCCGCCTAACGCATCTC
TGAAAATGGTTGCAATACGTGTAAGGCCCTGTGCATTAAGCCGGCCATGA
GGTGGCTATTTGAGATGCGTTAGGCGGCCAACTAAATCAAGAACCTGCAC
TCATCCCGTGCAGGTTCTTGATTTAGTTGGCCGCCTAACGCATCTCAAAT
CATTTTCATGCTGGGTGGTGGCTATTTGAGATGCGTTAGGCGGCCAACTA
CTAACGCATCTCAAATAGCCACCACCCAGCATGAAAATGGTGGCAATACG
TTTGAGATGCGGTAGGCGGCCAACTAAATCAAGAACCTGCACGGGATAAC
GTTGCAATACGTGTAAGGCCCTGTGCATTAAGCCGGCCATGAGTCGTAAG
CGCATCTCAAATAGCCACCACCCAGCATGAAAATGGTTGCAATACTTGTA
CACCCAGCATGAAAATGGTTGCAATACGTGTAAGGCCCTGTGCATTAAGC
ATACGTGTAAGGCCCTGGGCATTAAGCCGGCCATGAGTCGTAAGCCGCAT
GCGGCTTACGACTCATGGCCGGCTTAACGCACAGGGCCTTACACGTATTG
ACGCATCTCAAATAGCCGCCACCCAGCATGAAAATGGTTGCAATACGTGT
AAATAGCCACCACCCAGCATGAAAATGGTTGCAATACGTGTAAGGCCCTG
TGCGGCTTACGACTCATGGCCGGCTTAATGCACAGGGCCTTACACGTATT
ACCACGCAGCATGAAAATGGTTGCAATACGTGTAAGGCCCTGTGCATTAA
AACCAGTTTCATGCTGGGTGGTGGCTATTTGAGATGCGTTAGGCGGCCAA
GCTTACGACTCATGGCCGGCTTAATGCACAGGGCCTTACACGTATTGCAA
TGGGTGGTGGCTATTTGAGATGCGTTAGGCGGCCAACTAAATCAAGAACC
AAATGGTTGCAATACGTGTAAGGCCCTGTGCATTAAGCCGGCCATGAGTC
CCATTTTCATGCTGGGTGGTGGCTATTTGAGATGCGTTAGGCGGCCAACT
GCCTTACACGTATTGCATCCATTTTCATGCTGGGTGGTGGCTATTTGAGA
CACCCAGCATGAAAATGGTTGCAATACGTGTAAGGCCCTGTGCATTAAGC
ATTTAGTTGGCCGCCTAACGCATCTCAACTAGCCACCACCCAGCATGAAA
CACCCAGCATGAAAATGGTTGCAATACGTGTAAGGCCCTGTGCATTAAGA
GGCTATTTGAGATGCGTTAGGCGGCCAACTAAATCAAGAACCTGCACGGG
CACGTATTGCAACCATTTTCATGCTGGGTGGTGGCTATTTGAGATGCGTT
TGCACAGTGCCTTACACGTATTGCAACCATTTTCATGCTGGGTGGTGGCT
ATGGCCGGCTTAATGCACAGGGCCTTACACGTATTGCAACCATTTTCATG
GCAGGTTCTTGATTTAGTTGGCCGCCTAACGCATCTCAAATAGCCACCAC
CTGGGTGGTGGCGATTTGAGATGCGTTAGGCGGCCAACTAAATCAAGAAC
CTTAATGCACAGGGCCTTACACGTATTGCAACCATTTTCATGCTTGGTGG
GGCGGCCAACTAAATCAAGAACCTGCACGGGATAACTTCATATGGCTTCA
TGGCAAATGCAGCCATGCCCAAATATATTTGGGCATGGCTGCATTTGCCA
CGCATCTCAAATAGTCACCACCCAGCATGAAAATGGTTGCAATACGTGTA
TGGGTGGTGGCTATTTGAGATGCGTTAGGCGGCCAACTAAATCAAGAACC
CTTACGACTCATGGCCGGCTTAATGCACAGGGCCTTACACGTATTGCAAC
AACCATTTTCATGCTGGGTGGTAGCTATTTGAGATGCGTTAGGCGGCCAA
TGAAGCCATATGAAATTATCCCGTGCAGGTTCTTGATTTAGTTGGCCGCC
GCCTTACACGTATTGCAACCATTTGCATGCTGGGTGGTGGCTATTTGAGA
TGCGGCTTACGACTCATGGCCGGCTTAATGCACAGGGCCTTACACGTATT
CCGCCTAACGCATCTCAAATAGCCACCACCCAGCATGAAAATGGTTGCAA
TAACGCATCTCAAATAGCCACCACCCAGCATGAAAATGGTTGCAATACGT
GGCTATTTGAGATGCGTTAGGCGGCCAACTAAATCGAGAACCTGCACGGG
ATCTCAAATAGCCACCACCCAGCATGAAAATGGTTGCAATACGTGTAAGG
TTAATGCACAGGGCCTTACACGTCTTGCAACCATTTTCATGCTGGGTGGT
TTACGACTCATGGCCGGCTTAATGCACAGGGCCTTACACGTATTGCAACG
AGGGCCTTACACGTACTGCAACCATTTTCATGCTGGGTGGTGGCTATTTG
TTCATGCTGAGTGGTGGCTATTTGAGATGCGTTAGGCGGCCAACTAAATC
TGCGTTTGGCGGCCAACTAAATCAAGAACCTGCACGGGATAACTTCATAT
ACACGTATTGCAACCATTTTCATGCTGGGTGGTGGCTATTTGAGATGCGT
CCCAGCATGAAAATGGTTGCAATACGTGTAAGGCCCTGTGCATTAAGCCG
ATCTCAAATAGCCACCACCCAGCATGAAAATGGTTGCAATACGTGTAAGG
GCAGCCATATGAAGTTATCCCGTGCAGGTTCTTGATTTAGTTGGCCGCCT
ACGTGTAAGGCCCTGTGCATTAAGCCGGCCATGAGTCGTAAGCCGCATAT
CATATGAAGTTATCCCGTGCAGGTTCTTGATTTAGTTGGCCGCCTAACGC
CCGGCTTAATGCACAGGGCCTTACACGTATTGCAACCATTTTCATGCTGG
GGTTGCAATACGTGTAAAGCCCTGTGCATTAAGCCGGCCATGAGTCGTAA
CATGGCCGGCTTAATGCACAGGGCCTTACATGTATTGCAACCATTTTCAT
ACGTATTGCAACCATTTTCATGCTGGGTGGTGGCTATTTGAGATGCGTTA
TATTGCAACCATTTTCATGCTGGTTGGTGGCTATTTGAGATGCGTTAGGC
CGTATTGCAACCATTTTCATGCTGGGTGGTGGCTATTTGAGATGCGTTAG
GCTATTTGAGATGCGTTAGGCGGCCAACTAAATCAAGAACCTGCACGGGA
AGGGCCTTACACGTATTCCAACCATTTTCATGCTGGGTGGTGGCTATTTG
ATATGAAGGTATCCCGTGCAGGTTCTTGATTTAGTTGGCCGCCTAACGCA
GTGGTGGCTATTTGAGATGCGTTAGGCGGCCAACTAAATCAAGAACCTGC
TTACGACTCATGGCCGGCTTAATGCACAGGGCCTTACACGTTTTGCAACC
TCTCAAATAGCCACCACCCAGCATGAAAATGGTTTCAATACGTGTAAGGC
CCAGCATGAAAATGGTTGCAATACGTGTAAGGCCCTGTGCATTAAGCCGG
GCAATACGTGTAAGGCCCTGTGCATTAAGCCGGCCATGAGTCGTAAGCCG
CAGCATGAAAATGGTTGCAATACGTGTAATGCCCTGTGCATTAAGCCGGC
CAAGTATTGCAACCATTTTCATGCTGGGTGGTGGCTATTTGAGATGCGTT
TGCTGGGTGGTGGCTATTTGAGATGCGTTAGGCGGCCAACTAAATCAAGA
AGGCGGCCAACTAAATCAAGAACCTGCACGGGATAACTTCATATGCCTTC
TTATCCCGTGCAGGTTCTTGATTTAGTTGGCCGCCTAACGCATCGCAAAT
CCCGTGCAGGTTCTTGATTTAGTTGGCCGCCTAACGCATCTCAAATAGCC
GAAAATGGTTGCACTACGTGTAAGGCCCTGTGCATTAAGCCGGCCATGAG
TTAGGCGGCCAACTAAATCAAGAACCTGCACGGGATAACTTCATATGGCT
CACGTATTGCAACCATTTTCATGCTGGGTGGTGGCTATTTGAGATGCGTT
TTAGTTGGCCGCCTAACGCATCTCAAATAGACACCACCCAGCATGAAAAT
TTAGGCGGCCAACTAAATCAAGAACCTGCACGGGATAAGTTCATATGGCT
GGATGAAAATGGTTGCAATACGTGTAAGGCCCTGTGCATTAAGCCGGCCA
ATGTGAAGTTATCCCGTGCAGGTTCTTGATTTAGTTGGCCGCCTAACGCA
ACCATTTTCATGCTGGGTGGTGGCTATTTGAGATGCGTTAGGCGGCCAAC
GCCTTACACGTATTGCAACCATTTTCATGCTGGGTGGTGGCTATTTGAGA
TCAAATAGCCACCACCCAGCATGAAAATGGTTGCAATACGTGTAAGGCCC
TGATAATGGTTGCAATACGTGTAAGGCCCTGTGCATTAAGCCGGCCATGA
CCGGCTTAATGCACAGGGCCTTACACGTATTGCAACCATTTTCATGCTGG
CCATATGAAGTTATCCCGTGCAGGTTCTTGATTTAGTTGGCCGCCTAACG
GGGCCTTACACGTATTACAACCATTTTCATGCTGGGTGGTGGCTATTTGA
TTTAGTTGGCCGCCTAACGCATCTCAAATAGCCACCACCCAGCATGAAAA
TATGCGGCTTACGACTCATGGCCGGCTTAATGCACAGGGCCTTACACGTA
GTTCTTGATTTAGTTGGCCGCCTAACGCATCTCAAATAGCAACCACCCAG
GCTATTTGAGATGCGTTAGGCGGCCAACTAAATCAAGAACCTGCACGGGA
AATGCACAGGGCCTTACACGTATTGCAACCATTTTCATGCTGGGTGGTGG
AGTTATCCCGTGCAGGTTCTTGATTTAGTTGGCCGCCTAACGCATCTCAA
TCATGGCCGGCTTAATGCACATGGCCTTACACGTATTGCAACCATTTTCA
ATGCTTGCAATACGTGTAAGGCCCTGTGCATTAAGCCGGCCATGAGTCGT
GGCTTAATGCACAGGGCCTTACACGTATTGCAACCATTTTCATGCTGGGT
ATGGCCGGCTTAATGCACAGGGCCTTACACGGATTGCAACCATTTTCATG
TGCAATACGTGTAAGGCCCTGTGCATTAAGCCGGCCATGAGGCGTAAGCC
ATGCGGCTTACGACTCATGGCCGGCTAAATGCACAGGGCCTTACACGTAT
GTTGGCCGCCTAACGCATCTCAAATAGCCACCACCCAGCATAAAAATGGT
ATATGAAGTTATCCCGTGCAGGTTCTTGATTTAGTTGGCCGCCTAACACA
TGCAACCATTTTCATGCTGGGTGGTGGCTATTTGAGATACGTTAGGCGGC
TCTCAAATAGCCACCACCCAGCATGAAAATGGTTGCAATACGTGTAAGGC
CGGCTTAATGCACAGGGCCTTACACGTATTGCAACCATTGTCATGCTGGG
TCATGGCCGGCTTAATCCACAGGGCCTTACACGTATTGCAACCATTTTCA
TACACGTATTGCAACCATTTTCATGCTGGTTGGTGGCTATTTGAGATGCG
CAACCATTTTCATGCTGGGTGGTGGCTATTTGAGATGCGTTAGGCGGCCA
TCCACGTATTGCAACCATTTTCATGCTGGGTGGTGGCTATTTGAGATGCG
ATAGCCACCACCCAGCATGAAAATGGTTGCAATACGTGTAAGGCCCTGTG
CCGTGCAGGTTCTTGATTGAGTTGGCCGCCTAACGCATCTCAAATAGCCA
GCTATTTGAGATGCGTTAGGCGGCCAACTAAATCAAGAACCTGCACGGGA
CAGGGCCTTACACGTATTGCAACCATTTTCATGCTGGGTGGTGGCTATTT
GCCTAACGCATCTCAAATAGCCACCACCCAGCATGAAAATGGTTGCAATA
CGCCTAACGCATCTCAAATAGCCACCACCCAGCATGAAAATGGTTGCAAT
GCCGGCTTAATGCACAGGGCCTTACAGGTATTGCAACCATTTTCATGCTG
GCTTAATGCACAGGGCCTTACACGTATTGCAACCATCTTCATGCTGGGTG
GCCGCCTAACGCATCTCAAATAGCCACCTCCCAGCATGAAAATGGTTGCA
TGGCCGCCTAACGCATCTCAAATAGCCACCACCCAGCATGAAAATGGTTG
CAGGTTCTTGATTTAGTTGGCCGCCTAACGCATCTCAAATAGCCACCACC
ATACGTGTAAGGCCCTGTGCATTAAGCCGGCCATGAGTCGTAAGCCGCAT
ATTGCAACCATTTTCATGCTGGGTGGTGGTTATTTGAGATGCGTTAGGCG
AGGTTCTTGATTTAGTTGGCCGCCTAACGCATCTCAAATAGCCACCACCC
TTTGAGATGGGTTAGGCGGCCAACTAAATCAAGAACCTGCACGGGATAAC
GTTGGCCGCCTAACGCATCTCAAATAGCCACCACCCAGCATGAAAATGGT
CATGCTGGGTGGTGGCTATTTGAGATGCGTTAGGCGGCCAACTAAATCAA
TGAGATGCGTTAGGCGGCCAACTAAATCAAGAACCTGCACGGGATAACTT
TGCAACCATTTTCATGCAGGGTGGTGGCTATTTGAGATGCGTTAGGCGGC
ATGGTTGCAATACGTGTAAGGCCCTGTGCATTAAGCCGGGCATGAGTCGT
GGCCTTACACGTATTGCAACCATTTTCATGCTGGGTGGTGGCTATTTGAG
CCGTGCAGGTTCTTGATTTAGTTGGCCGCCTAACGCATCTCAAAGAGCCA
CCCAGCATGAAAATGGTTGCAATACGTGTAAGGCCCTGTGCATTAAGCCG
CACCACCCAGCATGAAAATGGTTGCAATACGTGTAAGGCCCTGTGCATTA
GGCCGCCTAACGCATCTCAAATAGCCACCACCCAGAATGAAAATGGTTGC
CTTACACGTATTGCAACCTTTTTCATGCTGGGTGGTGGCTATTTGAGATG
AATACGTGTAAGGCCCTGTGCATTAAGCTGGCCATGAGTCGTAAGCCGCA
CATGGCCGGCTTAATGCACAGGGCCTTACACGGATTGCAACCATTTTCAT
ATTTTCATGCTGGGTGGTGGCTATTTGAGATGCGTTAGGCGGCCAACTAA
ACATATTGCAACCATTTTCATGCTGGGTGGTGGCTATTTGAGATGCGTTA
ATGCACAGGGCCTTACACGTATTGCAACCATTTTCATGCTGGGTGGTGGC
CATCTCAAATAGCCACCACCCAGCATGAAAATGGTTGCAATACGTGTAAG
GCAACCATTTTCATGCTGGGTGGTGGCTATTTGAGATGCGTTAGGCGGCC
CCACCCAGCATGAAAATGGTTGCAATACGTGTAAGGCCCTGTGCATTAAG
CGGCTTACGACTCATGGCCGGCTTAATGCACAGGGCCTTACACGTATTGC
GGCCTTACACGTATTGCAACCATTTTCATGCTGGGTGGTGGCTATTTGAG
ATTTAGTTGGCCGTCTAACGCATCTCAAATAGCCACCACCCAGCATGAAA
CTGGCTATTTGAGATGCGTTAGGCGGCCAACTAAATCAAGAACCTGCACG
CACCACCCAGCATGAAAATGGTTGCAATACCTGTAAGGCCCTGTGCATTA
ATATGAAGTTATCCCGTGCAGGTTCTTGATTTAGTTGGCCGCCTAACGCA
AGGGCCTTACACGTATTGCAACCATTTTCATGCTGGGTGGTGGCTATTTG
TATCCCGTGCAGGTTATTGATTTAGTTGGCCGCCTAACGCATCTCAAATA
ACACGTATTGCAACCATTTTCATGCTGGGTGGTGGCTATTTGAGATGCGT
TGCTGGGTGGTGGCTATTTGAGATGCGTTAGGCGGCCAACTAAATCAAGA
CACCCAGCATGAAAATGGTTGCAATACGTGTAAAGCCCTGTGCATTAAGC
TAGGCGGCGAACTAAATCAAGAACCTGCACGGGATAACTTCATATGGCTT
GCAATACGTGTAAGGCCCTGTGCATTAAGCCGGCCATGAGTCGTAAGCCG
CCGCCTAACGCATCTCAAATAGCCACCACCCAGCATGAAAATGGTTGCAA
AGTTGGCCGCCTAACGCATCTCAAATAGCCACCACCCAGCATGAAAATGG
GGGCCTTACACGTATTGCAACCATTTTCATGCTGGGTGGTGGCTATTTGA
CGTTAGGCGGCCAACTAAATCAAGAACCTGCACGGGATAACTTCATATGG
AATGGTTGCAATACGTGTAAGGGCCTGTGCATTAAGCCGGCCATGAGTCG
ACTACTCATGGCCGGCTTAATGCACAGGGCCTTACACGTATTGCAACCAT
TGGCCGACTTAATGCACAGGGCCTTACACGTATTGCAACCATTTTCATGC
CCATTTTCATGCTGGGTGGTGGTTATTTGAGATGCGTTAGGCGGCCAACT
ATATGCGGCTTACGACTCATGGCCGGCTTAATGCACAGGGCCTTACCCGT
CTTGATTTAGTTGGCCGCCTAACGCATCTCAAATTGCCACCACCCAGCAT
TCTCAAATAGCCACCACCCAGCATGAAAATGGTTGCAATACGTGTAAGGC
CTTAATGCACAGGGCCTTACACGTATTGCAACCATTTTCATGCTGCGTGG
TGAGATGCGTTAGGCGGCCAACTAAATCAAGAACCTGCACGGGATAACTT
GAGATGCGTTAGGCGGCCAACTAAATCAAGAACCTGCACGGGATAACTTC
GCAACCATTTTCATGCTGGGTGGTGGCTATTTGAGATGCGTTGGGCGGCC
CCTTACACGTATGGCAACCATTTTCATGCTGGGTGGTGGCTATTTGAGAT
TGGTTGCAATACGTGTAAGGCCCTGTACATTAAGCCGGCCATGAGTCGTA
CCATATGAAGTTATCCCGTGCAGGTTCTTGATTTAGTTGGCCGCCTAACG
CATGCTGGGTGGTGGCTATTTGAGATGCGTTAGGCGGCCAACTAAATCAA
TAACGCATCTCAAATAGCCACCACCCAGCATGAAAATGGTTGCAATACGT
AATACGTGTAAGGCTCTGTGCATTAAGCCGGCCATGAGTCGTAAGCCGCA
GATGCGTTAGGCGGCCAACTAAATCAAGAACCTGCACGGGATAACTTCAT
ACACGTATTGCAACCATTTTCATGCTGGGTGGTGGCTATTTAAGATGCGT
GCAACCATTTTCATGCTGGGTGGTGGCTATTTGAGATGCGTTAGGCGGCC
TATGCGGCTTACGACTCATGGCCGGCTTAATGCACAGGGCCTTAGACGTA
CTAACGCAACTCAAATAGCCACCACCCAGCATGAAAATGGTTGCAATACG
TGGCCGCCTAACGCATCTCAAATAGCCACCACCCAGCATGAAAATGGTTG
TTTGAGATGCGTTAGGCGGCCAACTAAATCAAGAACCTGCACGGGATAAC
AATGCACAGGGCCTTACACGTATTGCAACCATTTTCATACTGGGTGGTGG
TAGTTGGCCGCCTAACGCATCTCAAATAGCCACCACCCAGCATGAAAATG
AGCATGAAAATGGTTGCAATACGTGTAAGGCCCTGTGCATTAAGCCGGCC
GCACAGGGCCTTACACGTATTGCAACCATGTTCATGCTGGGTGGTGGCTA
TACACGTATTGCAACCATTTGCATGCTGGGTGGTGGCTATTTGAGATGCG
GGGCCTTACACGTATTGTAACCATTTTCATGCTGGGTGGTGGCTATTTGA
CCGGCTTAATGCACAGGGCCTTACACGTATTGCAACCATTTTCATGCTGG
CTCAAATAGCCACCACCCAGCATGAAAATGGTTGCAATACGTGTAAGGCC
GAAGCCATATGAAGTTATCCCGTGCAGGTTCTTGATTTAGTTGGCCGCCT
AATGGTTGCAATACGTGTAAGGCCCTGTGCATTAAGCCGGCCATGAGTCG
CTTAATGCACAGGGCCTTACACGTATTGCGACCATTTTCATGCTGGGTGG
CTGGGTGGTGGCTATTTGAGATGCGTTAGGCGGCCAACTAAATCAAGAAC
TTGGCCGCCTAACGCATCTCAAAAAGCCACCACCCAGCATGAAAATGGTT
CAGGGCCTTACACGTATTGCAACCATTTTGATGCTGGGTGGTGGCTATTT
CTTAATGCACAGGGCCTTACACGTATTGCAACCATGTTCATGCTGGGTGG
AGATGCGTTAGGCGGCCAACTAAATCAAGAACCTGCACGGGATAACTTCA
TGGCTATTTGAGATGCGTTAGGCGGGCAACTAAATCAAGAACCTGCACGG
GTGGCTATTTGAGATGCGTTAGGCGGCCAACTAAATCAAGAACCTGGACG
TGGCCGGCTTAATGCACAGGGCCGTACACGTATTGCAACCATTTTCATGC
TTTAGTTGGCCGCCTAACGCATCTCAAATAGCCACCACCCAGCATGAAAA
TGATTTAGTTGGCCGCTTAACGCATCTCAAATAGCCACCACCCAGCATGA
GGGCAAATGCAGCCATGCCCAAATATATTTGGGCATGGCTGCATTTGCCA
GGCTTAATGCACAGGGCCTTACACGTATTGCAACCATTTTCATGCTGGGT
GCGCATCTCAAATAGCCACCACCCAGCATGAAAATGGTTGCAATACGTGT
ACAGGGCCTTACACGTATTGCAACCATTCTCATGCTGGGTGGTGGCTATT
CGTATTGCAACCATTTTCATGCTGGGTGGTGGCTATTTGAGATGCGTTAG
GGCTATTTGAGATGCGTTAGGCGGCCAACTAAATCAAGAACCTGCACGGG
ACGTGTAAGGCCCTGTGCATTAAGCCGGCCATGAGTCGTAAGCCGCATAT
ACAGGGCCTTACACGTATTGCAACCATTTTCATGCTGGGTGGTGGCTCTT
TAGCCACCACCCAGCATGAAAATGGTTGCAATACGTGTAAGGCCCTGTGC
GCAGGTTCTTGATTTAGTTGGCCGCCTAACGCATCTCAAATAGCCACCAC
GAAGTTATCCCGTGCAGGTTCTTGATTTAGTTGGCCGCCTAACGCATCTC
CGACTGATGGCCGGCTTAATGCACAGGGCCTTACACGTATTGCAACCATT
TACACGTATTGCAACCATTTTCATGCTGGGTGGTGGCTATTTGAGATGCG
GCCATATGAAGTTATCCCGTGCAGGTTCTTGATTTAGTTGGCCGCCTAAC
GAGATGCGTTAGGCGGCCAACTAAATCAAGAACCTGCACGGGATAACTTC
GCAGGTTCTTGATTTAGTTGGCCGCCTAACGCATCTCAAATAGCCACCAC
TATCCCGTGCAGGTTCTTGATTTAGTTGGCCGCCCAACGCATCTCAAATA
ATGAAAATGGTTGCAATACGTGTCAGGCCCTGTGCATTAAGCCGGCCATG
TGAGATGCGTTAGGCGGCCAACTAAATCAAGAACCTGCACGGGATAACTT
GACTCATGGCCGGCTTAATGCACAGGGCCTTACACGTATTGCAACCATTT
GCCATATGAAGTTATCCCGTGCAGGTTCTTGATTTAGTTGGCCGCCTAAC
GGTTCTTGATTTAGTTGGCCGCCTAACGCATCTCAAATAGCCACCACCCA
CGCCTAACGCATCTCAAATAGCCACCACCCAGCATGAAAAGGGTTGCAAT
CGGCTTAATGCACAGGGCCTTACACGTATTGCAACCATTTTCATGCTGGG
CCAGCATGAAAATGGTTGCAATACGTGTAAGGCCCTGTGCATTAAGCCGG
CATGGCCGGCTTAATGCACAAGGCCTTACACGTATTGCAACCATTTTCAT
GTGCAGGTTCTTGATTTAGTTTGCCGCCTAACGCATCTCAAATAGCCACC
GCCACAACCCAGCATGAAAATGGTTGCAATACGTGTAAGGCCCTGTGCAT
ATACGGGTAAGGCCCTGTGCATTAAGCCGGCCATGAGTCGTAAGCCGCAT
GCCACCACCCAGCATGAAAATGGTTGCAATACGTGTAAGGCCCTGTGCAT
CACAGGGCCTTACACGTATTGCAACCATTTTCATGCTGGGTGGTGGCTAT
ATGCTGGGTGGTGGCTATTTGAGATGCGTTAGGCGGCCAACTAAATCAAG
GAGATGCGTTAGGCGGCCAACTAAATCAAGAACCTGCACGGGATAACTTC
GCCGCCCAACGCATCTCAAATAGCCACCACCCAGCATGAAAATGGTTGCA
CCATTTTCATGCTGGGTGGTGGCTATTTCAGATGCGTTAGGCGGCCAACT
AGGCGGCCAACTAAAGCAAGAACCTGCACGGGATAACTTCATATGGCTTC
AGTTGGCCGCCTAACGCATCTCAAATAGCCACCACCCAGCATGAAAATGG
TTTCATGCTGGGTGGTGGCTATTTGAGATGCGTTAGGCGGCCAATTAAAT
TATGAAGTTATCCCGTGCAGGTTCTTGATTTAGTTGGCCGCCTAACGCAT
AAAATGGTTGCAATACGTGTAAGGCCCTGTGCATTAAGCCGGCCATGAGT
ATACGTGTAAGGCCCTGTGCATTAAGCCGGCCATGAGTCGTAAGCCGCAT
GGTGGTGGCTATTTGAGATGCGTTAGGCGGCCAACTAAATCAAGAACCTG
GGGTGGTGGCTATTTGAGATGCGTTAGGCGGCCAACTAAATCAAGAACCT
CTATTTGAGATGCGTTAGGCGGCCAACTAAATCAAGAACCTGCACGGGAT
CAGGTTCTTGATTTAGTTGGCCGCCTAACGCATCTCAAATAGCCACCACC
GCATCTCAAATAGCCACCACCCAGCATGAAAATGATTGCAATACGTGTAA
GGCGGCCAACTAAATCAAGAACCTGCACGGGATAACTTCATATGGCTTCA
ATGCGTTAGGCGGCCAACTAAATCAAGAACCTGCACGGGATAACTTCATA
AACCATTTTCATGCTGGGTGGTGGCTATTTGAGATGCGTTAGGCGGCCAA
TATCCCGTGCAGGTTCTTGATTTAGTTGGCCGCCTAACGCATCTCAACTA
ACAGGGCCTTACACGTATTGCAACCATTTTCATGCTGGGAGGTGGCTATT
CCGTGCAGGTTCTTGATTTAGTTGGCCGCCTAACGCATCTCAAATAGCCA
GGCTATTTGAGATGCGTTAGGCGGCCAACTAAATCAAGAACCTCCACGGG
AGGTTCTTGATTTAGTTGGCCGCCTAACGCATCTCAAATAGCCACCACCC
CAACACGTGTAAGGCCCTGTGCATTAAGCCGGCCATGAGTCGTAAGCCGC
TTGAGATGCGTTAGGCGGCCAACTAAATCAAGGACCTGCACGGGATAACT
CTATTTGAGATGCGTTAGGCGGCCAACTAAATCAAGAACCTGCACGGGAT
TGCTGGGTGGTGGCTATTTGAGATGCGTTAGGCGGCCAACTAAATCAAGA
GACTCATGGCCGGCTTTATGCACAGGGCCTTACACGTATTGCAACCATTT
GCGTTAGGCGGCCAACTAAATCAAGAACCTGCACGGGATAACTTCATATG
TATGCGGCTTACGACTCATGGCCGGCTTAATGAACAGGGCCTTACACGTA
AAATGGTTGCCATACGTGTAAGGCCCTGTGCATTAAGCCGGCCATGAGTC
ACCATTTTCATGCTGGGTGGTGGCTATTTGAGATGCGTTAGGCGGCCAAC
TTGCAATACGTGTAAGGCCCTGTGCATTAAGCCGGCCATGAGTCGTAAGC
GGTGGGTATTTGAGATGCGTTAGGCGGCCAACTAAATCAAGAACCTGCAC
CTGGGTGGTGGCTATTTGAGATGCGTTAGGCGGACAACTAAATCAAGAAC
TTCTTGATTTAGTTGGCCGCCTAACGCATCTCAACTAGCCACCACCCAGC
GCAACCATTTTCATGCTGGGTAGTGGCTATTTGAGATGCGTTAGGCGGCC
ATGAAGTTATCCCGTGCAGGTTCTTGATTTAGTTGGCCGCCTAACGCATC
AGCGCCTTACACGTATTGCAACCATTTTCATGCTGGGTGGTGGCTATTTG
TGCGGCTTACGACTCATGGCCGGCTTAATGCACAGGGCCTTACACGTTTT
GGCGGCCAACTAAATCAAGAACCTGCACGGGATAACTTCATATGGCTTAA
GGCCGCCTAACGCATCCCAAATAGCCACCACCCAGCATGAAAATGGTTGC
CCACCACCCAGCATGAAAATGGTTGCAATACGTGTAAGGCCCTGTGCATT
ATGGCCGGCTTAATGCACAGGGCCTTACACGTATCGCAACCATTTTCATG
GAAAATGGTTGCAATACGTGTAAGGCCCTGTGAATTAAGCCGGCCATGAG
TACACGTATTGCAACCATTTTCATGCTGGGTGGTGGCTATTTGAGATGCG
GGCCGGCTTAATGCACAGGGCCTTACACGAATTGCAACCATTTTCATGCT
AGCCATATGAAGTTATCCCGTGCAGGTTCTTGATTTAGTTGCCCGCCTAA
TGCACAGGGCCTTACACGGATTGCAACCATTTTCATGCTGGGTGGTGGCT
CACGTATTGCAACCATTTTCATGCTGGGTGGTGGCTATTTGAGATGCGTT
TCATGCTGGGTGGTGGCTATTTGAGATGCGTTAGGCGGCCTACTAAATCA
TGGTTGCAATACGTGTAAGGCCCTGTGCATTAAGCCGGCCATGAGTCGTA
ACCCAGCATGAAAATGGTTGCAATACGTGTAAGGCCCTGTGCATTAAGCC
GCTTACGACTCATGGCCGGCTTAATGCACAGGGCCTTACACGTATTGCAA
AATGCACAGGGCCTTACACGTATTGCAACCATTTTCATGCTGGGTGGTGG
CGCATCTCAAATAGCCACCACCCAGCATGAAAATGGTTGCAAGACGTGTA
GGTTCTTGATTTAGTTGGCCGCCTAACGCATCTCAAATAGCCACCACCCA
ACAGGGCCTTACACGTATTGCAACCATTTTCATGCTGGGTGGTGGCTATT
GCCATATGAAGTTATCCCGTGCAGGTTCTTGATTTAGCTGGCCGCCTAAC
CATGCTGGTTGGTGGCTATTTGAGATGCGTTAGGCGGCCAACTAAATCAA
AGATGCGTTAGGCGGCCAACTAAATCAAGAACCTGCACGGGATAACTTCA
TCAAATAGCCACCACCCAGCATGAAAATGGTTGCAATACGTGTAAGGCCC
ATTTTCATGCTGGGTGGTGGCTATTTGAGATGCGTTAGGCGGCCAACTAA
TCGTTAGGCGGCCAACTAAATCAAGAACCTGCACGGGATAACTTCATATG
CTGGGTGGTGGCTATTTGAGATGCGTTAGGCGGCCAACTAAATCAAGAAC
TGCTGGGTGGTGGCTATTTGAGATGTGTTAGGCGGCCAACTAAATCAAGA
ATGCTGGGTGGTGGCTATTTGAGATGCGTTAGGCGGCCAACTAAATCAAG
GATTTAGTTGGCCGCCTAACGCATCTCAAATAGCCACCACCAAGCATGAA
CCACCCAGCATGAAAATGGTTGCAATACGTGTAAGGCCCTGTGCATTAAG
CGTGCAGGTTCTTGATTTAGTTGGCCGCCTAACGCATCTCAAATAGCCAC
GTTTTCATGCTGGGTGGTGGCTATTTGAGATGCGTTAGGCGGCCAACTAA
CGGCTTAATGCACAGGGCCTTACACGTATTGCAACCATTTTCATGCTGGG
TATGAAGTTATCCCGTGCAGGTTCTTGATTTAGTTGGCCGCCTAACGCAT
CTTACACGTATTGCAACCATTTTCATGCTGGGTGGTGGCTATTTGAGATG
TATGAAGTTATCCCGTGCAGGTTCTTGATTTAGTTGGCCACCTAACGCAT
AGGTTCTTGATTTAGTTGGCCGCCTAACGCATCTCAAATAGCCACCACCC
CCAGCATGAAAATGGTTGCAATACGTGTAAGGCCCTGTGCATTTAGCCGG
GCTATTTGAGATGCGTTAGGCGGCCAACTAAATCAAGAACCTGCATGGGA
ACGTGTAAGGCCCTGTGCATTAAGCCGGCCATGAGTCGTAAGCCGCATAT
CTATTTGAGATGCGTTAGGCGGCCAACTAAATCAAGAACCTGCACGGGAT
ATGGCCGGCTTAATGCACAGGGCCTTACACGTATTGCAACCATTTTCATG
CTCAAATAGCCACCACCCAGCATGAAAATGGTTGCAATACGTGTAAGGCC
GCTGGGTGGTGGCTATTTGAGATGCGTTAGGCGGCCAACTGAATCAAGAA
GGCTTAATGCACAGGGCATTACACGTATTGCAACCATTTTCATGCTGGGT
GCTGGCTGGTGGCTATTTGAGATGCGTTAGGCGGCCAACTAAATCAAGAA
CACCACCCAGCATGAAAATGGTTGCAATACGTGTAAGGCCCTGTGCATTA
GTCATGGCCGGCTTAATGCACAGGGCCTTACACGTATTGCAACCATTTTC
GGGCCTTACACGTATTGCAACCATTTTCATGCTGGGTGGTGGCTATTTGA
GCGTTAGGCGGCCAACTAAATCAAGAACCTGCACGGGATAACTTCATATG
GGTGGCTATTTGAGATGCGTTAGGCGGCCCACTAAATCAAGAACCTGCAC
CACGTGTAAGGCCCTGTGCATTAAGCCGGCCATGAGTCGTAAGCCGCATA
TGCAATACGTGTAAGGACCTGTGCATTAAGCCGGCCATGAGTCGTAAGCC
CATGAAAATGGTTGCAATACGTGTAAGGCCCTGTGCATTAAGCCGGCCAT
AATAGCCACCACCCAGCATGAAAATGGTTGCAATACGTGTAAGGCCCTGT
CACCCAGCATGAAAATGGTTGCAATACGTGTAAGGCCCTGTGCATTAAGT
ATCCCGTGCAGGATCTTGATTTAGTTGGCCGCCTAACGCATCTCAAATAG
TTAGGCGGCCAACTAGATCAAGAACCTGCACGGGATAACTTCATATGGCT
GAGATGCGTTAGGCGGCTAACTAAATCAAGAACCTGCACGGGATAACTTC
ATTTTCATGCTGGGTGGTGGCTATTTGAGATGCGTTAGGCGGCCAACTAA
GGGTGGTGGCTATTTGAGATGCGTTAGGCGGCCAACTAAATCAAGAACCT
TGCACAGGGCCTTACACGTATTGCAACCATTTTCTTGCTGGGTGGTGGCT
AAGTTGTCCCGTGCAGGTTCTTGATTTAGTTGGCCGCCTAACGCATCTCA
CGTGCAGGTTCTTGATTTAGTTGGCCGCCTAACGCATCTCAAACAGCCAC
CCGGCTTAATGCACAGGGCCTTACACGTATTGCAACCATTTTCATGCTGG
TGGTTGCAATACGTGTAAGGCCCTGTGCATTAAGCCGGCGATGAGTCGTA
AGGCGGCCAACTAAATCAAGAACCTGCACGGGATAACTTCATATGGCTTC
TGCAACCATTTTCATGCTGGGTGGTGGCTATTTGAGATGCGTTAGGCGGC
ATAGCCACCACCCAGGATGAAAATGGTTGCAATACGTGTAAGGCCCTGTG
CCTAACGCATCTCAAATAGCCACCACCCAGCATGAAAATGGTTGCAATAC
ATTTGAGATGCGTTACGCGGCCAACTAAATCAAGAACCTGCACGGGATAA
ATGCGGCTTACGACTCATGGCCGGCTTAATGCACAGGGCCTTACACGTAT
CCATATGAAGTTATCCCGTGCAGGTTCTTGATTTAGTTGGCCGCCTAACG
GGCCTTACACGTATTGCAACCATTTTCATGCTGGGTGGTGGCTATTTGAG
GGCGGCCAACTAAATCAAGAACCTGCACGGGATAACTTCATATGGCTTCA
CCTAACGCATCTCAAATAGCCACCACCCAGCATGAAAATGGTAGCAATAC
TCTCAAATAGCCACCACCCAGCATGAAAATGGTTGCAAGACGTGTAAGGC
GCATGAAAATGGTTGCAATACGTGTAAGGCCCTGTGCATTTAGCCGGCCA
GGCCTTACACGTATTGCAACCATTTTCATGCTGGGTGGTGGCTATTTGAG
CCGGCTTAATGCACAGGGCCTTACACGTATTGCAACCATTTTCATGCTGG
ATGGCCTTACACGTATTGCAACCATTTTCATGCTGGGTGGTGGCTATTTG
GCACAGGGCCTTACACGTATTGCAACCATTTTCATGCTTGGTGGTGGCTA
TTTTCATGCTGGGTGGTTGCTATTTGAGATGCGTTAGGCGGCCAACTAAA
AGGCGGCCAACAAAATCAAGAACCTGCACGGGATAACTTCATATGGCTTC
CGACTCATGGCCGGCTTAATGCACAGGGCCTTACACGTATTGCAACCATT
CTTACACGTATTGCAACCATTTTCATGCTGGGTGGTGGCTATTTGAGATG
ACCCAGCATGAAAATGGTTGCAATACGTGTAAGGCCCTGTGCATTAAGCC
GGCCTTACACGTATTGCAACCATTTTCATGCTGGGTGGTGGCTATTTGAG
ATGCTGGGTGGTGGCTATTTGAGATGCGTTAGGCGCCCAACTAAATCAAG
TCATGCTCGGTGGTGGCTATTTGAGATGCGTTAGGCGGCCAACTAAATCA
GCATCTCAAATAGCCACCACCCAGCATGAAAATGGTTGCAATACGTGTAA
ATGCTGGGAGGTGGCTATTTGAGATGCGTTAGGCGGCCAACTAAATCAAG
CATATGAAGTTATCCCGTGCAGGTTCTTGATTTAGTTGGCCGCCTAACGC
TTGAGATGCGTTAGGCGGCCAACTAAATCAAGAACCTGCACGGGATAACT
TTACGACTCATGGCCGGCTTAATGCACAGGGCCTTACACGTATTGCAACC
ATGGCCGGCTTAATGCACAGGGCCTTACACGTATTGCAACCATTTTCATG
GGCTTACGACTCATGGCCGGCTTAATGCACAGGGCCTTACACGTATTGTA
GATGCGTTAGGCGGCCAACTAAATCAAGAACCTGCACGGGATAACTTCAT
TTTCATGCTGGGTGGTGGCTATTTGAGATGCGTTAGGCGGCCAACTAAAT
GGTTCTTGATTTAGTTGGCCGCCTAACGCATCTCAAATAGCCACCACCCA
TTCATGCTGGGTGGTGGCTATTTGAGATTCGTTAGGCGGCCAACTAAATC
ATACACGTATTGCAACCATTTTCATGCTGGGTGGTGGCTATTTGAGATGC
CACCACCCAGCATGAAAATGGTTGCAATACGTGTAAGGCCCTGTGCATTA
TACGACTCATGGCCGGCTTAATGCACAGGGCCTTACACGTATTGCAACCA
TGTCCGGCTTAATGCACAGGGCCTTACACGTATTGCAACCATTTTCATGC
TGGTGGCTATTTGAGATGCGTTAGGCGGCAAACTAAATCAAGAACCTGCA
AACGCATCTCAAATAGCCACCACCCAGCATGAAAATGGTTGCAATACGTG
AAGTTATCCCGTGCAGGTTCTTCATTTAGTTGGCCGCCTAACGCATCTCA
TATTTGAGATGCGTTAGGCGGCCATCTAAATCAAGAACCTGCACGGGATA
TCTTGATTTAGTTGGCCGCCTAACGCATCTCAAATAGCCACCACCCAGCA
TGCAGGTTCTTGATTTAGTGGGCCGCCTAACGCATCTCAAATAGCCACCA
TGTTATCCCGTGCAGGTTCTTGATTTAGTTGGCCGCCTAACGCATCTCAA
TCCCGTGCAGGTTCTTGATTTAGTTGGCCGCCTAACGCATCTCAAATAGC
GCGTTAGGCGGCCAACTAAATCAAGAACCTGCACGGGATAACTTCATATG
CACAGGACCTTACACGTATTGCAACCATTTTCATGCTGGGTGGTGGCTAT
ATGAAGTTATCCCGTGCAGGTTCTTGATTTAGTTGGCCGCCTAACGCATC
CCAGCATGAAAATGGTTGCAATACGTGTAAGGCCCTGTGCATTAAGCCGG
AGCCACCACCCAGCATGAAAATGGTTGCAATACGTGTAAGGCCCTGTGCA
TAACGCATCTCAAATAGCCACCACCCAGCATGAAAATGGTTGCAATACGT
TTAGGCGGCCAACTAAATCTAGAACCTGCACGGGATAACTTCATATGGCT
GCCTAACGCCTCTCAAATAGCCACCACCCAGCATGAAAATGGTTGCAATA
ACTCATGGCCGGCTTAATGCACAGGGCCTTACACGTATTGCAACCATTTT
GAAACTGGTTGCAATACGTGTAAGGCCCTGTGCATTAAGCCGGCCATGAG
GCCATATGCAGTTATCCCGTGCAGGTTCTTGATTTAGTTGGCCGCCTAAC
AAGCCATATGAAGTTATCCCGTGCAGGTTCTTGATTTAGTTGGCCGCCTA
GGCTTAATGCACAGGGCCTTACACGTATTGCAACCATTTTCATGCTGGGT
GGCCGGCTTAATGCACAGGGCCTTACACGTATTGCAACCATTTTCATGCT
CTTAATGCCCAGGGCCTTACACGTATTGCAACCATTTTCATGCTGGGTGG
GTGGCTATTTGAGATGCGTTAGGCGGCCAACTAAATAAAGAACCTGCACG
AGGGCCTTACACGTATTGCAACCATTTTCATGCTGGGTGGTGGCTATTTG
ATGCACAGGGCCTTAAACGTATTGCAACCATTTTCATGCTGGGTGGTGGC
CGTATTGCAACCATTTTCATGCTGGGTGGTGGCTATTTGAGATGCGTTAG
GCACAGGGCCTTACACGTATTGCAACCATTTTCATGCAGGGTGGTGGCTA
GGTGGCTATTCGAGATGCGTTAGGCGGCCAACTAAATCAAGAACCTGCAC
CATTTTCATGCTGGGTGGTGGCTATTTGAGATGCGTTAGGCGGCCAACTA
TAGCCACCACCCAGCATGAAAATGGTTGCAATACGTGTAAGGCACTGTGC
AGTTATCCCGTGCAGGTTCTTGATTTAGTTGGCCGCCTAACGCATCTCAA
ATTTTCATGCTGGGTGGTGGCTATTTGAGATGCGTTAGGCGGCCAACTAA
ATGCACAGGGCCTTACACGTATTGCAACCATTTTCATGCTGGGTGGTGGC
TGAGATGCGTTAGGCGGCCAACTAAATCAAGAACCTGCACGGGATAACTT
TGCAGGTTCTTGATTTAGTTGGCCGCCTAACGCATCTCAAATAGGCACCA
AGCCACTACCCAGCATGAAAATGGTTGCAATACGTGTAAGGCCCTGTGCA
CAGCATGAAAATGGTTGCAATACGTGTAAGGCCCTGTGCATTAAGCCGCC
TTACGACTCATGGCCGGCTTCATGCACAGGGCCTTACACGTATTGCAACC
CTCAAATAGCCACCACCCAGCATGAAAATGGTTGCAATACGTGTAAGGCC
TAGTTGGCCGCCTAACGCATCTCAAATAGCCACCACCCAGCATGAAAATG
ACAGGGCCTTACACGTATTGCAACCATTTTCATGCTGGGTGGTGGCTATT
TTCTTGATTTAGTTGGCCGCCTAACGCATCTCAAATAGCCCCCACCCAGC
GACTCATGGCCGGCTTAATGCACAGGGCCTTACACGTATTGCAACCATTT
CCGCCTAACGCATTTCAAATAGCCACCACCCAGCATGAAAATGGTTGCAA
TGCAATACGTGTAAGGCCCTGTGCATTAAGCCGGCCATGAGTCGTAAGCC
AGGGCCTTACACGTATTGCAACCATTTACATGCTGGGTGGTGGCTATTTG
ATATGAAGTTATCCCGTGCAGGTTCTTGATTTAGTTGGCCGCCTAACGCA
TTAATGCACAGGGCCTTACACGTATTGCGACCATTTTCATGCTGGGTGGT
TACGACTCATGGCCGGCTTAATGCACAGGGCCTTGCACGTATTGCAACCA
TTTGAGATGCGTTAGGCGGCCAACTAAATCAAGAACCTGCACGGGATAAC
GGTTTAGTTGGCCGCCTAACGCATCTCAAATAGCCACCACCCAGCATGAA
ATCTCAAATAGCCACCACCCAGCATGAAAATGGTTGCAATACGTGTAAGG
TATGAAGTTATCCCGTGCAGGTTCTTGATTTAGTTGGCCGCCTAACGGAT
TTGCACAGGGCCTTACACGTATTGCAACCATTTTCATGCTGGGTGGTGGC
GATTTAGTTTGCCGCCTAACGCATCTCAAATAGCCACCACCCAGCATGAA
GGTTCTTGATTTAGTTGGCCGCCTAACGCATCTCAAATACCCACCACCCA
GTTGCAAAACGTGTAAGGCCCTGTGCATTAAGCCGGCCATGAGTCGTAAG
AACCATTTTCATTCTGGGTGGTGGCTATTTGAGATGCGTTAGGCGGCCAA
TGCAGGTTCTTGATTGAGTTGGCCGCCTAACGCATCTCAAATAGCCACCA
TTTAGTTGGCCGCCTTACGCATCTCAAATAGCCACCACCCAGCATGAAAA
GGGTGGTGGCTATTTGAGATGCGTTAGGCGGCCAACTAAATCAAGAACCT
GCCTAACGCATCTCAAATAGCCACCACCCAGCATGAAAATGGTTGCAATA
GGCCGGCTTAATGCACAGGGCCTTACACGTATTGCAACCATTTTCATGCT
CGTGCAGGTTCTTGATTTAGTTGGCCGCCTAACGCATCTCAAATAGCCAC
TAGGCGGCCAACTAAATCAAGAACCTGCACGGGATAACTTCATATGGCTT
CAACCATTTTCATGCTGGGTGGTGGCTATTTGAGATGCGTTAGGCGGCCA
TCAAATAGCCACCTCCCAGCATGAAAATGGTTGCAATACGTGTAAGGCCC
CGACTCATGGCGGGCTTAATGCACAGGGCCTTACACGTATTGCAACCATT
CCATTTTCATGCTGGGTGGTGGCTATTTGAGATGCGTTAGGCGGCCAACT
TGGCCGCCTAACGCATCTCAAATAGCCACCACCCAGCATGAAAATGGTTG
CTTACGACTCATGGCCGGCTTAATGCACAGGGCCTTACACGTATTGCAAC
CCGTGCAGGTTCTTGATTTAGTTGGCCGCCTAACGCATCTCAAATAGTCA
ACCACCCAGCATGAAAATGGTTGCAATACGTGTAAGGCCCTGTGCATTAA
CGTTAGGCGGCCAACTAAATCAAGAACCTGCACGGGATAACTTCATATGG
CCGCCTAACGCATCTCAAATAGCCACCACCCAGCATGAAAATGGTTGCAA
GAAGTTATCCCGTGCAGGTTCTTGATTTAGTTGGCCGCCTAACGCATCTC
CTTGATTTAGTTGGCCTCCTAACGCATCTCAAATAGCCACCACCCAGCAT
CTTACACGTATTGCAACCATTTTCATGCTGGGTGGTGGCTATTTGAGATG
GTATTGCAACCATTTTCTTGCTGGGTGGTGGCTATTTGAGATGCGTTAGG
AAAATGGTTGCAATACGTGTAAGGCCCTGTGCATTAAGCCGGCCACGAGT
TGAAAATGGTTGCAATACGTGTAAGGCCCTGTGTATTAAGCCGGCCATGA
TCAAATAGCCACCACCCAGCATGAAAATGGTTGCAATACGTGTAAGGCCC
CCTTACACGTATTGCAACCATTTTCATGCTGGGTGGTGGCTATTTGAGAT
GAGATGCGTTAGGCGGCCAACTAAATCAAGAACCTGCACGGGATAACTTC
CAGGTTCTTGATTTAGTTGGTCGCCTAACGCATCTCAAATAGCCACCACC
AACCATTTTCATGCTGGGTGGTGGCTACTTGAGATGCGTTAGGCGGCCAA
GCTGGGTGGTGGCTATGTGAGATGCGTTAGGCGGCCAACTAAATCAAGAA
AGCCACCACCCAGCATGAAAATAGTTGCAATACGTGTAAGGCCCTGTGCA
CCTTACACGTATTGCAGCCATTTTCATGCTGGGTGGTGGCTATTTGAGAT
GCACAGGGCCTTACACGTATTGCAACCATTTTCATGCTGGGTGGTGGCTA
TTACGACTGATGGCCGGCTTAATGCACAGGGCCTTACACGTATTGCAACC
TCCCGTGCAGGTTCTTGATTTAGTTGGCCGCCTAACGCATCACAAATAGC
GCCACCACCCAGCATGAAAATGGTTGCAATACGTGTAAGGCCCTGTGCAT
AGATGCGTTAGGCGGCCAACTAAATCAAGAACCTGCACGGGATAACTTCA
ACTCATGGCCGGCTTAATGCACAGGGCCTTACACGTATTGCAACCATTTT
GGCTATTTGAGATGCGTTAGGCGGCCAACTAAATCAAGAACCTGCACGGG
CATGGCCGGCTTAATGTACAGGGCCTTACACGTATTGCAACCATTTTCAT
CATGCTGGGTGGTGGCTATTTGAGATGCGTTAGGCGGCCAACTAAATCAA
GCGGCTTACGACTCATGGCCGGTTTAATGCACAGGGCCTTACACGTATTG
TCGGCTTACGACTCATGGCCGGCTTAATGCACAGGGCCTTACACGTATTG
TGATTTAGTTGGCCGCCTAACGCATCTCAAATAGCCACCACCCAGCATGA
CGTTAGGCGGCCAACTAAATCAAGAACCTGCACGGGATAACTTCATATGG
TTACACGTATTGCAACCATTTTCATGCTGGGTGGTGGCTATTTGAGATGC
CATATGAAGTTATCCCGTGCAGGTTCTTGATTTAGTTGGCCGCCTAACGC
CACAGGGCCTTACACGTATTGCACCCATTTTCATGCTGGGTGGTGGCTAT
TTACGACTCATGGCCGGCTTAATGCACAGGGCCTTACACGTATTGCAACC
CCATATGAAGTTATCCCGTGCAGGTTCTTGATTTAGTTGGCCGCCTAACG
CATGGCCGGCTTAATGCACAGGGCCTTACACGTATTGCAACCATTTTCAT
CTATTTGAGATGCGTTAGGCGGCCAACTAAATCAAGAACCTGCACGGGAT
CGGCTTACGACTCATGGCCGGCTTAATGCACAGGGCCTTACACGTATTGC
ACACGTATTGCAACCATTTTCATGCTGGGTGGTGGCTATTTGAGATGCGT
CCTAACGCATCTCAAATAGCCACCACCCAGCATGAAAATGGTTGCAATAC
CAAATATCCACCACCCAGCATGAAAATGGTTGCAATACGTGTAAGGCCCT
TGCACAGGGCCTTACACGTATTGCAACCATTTTCATGCTGGGTGGTGGCT
ATTTGAGATGCGTTAGGCGGCTAACTAAATCAAGAACCTGCACGGGATAA
CTTAATGCACAGGGCCTTACATGTATTGCAACCATTTTCATGCTGGGTGG
CCGTGCAGGTTCTTGATTTAGTTGGCCGCCTAACGCATCTCAAATAGCCA
CATCTCAAATAGCCACCACCCAGCATGAAAATGGTTGCAATACGTGTAAG
GGGTGGTGGCTATTTGAGATGCGTTAGGCGGCCAACTAAATCAAGAACCT
ACACGTATTGCAACCATTTTCATGCTGGGTGGTGGCAATTTGAGATGCGT
GGCCGGCTTAATGCACAGGGCCTTACACGTATTGCAACCATTTTCATGCT
GCCATATGAAGTTATCCCGTGCAGGTACTTGATTTAGTTGGCCGCCTAAC
CCTTACACGTATTGCAACCATTTTCATGCTGGGTGGTGGCTATTTGAGAT
GTTGCAATACGTGTAAGGCCCTGTGCAGTAAGCCGGCCATGAGTCGTAAG
AATGGTTGCAATACGTGTAAGGCCCTGTGCATTGAGCCGGCCATGAGTCG
GTATTGCAACCATTTTCATGCTGGTTGGTGGCTATTTGAGATGCGTTAGG
TAATGCACATGGCCTTACACGTATTGCAACCATTTTCATGCTGGGTGGTG
GTGGTGGCTATTTGAGATGCGTTAGGCGGCCAACTAAATCAAGAACCTGC
GGCTTAATGCACAGGGCCTTACACGTATTGCAACCATTTTCATGCTGGGT
TTTGAGATGCGTTAGGCGGCCAACTAAATCAAGAACCTGCACGGGATAAC
AATCCCGTGCAGGTTCTTGATTTAGTTGGCCGCCTAACGCATCTCAAATA
GTGGCTATTTGAGATGCGTTAGGCGGCCAACTAAATCAAGAACCTGCATG
TGCAACCATTTTCATGCTTGGTGGTGGCTATTTGAGATGCGTTAGGCGGC
GCCACTACCCAGCATGAAAATGGTTGCAATACGTGTAAGGCCCTGTGCAT
CTTACGACTCATGGCCGGCTTAATGCACAGGGCCTTACACGTATTGCAAC
CCGGCTTAATGCACAGGGCCTTACACGTATTGCAACCATTTTCATGCTGG
TAGTTGGCCGCCTAACGCATCTCAAATAGCCACCACCCAGCATGAAAAGG
CAACCATTTTCATGCTGGGTGGTGGCTATTTGAGATGCGTTAGGCGGCCA
CTTACGACTCATGGCCGGCTTAATGCACAGGGCCTTACACGTATTGCAAC
ATTTGAGATGCGTTAGGCGGCCAACTAAATCAAGAACCTGCACGGGATAA
TACGACTCATGGCCGGCTTAATGCACAGGGCCTTACACGTATTGCAACCA
GATTTAGTTGGCCGCCTAACGCATCTAAAATAGCCACCACCCAGCATGAA
CCGCCTAACGCATCTCAAATAGCCACCACCCAGCATGAAAATGGTTGCAA
CTCATGGCCGGCTTAATGCACAGGGCCTTACACGTATTGCGACCATTTTC
TTGGCCGCCTAACGCATCTCAAATAGCCCCCACCCAGCATGAAAATGGTT
GCTTACGACTCATGGCCGGCTTAATGCACAGGGCCTTACACGTATTGCAA
TAGTTGGCCGCCTAACGCATCTCAAATAGCCACCACCCAGCATGAAAATG
CCACCACCTAGCATGAAAATGGTTGCAATACGTGTAAGGCCCTGTGCATT
GGTTCTTGATTTAGTTGGCCGCCTAACGCATCTCAAATAGCCACCACCCA
CCATTTTCATGCTGGGTGGTGGCTATTTGAGATGCGTTAGGCGGCCGACT
ATCCCGTGCAGGTTCTTGATTTAGTTGGCCGCCTAACGCATCTCAAATAG
CTTACACGTATTGCAACCATTTTCATGCTGGGTGGTGGCTATTTGAGATG
GGCGGCCAACTAAATCAAGAAGCTGCACGGGATAACTTCATATGGCTTCA
TTTAGTTGGCCGCCTAACGCATCTCAAATAGCCACCACCCAGTATGAAAA
ACTCATGGCCGGCTTAATGCACAGGGCCTTACACGTATTGCAACCATTTT
GCCGGCTTAATGCACAGGGCCTTACACGTATTGCAACCATTTTCATGCTG
ATTGCAACCATTTTCATGCTGGGTGGTGGCTATTTGGGATGCGTTAGGCG
CCTTACACGTATTGCAACCATTTTCATGCTGGGTGGTGGCTATGTGAGAT
ATTTAGTTGGCCGCCTAACGCATCTCAAATAGCCACCGCCCAGCATGAAA
TCTCAAATAGCCACCACCCAGCATGAAAATGGTTGCAATACGTGTAAGGC
ATTTGAGATGCGTTAGGCGGCCAACTAAATGAAGAACCTGCACGGGATAA
CATGCTGGGTGGTGGCTATTTGAGATGCGTTAGGCGGCCAACTAAATCAA
ATTTAGTTGGCCGCCTAACGCATATCAAATAGCCACCACCCAGCATGAAA
TTGGCCGCCTAACGCATCTCAAATAGCCACCACCCAGCATGAAAATGGTT
TCATGCTGGGTGGTGGCTATTTGAGATGCGTTAGGCGGCCAACTAAATCA
ACGACTCATGGCCGGCTTAATGCACAGGGCCTTAAACGTATTGCAACCAT
AGGTTCTTGATTTAGTTGGCCGCCTAACGCATCTCAAATAGCCACCACCC
GCTGGGTGGTGGCTATTTGAGATGCGTTAGGCGGCCAACTAAATCAAGAA
CGGGGTGGTGGCTATTTGAGATGCGTTAGGCGGCCAACTAAATCAAGAAC
GACTCATGGCCGGCTTAATGCACAGGGCCTTACACGTATTGCAACCATTT
TGCGGCATACGACTCATGGCCGGCTTAATGCACAGGGCCTTACACGTATT
CTTGATTTAGTTGGCCGCCTAACGCATCTCAAATAGCCACCACCCAGCAT
TACGACTCATGGCCGGCTTAATGCACAGGGCCTTACACGTATTGCAACCA
TATTTGAGATGCGTTAGGCGGCCAACTAAATCAAGAACCTGCACGGGATA
TGAAAATGTTTGCAATACGTGTAAGGCCCTGTGCATTAAGCCGGCCATGA
GCCATATGAAGTTATCCCGTCCAGGTTCTTGATTTAGTTGGCCGCCTAAC
TCCCGTGCAGGTCCTTGATTTAGTTGGCCGCCTAACGCATCTCAAATAGC
GGCTTAATGCACAGGGCCTTACACGTATTGCAACCATTTTCATGCTGGGT
ATGTCCGGCTTAATGCACAGGGCCTTACACGTATTGCAACCATTTTCATG
TACGTGTAAGGCCCTGTGCATTAAGCCGGCCATGAGTCGTGAGCCGCATA
TGCTGGGTGGTGGCTATTTGAGATGCGTTAGGCGGCCAACTAAATCAAGA
TGCAGGTTCTTGATTTAGTTGGCCGCCTAACGCATCTCAAATAGCCACCA
GGCCGGCTTAATGCACAGGGCCTTACACGGATTGCAACCATTTTCATGCT
GCATGAAAATGGTTGCAATACGTGTAAGGCCCTGTGCATTAAGCCGGCCA
TGGTTGCAATACGTGTAAGGCCCTGTGCATTAAGCCGGCCATGAGTCGTA
AAGTGTAAGGCCCTGTGCATTAAGCCGGCCATGAGTCGTAAGCCGCATAT
AACCATTTTCATGCTGGGTGGTGGCTATGTGAGATGCGTTAGGCGGCCAA
AAATAGCCACCACCCAGCCTGAAAATGGTTGCAATACGTGTAAGGCCCTG
AAAGCACAGGGCCTTACACGTATTGCAACCATTTTCATGCTGGGTGGTGG
TAGGCGGCCAACTAAATCAAGAACCTGCACGGGATAACTTCATATGGCTT
GGTGGTGGCTATTTGAGATGCGTTAGGCGGCCAACTAAATCAAGAACCTG
TACGTGTAAGGCCCTGTGCATTAAGCCGGCCATGAGTCGTAAGCCGCATA
GCCTAACGCATCTCAAATAGCCACCACCCAGCATGAAAATGGTTGCAATA
CTTACGACTCATGGCCGGCTTAATGCACAGGGCCTTACACGTATTGCAAC
CTATATGAGATGCGTTAGGCGGCCAACTAAATCAAGAACCTGCACGGGAT
ACTCATGGCCAGCTTAATGCACAGGGCCTTACACGTATTGCAACCATTTT
GGTGGCTATTTGAGATGCGTTAGGCGGCCAACTAAATCAAGAAGCTGCAC
GCCTAACGCATCTCAAATAGCCACCACCCAGCATGAAAATAGTTGCAATA
AACGCATCTCAAATAGCCACCACCCAGCATGAAAATGGTTGCAATACGTG
ATACGTGTAAGGCCCTGTGCATTAAGCCGGCCATGAGTCGTAAGCCGCAT
CATGCTGGGTGGTGGCTATTTGAGATGCGTTAGGCGGCCAACTAAATCAA
TAATGCACAGGGCCTTACACGTATTGCAACCATTTTCATGCTGGGTGGTG
GACTCATGGTCGGCTTAATGCACAGGGCCTTACACGTATTGCAACCATTT
CAATACGTGTAAGGCCCTGTGCATTAAGCCGGTCATGAGTCGTAAGCCGC
TTGCAATACGTGTAAGGCCCTGTGCATTAAGCCGGCCATGAGTCGTAAGC
GGCTTAATGCACAGGGCCTTACACGTATTGCAACCATTTTCATGCTGGGT
TTTACATGCTGGGTGGTGGCTATTTGAGATGCGTTAGGCGGCCAACTAAA
TTGATTTAGTTGGCCGCCTAACGCATCTCAAATAGCCACCACCCAGCATG
TTGATTTAGTTGGCCGCCTAACGCATCTCAAATAGCCACCACCCAGCATG
CGACTCATGCCCGGCTTAATGCACAGGGCCTTACACGTATTGCAACCATT
GAAAATGGTTGCAATACGTGTAAGGCCCTGTGCATTAAGCCGGCCATGAG
ACTCATGGCCGGCTTAATGCACAGGGCCTTACACGTATTGCAACCATTTT
ACGACTCATGGCCGGCTTAATGCACAGGGCCTCACACGTATTGCAACCAT
ATCCCGTGCAGGTTCTTGATTTAGTTGGCCGCCTAACTCATCTCAAATAG
GTGGTGGCTATTTGAGATGCGTTAGGCGGCCAACTAAATCAAGAACCTGC
GGTGGCTATTTGAGATGCGTTAGGCGGCCAACTAAATCAAGAACCTGCAC
TGCGTTAGGCGGACAACTAAATCAAGAACCTGCACGGGATAACTTCATAT
CATATGAAGTTATCCCGTGCAGGTTCTTGATTTAGTTGGCCGCCTAACGC
GAAGCCATATGAAGTTATCCCGTGCAGGTTCTTGATTTAGTTGGCCGCCT
TACACGTATTGCAACCATTTTCATGCTGGGTGGTGGCTATTTGAGGTGCG
ACCACCCAGCATGAAAATGGTTGCAATACGTGTAAGGCCCTGTGCATTAA
CAACCATTTTCATGCTGGGTGGTGGCTATTTGAGATGCGTTAGGCGGCCA
GCCGCCTAACGCATCTCAAATAGCCACCACCCAGCATGAAAATGGTTGCA
CACCACCCAGCATGAAAATGGTTGCAATACGTGTAAGGCCCTGTGCATTA
ATATGCGGCTTACGACTCATGGCCGGCTTGATGCACAGGGCCTTACACGT
GCATCTCAAATAGCCACCACCCAGCATGAAAATGGTTGCAATACGTGTAA
TGAAAATGGTTGCAATACGTGTAAGGCCCTGTGCATTAAGCCGGCCATGA
AAATGGTTGCAATACGTGTAAGGCCCTGTGCATTAAGCCGGCCATGAGTC
ATGCGTTAGGCGGCCAACTAAATCAAGAACCTGCACGGGATAACTTCATA
TTTAGTTGGCCGCCTAACGCATCTCAAATAGCCACCACCCAGCATGAAAA
ACCACCCAGCATGAAAATGGTTGCAATACGTGTAAGGCCCTGTGCATTAA
GCGGCTTACGACTCATGGCCGGCTTAATGCACAGGGCCTTACACGTATTG
CGTATTGCAACCATTTTCATGCTGGGTGGTGGCTATTTGAGATGCGTTAG
CGACTCATGGTCGGCTTAATGCACAGGGCCTTACACGTATTGCAACCATT
ATGCGTTAGGCGGCCAACTAAATCAAGAACCTGCACGGGATAACTTCATA
CTTGATTTAGTTGGCCGCCTAACGCATCTCAAATAGCCACCACCCAGCAT
AAATAGCCACCACCCAGCATGAAAATGGTTGCCATACGTGTAAGGCCCTG
GCTTACGACTCATGGCCGGCTTAATGCACAGGGCCTTACACGTATTGCAA
GTTCTTGATTTAGTTGGCCGCCTAACGCATCTCAAATAGCCACCACCCAG
CAGCTTACGACTCATGGCCGGCTTAATGCACAGGGCCTTACACGTATTGC
ATGAAAATGGTTGCAATACGTGTAAGGCCCTGTGCATTAAGCCGGCCATG
TATTTGACATGCGTTAGGCGGCCAACTAAATCAAGAACCTGCACGGGATA
TGGCTATTTGAGATGCGTTAAGCGGCCAACTAAATCAAGAACCTGCACGG
TTGCAATACGTGTAAGGCCCTGTGCATTAAGCCGGCCATGAGTCGTAAGC
GCAACCATTTTCATGCTGGGTGGTGGCTATTTGAGATGCGTTAGGCGGCC
CGTGCAGGTTCTTGATTTAGTTGGCCGCCTAACGAATCTCAAATAGCCAC
TCATGCTGGGTGGTGGCTATTTGAGATGCGTTAGGCGGCCAACTAAATCA
TGAAGCTATCCCGTGCAGGTTCTTGATTTAGTTGGCCGCCTAACGCATCT
AAAATGGTTGCAATACGTGTAAGGCCCTGTGCATTAAGCCGGCCATGAGT
GCGTTAGGCGGCCAACTAAATCAAGAACCTGCACGGGATAACTTCATATG
TGCGGCTTACGAGTCATGGCCGGCTTAATGCACAGGGCCTTACACGTATT
GCCGGCTTAATGCACTGGGCCTTACACGTATTGCAACCATTTTCATGCTG
ATGGCCGGCTTAATGCATAGGGCCTTACACGTATTGCAACCATTTTCATG
TATCCCGTGCAGGTTCTTGATTTAGTTCGCCGCCTAACGCATCTCAAATA
ACTCATGGCCGGCTTAATGCACAGGGCCTTACACGTATTGCAACCATTTT
GTTATCCCGTGCAGGTTCTTGATTTAGTTGGCCGCCTAACGCATCTCAAA
CGGCTTAATGCACAGGGCCTTACACGTATTGCAACCATTTTCATGCTGGG
AAGCCATATGAAGTTATCCCGTGCAGGTTCTTGATTTAGTTGGCCGCCTA
ATGAGGCTTACGACTCATGGCCGGCTTAATGCACAGGGCCTTACACGTAT
CTTACGACTCATGGACGGCTTAATGCACAGGGCCTTACACGTATTGCAAC
GATGCGTTAGGCGGCCAACTAAATCAAGAACCTGCACGGGATAACTTCAT
TGGCCGCCTAACGCATCTCAAATAGCCACCACCCAGCATGAGAATGGTTG
CCTAACGCATCTCAAATAGCCACCACCCAGCATGAAAATGGTTGCAATAC
GGTTCTTGATTTAGTTAGCCGCCTAACGCATCTCAAATAGCCACCACCCA
TCATGCTGGGTGGTGGCTATTTGAGATGCGTTAGGCGGCCAACTAAATCA
ATCTCAAATAGCCACCACCCAGCATGAAAATGGTTGCAATACTTGTAAGG
CACAGGGCCTTACACGTATTGCAACCATTTTCATGCTGGGTGGTGGCTAT
GGCTTACGACTCATGGCCGGCTTAATGCACAGGGCCTTACACGTATTGCA
TCATGCTGGGTGGTGGCTATTTGAGCTGCGTTAGGCGGCCAACTAAATCA
AAGTTATCCCGTGCAGGTTCTTGATTTAGTTGGCCGCCTAACGCATCTCA
CATTTTCATGCTGGGTGGTGGCTATTTGAGATGCGTTAGGCGGCCAACTA
TTGCAATACGTGTAAGGCCCTGTGCATTAAGCCGGCCATGAGTCGTAAGC
CACGTATTGCAACCATTTTCATGCTGGGTGGTGGCTATTTGAGATGCGTT
CAACCATTTTCATGCTGGGTGGTGGCTATTTGAGATGCGTTAGGCGGCCA
TTACACGTATTGCAACCATTTTCATGCTGGGTGGTGGCTATTTGAGATGC
GTGTTAGGCGGCCAACTAAATCAAGAACCTGCACGGGATAACTTCATATG
TTAGTTGGCCGCCTAACGCATCTCAAATAGCCACCACCCAGCATGAAACT
GCAACCATTTTCATGCTGGGTGGTGGCTATTTGAGATGCGTTAGGCGGCC
GCAGGTTCTTGATTTAGTTGGCCGCCTAACGCATCTCAAATAGCCACCAC
TATTTGAGATGCGTTAGGCGGCCAACTAAATCAAGAACCTGCATGGGATA
ATGAAAATGGTTGCAATACGTGTAAGGCCCTGTGCATTAAGCCGGCCATG
GTTAGGCGGCCAACTAAATCAAGAACCTGCTCGGGATAACTTCATATGGC
TGGTGGCTATTTGAGATGTGTTAGGCGGCCAACTAAATCAAGAACCTGCA
GATTTAGTTGGCCGCCTAACGCATCTCAAATAGCCACCACCCAGCATGAA
GGTTCTTGATTTAGTTGGCCGCCTAACGCATCTCAAATAGCCACCACCCA
GTTGGCCGCCTAACGCATCTCAAATAGCCACCACCCAGCATGAAAATGGT
GCCGGCTTAATGCACAGGGCCTTACACGTATTGCAACCATTTTCATGGTG
TTAGGCGGCCAACTAAATCCAGAACCTGCACGGGATAACTTCATATGGCT
TGCAGGTTCTTGATTTAGTTGGCCGCCTAACGCATCTCAAATTGCCACCA
AGCATGAAAATGGTTGCAATACGTGTAATGCCCTGTGCATTAAGCCGGCC
CAGGGCCTTACACGTATTGCTACCATTTTCATGCTGGGTGGTGGCTATTT
GCTATTTGAAATGCGTTAGGCGGCCAACTAAATCAAGAACCTGCACGGGA
ACCATTTTCATGCGGGGTGGTGGCTATTTGAGATGCGTTAGGCGGCCAAC
ATGCACAGGGCCTTACACGTATTGCAACCATTTTCATGCTGGGTGGTGGC
AGATGCGTTAGGCGGCCAACTAAATCAAGAACCTGCACGGGATAACTTCA
GCCTAACGCATCTCAAATAGCCACCGCCCAGCATGAAAATGGTTGCAATA
TCATGGCCGGCTTAATGCACAGGGCCTTACACGAATTGCAACCATTTTCA
ACCACCCAGCATGAAAATGGTTGCAATTCGTGTAAGGCCCTGTGCATTAA
ATAGCCACCACCCAGCATGAAAATGGTTGCAATACGTGTAAGGCCCTGTG
CCATATGAAGTTATCCCGTGGAGGTTCTTGATTTAGTTGGCCGCCTAACG
TTCATGCTGGGTGGTGGCTATTTGAGATGCGTTAGGCGGCCAACTAAATC
GCATGAAAATGGTTGCAATACGTGTAAGGCCCTGTGCATTAAGCCGGCCA
TTGCAATACGTGTAAGGCCCTGTGCATTAAGCCGGCCATGTGTCGTAAGC
TTAGGCGGCCAACTAAATCAAGAACCTGCACGGGATAACTGCATATGGCT
ATGCACAGGGCCTTACACGTATTGCAACCATTTTCATGCTGGGTGATGGC
ACTCATGGCCGGCTTAATGCACAGGGCCTTACACGTATTGCAACCATTTT
TTAGTTGGCCGCCTAACGCATCTCAAATAGCCACCACCCAGCATGAAAAT
TAGTTGGCCGCCTAACGCATCTCAAATAGCCACCACCCAGCATGAAAATG
ATGCTGGGTAGTGGCTATTTGAGATGCGTTAGGCGGCCAACTAAATCAAG
TGCGTTAGGCGGCCAACTAAATCAAGATCCTGCACGGGATAACTTCATAT
AATGCACAGGGCCTTACACGTATTGCAACCATTTTCATGCTGGGTGGTGG
TGCGGCTTACGACTCATAGCCGGCTTAATGCACAGGGCCTTACACGTATT
ATGCGGCTTACGACTCATGGCCGGCTTAATGCACAGGGCCTTACACGTAT
TTGCAACCATTTTCATGCTGGGTGGTGGCTATTTGAGATGCGTTAGGCGG
TAGCCACCACCCAGCATGAAAATGGTTGCAATACGTGTAAGGCCCTGTGC
TGAAAAGGGTTGCAATACGTGTAAGGCCCTGTGCATTAAGCCGGCCATGA
TACGACTCATGGCCGGCTTAATGCACAGGGCCTTACACGTATTGCAACCC
GCATCTCAAATAGCCACCACCCAGCATGAAAATGGTTGCAATACGTGTAA
TACAGGTTCTTGATTTAGTTGGCCGCCTAACGCATCTCAAATAGCCACCA
CGTATTGCAACCATTTTCATGCTGGGTGGTGGCTATTTGAGATGCGTTAG
TTTAGTTGGCCGCCTAACGCATCTCAAATAGCCACCACCCAGCATGAAAA
CCTAACGCATCTCAAATAGCCACCACCCAGCATGAAAATGGTTGCAATAC
GGGCAAATGCAGCCATGCCCAAATATATTTGGGCATGGCTGCATTTGCCA
AAGCCATATGAAGTTATCCCGTGCAGGTTCTTGATTTAGTTGGCCGCCTA
GCACAGGGCCTTACACGTATTGCAACCATTTTCATGCTGGGTGGTGGCAA
ACGTATTGCAACCATTTTCATGCTGGGTGGTTGCTATTTGAGATGCGTTA
GAAGGTTCTTGATTTAGTTGGCCGCCTAACGCATCTCAAATAGCCACCAC
GTATTGCAACCATTTTCATGCTGGCTGGTGGCTATTTGAGATGCGTTAGG
CAGCATGAAAATGGTTGCAATACGTATAAGGCCCTGTGCATTAAGCCGGC
CCGTGCAGGTTCTTGATCTAGTTGGCCGCCTAACGCATCTCAAATAGCCA
ATTGCAACCATTTTCATGCTGGGTGGTGGCTATTTGAGATGCGTTAGGCG
CCGCCTAACGCATCTCAAATAGCCACCACCCAGCATGAAAATGGTTGCAA
TGGCCGGCTTAATGCACAGGGCCTTACGCGTATTGCAACCATTTTCATGC
ACGTATTGCAACCATTTTCATGCTGGGTGGTAGCTATTTGAGATGCGTTA
AAGTTATCCCGTGCAGGTTCTTGATTTAGTTGGCCGCCTAACGCATCTCA
TAACGCATCTCAAATAGCCACCACCCAGCATGAAAATGGTTGCAATACGT
TGAAGTTATCCCGTGCAGGTTCTTGATTTAGTTGGCCGCCTAACGCATCT
CATGCTGGGTGGTGGCTATTTGAGATGCGTTAGGCGGCCAACTAAATCAA
ATTTGAGATGCGTTAGGCGGCCAACTAAATCAAGAACCTGCACGGGATAA
TGATTTAGTTGGTCGCCTAACGCATCTCAAATAGCCACCACCCAGCATGA
CAGCATGAACATGGTTGCAATACGTGTAAGGCCCTGTGCATTAAGCCGGC
TTGCAATACGTGTAAGGCCCTGTGCATTAAGCCGGCCATGAGTCGTAAGC
CTCATGGCCGGCTTAATGCACAGGGCCTTACACGTGTTGCAACCATTTTC
CCATATGAAGTTATCCCGTGCAGGTTCTTGATTTAGTTGGCCGCCTAACG
TTAGTTGGCCGCCTAACGCATCTCAAATAGCCACCACCCAGCATGAAAAT
GCCTAACGCATCTCAAATAGCCACCACCCAGCATGGAAATGGTTGCAATA
GCATCTCAAATAGCCACCACCCAGCATGAAAATGGTTGCAATACGTGTAA
GATTTAGTTGGCCGCCTAACGCATCTCAAATAGCCACCACACAGCATGAA
TTAATGCTCAGGGCCTTACACGTATTGCAACCATTTTCATGCTGGGTGGT
GGTTGCAATACGTGTAAGGCCCTGTCCATTAAGCCGGCCATGAGTCGTAA
GCCTTACACGTATTGCAACCATTTTCATGCTGGGTGGTGGCTATTTGAGA
CCATTTTCATGCTGGGTGGTGGCTATTTGAGATGCGTTAGGCGGCCAACT
TTGCAACCATTTTCATGCTGGGTGGTGGCTATTTGAGATGCGTTAGGCGC
CGTCTAACGCATCTCAAATAGCCACCACCCAGCATGAAAATGGTTGCAAT
TTGCAACCATTTTCATGCTGGGTGGTGGCTATTTGAGATGCGTTAGGCGG
TTCTTGATTTAGTTGGCCGCCTAACGCATCTCAAATAGCCACCACCCAGC
CCTTACACGTATTGCAACCATTTTCATGCTGGGTGGTGGCTATTTGAGAT
GGCTTACGACTCATGGCCGGCTTAATGCACAGGGCCTTACACGTATTGCA
TATGCGGGTTACGACTCATGGCCGGCTTAATGCACAGGGCCTTACACGTA
GCGGCTTACGACTCATGGCCGGCTTAATGCACAGGGCCTTACACGTATTG
GAAAATGGTTGCAATACGTGTAAGGCCCTGTGCATTAAGCCAGCCATGAG
CCACCACCCAGCATGAAAATGGTTGCAATACGTGTAAGGCCCTGTACATT
CGCCTAACGCATCTCAAATAGCCACCACCCAGCATGAAAATGGTTGCAAT
GCCGCCTAACGCATCTCAAATAGCCACCACCCAGCATGAAAATGGTTGCA
GCAATACGTGTAAGGCCCTGTGCATTAAGCCGGCCATGAGTCGTAAGCCG
CATGGCCGGCTTAATGCACAGGGCCATACACGTATTGCAACCATTTTCAT
AGCCATATGAAGTTATCCCGTGCAGGTTCTTGATTTAGTTGGCCGCCTAA
TTAATGCACAGGGCCTTACACGTATTGCAACCATTTTCATGCTGGGTGGT
ATGCGACTTACGACTCATGGCCGGCTTAATGCACAGGGCCTTACACGTAT
CAATACGTGTAAGGCCCTGTGCATTAAGCCGGCTATGAGTCGTAAGCCGC
GCCGCCTAACGCATCTCAAATAGCCACCACCCAGCATGAAAATGGTTGCA
CGCATCTCAAATAGCCACCACCCAGCATGAAAATGGTTGCAATTCGTGTA
CACCCAGCATGAAAATGGTTGCAATACGTGTAAGGTCCTGTGCATTAAGC
ATGCGTTAGGCGGCCAACTAAATCAAGAACCTGCACGGGATAACTTCATA
AATGGTTGCAATACGTGTAAGGCCCTGTGCATTAAGCCGGCCATGAGTCG
ATGGGTGCAATACGTGTAAGGCCCTGTGCATTAAGCCGGCCATGAGTCGT
TGGCCGGCTTAATGCACAGGGCCTTACACGTATTGCAACCATTTTCATGC
TCTTGATTTAGTTGGCCGCCTAACGCATCTCAAATAGCCACCACCCAGCA
ATATGCGGCTTACGACTCATGGCCGGCTTAATGCACAGGGCCTTACACGT
TTACACGTATTGCAACCATTTTCATGCTGGGTGGTGGCTATTTGAGATGC
TGAAGTTATCCCGTGCAGGTTCGTGATTTAGTTGGCCGCCTAACGCATCT
ACCATTTTCATGCTGGGTGGTGGCTATTTGAGATGCGTTAGGCGGCCCAC
CCCAGCACGAAAATGGTTGCAATACGTGTAAGGCCCTGTGCATTAAGCCG
GCAATACGTGTAAGGCCCTGTGCATTAAGCCGGCCATGAGTCGTAAGCCG
CTGGGTGGTGGCTATTTGAGATGCGTTAGGCGGCCAACTAAATCAAGAAC
AGCCACCACCTAGCATGAAAATGGTTGCAATACGTGTAAGGCCCTGTGCA
GATGCGTTAGGCGGCCAACTAAATCAAGAACCTGCACGGGATAACTTCAT
GGTGGCTATTTGAGATGCGTTAGGCGGCCAAGTAAATCAAGAACCTGCAC
GGCTTACGACTCATGGCCGGCTTAATGCACAGGGCCTTACACGTATTGCA
ATATGCGGCTTACGACTCATGGCCGGCTTAATGCACAGGGCCTTACACGT
GCGGCTTACGACTCATGGCCGGCTTAATGCATAGGGCCTTACACGTATTG
TTCTTGATTTAGTTGGCCGCCTAACGCATCTCAAATAGCCACCACCCAGC
TGCGGCTTACGACTCATGGCCGGCTTAATGCACAGGGCCTTACACGTATT
TGGCTATTTGAGATGCGTTAGGCGGCCAACTAAATCAAGAACCTGCACGG
CACGTATTGCAACCATTTTCATGCTGGGTGGTGGCTATTTGAGATGCGTT
GAGATGCGTTAGGCGGCCAACTAAATCAAGAACCTGCACGGGATAACTTC
AGTTATCCCGTGCAGGTTCTTGATTTAGTTGGCCGCCTAACGCATCTCAA
CTTAATGCACAGGGCCTTACCCGTATTGCAACCATTTTCATGCTGGGTGG
AACCATTTTCATGCTGTGTGGTGGCTATTTGAGATGCGTTAGGCGGCCAA
ATTTAGTTGGCCGCCTAACGCATCTCAAATAGCCACCTCCCAGCATGAAA
GCAATACGCGTAAGGCCCTGTGCATTAAGCCGGCCATGAGTCGTAAGCCG
ATGCGTTAGGCGGCCAACTAAATCAAGAACCTGCACGGGATAACTTCATA
TAGTTGGCCGCCTAACGCATCTCAAATAGCCACCACCCAGCATGAAAATG
#!/usr/bin/python
import itertools
def revTransDNA(seq,lowerCaseReturn=False):
bp = {'A':'T', 'C':'G', 'G':'C', 'T':'A', 'N':'N'}
seqTemp = "".join([bp[x.upper()] for x in reversed(seq)])
if (lowerCaseReturn == False):
return seqTemp
else:
return seqTemp.lower()
class Dna:
''' Object representing a FASTA record.
seq,name,sequence,and header are fields '''
def __init__(self, header, sequence):
self.head = header
self.seq = sequence
self.length = len(sequence)
self.revTrans = revTransDNA(sequence)
self.pair = False # set to True if there is a seq that matches
self.oneErrorSeq = ""
self.reported = False # True if printed out
self.appear = 1 #number of times (s.seq == other.seq) for s position only
self.hammOneCount = 0 # number of seqs with hamming distance == 1
def __str__(self, separator=''):
return ">{0}\n{1}".format(self.head, separator.join(self.seq))
def __len__(self):
return len(''.join(self.seq))
def completeMatch(self,other):
if (self.seq == other.seq):
return True
elif (self.seq == other.revTrans):
return True
else:
return False
def oneErrorMatch(self,other):
""" returns true if self.seq and other.(seq or revTrans) have a hamming distance of 1. Sets self.oneErrorSeq to other's matching sequence in that case as well"""
if (self.reported == True):
return False
forwardError = 0
if (self.length != other.length):
return False
for s,t in zip(self.seq,other.seq):
if (s == t):
continue
else:
forwardError += 1
if (forwardError == 1):
self.oneErrorSeq = other.seq
return True
else:
reverseError = 0
for s,t in zip(self.seq,other.revTrans):
if (s == t):
continue
else:
reverseError += 1
if (reverseError == 1):
self.oneErrorSeq = other.revTrans
return True
return False
@property
def name(self, separator=''):
return self.head
@property
def sequence(self, separator=''):
return separator.join(self.seq)
def setPairFound(self,other):
""" sets self and other pair instance variables to true if the sequences match, counts the number of sequences a given seq is the same as """
if (self.completeMatch(other) and self.name != other.name):
self.pair = True
other.pair = True
self.appear += 1
def reportOneErrorMatch(self):
""" prints the pair of seqs, old->new"""
if (self.reported == False):
self.reported = True
print("{0}->{1}".format(self.seq, self.oneErrorSeq))
def setErrorPairFound(self,other):
""" increments hammOneCount(hamming count of one counter variable) if self.seq and (other.seq or other.revTrans) have a hamming distance of 1"""
if (self.oneErrorMatch(other)):
self.hammOneCount += 1
Sign up for free to join this conversation on GitHub. Already have an account? Sign in to comment