Created
November 18, 2012 08:37
-
-
Save adamwespiser/4104276 to your computer and use it in GitHub Desktop.
Solution to rosalind's "corr" problem
This file contains hidden or bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
| Solution to rosalind's "CORR" problem. | |
| http://rosalind.info/problems/corr/ | |
| The problem is: | |
| Given a collection of reads(same size), a read is either: | |
| 1) Correct, and is the same as another read or its reverse trans | |
| 2) Incorrect by a point mutation, and the thus one base pair difference between the read and a correct read. (Hamming distance = 1) | |
| report incorrect reads and their correct counterparts. | |
| There is a strong assumption that a read must be either correct or incorrect, and that all incorrect reads map to at least one correct read. |
This file contains hidden or bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
| import string | |
| import itertools | |
| from optparse import OptionParser | |
| import corrLib | |
| def readInDnaSequence(fileName): | |
| """ problem specific function: | |
| read in the dna sequences, one sequence per line, no annotation, | |
| [ATCG] chars only""" | |
| file = open(fileName, 'r') | |
| dnaSeqs = [] | |
| index = 0 | |
| for line in file: | |
| dnaSeqs.append(corrLib.Dna(index,line.strip())) | |
| index += 1 | |
| return dnaSeqs | |
| def main(): | |
| """ run the main loop taking an input file designated by the | |
| '--file' option | |
| """ | |
| parser = OptionParser() | |
| parser.add_option("-f","--file") | |
| (option, args ) = parser.parse_args() | |
| file = option.file | |
| #print("reading in dna sequence") | |
| seqs = readInDnaSequence(file) | |
| #print("sequence in....") | |
| # O(n^2) | |
| # determine all of the correct sequences with full matches | |
| for s,t in itertools.product(seqs,repeat=2): | |
| s.setPairFound(t) | |
| #s.setErrorPairFound(t) | |
| #split the sequences into matching and no matching lists | |
| seqsWithMatch = filter(lambda x: x.pair == True, seqs) | |
| seqsNoMatch = filter(lambda x: x.pair == False, seqs) | |
| # this may work as well, if oneErrorSeq is set with setPairFound | |
| # in the above loop | |
| #for s in seqs: | |
| # if (s.pair == False): | |
| # print("{0}->{1}".format(s.seq,s.oneErrorSeq)) | |
| #print(len(seqsWithMatch)) | |
| #print(len(seqsNoMatch)) | |
| # over sequences with no match, iterate over matching sequences | |
| # and find the corresponding correct sequence | |
| for s in seqsNoMatch: | |
| for t in seqsWithMatch: | |
| if( s.oneErrorMatch(t)): | |
| True | |
| s.reportOneErrorMatch() | |
| break | |
| if (__name__ == '__main__'): | |
| main() |
This file contains hidden or bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
| AAATAGCCCCCACCCAGCATGAAAATGGTTGCAATACGTGTAAGGCCCTG | |
| TGAAGTTATCCCGTGCAGGTTCTTGATTTAGTTGGCCGCCTAACGCATCT | |
| TACGTTTAAGGCCCTGTGCATTAAGCCGGCCATGAGTCGTAAGCCGCATA | |
| TATGAAGTTATCCCGTGCAGGTTCTTGATTTAGTTGGCCGCCTAACGCAT | |
| ATATGAAGTTATCCCGTGCAGGTTCTTGATTTAGTTGGCCGCCTAACGCA | |
| CAACCATTTTCATGCTGGGTGGTGGCTATTTGAGATGCGTTAGGCGGCCA | |
| TTGATTTAGTTGGCCGCCTAACGCATCTCAAATAGCCACCACCCAGCATG | |
| CGTATTGCAACCATTTTCATGCTGGGTGGTGGCTATTTGAGATGCGTTAG | |
| ACAGGGCCTTACACGTATTGCAACCATTTTCATGCTGGGTGGTGGCTATT | |
| CGGCTTAATGCACAGGGCCTTACACGTATTGCAACCATTTTCATGCTGGG | |
| AAGCCATATGAAGTTATCCCGTGCAGGTTCTTGATTTAGTTGGCCGCCTA | |
| TTGAGATGCGTTAGGCGGCCAACTAAATCAAGAACCTACACGGGATAACT | |
| GCGGCTTACGACTCATGGCCGGCTTAATGCACAGGGCCTTACACGTATTC | |
| CGTTAGGCGGCCAACTAAATCAAGAACGTGCACGGGATAACTTCATATGG | |
| TCTCAAATAGCCACCACCCAGCATGAAAATGGTTGCAATACGAGTAAGGC | |
| TGCAATACGTGTAAGGCCCTGTGCATTAAGCCGGCCATGAGTCGTAAGCC | |
| AAGTTATCCCGTGCAGGTTCTTGATTTAGTTGGCCGCCTAACGCATCTCA | |
| AATGCACAGGGCCTTACACGTATTGCAACCATTTTCATGCTGGGTGGTGG | |
| ATTGCAACCATTTTCATGCTGGGTGGTGGCTATATGAGATGCGTTAGGCG | |
| AAATAGCCACCACCCAGCATTAAAATGGTTGCAATACGTGTAAGGCCCTG | |
| ACGACTCATGGCCGGCTTAATGCACAGGGCCTTACACGTATTGCAACCAT | |
| GGTGGTGGCTATTTGAGATGCGTTAGGCGGCCAACTAAATCAAGAACCTG | |
| CTTACACGTATTGCAACCATTTTCATGCTGGGTGGTGGCTATTTGAGATG | |
| TGCGTTAGGCGGCCAACTAAATCAAGAACCTGCACGGGATAACTTCATAT | |
| GCCATATGAAGTTATCCCGTGCAGGTTCTTGATTTATTTGGCCGCCTAAC | |
| GACATATGAAGTTATCCCGTGCAGGTTCTTGATTTAGTTGGCCGCCTAAC | |
| CACCACCCAGCATGAAAATGGTTGCAATACGTGTAAGGCCCTGTGCATTA | |
| GTATTGCAACCATTTTCATGCTGGGTGGTGGCTATATGAGATGCGTTAGG | |
| GGTTGCAATACGTGTAAGGCCCTGTGCATTAAGCCGGACATGAGTCGTAA | |
| TCCCGTGCAGGTTCTTGATTTAGTTGGCCGCCTAACGCATCTCAAATAGC | |
| CCCGTGCAGGTTCTTGATTTAGTTGGCCGGCTAACGCATCTCAAATAGCC | |
| TAGGCGGCCAACTAAATCAAGAACCTGCACGGGATAACTTCATATGGCTT | |
| TTAGGCGGCCAACTAAATCAAGAACCTGCAGGGGATAACTTCATATGGCT | |
| ACGACTCATGGCCGGCTTAATGCACAGGGCCTTACACGTATTGCAACCAT | |
| GCCTAACGCATCTCAAATAGCCACCACCCAGCATGAAAATGGGTGCAATA | |
| TATTTGAGATGCGTTAGGCGGCCAACTAAATCAAGAACCTGCACGGGATA | |
| GCTGGGTGGTGGCTATTTGAGATGCGTTAGGAGGCCAACTAAATCAAGAA | |
| GCAAAGGGCCTTACACGTATTGCAACCATTTTCATGCTGGGTGGTGGCTA | |
| TTGAGATGCGTTAGGCGGCCAACTAAATCCAGAACCTGCACGGGATAACT | |
| GGCCGGCTTAATGCACAGGGCCTTACACGTATTGCAACCATTTTCATGCT | |
| CCATTTTCATGCTGGGTGGTGGCTATTTGAGATGCGTTAGGCGGCCAACT | |
| TTTAGTTGGCCGCCTAACGCATCTCAAATAGCCACCACCCCGCATGAAAA | |
| GGCGGCCAACTAAATCAAGAACCTGCACGGGATAACTTCATATGGCTTCA | |
| CAGGTTCTTGATTTAGTTGGCCGCCTAACGCATCTCAAATAGCCACCACC | |
| GGTGGCTATTTGAGATGCGTTAGGCGGCCAACTAAATCAAGAACCTACAC | |
| GTGGTGGCTATTTGAGATGCGTTAGGCGGCCAACTAAATCAAGAACCTGC | |
| CACCCAGCAGGAAAATGGTTGCAATACGTGTAAGGCCCTGTGCATTAAGC | |
| CTATTTGAGATGCGTTAGGCGGCCAACTAAATTAAGAACCTGCACGGGAT | |
| CGAGTCATGGCCGGCTTAATGCACAGGGCCTTACACGTATTGCAACCATT | |
| ACCATTTTCATGCTGGGTGGTGGCTATTTGAGATGCGTTAGGCGGCCAAC | |
| GGCGGCCAACTAAATCAAGAACCTGCACGGGATAACTTCATATGGCTTCA | |
| GGTGGTGGCTATTTGAGATGCGTTAGGCGGCCAACTAAATCAAGAACCTG | |
| CGTATTGCAACCATTTTCATGCTGGGTGGTGGCTATTTGAGATGCGTTAG | |
| GCATTGCAACCATTTTCATGCTGGGTGGTGGCTATTTGAGATGCGTTAGG | |
| TGGCCGGCTTAATGCACAGGGCCTTACACGTATTGCAACCATTTTCATGC | |
| TTTGAGATGCGTTAGGCGGCCAACTAAATCAAGAACCTGCACGGGATAAC | |
| CGGTTCTTGATTTAGTTGGCCGCCTAACGCATCTCAAATAGCCACCACCC | |
| ATGAAAATGGTTGCAATACGTGTAAGGCCCGGTGCATTAAGCCGGCCATG | |
| GACTCATGGCCGGCTTAATGCACAGGGCCTTACACGTATTGCAACCATTT | |
| ACAGGGCCTTACACGTATTGCAACCATTTTCATGCTGGGTGGTGGCTATT | |
| GATGCGTTAGGCGGCCAACTAAATCAAGAACCTGCACGGGATAACTTCAT | |
| ATCCCGTGCAGGTTCTTGATTTAGTTGGCCGCCTAACGCATCTCAAATAG | |
| GGTGGTGGCTATTTGAGATGCGTTAGGCGGCCAAGTAAATCAAGAACCTG | |
| CTTACACGTATTGCAACCATTTTCATGCTGGGTGGTGGCTATTTGAGATG | |
| ACGTATTGCATCCATTTTCATGCTGGGTGGTGGCTATTTGAGATGCGTTA | |
| GATGCGTTAGGAGGCCAACTAAATCAAGAACCTGCACGGGATAACTTCAT | |
| ATAGCCACCACCCAGCATGACAATGGTTGCAATACGTGTAAGGCCCTGTG | |
| ACGCATCTCAAATAGCCACCACCCAGCATGAAAATGGATGCAATACGTGT | |
| TTATCCCGTGCAGGTTCTTGATTTAGTTGGCCGCCTAACGCATCTCAAAT | |
| CTTAATGCACAGGGCCTTACACGTATTGCAACCATTTTCATGCTGGGTGC | |
| CACGTATTGCAACCATTTTCATGCTGGGTGGTGGCTATTTGAGATGCGTT | |
| TTTCATGCTGGGTGGTGGCTATTTGAGATGCGTTAGGCGGCCAACTAAAT | |
| TCAGATGCGTTAGGCGGCCAACTAAATCAAGAACCTGCACGGGATAACTT | |
| ACACGAATTGCAACCATTTTCATGCTGGGTGGTGGCTATTTGAGATGCGT | |
| TGCAGGTTCTTGATTTAGTTGGCCGCCTAACGCATCTCAAATAGCCACCA | |
| CAGGTTCTTGATTTAGTTGGCCGCCTAACGCATCTCAAATAGCCACCACC | |
| TTATCCCGTGCAGGTTCTTGATTTAGTTGGCCGCCTAATGCATCTCAAAT | |
| CCGACTCATGGCCGGCTTAATGCACAGGGCCTTACACGTATTGCAACCAT | |
| AAATAGCCACCACCCAGCATGAAAATGGTTGCAATACGTGTAAGGCCCTG | |
| GCTGAGTGGTGGCTATTTGAGATGCGTTAGGCGGCCAACTAAATCAAGAA | |
| TTACACGTATTGCAACCATTTTCATGCTGGGTGGTGGCTATTTGAGATGC | |
| ATTTTCATGCTGGGTGGTGGCTATTTGAGATGCGTTAGGCGGCCAACTAA | |
| CACCACCCAGCATGAAAATGGTTGCAATACGTGTAAGGCCCTGTGCATTA | |
| AGCCATATGAAGTTATCCCGTGCAGGTTCTTGACTTAGTTGGCCGCCTAA | |
| GATGCGTTAGGCGGCCAACTAAATCAAGAACCTGCACGGGATAACTTCAT | |
| GCCGGCTTAATGCACAGGGCCTTTCACGTATTGCAACCATTTTCATGCTG | |
| CACCACCCAGCATGAAAATGGTTGCAATACGTGTAAGGCCCTGTGCATTA | |
| CGGCTTAATGCACAGGGCCTTACACGTATTGCAACCATTTTCATGCTGGG | |
| GTTATCCCGTGCAGGTCCTTGATTTAGTTGGCCGCCTAACGCATCTCAAA | |
| ACCATTTTCATGCTGGGTGGTGGCTATTTGAGATGCGTTAGGCGGCCAAC | |
| GTGGCTATTTGAGATGCGTTAGGCGGCCAACTAAAACAAGAACCTGCACG | |
| TACGTGTAAGGCCCTGTGCATTAAGCCGGCCATGAGTCGTAAGCCGCATA | |
| CATGAAAATGGTTGCAATACGTGTAAGGCCCTGTGCATTAAGCCGGCCAT | |
| CATGAAAATGGTTGCAATACGTGTAAGGCCCTGTGCATTAAGCCGGCCAT | |
| TTATCCCCTGCAGGTTCTTGATTTAGTTGGCCGCCTAACGCATCTCAAAT | |
| GCTTAATGCACAGGGCCTTACACGTATTGCAACCATTTTCATGCTGGGTG | |
| GGCCTTACACGTATTGCAACCATTTTCATGCTGGGTGGTGGCTATTTGAG | |
| TGAAAATGGTTGCAATACGTGTAAGGACCTGTGCATTAAGCCGGCCATGA | |
| ACGACTCATGGCCGGCTTAAGGCACAGGGCCTTACACGTATTGCAACCAT | |
| ACGTGTAAGGCCCTGTGCATTAAGCCGGCCATGAGTCGTAAGCCGCATAT | |
| GGCTTACGACTCATGGCCGGCTTAATGCACAGGGTCTTACACGTATTGCA | |
| CGTATTGCAACCATTTTCATGCTGGGTGGTGGCTATTTGAGATGCGTTAG | |
| GTGGCTATTTGAGATGCGTTAGGCGGCCAACTAAATCAAGAACCTGCAGG | |
| GATTTAGTTGGCCGCCTAACGCATCTCAAATAGCCACCACCCAGCATGAA | |
| GGCGGCCAACTAAATCAAGAACCTGCAAGGGATAACTTCATATGGCTTCA | |
| AGGCGGCCAACTAAATCAAGAACCTGCACGGGATAACTTCATATGGCTTC | |
| CAGGGCCTTACACGTATTGCAACCATTTTCATGCGGGGTGGTGGCTATTT | |
| AGCATGAAAATGGTTGCAATACGTGTAAGGCCCTGTGCATTAAGCCGGCC | |
| TGCAATACGTGTAAGGCCCTGTGCATTAAGCCGGCCATGAGTCGTAAGCC | |
| AGTTGGCCGCCTAACGCATCTCAAATAGCCACCACCCAGCATGAAAATGG | |
| TGGTGGCTATTTGAGATGCGTTAGGCGGCCAACTAAATCAAGAACCTGCA | |
| GCCGCCTAACGCATCTCAAATAGCCACCACCCAGCATGAAAATGTTTGCA | |
| CACAGGGCCTTACACGTATTGCAACCATTTTCATGCTGGGTGGTGGCTAT | |
| TATTCATGCTGGGTGGTGGCTATTTGAGATGCGTTAGGCGGCCAACTAAA | |
| TAGGCGGCCAACTAAATCAAGAACCTGCACGGGATAACTTCATATGGCTT | |
| AGAGGGCCTTACACGTATTGCAACCATTTTCATGCTGGGTGGTGGCTATT | |
| GTTATCCCGTGCAGGTTCTTGATTTAGTTGGCCGCCTAACGCATCTCAAA | |
| AATAGCCACCACCCAGCATGAAAATGGTTGCAATACGTGTAAGGCCCTGT | |
| AGGTTCTTGATTTAGTTGGCCGCCTAACGCATCTCAAATAGCCACCACCC | |
| TTTCATGCTGGGTGGTGGCTATTTGAGATGCGTTAGGAGGCCAACTAAAT | |
| CCCAGCATGAAAATGGTTGCAATACGTGTAAGGCCCTGTGCATTAAGCCG | |
| CATTTTCATGCTGGGTGGTGGCTATTTGAGATGCGTTAGGCGGCCAACTA | |
| CTCATGGCCGGCTTAATGCACAGGGCCTTACACGTATTGCAACCATTTTC | |
| TGATTTAGTTGGCCGCCTAACGCATCTCAAATAGCCACCACCCAGCATGA | |
| AGTTATCCCGTGCAGGTTCTTGATTTAGTTGGCCGCCTTACGCATCTCAA | |
| GCAACCATTTTCATGCAGGGTGGTGGCTATTTGAGATGCGTTAGGCGGCC | |
| GGCTATTTGAGATGCGTTAGGCGGCCAACTAAATCAAGAACCTGCACGGG | |
| CGCCTAACGCATCTCAAGTAGCCACCACCCAGCATGAAAATGGTTGCAAT | |
| ATCATGAAAATGGTTGCAATACGTGTAAGGCCCTGTGCATTAAGCCGGCC | |
| AGGGCCTTACACGTATTGCAACCATTTTCATGCTGGGTGGTGGCTATTTG | |
| GGGCCTTACACGTATTGCAACCATTTGCATGCTGGGTGGTGGCTATTTGA | |
| CAGCATGAAAATGGTTGCAATACGTGTAAGGCCCTGTGCATTAAGCCGGC | |
| GTTATCCCGTGCAGGTTCTTGATTTAGTTGGCCGCCTAACGCATCTCAAA | |
| CCACCACCCAGCATGAAAATGGTTGCAATACGTGTGAGGCCCTGTGCATT | |
| GCAATACGTGTAAGGCCCTGTGTATTAAGCCGGCCATGAGTCGTAAGCCG | |
| GATGCGTTAGGCGGCCAACTAAATCAAGAACCTGCACGGGATAACTTCAT | |
| GTTTAGTTGGCCGCCTAACGCATCTCAAATAGCCACCACCCAGCATGAAA | |
| CACGTATTGCAACCATTTTCATGCTGGGTGGTGGCTATTTGAGAGGCGTT | |
| AGATGCGTTAGGCGGCCAACTAAATCAAGAACCTGCACGGGATAACTTCA | |
| GAAGCCATATGAAGTTATCCCGTGCAGGTTCTTGATTTAGTTGGCCGCCT | |
| CCCGTGCAGGTTCTTGATTTAGTTGGCCGCCTAACGCATCTCAAATAGCC | |
| GTTGCAATACGTGAAAGGCCCTGTGCATTAAGCCGGCCATGAGTCGTAAG | |
| GCTATTTGAGATGCGTTAGGCGGCCAACTAAATCAAGTACCTGCACGGGA | |
| ACGTATTGCAACCATTTTCATGCTGGGTGGTGACTATTTGAGATGCGTTA | |
| GAGATGCGTTAGGCGGCCAACTAAATCAAGAACCTGCACGGGATAACTTC | |
| TTGCAACCATTTTCATGCTGGGTGGTGGCTATTTGAGATGCGTTAGGCGG | |
| TGCACAGGGCCTTACACGTATTGCAACCATTTTCATGCTGGATGGTGGCT | |
| GGTGGCTATTTGAGATGCTTTAGGCGGCCAACTAAATCAAGAACCTGCAC | |
| GGCTTAATGCCCAGGGCCTTACACGTATTGCAACCATTTTCATGCTGGGT | |
| GCAGGTTCTTGATTTAGTTGGCCGCCTAACGCATCTCAAATAGCCACCAC | |
| ATATGCGGCTTACGACTCATGGCCGGCTTAATGCACAGGGCCTTACACGT | |
| TAGCCACCACCCAGCATGAAGATGGTTGCAATACGTGTAAGGCCCTGTGC | |
| CTTATGGCCGGCTTAATGCACAGGGCCTTACACGTATTGCAACCATTTTC | |
| CTCAAATAGCCACCACGCAGCATGAAAATGGTTGCAATACGTGTAAGGCC | |
| AAATGGTAGCAATACGTGTAAGGCCCTGTGCATTAAGCCGGCCATGAGTC | |
| TCTTGATTTAGTTGGCCGCCTAACGCATCTCAAATAGCCACCACCCAGCA | |
| GGGCCTTACACGTGTTGCAACCATTTTCATGCTGGGTGGTGGCTATTTGA | |
| AGGCCCTTACACGTATTGCAACCATTTTCATGCTGGGTGGTGGCTATTTG | |
| AAGCCATATGAAGTTATCCCGTGCAGGTTCTTGATTTAGTTGGCCGCCTA | |
| TATGCTGCTTACGACTCATGGCCGGCTTAATGCACAGGGCCTTACACGTA | |
| TCTTGATTTAGTTGGCCGCCTAACGCATCTCAAATAGCCACCACCCAGCA | |
| TACGACTCATGGCCGGCTTAATGCACAGGGCCTTACACGTATTGCACCCA | |
| CTTACACGTATTGCAACCATTTTCATGCTGGGTGGTGGCTATTTGAGATG | |
| TGCTGGGTGGTGGCTATTTGAGATGCGTTAGGCGGCCAACTAAATCAAGA | |
| AATACGTCTAAGGCCCTGTGCATTAAGCCGGCCATGAGTCGTAAGCCGCA | |
| GTTCTTGATTTAGTTGGCCGCCTAACGCATCTCAAATAGCCGCCACCCAG | |
| CGTCTTACGACTCATGGCCGGCTTAATGCACAGGGCCTTACACGTATTGC | |
| ATGCTGGGTGGTGGCTATTTGAGATGCGTTAGGCGGCCAACTAAATCCAG | |
| CTGGGTGGTGGCTACTTGAGATGCGTTAGGCGGCCAACTAAATCAAGAAC | |
| TGGGTGGTGGCTATTTGAGATGCGTTAGGCGGCCAACTAAATCAAGAACC | |
| TGCACAGGGCCTTACACGTATTGCAACCATTTTCACGCTGGGTGGTGGCT | |
| GGTTGCAATACGTGTAAGGCCCTGTGCATTAAGCCGGCCATGAGGCGTAA | |
| GTTAGGCGGCCAACTAAATCAAGAACCGGCACGGGATAACTTCATATGGC | |
| ATTGCAACCATTTTCATGCTGGGTGGTGGCTATTTGAGATGCGTTATGCG | |
| TTAATGCACAGGGCCTTACACGTATTGCAACCATTTTCATGCTGGGTGGT | |
| ACACGTATTGCAACCATTTTCATGCTGGGTCGTGGCTATTTGAGATGCGT | |
| ACCATTTTCATGCTGGGTGGTGGCTATTTGAGATGCGTTAGGCGGCCAAC | |
| ACTTATCCCGTGCAGGTTCTTGATTTAGTTGGCCGCCTAACGCATCTCAA | |
| GCTTAACGCACAGGGCCTTACACGTATTGCAACCATTTTCATGCTGGGTG | |
| CCGTGCAGGTTCTTGATTTTGTTGGCCGCCTAACGCATCTCAAATAGCCA | |
| TGAAGCCATATGAAGTTATCCCGTGCAGGTTCTTGATTTAGTTGGCCGCC | |
| AGGCGGCCAACTAAATCAAGAACCTGCACGGGATAACTTCATATGGCTTC | |
| TGAAGTTATCCCGTGCAGGTTCTTGATTTAGTTGGCCGCCTAACGCATCT | |
| CCCGCGCAGGTTCTTGATTTAGTTGGCCGCCTAACGCATCTCAAATAGCC | |
| TATTGCAACCATTTTCAAGCTGGGTGGTGGCTATTTGAGATGCGTTAGGC | |
| GCAACCATTTTCATGCTGGGTGGTGGCTATTTGAGATGCGTTAGGCGGCC | |
| ATAGCCACCACCCAGCATGAAAATGGTTGCAATACGTGTAAGGCCCTGTG | |
| GAAGTTATCCCGTGCAGGTTCTTGATTTAGTTGGCCGCCTAACGCATCTC | |
| TGAAAATGGTTGCAATACGTGTAAGGCCCTGTGCATTAAGCCGGCCATGA | |
| GGTGGCTATTTGAGATGCGTTAGGCGGCCAACTAAATCAAGAACCTGCAC | |
| TCATCCCGTGCAGGTTCTTGATTTAGTTGGCCGCCTAACGCATCTCAAAT | |
| CATTTTCATGCTGGGTGGTGGCTATTTGAGATGCGTTAGGCGGCCAACTA | |
| CTAACGCATCTCAAATAGCCACCACCCAGCATGAAAATGGTGGCAATACG | |
| TTTGAGATGCGGTAGGCGGCCAACTAAATCAAGAACCTGCACGGGATAAC | |
| GTTGCAATACGTGTAAGGCCCTGTGCATTAAGCCGGCCATGAGTCGTAAG | |
| CGCATCTCAAATAGCCACCACCCAGCATGAAAATGGTTGCAATACTTGTA | |
| CACCCAGCATGAAAATGGTTGCAATACGTGTAAGGCCCTGTGCATTAAGC | |
| ATACGTGTAAGGCCCTGGGCATTAAGCCGGCCATGAGTCGTAAGCCGCAT | |
| GCGGCTTACGACTCATGGCCGGCTTAACGCACAGGGCCTTACACGTATTG | |
| ACGCATCTCAAATAGCCGCCACCCAGCATGAAAATGGTTGCAATACGTGT | |
| AAATAGCCACCACCCAGCATGAAAATGGTTGCAATACGTGTAAGGCCCTG | |
| TGCGGCTTACGACTCATGGCCGGCTTAATGCACAGGGCCTTACACGTATT | |
| ACCACGCAGCATGAAAATGGTTGCAATACGTGTAAGGCCCTGTGCATTAA | |
| AACCAGTTTCATGCTGGGTGGTGGCTATTTGAGATGCGTTAGGCGGCCAA | |
| GCTTACGACTCATGGCCGGCTTAATGCACAGGGCCTTACACGTATTGCAA | |
| TGGGTGGTGGCTATTTGAGATGCGTTAGGCGGCCAACTAAATCAAGAACC | |
| AAATGGTTGCAATACGTGTAAGGCCCTGTGCATTAAGCCGGCCATGAGTC | |
| CCATTTTCATGCTGGGTGGTGGCTATTTGAGATGCGTTAGGCGGCCAACT | |
| GCCTTACACGTATTGCATCCATTTTCATGCTGGGTGGTGGCTATTTGAGA | |
| CACCCAGCATGAAAATGGTTGCAATACGTGTAAGGCCCTGTGCATTAAGC | |
| ATTTAGTTGGCCGCCTAACGCATCTCAACTAGCCACCACCCAGCATGAAA | |
| CACCCAGCATGAAAATGGTTGCAATACGTGTAAGGCCCTGTGCATTAAGA | |
| GGCTATTTGAGATGCGTTAGGCGGCCAACTAAATCAAGAACCTGCACGGG | |
| CACGTATTGCAACCATTTTCATGCTGGGTGGTGGCTATTTGAGATGCGTT | |
| TGCACAGTGCCTTACACGTATTGCAACCATTTTCATGCTGGGTGGTGGCT | |
| ATGGCCGGCTTAATGCACAGGGCCTTACACGTATTGCAACCATTTTCATG | |
| GCAGGTTCTTGATTTAGTTGGCCGCCTAACGCATCTCAAATAGCCACCAC | |
| CTGGGTGGTGGCGATTTGAGATGCGTTAGGCGGCCAACTAAATCAAGAAC | |
| CTTAATGCACAGGGCCTTACACGTATTGCAACCATTTTCATGCTTGGTGG | |
| GGCGGCCAACTAAATCAAGAACCTGCACGGGATAACTTCATATGGCTTCA | |
| TGGCAAATGCAGCCATGCCCAAATATATTTGGGCATGGCTGCATTTGCCA | |
| CGCATCTCAAATAGTCACCACCCAGCATGAAAATGGTTGCAATACGTGTA | |
| TGGGTGGTGGCTATTTGAGATGCGTTAGGCGGCCAACTAAATCAAGAACC | |
| CTTACGACTCATGGCCGGCTTAATGCACAGGGCCTTACACGTATTGCAAC | |
| AACCATTTTCATGCTGGGTGGTAGCTATTTGAGATGCGTTAGGCGGCCAA | |
| TGAAGCCATATGAAATTATCCCGTGCAGGTTCTTGATTTAGTTGGCCGCC | |
| GCCTTACACGTATTGCAACCATTTGCATGCTGGGTGGTGGCTATTTGAGA | |
| TGCGGCTTACGACTCATGGCCGGCTTAATGCACAGGGCCTTACACGTATT | |
| CCGCCTAACGCATCTCAAATAGCCACCACCCAGCATGAAAATGGTTGCAA | |
| TAACGCATCTCAAATAGCCACCACCCAGCATGAAAATGGTTGCAATACGT | |
| GGCTATTTGAGATGCGTTAGGCGGCCAACTAAATCGAGAACCTGCACGGG | |
| ATCTCAAATAGCCACCACCCAGCATGAAAATGGTTGCAATACGTGTAAGG | |
| TTAATGCACAGGGCCTTACACGTCTTGCAACCATTTTCATGCTGGGTGGT | |
| TTACGACTCATGGCCGGCTTAATGCACAGGGCCTTACACGTATTGCAACG | |
| AGGGCCTTACACGTACTGCAACCATTTTCATGCTGGGTGGTGGCTATTTG | |
| TTCATGCTGAGTGGTGGCTATTTGAGATGCGTTAGGCGGCCAACTAAATC | |
| TGCGTTTGGCGGCCAACTAAATCAAGAACCTGCACGGGATAACTTCATAT | |
| ACACGTATTGCAACCATTTTCATGCTGGGTGGTGGCTATTTGAGATGCGT | |
| CCCAGCATGAAAATGGTTGCAATACGTGTAAGGCCCTGTGCATTAAGCCG | |
| ATCTCAAATAGCCACCACCCAGCATGAAAATGGTTGCAATACGTGTAAGG | |
| GCAGCCATATGAAGTTATCCCGTGCAGGTTCTTGATTTAGTTGGCCGCCT | |
| ACGTGTAAGGCCCTGTGCATTAAGCCGGCCATGAGTCGTAAGCCGCATAT | |
| CATATGAAGTTATCCCGTGCAGGTTCTTGATTTAGTTGGCCGCCTAACGC | |
| CCGGCTTAATGCACAGGGCCTTACACGTATTGCAACCATTTTCATGCTGG | |
| GGTTGCAATACGTGTAAAGCCCTGTGCATTAAGCCGGCCATGAGTCGTAA | |
| CATGGCCGGCTTAATGCACAGGGCCTTACATGTATTGCAACCATTTTCAT | |
| ACGTATTGCAACCATTTTCATGCTGGGTGGTGGCTATTTGAGATGCGTTA | |
| TATTGCAACCATTTTCATGCTGGTTGGTGGCTATTTGAGATGCGTTAGGC | |
| CGTATTGCAACCATTTTCATGCTGGGTGGTGGCTATTTGAGATGCGTTAG | |
| GCTATTTGAGATGCGTTAGGCGGCCAACTAAATCAAGAACCTGCACGGGA | |
| AGGGCCTTACACGTATTCCAACCATTTTCATGCTGGGTGGTGGCTATTTG | |
| ATATGAAGGTATCCCGTGCAGGTTCTTGATTTAGTTGGCCGCCTAACGCA | |
| GTGGTGGCTATTTGAGATGCGTTAGGCGGCCAACTAAATCAAGAACCTGC | |
| TTACGACTCATGGCCGGCTTAATGCACAGGGCCTTACACGTTTTGCAACC | |
| TCTCAAATAGCCACCACCCAGCATGAAAATGGTTTCAATACGTGTAAGGC | |
| CCAGCATGAAAATGGTTGCAATACGTGTAAGGCCCTGTGCATTAAGCCGG | |
| GCAATACGTGTAAGGCCCTGTGCATTAAGCCGGCCATGAGTCGTAAGCCG | |
| CAGCATGAAAATGGTTGCAATACGTGTAATGCCCTGTGCATTAAGCCGGC | |
| CAAGTATTGCAACCATTTTCATGCTGGGTGGTGGCTATTTGAGATGCGTT | |
| TGCTGGGTGGTGGCTATTTGAGATGCGTTAGGCGGCCAACTAAATCAAGA | |
| AGGCGGCCAACTAAATCAAGAACCTGCACGGGATAACTTCATATGCCTTC | |
| TTATCCCGTGCAGGTTCTTGATTTAGTTGGCCGCCTAACGCATCGCAAAT | |
| CCCGTGCAGGTTCTTGATTTAGTTGGCCGCCTAACGCATCTCAAATAGCC | |
| GAAAATGGTTGCACTACGTGTAAGGCCCTGTGCATTAAGCCGGCCATGAG | |
| TTAGGCGGCCAACTAAATCAAGAACCTGCACGGGATAACTTCATATGGCT | |
| CACGTATTGCAACCATTTTCATGCTGGGTGGTGGCTATTTGAGATGCGTT | |
| TTAGTTGGCCGCCTAACGCATCTCAAATAGACACCACCCAGCATGAAAAT | |
| TTAGGCGGCCAACTAAATCAAGAACCTGCACGGGATAAGTTCATATGGCT | |
| GGATGAAAATGGTTGCAATACGTGTAAGGCCCTGTGCATTAAGCCGGCCA | |
| ATGTGAAGTTATCCCGTGCAGGTTCTTGATTTAGTTGGCCGCCTAACGCA | |
| ACCATTTTCATGCTGGGTGGTGGCTATTTGAGATGCGTTAGGCGGCCAAC | |
| GCCTTACACGTATTGCAACCATTTTCATGCTGGGTGGTGGCTATTTGAGA | |
| TCAAATAGCCACCACCCAGCATGAAAATGGTTGCAATACGTGTAAGGCCC | |
| TGATAATGGTTGCAATACGTGTAAGGCCCTGTGCATTAAGCCGGCCATGA | |
| CCGGCTTAATGCACAGGGCCTTACACGTATTGCAACCATTTTCATGCTGG | |
| CCATATGAAGTTATCCCGTGCAGGTTCTTGATTTAGTTGGCCGCCTAACG | |
| GGGCCTTACACGTATTACAACCATTTTCATGCTGGGTGGTGGCTATTTGA | |
| TTTAGTTGGCCGCCTAACGCATCTCAAATAGCCACCACCCAGCATGAAAA | |
| TATGCGGCTTACGACTCATGGCCGGCTTAATGCACAGGGCCTTACACGTA | |
| GTTCTTGATTTAGTTGGCCGCCTAACGCATCTCAAATAGCAACCACCCAG | |
| GCTATTTGAGATGCGTTAGGCGGCCAACTAAATCAAGAACCTGCACGGGA | |
| AATGCACAGGGCCTTACACGTATTGCAACCATTTTCATGCTGGGTGGTGG | |
| AGTTATCCCGTGCAGGTTCTTGATTTAGTTGGCCGCCTAACGCATCTCAA | |
| TCATGGCCGGCTTAATGCACATGGCCTTACACGTATTGCAACCATTTTCA | |
| ATGCTTGCAATACGTGTAAGGCCCTGTGCATTAAGCCGGCCATGAGTCGT | |
| GGCTTAATGCACAGGGCCTTACACGTATTGCAACCATTTTCATGCTGGGT | |
| ATGGCCGGCTTAATGCACAGGGCCTTACACGGATTGCAACCATTTTCATG | |
| TGCAATACGTGTAAGGCCCTGTGCATTAAGCCGGCCATGAGGCGTAAGCC | |
| ATGCGGCTTACGACTCATGGCCGGCTAAATGCACAGGGCCTTACACGTAT | |
| GTTGGCCGCCTAACGCATCTCAAATAGCCACCACCCAGCATAAAAATGGT | |
| ATATGAAGTTATCCCGTGCAGGTTCTTGATTTAGTTGGCCGCCTAACACA | |
| TGCAACCATTTTCATGCTGGGTGGTGGCTATTTGAGATACGTTAGGCGGC | |
| TCTCAAATAGCCACCACCCAGCATGAAAATGGTTGCAATACGTGTAAGGC | |
| CGGCTTAATGCACAGGGCCTTACACGTATTGCAACCATTGTCATGCTGGG | |
| TCATGGCCGGCTTAATCCACAGGGCCTTACACGTATTGCAACCATTTTCA | |
| TACACGTATTGCAACCATTTTCATGCTGGTTGGTGGCTATTTGAGATGCG | |
| CAACCATTTTCATGCTGGGTGGTGGCTATTTGAGATGCGTTAGGCGGCCA | |
| TCCACGTATTGCAACCATTTTCATGCTGGGTGGTGGCTATTTGAGATGCG | |
| ATAGCCACCACCCAGCATGAAAATGGTTGCAATACGTGTAAGGCCCTGTG | |
| CCGTGCAGGTTCTTGATTGAGTTGGCCGCCTAACGCATCTCAAATAGCCA | |
| GCTATTTGAGATGCGTTAGGCGGCCAACTAAATCAAGAACCTGCACGGGA | |
| CAGGGCCTTACACGTATTGCAACCATTTTCATGCTGGGTGGTGGCTATTT | |
| GCCTAACGCATCTCAAATAGCCACCACCCAGCATGAAAATGGTTGCAATA | |
| CGCCTAACGCATCTCAAATAGCCACCACCCAGCATGAAAATGGTTGCAAT | |
| GCCGGCTTAATGCACAGGGCCTTACAGGTATTGCAACCATTTTCATGCTG | |
| GCTTAATGCACAGGGCCTTACACGTATTGCAACCATCTTCATGCTGGGTG | |
| GCCGCCTAACGCATCTCAAATAGCCACCTCCCAGCATGAAAATGGTTGCA | |
| TGGCCGCCTAACGCATCTCAAATAGCCACCACCCAGCATGAAAATGGTTG | |
| CAGGTTCTTGATTTAGTTGGCCGCCTAACGCATCTCAAATAGCCACCACC | |
| ATACGTGTAAGGCCCTGTGCATTAAGCCGGCCATGAGTCGTAAGCCGCAT | |
| ATTGCAACCATTTTCATGCTGGGTGGTGGTTATTTGAGATGCGTTAGGCG | |
| AGGTTCTTGATTTAGTTGGCCGCCTAACGCATCTCAAATAGCCACCACCC | |
| TTTGAGATGGGTTAGGCGGCCAACTAAATCAAGAACCTGCACGGGATAAC | |
| GTTGGCCGCCTAACGCATCTCAAATAGCCACCACCCAGCATGAAAATGGT | |
| CATGCTGGGTGGTGGCTATTTGAGATGCGTTAGGCGGCCAACTAAATCAA | |
| TGAGATGCGTTAGGCGGCCAACTAAATCAAGAACCTGCACGGGATAACTT | |
| TGCAACCATTTTCATGCAGGGTGGTGGCTATTTGAGATGCGTTAGGCGGC | |
| ATGGTTGCAATACGTGTAAGGCCCTGTGCATTAAGCCGGGCATGAGTCGT | |
| GGCCTTACACGTATTGCAACCATTTTCATGCTGGGTGGTGGCTATTTGAG | |
| CCGTGCAGGTTCTTGATTTAGTTGGCCGCCTAACGCATCTCAAAGAGCCA | |
| CCCAGCATGAAAATGGTTGCAATACGTGTAAGGCCCTGTGCATTAAGCCG | |
| CACCACCCAGCATGAAAATGGTTGCAATACGTGTAAGGCCCTGTGCATTA | |
| GGCCGCCTAACGCATCTCAAATAGCCACCACCCAGAATGAAAATGGTTGC | |
| CTTACACGTATTGCAACCTTTTTCATGCTGGGTGGTGGCTATTTGAGATG | |
| AATACGTGTAAGGCCCTGTGCATTAAGCTGGCCATGAGTCGTAAGCCGCA | |
| CATGGCCGGCTTAATGCACAGGGCCTTACACGGATTGCAACCATTTTCAT | |
| ATTTTCATGCTGGGTGGTGGCTATTTGAGATGCGTTAGGCGGCCAACTAA | |
| ACATATTGCAACCATTTTCATGCTGGGTGGTGGCTATTTGAGATGCGTTA | |
| ATGCACAGGGCCTTACACGTATTGCAACCATTTTCATGCTGGGTGGTGGC | |
| CATCTCAAATAGCCACCACCCAGCATGAAAATGGTTGCAATACGTGTAAG | |
| GCAACCATTTTCATGCTGGGTGGTGGCTATTTGAGATGCGTTAGGCGGCC | |
| CCACCCAGCATGAAAATGGTTGCAATACGTGTAAGGCCCTGTGCATTAAG | |
| CGGCTTACGACTCATGGCCGGCTTAATGCACAGGGCCTTACACGTATTGC | |
| GGCCTTACACGTATTGCAACCATTTTCATGCTGGGTGGTGGCTATTTGAG | |
| ATTTAGTTGGCCGTCTAACGCATCTCAAATAGCCACCACCCAGCATGAAA | |
| CTGGCTATTTGAGATGCGTTAGGCGGCCAACTAAATCAAGAACCTGCACG | |
| CACCACCCAGCATGAAAATGGTTGCAATACCTGTAAGGCCCTGTGCATTA | |
| ATATGAAGTTATCCCGTGCAGGTTCTTGATTTAGTTGGCCGCCTAACGCA | |
| AGGGCCTTACACGTATTGCAACCATTTTCATGCTGGGTGGTGGCTATTTG | |
| TATCCCGTGCAGGTTATTGATTTAGTTGGCCGCCTAACGCATCTCAAATA | |
| ACACGTATTGCAACCATTTTCATGCTGGGTGGTGGCTATTTGAGATGCGT | |
| TGCTGGGTGGTGGCTATTTGAGATGCGTTAGGCGGCCAACTAAATCAAGA | |
| CACCCAGCATGAAAATGGTTGCAATACGTGTAAAGCCCTGTGCATTAAGC | |
| TAGGCGGCGAACTAAATCAAGAACCTGCACGGGATAACTTCATATGGCTT | |
| GCAATACGTGTAAGGCCCTGTGCATTAAGCCGGCCATGAGTCGTAAGCCG | |
| CCGCCTAACGCATCTCAAATAGCCACCACCCAGCATGAAAATGGTTGCAA | |
| AGTTGGCCGCCTAACGCATCTCAAATAGCCACCACCCAGCATGAAAATGG | |
| GGGCCTTACACGTATTGCAACCATTTTCATGCTGGGTGGTGGCTATTTGA | |
| CGTTAGGCGGCCAACTAAATCAAGAACCTGCACGGGATAACTTCATATGG | |
| AATGGTTGCAATACGTGTAAGGGCCTGTGCATTAAGCCGGCCATGAGTCG | |
| ACTACTCATGGCCGGCTTAATGCACAGGGCCTTACACGTATTGCAACCAT | |
| TGGCCGACTTAATGCACAGGGCCTTACACGTATTGCAACCATTTTCATGC | |
| CCATTTTCATGCTGGGTGGTGGTTATTTGAGATGCGTTAGGCGGCCAACT | |
| ATATGCGGCTTACGACTCATGGCCGGCTTAATGCACAGGGCCTTACCCGT | |
| CTTGATTTAGTTGGCCGCCTAACGCATCTCAAATTGCCACCACCCAGCAT | |
| TCTCAAATAGCCACCACCCAGCATGAAAATGGTTGCAATACGTGTAAGGC | |
| CTTAATGCACAGGGCCTTACACGTATTGCAACCATTTTCATGCTGCGTGG | |
| TGAGATGCGTTAGGCGGCCAACTAAATCAAGAACCTGCACGGGATAACTT | |
| GAGATGCGTTAGGCGGCCAACTAAATCAAGAACCTGCACGGGATAACTTC | |
| GCAACCATTTTCATGCTGGGTGGTGGCTATTTGAGATGCGTTGGGCGGCC | |
| CCTTACACGTATGGCAACCATTTTCATGCTGGGTGGTGGCTATTTGAGAT | |
| TGGTTGCAATACGTGTAAGGCCCTGTACATTAAGCCGGCCATGAGTCGTA | |
| CCATATGAAGTTATCCCGTGCAGGTTCTTGATTTAGTTGGCCGCCTAACG | |
| CATGCTGGGTGGTGGCTATTTGAGATGCGTTAGGCGGCCAACTAAATCAA | |
| TAACGCATCTCAAATAGCCACCACCCAGCATGAAAATGGTTGCAATACGT | |
| AATACGTGTAAGGCTCTGTGCATTAAGCCGGCCATGAGTCGTAAGCCGCA | |
| GATGCGTTAGGCGGCCAACTAAATCAAGAACCTGCACGGGATAACTTCAT | |
| ACACGTATTGCAACCATTTTCATGCTGGGTGGTGGCTATTTAAGATGCGT | |
| GCAACCATTTTCATGCTGGGTGGTGGCTATTTGAGATGCGTTAGGCGGCC | |
| TATGCGGCTTACGACTCATGGCCGGCTTAATGCACAGGGCCTTAGACGTA | |
| CTAACGCAACTCAAATAGCCACCACCCAGCATGAAAATGGTTGCAATACG | |
| TGGCCGCCTAACGCATCTCAAATAGCCACCACCCAGCATGAAAATGGTTG | |
| TTTGAGATGCGTTAGGCGGCCAACTAAATCAAGAACCTGCACGGGATAAC | |
| AATGCACAGGGCCTTACACGTATTGCAACCATTTTCATACTGGGTGGTGG | |
| TAGTTGGCCGCCTAACGCATCTCAAATAGCCACCACCCAGCATGAAAATG | |
| AGCATGAAAATGGTTGCAATACGTGTAAGGCCCTGTGCATTAAGCCGGCC | |
| GCACAGGGCCTTACACGTATTGCAACCATGTTCATGCTGGGTGGTGGCTA | |
| TACACGTATTGCAACCATTTGCATGCTGGGTGGTGGCTATTTGAGATGCG | |
| GGGCCTTACACGTATTGTAACCATTTTCATGCTGGGTGGTGGCTATTTGA | |
| CCGGCTTAATGCACAGGGCCTTACACGTATTGCAACCATTTTCATGCTGG | |
| CTCAAATAGCCACCACCCAGCATGAAAATGGTTGCAATACGTGTAAGGCC | |
| GAAGCCATATGAAGTTATCCCGTGCAGGTTCTTGATTTAGTTGGCCGCCT | |
| AATGGTTGCAATACGTGTAAGGCCCTGTGCATTAAGCCGGCCATGAGTCG | |
| CTTAATGCACAGGGCCTTACACGTATTGCGACCATTTTCATGCTGGGTGG | |
| CTGGGTGGTGGCTATTTGAGATGCGTTAGGCGGCCAACTAAATCAAGAAC | |
| TTGGCCGCCTAACGCATCTCAAAAAGCCACCACCCAGCATGAAAATGGTT | |
| CAGGGCCTTACACGTATTGCAACCATTTTGATGCTGGGTGGTGGCTATTT | |
| CTTAATGCACAGGGCCTTACACGTATTGCAACCATGTTCATGCTGGGTGG | |
| AGATGCGTTAGGCGGCCAACTAAATCAAGAACCTGCACGGGATAACTTCA | |
| TGGCTATTTGAGATGCGTTAGGCGGGCAACTAAATCAAGAACCTGCACGG | |
| GTGGCTATTTGAGATGCGTTAGGCGGCCAACTAAATCAAGAACCTGGACG | |
| TGGCCGGCTTAATGCACAGGGCCGTACACGTATTGCAACCATTTTCATGC | |
| TTTAGTTGGCCGCCTAACGCATCTCAAATAGCCACCACCCAGCATGAAAA | |
| TGATTTAGTTGGCCGCTTAACGCATCTCAAATAGCCACCACCCAGCATGA | |
| GGGCAAATGCAGCCATGCCCAAATATATTTGGGCATGGCTGCATTTGCCA | |
| GGCTTAATGCACAGGGCCTTACACGTATTGCAACCATTTTCATGCTGGGT | |
| GCGCATCTCAAATAGCCACCACCCAGCATGAAAATGGTTGCAATACGTGT | |
| ACAGGGCCTTACACGTATTGCAACCATTCTCATGCTGGGTGGTGGCTATT | |
| CGTATTGCAACCATTTTCATGCTGGGTGGTGGCTATTTGAGATGCGTTAG | |
| GGCTATTTGAGATGCGTTAGGCGGCCAACTAAATCAAGAACCTGCACGGG | |
| ACGTGTAAGGCCCTGTGCATTAAGCCGGCCATGAGTCGTAAGCCGCATAT | |
| ACAGGGCCTTACACGTATTGCAACCATTTTCATGCTGGGTGGTGGCTCTT | |
| TAGCCACCACCCAGCATGAAAATGGTTGCAATACGTGTAAGGCCCTGTGC | |
| GCAGGTTCTTGATTTAGTTGGCCGCCTAACGCATCTCAAATAGCCACCAC | |
| GAAGTTATCCCGTGCAGGTTCTTGATTTAGTTGGCCGCCTAACGCATCTC | |
| CGACTGATGGCCGGCTTAATGCACAGGGCCTTACACGTATTGCAACCATT | |
| TACACGTATTGCAACCATTTTCATGCTGGGTGGTGGCTATTTGAGATGCG | |
| GCCATATGAAGTTATCCCGTGCAGGTTCTTGATTTAGTTGGCCGCCTAAC | |
| GAGATGCGTTAGGCGGCCAACTAAATCAAGAACCTGCACGGGATAACTTC | |
| GCAGGTTCTTGATTTAGTTGGCCGCCTAACGCATCTCAAATAGCCACCAC | |
| TATCCCGTGCAGGTTCTTGATTTAGTTGGCCGCCCAACGCATCTCAAATA | |
| ATGAAAATGGTTGCAATACGTGTCAGGCCCTGTGCATTAAGCCGGCCATG | |
| TGAGATGCGTTAGGCGGCCAACTAAATCAAGAACCTGCACGGGATAACTT | |
| GACTCATGGCCGGCTTAATGCACAGGGCCTTACACGTATTGCAACCATTT | |
| GCCATATGAAGTTATCCCGTGCAGGTTCTTGATTTAGTTGGCCGCCTAAC | |
| GGTTCTTGATTTAGTTGGCCGCCTAACGCATCTCAAATAGCCACCACCCA | |
| CGCCTAACGCATCTCAAATAGCCACCACCCAGCATGAAAAGGGTTGCAAT | |
| CGGCTTAATGCACAGGGCCTTACACGTATTGCAACCATTTTCATGCTGGG | |
| CCAGCATGAAAATGGTTGCAATACGTGTAAGGCCCTGTGCATTAAGCCGG | |
| CATGGCCGGCTTAATGCACAAGGCCTTACACGTATTGCAACCATTTTCAT | |
| GTGCAGGTTCTTGATTTAGTTTGCCGCCTAACGCATCTCAAATAGCCACC | |
| GCCACAACCCAGCATGAAAATGGTTGCAATACGTGTAAGGCCCTGTGCAT | |
| ATACGGGTAAGGCCCTGTGCATTAAGCCGGCCATGAGTCGTAAGCCGCAT | |
| GCCACCACCCAGCATGAAAATGGTTGCAATACGTGTAAGGCCCTGTGCAT | |
| CACAGGGCCTTACACGTATTGCAACCATTTTCATGCTGGGTGGTGGCTAT | |
| ATGCTGGGTGGTGGCTATTTGAGATGCGTTAGGCGGCCAACTAAATCAAG | |
| GAGATGCGTTAGGCGGCCAACTAAATCAAGAACCTGCACGGGATAACTTC | |
| GCCGCCCAACGCATCTCAAATAGCCACCACCCAGCATGAAAATGGTTGCA | |
| CCATTTTCATGCTGGGTGGTGGCTATTTCAGATGCGTTAGGCGGCCAACT | |
| AGGCGGCCAACTAAAGCAAGAACCTGCACGGGATAACTTCATATGGCTTC | |
| AGTTGGCCGCCTAACGCATCTCAAATAGCCACCACCCAGCATGAAAATGG | |
| TTTCATGCTGGGTGGTGGCTATTTGAGATGCGTTAGGCGGCCAATTAAAT | |
| TATGAAGTTATCCCGTGCAGGTTCTTGATTTAGTTGGCCGCCTAACGCAT | |
| AAAATGGTTGCAATACGTGTAAGGCCCTGTGCATTAAGCCGGCCATGAGT | |
| ATACGTGTAAGGCCCTGTGCATTAAGCCGGCCATGAGTCGTAAGCCGCAT | |
| GGTGGTGGCTATTTGAGATGCGTTAGGCGGCCAACTAAATCAAGAACCTG | |
| GGGTGGTGGCTATTTGAGATGCGTTAGGCGGCCAACTAAATCAAGAACCT | |
| CTATTTGAGATGCGTTAGGCGGCCAACTAAATCAAGAACCTGCACGGGAT | |
| CAGGTTCTTGATTTAGTTGGCCGCCTAACGCATCTCAAATAGCCACCACC | |
| GCATCTCAAATAGCCACCACCCAGCATGAAAATGATTGCAATACGTGTAA | |
| GGCGGCCAACTAAATCAAGAACCTGCACGGGATAACTTCATATGGCTTCA | |
| ATGCGTTAGGCGGCCAACTAAATCAAGAACCTGCACGGGATAACTTCATA | |
| AACCATTTTCATGCTGGGTGGTGGCTATTTGAGATGCGTTAGGCGGCCAA | |
| TATCCCGTGCAGGTTCTTGATTTAGTTGGCCGCCTAACGCATCTCAACTA | |
| ACAGGGCCTTACACGTATTGCAACCATTTTCATGCTGGGAGGTGGCTATT | |
| CCGTGCAGGTTCTTGATTTAGTTGGCCGCCTAACGCATCTCAAATAGCCA | |
| GGCTATTTGAGATGCGTTAGGCGGCCAACTAAATCAAGAACCTCCACGGG | |
| AGGTTCTTGATTTAGTTGGCCGCCTAACGCATCTCAAATAGCCACCACCC | |
| CAACACGTGTAAGGCCCTGTGCATTAAGCCGGCCATGAGTCGTAAGCCGC | |
| TTGAGATGCGTTAGGCGGCCAACTAAATCAAGGACCTGCACGGGATAACT | |
| CTATTTGAGATGCGTTAGGCGGCCAACTAAATCAAGAACCTGCACGGGAT | |
| TGCTGGGTGGTGGCTATTTGAGATGCGTTAGGCGGCCAACTAAATCAAGA | |
| GACTCATGGCCGGCTTTATGCACAGGGCCTTACACGTATTGCAACCATTT | |
| GCGTTAGGCGGCCAACTAAATCAAGAACCTGCACGGGATAACTTCATATG | |
| TATGCGGCTTACGACTCATGGCCGGCTTAATGAACAGGGCCTTACACGTA | |
| AAATGGTTGCCATACGTGTAAGGCCCTGTGCATTAAGCCGGCCATGAGTC | |
| ACCATTTTCATGCTGGGTGGTGGCTATTTGAGATGCGTTAGGCGGCCAAC | |
| TTGCAATACGTGTAAGGCCCTGTGCATTAAGCCGGCCATGAGTCGTAAGC | |
| GGTGGGTATTTGAGATGCGTTAGGCGGCCAACTAAATCAAGAACCTGCAC | |
| CTGGGTGGTGGCTATTTGAGATGCGTTAGGCGGACAACTAAATCAAGAAC | |
| TTCTTGATTTAGTTGGCCGCCTAACGCATCTCAACTAGCCACCACCCAGC | |
| GCAACCATTTTCATGCTGGGTAGTGGCTATTTGAGATGCGTTAGGCGGCC | |
| ATGAAGTTATCCCGTGCAGGTTCTTGATTTAGTTGGCCGCCTAACGCATC | |
| AGCGCCTTACACGTATTGCAACCATTTTCATGCTGGGTGGTGGCTATTTG | |
| TGCGGCTTACGACTCATGGCCGGCTTAATGCACAGGGCCTTACACGTTTT | |
| GGCGGCCAACTAAATCAAGAACCTGCACGGGATAACTTCATATGGCTTAA | |
| GGCCGCCTAACGCATCCCAAATAGCCACCACCCAGCATGAAAATGGTTGC | |
| CCACCACCCAGCATGAAAATGGTTGCAATACGTGTAAGGCCCTGTGCATT | |
| ATGGCCGGCTTAATGCACAGGGCCTTACACGTATCGCAACCATTTTCATG | |
| GAAAATGGTTGCAATACGTGTAAGGCCCTGTGAATTAAGCCGGCCATGAG | |
| TACACGTATTGCAACCATTTTCATGCTGGGTGGTGGCTATTTGAGATGCG | |
| GGCCGGCTTAATGCACAGGGCCTTACACGAATTGCAACCATTTTCATGCT | |
| AGCCATATGAAGTTATCCCGTGCAGGTTCTTGATTTAGTTGCCCGCCTAA | |
| TGCACAGGGCCTTACACGGATTGCAACCATTTTCATGCTGGGTGGTGGCT | |
| CACGTATTGCAACCATTTTCATGCTGGGTGGTGGCTATTTGAGATGCGTT | |
| TCATGCTGGGTGGTGGCTATTTGAGATGCGTTAGGCGGCCTACTAAATCA | |
| TGGTTGCAATACGTGTAAGGCCCTGTGCATTAAGCCGGCCATGAGTCGTA | |
| ACCCAGCATGAAAATGGTTGCAATACGTGTAAGGCCCTGTGCATTAAGCC | |
| GCTTACGACTCATGGCCGGCTTAATGCACAGGGCCTTACACGTATTGCAA | |
| AATGCACAGGGCCTTACACGTATTGCAACCATTTTCATGCTGGGTGGTGG | |
| CGCATCTCAAATAGCCACCACCCAGCATGAAAATGGTTGCAAGACGTGTA | |
| GGTTCTTGATTTAGTTGGCCGCCTAACGCATCTCAAATAGCCACCACCCA | |
| ACAGGGCCTTACACGTATTGCAACCATTTTCATGCTGGGTGGTGGCTATT | |
| GCCATATGAAGTTATCCCGTGCAGGTTCTTGATTTAGCTGGCCGCCTAAC | |
| CATGCTGGTTGGTGGCTATTTGAGATGCGTTAGGCGGCCAACTAAATCAA | |
| AGATGCGTTAGGCGGCCAACTAAATCAAGAACCTGCACGGGATAACTTCA | |
| TCAAATAGCCACCACCCAGCATGAAAATGGTTGCAATACGTGTAAGGCCC | |
| ATTTTCATGCTGGGTGGTGGCTATTTGAGATGCGTTAGGCGGCCAACTAA | |
| TCGTTAGGCGGCCAACTAAATCAAGAACCTGCACGGGATAACTTCATATG | |
| CTGGGTGGTGGCTATTTGAGATGCGTTAGGCGGCCAACTAAATCAAGAAC | |
| TGCTGGGTGGTGGCTATTTGAGATGTGTTAGGCGGCCAACTAAATCAAGA | |
| ATGCTGGGTGGTGGCTATTTGAGATGCGTTAGGCGGCCAACTAAATCAAG | |
| GATTTAGTTGGCCGCCTAACGCATCTCAAATAGCCACCACCAAGCATGAA | |
| CCACCCAGCATGAAAATGGTTGCAATACGTGTAAGGCCCTGTGCATTAAG | |
| CGTGCAGGTTCTTGATTTAGTTGGCCGCCTAACGCATCTCAAATAGCCAC | |
| GTTTTCATGCTGGGTGGTGGCTATTTGAGATGCGTTAGGCGGCCAACTAA | |
| CGGCTTAATGCACAGGGCCTTACACGTATTGCAACCATTTTCATGCTGGG | |
| TATGAAGTTATCCCGTGCAGGTTCTTGATTTAGTTGGCCGCCTAACGCAT | |
| CTTACACGTATTGCAACCATTTTCATGCTGGGTGGTGGCTATTTGAGATG | |
| TATGAAGTTATCCCGTGCAGGTTCTTGATTTAGTTGGCCACCTAACGCAT | |
| AGGTTCTTGATTTAGTTGGCCGCCTAACGCATCTCAAATAGCCACCACCC | |
| CCAGCATGAAAATGGTTGCAATACGTGTAAGGCCCTGTGCATTTAGCCGG | |
| GCTATTTGAGATGCGTTAGGCGGCCAACTAAATCAAGAACCTGCATGGGA | |
| ACGTGTAAGGCCCTGTGCATTAAGCCGGCCATGAGTCGTAAGCCGCATAT | |
| CTATTTGAGATGCGTTAGGCGGCCAACTAAATCAAGAACCTGCACGGGAT | |
| ATGGCCGGCTTAATGCACAGGGCCTTACACGTATTGCAACCATTTTCATG | |
| CTCAAATAGCCACCACCCAGCATGAAAATGGTTGCAATACGTGTAAGGCC | |
| GCTGGGTGGTGGCTATTTGAGATGCGTTAGGCGGCCAACTGAATCAAGAA | |
| GGCTTAATGCACAGGGCATTACACGTATTGCAACCATTTTCATGCTGGGT | |
| GCTGGCTGGTGGCTATTTGAGATGCGTTAGGCGGCCAACTAAATCAAGAA | |
| CACCACCCAGCATGAAAATGGTTGCAATACGTGTAAGGCCCTGTGCATTA | |
| GTCATGGCCGGCTTAATGCACAGGGCCTTACACGTATTGCAACCATTTTC | |
| GGGCCTTACACGTATTGCAACCATTTTCATGCTGGGTGGTGGCTATTTGA | |
| GCGTTAGGCGGCCAACTAAATCAAGAACCTGCACGGGATAACTTCATATG | |
| GGTGGCTATTTGAGATGCGTTAGGCGGCCCACTAAATCAAGAACCTGCAC | |
| CACGTGTAAGGCCCTGTGCATTAAGCCGGCCATGAGTCGTAAGCCGCATA | |
| TGCAATACGTGTAAGGACCTGTGCATTAAGCCGGCCATGAGTCGTAAGCC | |
| CATGAAAATGGTTGCAATACGTGTAAGGCCCTGTGCATTAAGCCGGCCAT | |
| AATAGCCACCACCCAGCATGAAAATGGTTGCAATACGTGTAAGGCCCTGT | |
| CACCCAGCATGAAAATGGTTGCAATACGTGTAAGGCCCTGTGCATTAAGT | |
| ATCCCGTGCAGGATCTTGATTTAGTTGGCCGCCTAACGCATCTCAAATAG | |
| TTAGGCGGCCAACTAGATCAAGAACCTGCACGGGATAACTTCATATGGCT | |
| GAGATGCGTTAGGCGGCTAACTAAATCAAGAACCTGCACGGGATAACTTC | |
| ATTTTCATGCTGGGTGGTGGCTATTTGAGATGCGTTAGGCGGCCAACTAA | |
| GGGTGGTGGCTATTTGAGATGCGTTAGGCGGCCAACTAAATCAAGAACCT | |
| TGCACAGGGCCTTACACGTATTGCAACCATTTTCTTGCTGGGTGGTGGCT | |
| AAGTTGTCCCGTGCAGGTTCTTGATTTAGTTGGCCGCCTAACGCATCTCA | |
| CGTGCAGGTTCTTGATTTAGTTGGCCGCCTAACGCATCTCAAACAGCCAC | |
| CCGGCTTAATGCACAGGGCCTTACACGTATTGCAACCATTTTCATGCTGG | |
| TGGTTGCAATACGTGTAAGGCCCTGTGCATTAAGCCGGCGATGAGTCGTA | |
| AGGCGGCCAACTAAATCAAGAACCTGCACGGGATAACTTCATATGGCTTC | |
| TGCAACCATTTTCATGCTGGGTGGTGGCTATTTGAGATGCGTTAGGCGGC | |
| ATAGCCACCACCCAGGATGAAAATGGTTGCAATACGTGTAAGGCCCTGTG | |
| CCTAACGCATCTCAAATAGCCACCACCCAGCATGAAAATGGTTGCAATAC | |
| ATTTGAGATGCGTTACGCGGCCAACTAAATCAAGAACCTGCACGGGATAA | |
| ATGCGGCTTACGACTCATGGCCGGCTTAATGCACAGGGCCTTACACGTAT | |
| CCATATGAAGTTATCCCGTGCAGGTTCTTGATTTAGTTGGCCGCCTAACG | |
| GGCCTTACACGTATTGCAACCATTTTCATGCTGGGTGGTGGCTATTTGAG | |
| GGCGGCCAACTAAATCAAGAACCTGCACGGGATAACTTCATATGGCTTCA | |
| CCTAACGCATCTCAAATAGCCACCACCCAGCATGAAAATGGTAGCAATAC | |
| TCTCAAATAGCCACCACCCAGCATGAAAATGGTTGCAAGACGTGTAAGGC | |
| GCATGAAAATGGTTGCAATACGTGTAAGGCCCTGTGCATTTAGCCGGCCA | |
| GGCCTTACACGTATTGCAACCATTTTCATGCTGGGTGGTGGCTATTTGAG | |
| CCGGCTTAATGCACAGGGCCTTACACGTATTGCAACCATTTTCATGCTGG | |
| ATGGCCTTACACGTATTGCAACCATTTTCATGCTGGGTGGTGGCTATTTG | |
| GCACAGGGCCTTACACGTATTGCAACCATTTTCATGCTTGGTGGTGGCTA | |
| TTTTCATGCTGGGTGGTTGCTATTTGAGATGCGTTAGGCGGCCAACTAAA | |
| AGGCGGCCAACAAAATCAAGAACCTGCACGGGATAACTTCATATGGCTTC | |
| CGACTCATGGCCGGCTTAATGCACAGGGCCTTACACGTATTGCAACCATT | |
| CTTACACGTATTGCAACCATTTTCATGCTGGGTGGTGGCTATTTGAGATG | |
| ACCCAGCATGAAAATGGTTGCAATACGTGTAAGGCCCTGTGCATTAAGCC | |
| GGCCTTACACGTATTGCAACCATTTTCATGCTGGGTGGTGGCTATTTGAG | |
| ATGCTGGGTGGTGGCTATTTGAGATGCGTTAGGCGCCCAACTAAATCAAG | |
| TCATGCTCGGTGGTGGCTATTTGAGATGCGTTAGGCGGCCAACTAAATCA | |
| GCATCTCAAATAGCCACCACCCAGCATGAAAATGGTTGCAATACGTGTAA | |
| ATGCTGGGAGGTGGCTATTTGAGATGCGTTAGGCGGCCAACTAAATCAAG | |
| CATATGAAGTTATCCCGTGCAGGTTCTTGATTTAGTTGGCCGCCTAACGC | |
| TTGAGATGCGTTAGGCGGCCAACTAAATCAAGAACCTGCACGGGATAACT | |
| TTACGACTCATGGCCGGCTTAATGCACAGGGCCTTACACGTATTGCAACC | |
| ATGGCCGGCTTAATGCACAGGGCCTTACACGTATTGCAACCATTTTCATG | |
| GGCTTACGACTCATGGCCGGCTTAATGCACAGGGCCTTACACGTATTGTA | |
| GATGCGTTAGGCGGCCAACTAAATCAAGAACCTGCACGGGATAACTTCAT | |
| TTTCATGCTGGGTGGTGGCTATTTGAGATGCGTTAGGCGGCCAACTAAAT | |
| GGTTCTTGATTTAGTTGGCCGCCTAACGCATCTCAAATAGCCACCACCCA | |
| TTCATGCTGGGTGGTGGCTATTTGAGATTCGTTAGGCGGCCAACTAAATC | |
| ATACACGTATTGCAACCATTTTCATGCTGGGTGGTGGCTATTTGAGATGC | |
| CACCACCCAGCATGAAAATGGTTGCAATACGTGTAAGGCCCTGTGCATTA | |
| TACGACTCATGGCCGGCTTAATGCACAGGGCCTTACACGTATTGCAACCA | |
| TGTCCGGCTTAATGCACAGGGCCTTACACGTATTGCAACCATTTTCATGC | |
| TGGTGGCTATTTGAGATGCGTTAGGCGGCAAACTAAATCAAGAACCTGCA | |
| AACGCATCTCAAATAGCCACCACCCAGCATGAAAATGGTTGCAATACGTG | |
| AAGTTATCCCGTGCAGGTTCTTCATTTAGTTGGCCGCCTAACGCATCTCA | |
| TATTTGAGATGCGTTAGGCGGCCATCTAAATCAAGAACCTGCACGGGATA | |
| TCTTGATTTAGTTGGCCGCCTAACGCATCTCAAATAGCCACCACCCAGCA | |
| TGCAGGTTCTTGATTTAGTGGGCCGCCTAACGCATCTCAAATAGCCACCA | |
| TGTTATCCCGTGCAGGTTCTTGATTTAGTTGGCCGCCTAACGCATCTCAA | |
| TCCCGTGCAGGTTCTTGATTTAGTTGGCCGCCTAACGCATCTCAAATAGC | |
| GCGTTAGGCGGCCAACTAAATCAAGAACCTGCACGGGATAACTTCATATG | |
| CACAGGACCTTACACGTATTGCAACCATTTTCATGCTGGGTGGTGGCTAT | |
| ATGAAGTTATCCCGTGCAGGTTCTTGATTTAGTTGGCCGCCTAACGCATC | |
| CCAGCATGAAAATGGTTGCAATACGTGTAAGGCCCTGTGCATTAAGCCGG | |
| AGCCACCACCCAGCATGAAAATGGTTGCAATACGTGTAAGGCCCTGTGCA | |
| TAACGCATCTCAAATAGCCACCACCCAGCATGAAAATGGTTGCAATACGT | |
| TTAGGCGGCCAACTAAATCTAGAACCTGCACGGGATAACTTCATATGGCT | |
| GCCTAACGCCTCTCAAATAGCCACCACCCAGCATGAAAATGGTTGCAATA | |
| ACTCATGGCCGGCTTAATGCACAGGGCCTTACACGTATTGCAACCATTTT | |
| GAAACTGGTTGCAATACGTGTAAGGCCCTGTGCATTAAGCCGGCCATGAG | |
| GCCATATGCAGTTATCCCGTGCAGGTTCTTGATTTAGTTGGCCGCCTAAC | |
| AAGCCATATGAAGTTATCCCGTGCAGGTTCTTGATTTAGTTGGCCGCCTA | |
| GGCTTAATGCACAGGGCCTTACACGTATTGCAACCATTTTCATGCTGGGT | |
| GGCCGGCTTAATGCACAGGGCCTTACACGTATTGCAACCATTTTCATGCT | |
| CTTAATGCCCAGGGCCTTACACGTATTGCAACCATTTTCATGCTGGGTGG | |
| GTGGCTATTTGAGATGCGTTAGGCGGCCAACTAAATAAAGAACCTGCACG | |
| AGGGCCTTACACGTATTGCAACCATTTTCATGCTGGGTGGTGGCTATTTG | |
| ATGCACAGGGCCTTAAACGTATTGCAACCATTTTCATGCTGGGTGGTGGC | |
| CGTATTGCAACCATTTTCATGCTGGGTGGTGGCTATTTGAGATGCGTTAG | |
| GCACAGGGCCTTACACGTATTGCAACCATTTTCATGCAGGGTGGTGGCTA | |
| GGTGGCTATTCGAGATGCGTTAGGCGGCCAACTAAATCAAGAACCTGCAC | |
| CATTTTCATGCTGGGTGGTGGCTATTTGAGATGCGTTAGGCGGCCAACTA | |
| TAGCCACCACCCAGCATGAAAATGGTTGCAATACGTGTAAGGCACTGTGC | |
| AGTTATCCCGTGCAGGTTCTTGATTTAGTTGGCCGCCTAACGCATCTCAA | |
| ATTTTCATGCTGGGTGGTGGCTATTTGAGATGCGTTAGGCGGCCAACTAA | |
| ATGCACAGGGCCTTACACGTATTGCAACCATTTTCATGCTGGGTGGTGGC | |
| TGAGATGCGTTAGGCGGCCAACTAAATCAAGAACCTGCACGGGATAACTT | |
| TGCAGGTTCTTGATTTAGTTGGCCGCCTAACGCATCTCAAATAGGCACCA | |
| AGCCACTACCCAGCATGAAAATGGTTGCAATACGTGTAAGGCCCTGTGCA | |
| CAGCATGAAAATGGTTGCAATACGTGTAAGGCCCTGTGCATTAAGCCGCC | |
| TTACGACTCATGGCCGGCTTCATGCACAGGGCCTTACACGTATTGCAACC | |
| CTCAAATAGCCACCACCCAGCATGAAAATGGTTGCAATACGTGTAAGGCC | |
| TAGTTGGCCGCCTAACGCATCTCAAATAGCCACCACCCAGCATGAAAATG | |
| ACAGGGCCTTACACGTATTGCAACCATTTTCATGCTGGGTGGTGGCTATT | |
| TTCTTGATTTAGTTGGCCGCCTAACGCATCTCAAATAGCCCCCACCCAGC | |
| GACTCATGGCCGGCTTAATGCACAGGGCCTTACACGTATTGCAACCATTT | |
| CCGCCTAACGCATTTCAAATAGCCACCACCCAGCATGAAAATGGTTGCAA | |
| TGCAATACGTGTAAGGCCCTGTGCATTAAGCCGGCCATGAGTCGTAAGCC | |
| AGGGCCTTACACGTATTGCAACCATTTACATGCTGGGTGGTGGCTATTTG | |
| ATATGAAGTTATCCCGTGCAGGTTCTTGATTTAGTTGGCCGCCTAACGCA | |
| TTAATGCACAGGGCCTTACACGTATTGCGACCATTTTCATGCTGGGTGGT | |
| TACGACTCATGGCCGGCTTAATGCACAGGGCCTTGCACGTATTGCAACCA | |
| TTTGAGATGCGTTAGGCGGCCAACTAAATCAAGAACCTGCACGGGATAAC | |
| GGTTTAGTTGGCCGCCTAACGCATCTCAAATAGCCACCACCCAGCATGAA | |
| ATCTCAAATAGCCACCACCCAGCATGAAAATGGTTGCAATACGTGTAAGG | |
| TATGAAGTTATCCCGTGCAGGTTCTTGATTTAGTTGGCCGCCTAACGGAT | |
| TTGCACAGGGCCTTACACGTATTGCAACCATTTTCATGCTGGGTGGTGGC | |
| GATTTAGTTTGCCGCCTAACGCATCTCAAATAGCCACCACCCAGCATGAA | |
| GGTTCTTGATTTAGTTGGCCGCCTAACGCATCTCAAATACCCACCACCCA | |
| GTTGCAAAACGTGTAAGGCCCTGTGCATTAAGCCGGCCATGAGTCGTAAG | |
| AACCATTTTCATTCTGGGTGGTGGCTATTTGAGATGCGTTAGGCGGCCAA | |
| TGCAGGTTCTTGATTGAGTTGGCCGCCTAACGCATCTCAAATAGCCACCA | |
| TTTAGTTGGCCGCCTTACGCATCTCAAATAGCCACCACCCAGCATGAAAA | |
| GGGTGGTGGCTATTTGAGATGCGTTAGGCGGCCAACTAAATCAAGAACCT | |
| GCCTAACGCATCTCAAATAGCCACCACCCAGCATGAAAATGGTTGCAATA | |
| GGCCGGCTTAATGCACAGGGCCTTACACGTATTGCAACCATTTTCATGCT | |
| CGTGCAGGTTCTTGATTTAGTTGGCCGCCTAACGCATCTCAAATAGCCAC | |
| TAGGCGGCCAACTAAATCAAGAACCTGCACGGGATAACTTCATATGGCTT | |
| CAACCATTTTCATGCTGGGTGGTGGCTATTTGAGATGCGTTAGGCGGCCA | |
| TCAAATAGCCACCTCCCAGCATGAAAATGGTTGCAATACGTGTAAGGCCC | |
| CGACTCATGGCGGGCTTAATGCACAGGGCCTTACACGTATTGCAACCATT | |
| CCATTTTCATGCTGGGTGGTGGCTATTTGAGATGCGTTAGGCGGCCAACT | |
| TGGCCGCCTAACGCATCTCAAATAGCCACCACCCAGCATGAAAATGGTTG | |
| CTTACGACTCATGGCCGGCTTAATGCACAGGGCCTTACACGTATTGCAAC | |
| CCGTGCAGGTTCTTGATTTAGTTGGCCGCCTAACGCATCTCAAATAGTCA | |
| ACCACCCAGCATGAAAATGGTTGCAATACGTGTAAGGCCCTGTGCATTAA | |
| CGTTAGGCGGCCAACTAAATCAAGAACCTGCACGGGATAACTTCATATGG | |
| CCGCCTAACGCATCTCAAATAGCCACCACCCAGCATGAAAATGGTTGCAA | |
| GAAGTTATCCCGTGCAGGTTCTTGATTTAGTTGGCCGCCTAACGCATCTC | |
| CTTGATTTAGTTGGCCTCCTAACGCATCTCAAATAGCCACCACCCAGCAT | |
| CTTACACGTATTGCAACCATTTTCATGCTGGGTGGTGGCTATTTGAGATG | |
| GTATTGCAACCATTTTCTTGCTGGGTGGTGGCTATTTGAGATGCGTTAGG | |
| AAAATGGTTGCAATACGTGTAAGGCCCTGTGCATTAAGCCGGCCACGAGT | |
| TGAAAATGGTTGCAATACGTGTAAGGCCCTGTGTATTAAGCCGGCCATGA | |
| TCAAATAGCCACCACCCAGCATGAAAATGGTTGCAATACGTGTAAGGCCC | |
| CCTTACACGTATTGCAACCATTTTCATGCTGGGTGGTGGCTATTTGAGAT | |
| GAGATGCGTTAGGCGGCCAACTAAATCAAGAACCTGCACGGGATAACTTC | |
| CAGGTTCTTGATTTAGTTGGTCGCCTAACGCATCTCAAATAGCCACCACC | |
| AACCATTTTCATGCTGGGTGGTGGCTACTTGAGATGCGTTAGGCGGCCAA | |
| GCTGGGTGGTGGCTATGTGAGATGCGTTAGGCGGCCAACTAAATCAAGAA | |
| AGCCACCACCCAGCATGAAAATAGTTGCAATACGTGTAAGGCCCTGTGCA | |
| CCTTACACGTATTGCAGCCATTTTCATGCTGGGTGGTGGCTATTTGAGAT | |
| GCACAGGGCCTTACACGTATTGCAACCATTTTCATGCTGGGTGGTGGCTA | |
| TTACGACTGATGGCCGGCTTAATGCACAGGGCCTTACACGTATTGCAACC | |
| TCCCGTGCAGGTTCTTGATTTAGTTGGCCGCCTAACGCATCACAAATAGC | |
| GCCACCACCCAGCATGAAAATGGTTGCAATACGTGTAAGGCCCTGTGCAT | |
| AGATGCGTTAGGCGGCCAACTAAATCAAGAACCTGCACGGGATAACTTCA | |
| ACTCATGGCCGGCTTAATGCACAGGGCCTTACACGTATTGCAACCATTTT | |
| GGCTATTTGAGATGCGTTAGGCGGCCAACTAAATCAAGAACCTGCACGGG | |
| CATGGCCGGCTTAATGTACAGGGCCTTACACGTATTGCAACCATTTTCAT | |
| CATGCTGGGTGGTGGCTATTTGAGATGCGTTAGGCGGCCAACTAAATCAA | |
| GCGGCTTACGACTCATGGCCGGTTTAATGCACAGGGCCTTACACGTATTG | |
| TCGGCTTACGACTCATGGCCGGCTTAATGCACAGGGCCTTACACGTATTG | |
| TGATTTAGTTGGCCGCCTAACGCATCTCAAATAGCCACCACCCAGCATGA | |
| CGTTAGGCGGCCAACTAAATCAAGAACCTGCACGGGATAACTTCATATGG | |
| TTACACGTATTGCAACCATTTTCATGCTGGGTGGTGGCTATTTGAGATGC | |
| CATATGAAGTTATCCCGTGCAGGTTCTTGATTTAGTTGGCCGCCTAACGC | |
| CACAGGGCCTTACACGTATTGCACCCATTTTCATGCTGGGTGGTGGCTAT | |
| TTACGACTCATGGCCGGCTTAATGCACAGGGCCTTACACGTATTGCAACC | |
| CCATATGAAGTTATCCCGTGCAGGTTCTTGATTTAGTTGGCCGCCTAACG | |
| CATGGCCGGCTTAATGCACAGGGCCTTACACGTATTGCAACCATTTTCAT | |
| CTATTTGAGATGCGTTAGGCGGCCAACTAAATCAAGAACCTGCACGGGAT | |
| CGGCTTACGACTCATGGCCGGCTTAATGCACAGGGCCTTACACGTATTGC | |
| ACACGTATTGCAACCATTTTCATGCTGGGTGGTGGCTATTTGAGATGCGT | |
| CCTAACGCATCTCAAATAGCCACCACCCAGCATGAAAATGGTTGCAATAC | |
| CAAATATCCACCACCCAGCATGAAAATGGTTGCAATACGTGTAAGGCCCT | |
| TGCACAGGGCCTTACACGTATTGCAACCATTTTCATGCTGGGTGGTGGCT | |
| ATTTGAGATGCGTTAGGCGGCTAACTAAATCAAGAACCTGCACGGGATAA | |
| CTTAATGCACAGGGCCTTACATGTATTGCAACCATTTTCATGCTGGGTGG | |
| CCGTGCAGGTTCTTGATTTAGTTGGCCGCCTAACGCATCTCAAATAGCCA | |
| CATCTCAAATAGCCACCACCCAGCATGAAAATGGTTGCAATACGTGTAAG | |
| GGGTGGTGGCTATTTGAGATGCGTTAGGCGGCCAACTAAATCAAGAACCT | |
| ACACGTATTGCAACCATTTTCATGCTGGGTGGTGGCAATTTGAGATGCGT | |
| GGCCGGCTTAATGCACAGGGCCTTACACGTATTGCAACCATTTTCATGCT | |
| GCCATATGAAGTTATCCCGTGCAGGTACTTGATTTAGTTGGCCGCCTAAC | |
| CCTTACACGTATTGCAACCATTTTCATGCTGGGTGGTGGCTATTTGAGAT | |
| GTTGCAATACGTGTAAGGCCCTGTGCAGTAAGCCGGCCATGAGTCGTAAG | |
| AATGGTTGCAATACGTGTAAGGCCCTGTGCATTGAGCCGGCCATGAGTCG | |
| GTATTGCAACCATTTTCATGCTGGTTGGTGGCTATTTGAGATGCGTTAGG | |
| TAATGCACATGGCCTTACACGTATTGCAACCATTTTCATGCTGGGTGGTG | |
| GTGGTGGCTATTTGAGATGCGTTAGGCGGCCAACTAAATCAAGAACCTGC | |
| GGCTTAATGCACAGGGCCTTACACGTATTGCAACCATTTTCATGCTGGGT | |
| TTTGAGATGCGTTAGGCGGCCAACTAAATCAAGAACCTGCACGGGATAAC | |
| AATCCCGTGCAGGTTCTTGATTTAGTTGGCCGCCTAACGCATCTCAAATA | |
| GTGGCTATTTGAGATGCGTTAGGCGGCCAACTAAATCAAGAACCTGCATG | |
| TGCAACCATTTTCATGCTTGGTGGTGGCTATTTGAGATGCGTTAGGCGGC | |
| GCCACTACCCAGCATGAAAATGGTTGCAATACGTGTAAGGCCCTGTGCAT | |
| CTTACGACTCATGGCCGGCTTAATGCACAGGGCCTTACACGTATTGCAAC | |
| CCGGCTTAATGCACAGGGCCTTACACGTATTGCAACCATTTTCATGCTGG | |
| TAGTTGGCCGCCTAACGCATCTCAAATAGCCACCACCCAGCATGAAAAGG | |
| CAACCATTTTCATGCTGGGTGGTGGCTATTTGAGATGCGTTAGGCGGCCA | |
| CTTACGACTCATGGCCGGCTTAATGCACAGGGCCTTACACGTATTGCAAC | |
| ATTTGAGATGCGTTAGGCGGCCAACTAAATCAAGAACCTGCACGGGATAA | |
| TACGACTCATGGCCGGCTTAATGCACAGGGCCTTACACGTATTGCAACCA | |
| GATTTAGTTGGCCGCCTAACGCATCTAAAATAGCCACCACCCAGCATGAA | |
| CCGCCTAACGCATCTCAAATAGCCACCACCCAGCATGAAAATGGTTGCAA | |
| CTCATGGCCGGCTTAATGCACAGGGCCTTACACGTATTGCGACCATTTTC | |
| TTGGCCGCCTAACGCATCTCAAATAGCCCCCACCCAGCATGAAAATGGTT | |
| GCTTACGACTCATGGCCGGCTTAATGCACAGGGCCTTACACGTATTGCAA | |
| TAGTTGGCCGCCTAACGCATCTCAAATAGCCACCACCCAGCATGAAAATG | |
| CCACCACCTAGCATGAAAATGGTTGCAATACGTGTAAGGCCCTGTGCATT | |
| GGTTCTTGATTTAGTTGGCCGCCTAACGCATCTCAAATAGCCACCACCCA | |
| CCATTTTCATGCTGGGTGGTGGCTATTTGAGATGCGTTAGGCGGCCGACT | |
| ATCCCGTGCAGGTTCTTGATTTAGTTGGCCGCCTAACGCATCTCAAATAG | |
| CTTACACGTATTGCAACCATTTTCATGCTGGGTGGTGGCTATTTGAGATG | |
| GGCGGCCAACTAAATCAAGAAGCTGCACGGGATAACTTCATATGGCTTCA | |
| TTTAGTTGGCCGCCTAACGCATCTCAAATAGCCACCACCCAGTATGAAAA | |
| ACTCATGGCCGGCTTAATGCACAGGGCCTTACACGTATTGCAACCATTTT | |
| GCCGGCTTAATGCACAGGGCCTTACACGTATTGCAACCATTTTCATGCTG | |
| ATTGCAACCATTTTCATGCTGGGTGGTGGCTATTTGGGATGCGTTAGGCG | |
| CCTTACACGTATTGCAACCATTTTCATGCTGGGTGGTGGCTATGTGAGAT | |
| ATTTAGTTGGCCGCCTAACGCATCTCAAATAGCCACCGCCCAGCATGAAA | |
| TCTCAAATAGCCACCACCCAGCATGAAAATGGTTGCAATACGTGTAAGGC | |
| ATTTGAGATGCGTTAGGCGGCCAACTAAATGAAGAACCTGCACGGGATAA | |
| CATGCTGGGTGGTGGCTATTTGAGATGCGTTAGGCGGCCAACTAAATCAA | |
| ATTTAGTTGGCCGCCTAACGCATATCAAATAGCCACCACCCAGCATGAAA | |
| TTGGCCGCCTAACGCATCTCAAATAGCCACCACCCAGCATGAAAATGGTT | |
| TCATGCTGGGTGGTGGCTATTTGAGATGCGTTAGGCGGCCAACTAAATCA | |
| ACGACTCATGGCCGGCTTAATGCACAGGGCCTTAAACGTATTGCAACCAT | |
| AGGTTCTTGATTTAGTTGGCCGCCTAACGCATCTCAAATAGCCACCACCC | |
| GCTGGGTGGTGGCTATTTGAGATGCGTTAGGCGGCCAACTAAATCAAGAA | |
| CGGGGTGGTGGCTATTTGAGATGCGTTAGGCGGCCAACTAAATCAAGAAC | |
| GACTCATGGCCGGCTTAATGCACAGGGCCTTACACGTATTGCAACCATTT | |
| TGCGGCATACGACTCATGGCCGGCTTAATGCACAGGGCCTTACACGTATT | |
| CTTGATTTAGTTGGCCGCCTAACGCATCTCAAATAGCCACCACCCAGCAT | |
| TACGACTCATGGCCGGCTTAATGCACAGGGCCTTACACGTATTGCAACCA | |
| TATTTGAGATGCGTTAGGCGGCCAACTAAATCAAGAACCTGCACGGGATA | |
| TGAAAATGTTTGCAATACGTGTAAGGCCCTGTGCATTAAGCCGGCCATGA | |
| GCCATATGAAGTTATCCCGTCCAGGTTCTTGATTTAGTTGGCCGCCTAAC | |
| TCCCGTGCAGGTCCTTGATTTAGTTGGCCGCCTAACGCATCTCAAATAGC | |
| GGCTTAATGCACAGGGCCTTACACGTATTGCAACCATTTTCATGCTGGGT | |
| ATGTCCGGCTTAATGCACAGGGCCTTACACGTATTGCAACCATTTTCATG | |
| TACGTGTAAGGCCCTGTGCATTAAGCCGGCCATGAGTCGTGAGCCGCATA | |
| TGCTGGGTGGTGGCTATTTGAGATGCGTTAGGCGGCCAACTAAATCAAGA | |
| TGCAGGTTCTTGATTTAGTTGGCCGCCTAACGCATCTCAAATAGCCACCA | |
| GGCCGGCTTAATGCACAGGGCCTTACACGGATTGCAACCATTTTCATGCT | |
| GCATGAAAATGGTTGCAATACGTGTAAGGCCCTGTGCATTAAGCCGGCCA | |
| TGGTTGCAATACGTGTAAGGCCCTGTGCATTAAGCCGGCCATGAGTCGTA | |
| AAGTGTAAGGCCCTGTGCATTAAGCCGGCCATGAGTCGTAAGCCGCATAT | |
| AACCATTTTCATGCTGGGTGGTGGCTATGTGAGATGCGTTAGGCGGCCAA | |
| AAATAGCCACCACCCAGCCTGAAAATGGTTGCAATACGTGTAAGGCCCTG | |
| AAAGCACAGGGCCTTACACGTATTGCAACCATTTTCATGCTGGGTGGTGG | |
| TAGGCGGCCAACTAAATCAAGAACCTGCACGGGATAACTTCATATGGCTT | |
| GGTGGTGGCTATTTGAGATGCGTTAGGCGGCCAACTAAATCAAGAACCTG | |
| TACGTGTAAGGCCCTGTGCATTAAGCCGGCCATGAGTCGTAAGCCGCATA | |
| GCCTAACGCATCTCAAATAGCCACCACCCAGCATGAAAATGGTTGCAATA | |
| CTTACGACTCATGGCCGGCTTAATGCACAGGGCCTTACACGTATTGCAAC | |
| CTATATGAGATGCGTTAGGCGGCCAACTAAATCAAGAACCTGCACGGGAT | |
| ACTCATGGCCAGCTTAATGCACAGGGCCTTACACGTATTGCAACCATTTT | |
| GGTGGCTATTTGAGATGCGTTAGGCGGCCAACTAAATCAAGAAGCTGCAC | |
| GCCTAACGCATCTCAAATAGCCACCACCCAGCATGAAAATAGTTGCAATA | |
| AACGCATCTCAAATAGCCACCACCCAGCATGAAAATGGTTGCAATACGTG | |
| ATACGTGTAAGGCCCTGTGCATTAAGCCGGCCATGAGTCGTAAGCCGCAT | |
| CATGCTGGGTGGTGGCTATTTGAGATGCGTTAGGCGGCCAACTAAATCAA | |
| TAATGCACAGGGCCTTACACGTATTGCAACCATTTTCATGCTGGGTGGTG | |
| GACTCATGGTCGGCTTAATGCACAGGGCCTTACACGTATTGCAACCATTT | |
| CAATACGTGTAAGGCCCTGTGCATTAAGCCGGTCATGAGTCGTAAGCCGC | |
| TTGCAATACGTGTAAGGCCCTGTGCATTAAGCCGGCCATGAGTCGTAAGC | |
| GGCTTAATGCACAGGGCCTTACACGTATTGCAACCATTTTCATGCTGGGT | |
| TTTACATGCTGGGTGGTGGCTATTTGAGATGCGTTAGGCGGCCAACTAAA | |
| TTGATTTAGTTGGCCGCCTAACGCATCTCAAATAGCCACCACCCAGCATG | |
| TTGATTTAGTTGGCCGCCTAACGCATCTCAAATAGCCACCACCCAGCATG | |
| CGACTCATGCCCGGCTTAATGCACAGGGCCTTACACGTATTGCAACCATT | |
| GAAAATGGTTGCAATACGTGTAAGGCCCTGTGCATTAAGCCGGCCATGAG | |
| ACTCATGGCCGGCTTAATGCACAGGGCCTTACACGTATTGCAACCATTTT | |
| ACGACTCATGGCCGGCTTAATGCACAGGGCCTCACACGTATTGCAACCAT | |
| ATCCCGTGCAGGTTCTTGATTTAGTTGGCCGCCTAACTCATCTCAAATAG | |
| GTGGTGGCTATTTGAGATGCGTTAGGCGGCCAACTAAATCAAGAACCTGC | |
| GGTGGCTATTTGAGATGCGTTAGGCGGCCAACTAAATCAAGAACCTGCAC | |
| TGCGTTAGGCGGACAACTAAATCAAGAACCTGCACGGGATAACTTCATAT | |
| CATATGAAGTTATCCCGTGCAGGTTCTTGATTTAGTTGGCCGCCTAACGC | |
| GAAGCCATATGAAGTTATCCCGTGCAGGTTCTTGATTTAGTTGGCCGCCT | |
| TACACGTATTGCAACCATTTTCATGCTGGGTGGTGGCTATTTGAGGTGCG | |
| ACCACCCAGCATGAAAATGGTTGCAATACGTGTAAGGCCCTGTGCATTAA | |
| CAACCATTTTCATGCTGGGTGGTGGCTATTTGAGATGCGTTAGGCGGCCA | |
| GCCGCCTAACGCATCTCAAATAGCCACCACCCAGCATGAAAATGGTTGCA | |
| CACCACCCAGCATGAAAATGGTTGCAATACGTGTAAGGCCCTGTGCATTA | |
| ATATGCGGCTTACGACTCATGGCCGGCTTGATGCACAGGGCCTTACACGT | |
| GCATCTCAAATAGCCACCACCCAGCATGAAAATGGTTGCAATACGTGTAA | |
| TGAAAATGGTTGCAATACGTGTAAGGCCCTGTGCATTAAGCCGGCCATGA | |
| AAATGGTTGCAATACGTGTAAGGCCCTGTGCATTAAGCCGGCCATGAGTC | |
| ATGCGTTAGGCGGCCAACTAAATCAAGAACCTGCACGGGATAACTTCATA | |
| TTTAGTTGGCCGCCTAACGCATCTCAAATAGCCACCACCCAGCATGAAAA | |
| ACCACCCAGCATGAAAATGGTTGCAATACGTGTAAGGCCCTGTGCATTAA | |
| GCGGCTTACGACTCATGGCCGGCTTAATGCACAGGGCCTTACACGTATTG | |
| CGTATTGCAACCATTTTCATGCTGGGTGGTGGCTATTTGAGATGCGTTAG | |
| CGACTCATGGTCGGCTTAATGCACAGGGCCTTACACGTATTGCAACCATT | |
| ATGCGTTAGGCGGCCAACTAAATCAAGAACCTGCACGGGATAACTTCATA | |
| CTTGATTTAGTTGGCCGCCTAACGCATCTCAAATAGCCACCACCCAGCAT | |
| AAATAGCCACCACCCAGCATGAAAATGGTTGCCATACGTGTAAGGCCCTG | |
| GCTTACGACTCATGGCCGGCTTAATGCACAGGGCCTTACACGTATTGCAA | |
| GTTCTTGATTTAGTTGGCCGCCTAACGCATCTCAAATAGCCACCACCCAG | |
| CAGCTTACGACTCATGGCCGGCTTAATGCACAGGGCCTTACACGTATTGC | |
| ATGAAAATGGTTGCAATACGTGTAAGGCCCTGTGCATTAAGCCGGCCATG | |
| TATTTGACATGCGTTAGGCGGCCAACTAAATCAAGAACCTGCACGGGATA | |
| TGGCTATTTGAGATGCGTTAAGCGGCCAACTAAATCAAGAACCTGCACGG | |
| TTGCAATACGTGTAAGGCCCTGTGCATTAAGCCGGCCATGAGTCGTAAGC | |
| GCAACCATTTTCATGCTGGGTGGTGGCTATTTGAGATGCGTTAGGCGGCC | |
| CGTGCAGGTTCTTGATTTAGTTGGCCGCCTAACGAATCTCAAATAGCCAC | |
| TCATGCTGGGTGGTGGCTATTTGAGATGCGTTAGGCGGCCAACTAAATCA | |
| TGAAGCTATCCCGTGCAGGTTCTTGATTTAGTTGGCCGCCTAACGCATCT | |
| AAAATGGTTGCAATACGTGTAAGGCCCTGTGCATTAAGCCGGCCATGAGT | |
| GCGTTAGGCGGCCAACTAAATCAAGAACCTGCACGGGATAACTTCATATG | |
| TGCGGCTTACGAGTCATGGCCGGCTTAATGCACAGGGCCTTACACGTATT | |
| GCCGGCTTAATGCACTGGGCCTTACACGTATTGCAACCATTTTCATGCTG | |
| ATGGCCGGCTTAATGCATAGGGCCTTACACGTATTGCAACCATTTTCATG | |
| TATCCCGTGCAGGTTCTTGATTTAGTTCGCCGCCTAACGCATCTCAAATA | |
| ACTCATGGCCGGCTTAATGCACAGGGCCTTACACGTATTGCAACCATTTT | |
| GTTATCCCGTGCAGGTTCTTGATTTAGTTGGCCGCCTAACGCATCTCAAA | |
| CGGCTTAATGCACAGGGCCTTACACGTATTGCAACCATTTTCATGCTGGG | |
| AAGCCATATGAAGTTATCCCGTGCAGGTTCTTGATTTAGTTGGCCGCCTA | |
| ATGAGGCTTACGACTCATGGCCGGCTTAATGCACAGGGCCTTACACGTAT | |
| CTTACGACTCATGGACGGCTTAATGCACAGGGCCTTACACGTATTGCAAC | |
| GATGCGTTAGGCGGCCAACTAAATCAAGAACCTGCACGGGATAACTTCAT | |
| TGGCCGCCTAACGCATCTCAAATAGCCACCACCCAGCATGAGAATGGTTG | |
| CCTAACGCATCTCAAATAGCCACCACCCAGCATGAAAATGGTTGCAATAC | |
| GGTTCTTGATTTAGTTAGCCGCCTAACGCATCTCAAATAGCCACCACCCA | |
| TCATGCTGGGTGGTGGCTATTTGAGATGCGTTAGGCGGCCAACTAAATCA | |
| ATCTCAAATAGCCACCACCCAGCATGAAAATGGTTGCAATACTTGTAAGG | |
| CACAGGGCCTTACACGTATTGCAACCATTTTCATGCTGGGTGGTGGCTAT | |
| GGCTTACGACTCATGGCCGGCTTAATGCACAGGGCCTTACACGTATTGCA | |
| TCATGCTGGGTGGTGGCTATTTGAGCTGCGTTAGGCGGCCAACTAAATCA | |
| AAGTTATCCCGTGCAGGTTCTTGATTTAGTTGGCCGCCTAACGCATCTCA | |
| CATTTTCATGCTGGGTGGTGGCTATTTGAGATGCGTTAGGCGGCCAACTA | |
| TTGCAATACGTGTAAGGCCCTGTGCATTAAGCCGGCCATGAGTCGTAAGC | |
| CACGTATTGCAACCATTTTCATGCTGGGTGGTGGCTATTTGAGATGCGTT | |
| CAACCATTTTCATGCTGGGTGGTGGCTATTTGAGATGCGTTAGGCGGCCA | |
| TTACACGTATTGCAACCATTTTCATGCTGGGTGGTGGCTATTTGAGATGC | |
| GTGTTAGGCGGCCAACTAAATCAAGAACCTGCACGGGATAACTTCATATG | |
| TTAGTTGGCCGCCTAACGCATCTCAAATAGCCACCACCCAGCATGAAACT | |
| GCAACCATTTTCATGCTGGGTGGTGGCTATTTGAGATGCGTTAGGCGGCC | |
| GCAGGTTCTTGATTTAGTTGGCCGCCTAACGCATCTCAAATAGCCACCAC | |
| TATTTGAGATGCGTTAGGCGGCCAACTAAATCAAGAACCTGCATGGGATA | |
| ATGAAAATGGTTGCAATACGTGTAAGGCCCTGTGCATTAAGCCGGCCATG | |
| GTTAGGCGGCCAACTAAATCAAGAACCTGCTCGGGATAACTTCATATGGC | |
| TGGTGGCTATTTGAGATGTGTTAGGCGGCCAACTAAATCAAGAACCTGCA | |
| GATTTAGTTGGCCGCCTAACGCATCTCAAATAGCCACCACCCAGCATGAA | |
| GGTTCTTGATTTAGTTGGCCGCCTAACGCATCTCAAATAGCCACCACCCA | |
| GTTGGCCGCCTAACGCATCTCAAATAGCCACCACCCAGCATGAAAATGGT | |
| GCCGGCTTAATGCACAGGGCCTTACACGTATTGCAACCATTTTCATGGTG | |
| TTAGGCGGCCAACTAAATCCAGAACCTGCACGGGATAACTTCATATGGCT | |
| TGCAGGTTCTTGATTTAGTTGGCCGCCTAACGCATCTCAAATTGCCACCA | |
| AGCATGAAAATGGTTGCAATACGTGTAATGCCCTGTGCATTAAGCCGGCC | |
| CAGGGCCTTACACGTATTGCTACCATTTTCATGCTGGGTGGTGGCTATTT | |
| GCTATTTGAAATGCGTTAGGCGGCCAACTAAATCAAGAACCTGCACGGGA | |
| ACCATTTTCATGCGGGGTGGTGGCTATTTGAGATGCGTTAGGCGGCCAAC | |
| ATGCACAGGGCCTTACACGTATTGCAACCATTTTCATGCTGGGTGGTGGC | |
| AGATGCGTTAGGCGGCCAACTAAATCAAGAACCTGCACGGGATAACTTCA | |
| GCCTAACGCATCTCAAATAGCCACCGCCCAGCATGAAAATGGTTGCAATA | |
| TCATGGCCGGCTTAATGCACAGGGCCTTACACGAATTGCAACCATTTTCA | |
| ACCACCCAGCATGAAAATGGTTGCAATTCGTGTAAGGCCCTGTGCATTAA | |
| ATAGCCACCACCCAGCATGAAAATGGTTGCAATACGTGTAAGGCCCTGTG | |
| CCATATGAAGTTATCCCGTGGAGGTTCTTGATTTAGTTGGCCGCCTAACG | |
| TTCATGCTGGGTGGTGGCTATTTGAGATGCGTTAGGCGGCCAACTAAATC | |
| GCATGAAAATGGTTGCAATACGTGTAAGGCCCTGTGCATTAAGCCGGCCA | |
| TTGCAATACGTGTAAGGCCCTGTGCATTAAGCCGGCCATGTGTCGTAAGC | |
| TTAGGCGGCCAACTAAATCAAGAACCTGCACGGGATAACTGCATATGGCT | |
| ATGCACAGGGCCTTACACGTATTGCAACCATTTTCATGCTGGGTGATGGC | |
| ACTCATGGCCGGCTTAATGCACAGGGCCTTACACGTATTGCAACCATTTT | |
| TTAGTTGGCCGCCTAACGCATCTCAAATAGCCACCACCCAGCATGAAAAT | |
| TAGTTGGCCGCCTAACGCATCTCAAATAGCCACCACCCAGCATGAAAATG | |
| ATGCTGGGTAGTGGCTATTTGAGATGCGTTAGGCGGCCAACTAAATCAAG | |
| TGCGTTAGGCGGCCAACTAAATCAAGATCCTGCACGGGATAACTTCATAT | |
| AATGCACAGGGCCTTACACGTATTGCAACCATTTTCATGCTGGGTGGTGG | |
| TGCGGCTTACGACTCATAGCCGGCTTAATGCACAGGGCCTTACACGTATT | |
| ATGCGGCTTACGACTCATGGCCGGCTTAATGCACAGGGCCTTACACGTAT | |
| TTGCAACCATTTTCATGCTGGGTGGTGGCTATTTGAGATGCGTTAGGCGG | |
| TAGCCACCACCCAGCATGAAAATGGTTGCAATACGTGTAAGGCCCTGTGC | |
| TGAAAAGGGTTGCAATACGTGTAAGGCCCTGTGCATTAAGCCGGCCATGA | |
| TACGACTCATGGCCGGCTTAATGCACAGGGCCTTACACGTATTGCAACCC | |
| GCATCTCAAATAGCCACCACCCAGCATGAAAATGGTTGCAATACGTGTAA | |
| TACAGGTTCTTGATTTAGTTGGCCGCCTAACGCATCTCAAATAGCCACCA | |
| CGTATTGCAACCATTTTCATGCTGGGTGGTGGCTATTTGAGATGCGTTAG | |
| TTTAGTTGGCCGCCTAACGCATCTCAAATAGCCACCACCCAGCATGAAAA | |
| CCTAACGCATCTCAAATAGCCACCACCCAGCATGAAAATGGTTGCAATAC | |
| GGGCAAATGCAGCCATGCCCAAATATATTTGGGCATGGCTGCATTTGCCA | |
| AAGCCATATGAAGTTATCCCGTGCAGGTTCTTGATTTAGTTGGCCGCCTA | |
| GCACAGGGCCTTACACGTATTGCAACCATTTTCATGCTGGGTGGTGGCAA | |
| ACGTATTGCAACCATTTTCATGCTGGGTGGTTGCTATTTGAGATGCGTTA | |
| GAAGGTTCTTGATTTAGTTGGCCGCCTAACGCATCTCAAATAGCCACCAC | |
| GTATTGCAACCATTTTCATGCTGGCTGGTGGCTATTTGAGATGCGTTAGG | |
| CAGCATGAAAATGGTTGCAATACGTATAAGGCCCTGTGCATTAAGCCGGC | |
| CCGTGCAGGTTCTTGATCTAGTTGGCCGCCTAACGCATCTCAAATAGCCA | |
| ATTGCAACCATTTTCATGCTGGGTGGTGGCTATTTGAGATGCGTTAGGCG | |
| CCGCCTAACGCATCTCAAATAGCCACCACCCAGCATGAAAATGGTTGCAA | |
| TGGCCGGCTTAATGCACAGGGCCTTACGCGTATTGCAACCATTTTCATGC | |
| ACGTATTGCAACCATTTTCATGCTGGGTGGTAGCTATTTGAGATGCGTTA | |
| AAGTTATCCCGTGCAGGTTCTTGATTTAGTTGGCCGCCTAACGCATCTCA | |
| TAACGCATCTCAAATAGCCACCACCCAGCATGAAAATGGTTGCAATACGT | |
| TGAAGTTATCCCGTGCAGGTTCTTGATTTAGTTGGCCGCCTAACGCATCT | |
| CATGCTGGGTGGTGGCTATTTGAGATGCGTTAGGCGGCCAACTAAATCAA | |
| ATTTGAGATGCGTTAGGCGGCCAACTAAATCAAGAACCTGCACGGGATAA | |
| TGATTTAGTTGGTCGCCTAACGCATCTCAAATAGCCACCACCCAGCATGA | |
| CAGCATGAACATGGTTGCAATACGTGTAAGGCCCTGTGCATTAAGCCGGC | |
| TTGCAATACGTGTAAGGCCCTGTGCATTAAGCCGGCCATGAGTCGTAAGC | |
| CTCATGGCCGGCTTAATGCACAGGGCCTTACACGTGTTGCAACCATTTTC | |
| CCATATGAAGTTATCCCGTGCAGGTTCTTGATTTAGTTGGCCGCCTAACG | |
| TTAGTTGGCCGCCTAACGCATCTCAAATAGCCACCACCCAGCATGAAAAT | |
| GCCTAACGCATCTCAAATAGCCACCACCCAGCATGGAAATGGTTGCAATA | |
| GCATCTCAAATAGCCACCACCCAGCATGAAAATGGTTGCAATACGTGTAA | |
| GATTTAGTTGGCCGCCTAACGCATCTCAAATAGCCACCACACAGCATGAA | |
| TTAATGCTCAGGGCCTTACACGTATTGCAACCATTTTCATGCTGGGTGGT | |
| GGTTGCAATACGTGTAAGGCCCTGTCCATTAAGCCGGCCATGAGTCGTAA | |
| GCCTTACACGTATTGCAACCATTTTCATGCTGGGTGGTGGCTATTTGAGA | |
| CCATTTTCATGCTGGGTGGTGGCTATTTGAGATGCGTTAGGCGGCCAACT | |
| TTGCAACCATTTTCATGCTGGGTGGTGGCTATTTGAGATGCGTTAGGCGC | |
| CGTCTAACGCATCTCAAATAGCCACCACCCAGCATGAAAATGGTTGCAAT | |
| TTGCAACCATTTTCATGCTGGGTGGTGGCTATTTGAGATGCGTTAGGCGG | |
| TTCTTGATTTAGTTGGCCGCCTAACGCATCTCAAATAGCCACCACCCAGC | |
| CCTTACACGTATTGCAACCATTTTCATGCTGGGTGGTGGCTATTTGAGAT | |
| GGCTTACGACTCATGGCCGGCTTAATGCACAGGGCCTTACACGTATTGCA | |
| TATGCGGGTTACGACTCATGGCCGGCTTAATGCACAGGGCCTTACACGTA | |
| GCGGCTTACGACTCATGGCCGGCTTAATGCACAGGGCCTTACACGTATTG | |
| GAAAATGGTTGCAATACGTGTAAGGCCCTGTGCATTAAGCCAGCCATGAG | |
| CCACCACCCAGCATGAAAATGGTTGCAATACGTGTAAGGCCCTGTACATT | |
| CGCCTAACGCATCTCAAATAGCCACCACCCAGCATGAAAATGGTTGCAAT | |
| GCCGCCTAACGCATCTCAAATAGCCACCACCCAGCATGAAAATGGTTGCA | |
| GCAATACGTGTAAGGCCCTGTGCATTAAGCCGGCCATGAGTCGTAAGCCG | |
| CATGGCCGGCTTAATGCACAGGGCCATACACGTATTGCAACCATTTTCAT | |
| AGCCATATGAAGTTATCCCGTGCAGGTTCTTGATTTAGTTGGCCGCCTAA | |
| TTAATGCACAGGGCCTTACACGTATTGCAACCATTTTCATGCTGGGTGGT | |
| ATGCGACTTACGACTCATGGCCGGCTTAATGCACAGGGCCTTACACGTAT | |
| CAATACGTGTAAGGCCCTGTGCATTAAGCCGGCTATGAGTCGTAAGCCGC | |
| GCCGCCTAACGCATCTCAAATAGCCACCACCCAGCATGAAAATGGTTGCA | |
| CGCATCTCAAATAGCCACCACCCAGCATGAAAATGGTTGCAATTCGTGTA | |
| CACCCAGCATGAAAATGGTTGCAATACGTGTAAGGTCCTGTGCATTAAGC | |
| ATGCGTTAGGCGGCCAACTAAATCAAGAACCTGCACGGGATAACTTCATA | |
| AATGGTTGCAATACGTGTAAGGCCCTGTGCATTAAGCCGGCCATGAGTCG | |
| ATGGGTGCAATACGTGTAAGGCCCTGTGCATTAAGCCGGCCATGAGTCGT | |
| TGGCCGGCTTAATGCACAGGGCCTTACACGTATTGCAACCATTTTCATGC | |
| TCTTGATTTAGTTGGCCGCCTAACGCATCTCAAATAGCCACCACCCAGCA | |
| ATATGCGGCTTACGACTCATGGCCGGCTTAATGCACAGGGCCTTACACGT | |
| TTACACGTATTGCAACCATTTTCATGCTGGGTGGTGGCTATTTGAGATGC | |
| TGAAGTTATCCCGTGCAGGTTCGTGATTTAGTTGGCCGCCTAACGCATCT | |
| ACCATTTTCATGCTGGGTGGTGGCTATTTGAGATGCGTTAGGCGGCCCAC | |
| CCCAGCACGAAAATGGTTGCAATACGTGTAAGGCCCTGTGCATTAAGCCG | |
| GCAATACGTGTAAGGCCCTGTGCATTAAGCCGGCCATGAGTCGTAAGCCG | |
| CTGGGTGGTGGCTATTTGAGATGCGTTAGGCGGCCAACTAAATCAAGAAC | |
| AGCCACCACCTAGCATGAAAATGGTTGCAATACGTGTAAGGCCCTGTGCA | |
| GATGCGTTAGGCGGCCAACTAAATCAAGAACCTGCACGGGATAACTTCAT | |
| GGTGGCTATTTGAGATGCGTTAGGCGGCCAAGTAAATCAAGAACCTGCAC | |
| GGCTTACGACTCATGGCCGGCTTAATGCACAGGGCCTTACACGTATTGCA | |
| ATATGCGGCTTACGACTCATGGCCGGCTTAATGCACAGGGCCTTACACGT | |
| GCGGCTTACGACTCATGGCCGGCTTAATGCATAGGGCCTTACACGTATTG | |
| TTCTTGATTTAGTTGGCCGCCTAACGCATCTCAAATAGCCACCACCCAGC | |
| TGCGGCTTACGACTCATGGCCGGCTTAATGCACAGGGCCTTACACGTATT | |
| TGGCTATTTGAGATGCGTTAGGCGGCCAACTAAATCAAGAACCTGCACGG | |
| CACGTATTGCAACCATTTTCATGCTGGGTGGTGGCTATTTGAGATGCGTT | |
| GAGATGCGTTAGGCGGCCAACTAAATCAAGAACCTGCACGGGATAACTTC | |
| AGTTATCCCGTGCAGGTTCTTGATTTAGTTGGCCGCCTAACGCATCTCAA | |
| CTTAATGCACAGGGCCTTACCCGTATTGCAACCATTTTCATGCTGGGTGG | |
| AACCATTTTCATGCTGTGTGGTGGCTATTTGAGATGCGTTAGGCGGCCAA | |
| ATTTAGTTGGCCGCCTAACGCATCTCAAATAGCCACCTCCCAGCATGAAA | |
| GCAATACGCGTAAGGCCCTGTGCATTAAGCCGGCCATGAGTCGTAAGCCG | |
| ATGCGTTAGGCGGCCAACTAAATCAAGAACCTGCACGGGATAACTTCATA | |
| TAGTTGGCCGCCTAACGCATCTCAAATAGCCACCACCCAGCATGAAAATG |
This file contains hidden or bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
| #!/usr/bin/python | |
| import itertools | |
| def revTransDNA(seq,lowerCaseReturn=False): | |
| bp = {'A':'T', 'C':'G', 'G':'C', 'T':'A', 'N':'N'} | |
| seqTemp = "".join([bp[x.upper()] for x in reversed(seq)]) | |
| if (lowerCaseReturn == False): | |
| return seqTemp | |
| else: | |
| return seqTemp.lower() | |
| class Dna: | |
| ''' Object representing a FASTA record. | |
| seq,name,sequence,and header are fields ''' | |
| def __init__(self, header, sequence): | |
| self.head = header | |
| self.seq = sequence | |
| self.length = len(sequence) | |
| self.revTrans = revTransDNA(sequence) | |
| self.pair = False # set to True if there is a seq that matches | |
| self.oneErrorSeq = "" | |
| self.reported = False # True if printed out | |
| self.appear = 1 #number of times (s.seq == other.seq) for s position only | |
| self.hammOneCount = 0 # number of seqs with hamming distance == 1 | |
| def __str__(self, separator=''): | |
| return ">{0}\n{1}".format(self.head, separator.join(self.seq)) | |
| def __len__(self): | |
| return len(''.join(self.seq)) | |
| def completeMatch(self,other): | |
| if (self.seq == other.seq): | |
| return True | |
| elif (self.seq == other.revTrans): | |
| return True | |
| else: | |
| return False | |
| def oneErrorMatch(self,other): | |
| """ returns true if self.seq and other.(seq or revTrans) have a hamming distance of 1. Sets self.oneErrorSeq to other's matching sequence in that case as well""" | |
| if (self.reported == True): | |
| return False | |
| forwardError = 0 | |
| if (self.length != other.length): | |
| return False | |
| for s,t in zip(self.seq,other.seq): | |
| if (s == t): | |
| continue | |
| else: | |
| forwardError += 1 | |
| if (forwardError == 1): | |
| self.oneErrorSeq = other.seq | |
| return True | |
| else: | |
| reverseError = 0 | |
| for s,t in zip(self.seq,other.revTrans): | |
| if (s == t): | |
| continue | |
| else: | |
| reverseError += 1 | |
| if (reverseError == 1): | |
| self.oneErrorSeq = other.revTrans | |
| return True | |
| return False | |
| @property | |
| def name(self, separator=''): | |
| return self.head | |
| @property | |
| def sequence(self, separator=''): | |
| return separator.join(self.seq) | |
| def setPairFound(self,other): | |
| """ sets self and other pair instance variables to true if the sequences match, counts the number of sequences a given seq is the same as """ | |
| if (self.completeMatch(other) and self.name != other.name): | |
| self.pair = True | |
| other.pair = True | |
| self.appear += 1 | |
| def reportOneErrorMatch(self): | |
| """ prints the pair of seqs, old->new""" | |
| if (self.reported == False): | |
| self.reported = True | |
| print("{0}->{1}".format(self.seq, self.oneErrorSeq)) | |
| def setErrorPairFound(self,other): | |
| """ increments hammOneCount(hamming count of one counter variable) if self.seq and (other.seq or other.revTrans) have a hamming distance of 1""" | |
| if (self.oneErrorMatch(other)): | |
| self.hammOneCount += 1 |
Sign up for free
to join this conversation on GitHub.
Already have an account?
Sign in to comment