diff --git a/src/cline_tools/gene.fasta b/src/cline_tools/gene.fasta new file mode 100644 index 0000000..99b3fd2 --- /dev/null +++ b/src/cline_tools/gene.fasta @@ -0,0 +1,238 @@ +>NC_001643.1 Pan troglodytes mitochondrion, complete genome +GTTTATGTAGCTTACCCCCTCAAAGCAATACACTGAAAATGTTTCGACGGGTTTACATCACCCCATAAAC +AAACAGGTTTGGTCCTAGCCTTTCTATTAGCTCTTAGTAAGATTACACATGCAAGCATCCCCGCCCCGTG +AGTCACCCTCTAAATCGCCATGATCAAAAGGAACAAGTATCAAGCACGCAGCAATGCAGCTCAAAACGCT +TAGCCTAGCCACACCCCCACGGGAGACAGCAGTGATAAACCTTTAGCAATAAACGAAAGTTTAACTAAGC +CATACTAACCTCAGGGTTGGTCAATTTCGTGCTAGCCACCGCGGTCATACGATTAACCCAAGTCAATAGA +AACCGGCGTAAAGAGTGTTTTAGATCACCCCCCCATAAAGCTAAAATTCACCTGAGTTGTAAAAAACTCC +AGCTGATACAAAATAAACTACGAAAGTGGCTTTAACACATCTGAATACACAATAGCTAAGACCCAAACTG +GGATTAGATACCCCACTATGCTTAGCCCTAAACTTCAACAGTTAAATTAACAAAACTGCTCGCCAGAACA +CTACGAGCCACAGCTTAAAACTCAAAGGACCTGGCGGTGCTTCATATCCCTCTAGAGGAGCCTGTTCTGT +AATCGATAAACCCCGATCAACCTCACCGCCTCTTGCTCAGCCTATATACCGCCATCTTCAGCAAACCCTG +ATGAAGGTTACAAAGTAAGCACAAGTACCCACGTAAAGACGTTAGGTCAAGGTGTAGCCTATGAGGTGGC +AAGAAATGGGCTACATTTTCTACCCCAGAAAATTACGATAACCCTTATGAAACCTAAGGGTCAAAGGTGG +ATTTAGCAGTAAACTAAGAGTAGAGTGCTTAGTTGAACAGGGCCCTGAAGCGCGTACACACCGCCCGTCA +CCCTCCTCAAGTATACTTCAAAGGATACTTAACTTAAACCCCCTACGTATTTATATAGAGGAGATAAGTC +GTAACATGGTAAGTGTACTGGAAAGTGCACTTGGACGAACCAGAGTGTAGCTTAACATAAAGCACCCAAC +TTACACTTAGGAGATTTCAACTCAACTTGACCACTCTGAGCCAAACCTAGCCCCAAACCCCCTCCACCCT +ACTACCAAACAACCTTAACCAAACCATTTACCCAAATAAAGTATAGGCGATAGAAATTGTAAACCGGCGC +AATAGACATAGTACCGCAAGGGAAAGATGAAAAATTATACCCAAGCATAATACAGCAAGGACTAACCCCT +GTACCTTTTGCATAATGAATTAACTAGAAATAACTTTGCAAAGAGAACCAAAGCTAAGACCCCCGAAACC +AGACGAGCTACCTAAGAACAGCTAAAAGAGCACACCCGTCTATGTAGCAAAATAGTGGGAAGATTTATAG +GTAGAGGCGACAAACCTACCGAGCCTGGTGATAGCTGGTTGTCCAAGATAGAATCTTAGTTCAACTTTAA +ATTTACCTACAGAACCCTCTAAATCCCCTTGTAAACTTAACTGTTAGTCCAAAGAGGAACAGCTCTTTAG +ACACTAGGAAAAAACCTTGTAAAGAGAGTAAAAAATTTAACACCCATAGTAGGCCTAAAAGCAGCCACCA +ATTAAGAAAGCGTTCAAGCTCAACACCCACAACCTTAAAGATCCCAAACATACAACCGAACTCCTTACAC +CCAATTGGACCAATCTATTACCCCATAGAAGAACTAATGTTAGTATAAGTAACATGAAAACATTCTCCTC +CGCATAAGCCTACATCAGACCAAAATATTAAACTGACAATTAACAGCCTAATATCTACAATCAACCAACA +AGCCATTATTACCCCCGCTGTTAACCCAACACAGGCATGCCCACAAGGAAAGGTTAAAAAAAGTAAAAGG +AACTCGGCAAATCTTACCCCGCCTGTTTACCAAAAACATCACCTCTAGCATTACCAGTATTAGAGGCACC +GCCTGCCCGGTGACATATGTTTAACGGCCGCGGTACCCTAACCGTGCAAAGGTAGCATAATCACTTGTTC +CTTAAATAGGGACTTGTATGAATGGCTCCACGAGGGTTTAGCTGTCTCTTACTTTCAACCAGTGAAATTG +ACCTACCCGTGAAGAGGCGGGCATAACATAACAAGACGAGAAGACCCTATGGAGCTTTAATTCATTAATG +CAAACAATACTTAACAAACCTACAGGTCCTAAACTATTAAACCTGCATTAAAAATTTCGGTTGGGGCGAC +CTCGGAGCACAACCCAACCTCCGAGCAATACATGCTAAGACCTCACCAGTCAAAGCGAATTACTACATCC +AATTGATCCAATGACTTGACCAACGGAACAAGTTACCCTAGGGATAACAGCGCAATCCTATTCCAGAGTC +CATATCAACAATAGGGTTTACGACCTCGATGTTGGATCAGGACATCCCGATGGTGCAGCCGCTATTAAAG +GTTCGTTTGTTCAACGATTAAAGTCCTACGTGATCTGAGTTCAGACCGGAGTAATCCAGGTCGGTTTCTA +TCTGTTCTAAATTTCTCCCTGTACGAAAGGACAAGAGAAATGAGGCCTACTTCACAAAGCGCCTTCCCCA +ATAAATGATATTATCTCAATTTAGCGCCATGCCAACACCCACTCAAGAACAGAGTTTGTTAAGATGGCAG +AGCCCGGTAATTGCATAAAACTTAAAACTTTACAATCAGAGGTTCAATTCCTCTTCTTGACAACACACCC +ATGACCAACCTCCTACTCCTCATTGTACCCATCCTAATCGCAATAGCATTCCTAATGCTAACCGAACGAA +AAATTCTAGGCTACATACAACTACGCAAAGGTCCCAACATTGTAGGTCCTTACGGGCTATTACAGCCCTT +CGCTGACGCCATAAAACTCTTCACTAAAGAACCCTTAAAACCCTCCACTTCAACCATTACCCTCTACATC +ACCGCCCCAACCCTAGCCCTCACCATTGCCCTCTTACTATGAACCCCCCTCCCCATACCCAACCCCCTAG +TCAATCTTAACTTAGGCCTCCTATTTATTCTAGCCACCTCCAGCCTAGCCGTTTACTCAATCCTCTGATC +AGGGTGAGCATCAAACTCGAACTACGCCTTAATCGGTGCACTACGAGCAGTAGCCCAAACAATCTCATAC +GAAGTCACTCTAGCCATTATCCTACTGTCAACGCTACTAATAAGTGGCTCCTTCAATCTCTCTACCCTTG +TCACAACACAAGAGCACCTCTGACTAATCCTGCCAACATGACCCCTGGCCATAATATGATTTATCTCTAC +ACTAGCAGAGACCAACCGAACTCCCTTCGACCTTACTGAAGGAGAATCTGAACTAGTCTCAGGCTTTAAT +ATCGAGTATGCCGCAGGCCCCTTTGCCCTATTTTTCATAGCCGAATACATAAACATTATTATAATAAACA +CCCTCACTGCTACAATCTTCCTAGGAGCAACATACAATACTCACTCCCCTGAACTCTACACGACATATTT +TGTCACCAAAGCTCTACTTCTAACCTCCCTGTTCCTATGAATTCGAACAGCATATCCCCGATTTCGCTAC +GACCAGCTCATACACCTCCTATGAAAAAACTTCCTACCACTCACCCTAGCATCACTCATGTGATATATCT +CCATACCCACTACAATCTCCAGCATCCCCCCTCAAACCTAAGAAATATGTCTGATAAAAGAATTACTTTG +ATAGAGTAAATAATAGGAGTTCAAATCCCCTTATTTCTAGGACTATAAGAATCGAACTCATCCCTGAGAA +TCCAAAATTCTCCGTGCCACCTATCACACCCCATCCTAAAGTAAGGTCAGCTAAATAAGCTATCGGGCCC +ATACCCCGAAAATGTTGGTTACACCCTTCCCGTACTAATTAATCCCCTAGCCCAACCCATCATCTACTCT +ACCATCCTTACAGGCACGCTCATTACAGCGCTAAGCTCACACTGATTTTTCACCTGAGTAGGCCTAGAAA +TAAATATACTAGCTTTTATCCCAATCCTAACCAAAAAAATAAGCCCCCGCTCCACAGAAGCCGCCATCAA +ATACTTTCTCACACAAGCAACTGCGTCCATAATTCTCCTGATAGCTATCCTCTCCAACAGCATACTCTCC +GGACAATGAACCATAACCAATACTACCAATCAATACTCATCATTAATAATTATAATAGCAATGGCAATAA +AACTAGGAATAGCCCCCTTTCACTTTTGAGTTCCAGAAGTTACCCAAGGCACCCCCCTAATATCCGGCCT +ACTCCTCCTCACATGACAAAAATTAGCCCCTATTTCAATTATATACCAAATCTCCTCATCACTGAACGTA +AACCTTCTCCTCACCCTTTCAATCTTGTCCATTATAGCAGGCAGCTGAGGCGGACTAAACCAAACCCAAC +TACGCAAAATCCTAGCATACTCCTCAATCACCCACATAGGCTGAATAATAGCAGTCCTACCATATAACCC +TAACATAACCATTCTTAATTTAACCATTTACATCATCCTAACTACTACCGCATTTCTGCTACTCAACTTA +AACTCCAGCACCACAACCCTACTACTATCTCGCACCTGAAACAAGCTAACATGATTAACTCCCCTAATTC +CATCCACCCTCCTCTCCCTAGGAGGCCTACCCCCACTAACTGGCTTCTTACCCAAATGAGTTATCATCGA +AGAATTCACAAAAAATAATAGCCTCATCATCCCCACCATCATAGCCATCATCACTCTCCTTAACCTCTAT +TTCTACCTACGCCTAATCTACTCCACCTCAATTACACTACTTCCCATATCTAATAACGTAAAAATAAAAT +GACAATTCGAACATACAAAACCCACCCCCTTCCTCCCTACACTCATCACCCTTACCACACTGCTTCTACC +CATCTCCCCCTTCATACTAATAATCTTATAGAAATTTAGGTTAAGCACAGACCAAGAGCCTTCAAAGCCC +TCAGCAAGTTACAATACTTAATTTCTGCAACAACTAAGGACTGCAAAACCCCACTCTGCATCAACTGAAC +GCAAATCAGCCACTTTAATTAAGCTAAGCCCTTACTAGATTAATGGGACTTAAACCCACAAACATTTAGT +TAACAGCTAAACACCCTAATCAACTGGCTTCAATCTACTTCTCCCGCCGCAAGAAAAAAAGGCGGGAGAA +GCCCCGGCAGGTTTGAAGCTGCTTCTTCGAATTTGCAATTCAATATGAAAATCACCTCAGAGCTGGTAAA +AAGAGGCTTAACCCCTGTCTTTAGATTTACAGTCCAATGCTTCACTCAGCCATTTTACCCCACCCTACTG +ATGTTCACCGACCGCTGACTATTCTCTACAAACCACAAAGATATTGGAACACTATACCTACTATTCGGTG +CATGAGCTGGAGTCCTGGGCACAGCCCTAAGTCTCCTTATTCGGGCTGAACTAGGCCAACCAGGCAACCT +CCTAGGTAATGACCACATCTACAATGTCATCGTCACAGCCCATGCATTCGTAATAATCTTCTTCATAGTA +ATGCCTATTATAATCGGAGGCTTTGGCAACTGGCTAGTTCCCTTGATAATTGGTGCCCCCGACATGGCAT +TCCCCCGCATAAACAACATAAGCTTCTGGCTCCTGCCCCCTTCTCTCCTACTTCTACTTGCATCTGCCAT +AGTAGAAGCCGGCGCGGGAACAGGTTGAACAGTCTACCCTCCCTTAGCGGGAAACTACTCGCATCCTGGA +GCCTCCGTAGACCTAACCATCTTCTCCTTACATCTGGCAGGCATCTCCTCTATCCTAGGAGCCATTAACT +TCATCACAACAATTATTAATATAAAACCTCCTGCCATGACCCAATACCAAACACCCCTCTTCGTCTGATC +CGTCCTAATCACAGCAGTCTTACTTCTCCTATCCCTCCCAGTCCTAGCTGCTGGCATCACCATACTATTG +ACAGATCGTAACCTCAACACTACCTTCTTCGACCCAGCCGGGGGAGGAGACCCTATTCTATATCAACACT +TATTCTGATTTTTTGGCCACCCCGAAGTTTATATTCTTATCCTACCAGGCTTCGGAATAATTTCCCACAT +TGTAACTTATTACTCCGGAAAAAAAGAACCATTTGGATATATAGGCATGGTTTGAGCTATAATATCAATT +GGCTTCCTAGGGTTTATCGTGTGAGCACACCATATATTTACAGTAGGGATAGACGTAGACACCCGAGCCT +ATTTCACCTCCGCTACCATAATCATTGCTATTCCTACCGGCGTCAAAGTATTCAGCTGACTCGCTACACT +TCACGGAAGCAATATGAAATGATCTGCCGCAGTACTCTGAGCCCTAGGGTTTATCTTTCTCTTCACCGTA +GGTGGCCTAACCGGCATTGTACTAGCAAACTCATCATTAGACATCGTGCTACACGACACATACTACGTCG +TAGCCCACTTCCACTACGTTCTATCAATAGGAGCTGTATTCGCCATCATAGGAGGCTTCATTCACTGATT +CCCCCTATTCTCAGGCTATACCCTAGACCAAACCTATGCCAAAATCCAATTTGCCATCATGTTCATTGGC +GTAAACCTAACCTTCTTCCCACAGCACTTCCTTGGCCTATCTGGGATGCCCCGACGTTACTCGGACTACC +CCGATGCATACACCACATGAAATGTCCTATCATCCGTAGGCTCATTTATCTCCCTGACAGCAGTAATATT +AATAATTTTCATGATTTGAGAAGCCTTTGCTTCAAAACGAAAAGTCCTAATAGTAGAAGAGCCCTCCGCA +AACCTGGAATGACTATATGGATGCCCCCCACCCTACCACACATTCGAAGAACCCGTATACATAAAATCTA +GACAAAAAAGGAAGGAATCGAACCCCCTAAAGCTGGTTTCAAGCCAACCCCATGACCTCCATGACTTTTT +CAAAAAGATATTAGAAAAACTATTTCATAACTTTGTCAAAGTTAAATTACAGGTTAACCCCCGTATATCT +TAATGGCACATGCAGCGCAAGTAGGTCTACAAGATGCTACTTCCCCTATCATAGAAGAACTTATTATCTT +TCACGACCATGCCCTCATAATTATCTTTCTCATCTGCTTTCTAGTCCTATACGCCCTTTTCCTAACACTC +ACAACAAAACTAACTAATACTAGTATTTCAGACGCCCAGGAAATAGAAACCGTCTGAACTATCCTGCCCG +CCATCATCCTAGTCCTTATTGCCCTACCATCCCTGCGTATCCTTTACATAACAGACGAGGTCAACGACCC +CTCCTTTACTATTAAATCAATCGGCCATCAATGATATTGAACCTACGAATACACCGACTACGGCGGGCTA +ATCTTCAACTCCTACATACTCCCCCCATTATTTCTAGAACCAGGTGATCTACGACTCCTTGACGTTGATA +ACCGAGTGGTCCTCCCAGTTGAAGCCCCCGTTCGTATAATAATTACATCACAAGATGTTCTACACTCATG +AGCTGTTCCCACATTAGGCCTAAAAACAGACGCAATTCCCGGACGCCTAAACCAAACCACTTTCACCGCC +ACACGACCAGGAGTATACTACGGCCAATGCTCAGAAATCTGTGGAGCAAACCACAGTTTTATACCCATCG +TCCTAGAATTAATCCCTCTAAAAATCTTTGAAATAGGACCCGTATTCACTCTATAGCACCTTCTCTACCC +CTCTCCAGAGCTCACTGTAAAGCTAACCTAGCATTAACCTTTTAAGTTAAAGATTAAGAGGACCGACACC +TCTTTACAGTGAAATGCCCCAACTAAATACCGCCGTATGACCCACCATAATTACCCCCATACTCCTGACA +CTATTTCTCGTCACCCAACTAAAAATATTAAATTCAAATTACCATCTACCCCCCTCACCAAAACCCATAA +AAATAAAAAACTACAATAAACCCTGAGAACCAAAATGAACGAAAATCTATTCGCTTCATTCGCTGCCCCC +ACAATCCTAGGCTTACCCGCCGCAGTACTAATCATTCTATTCCCCCCTCTACTGGTCCCCACTTCTAAAC +ATCTCATCAACAACCGACTAATTACCACCCAACAATGACTAATTCAACTGACCTCAAAACAAATAATAAC +TATACACAGCACTAAAGGACGAACCTGATCTCTCATACTAGTATCCTTAATCATTTTTATTACCACAACC +AATCTTCTTGGGCTTCTACCCCACTCATTCACACCAACCACCCAACTATCTATAAACCTAGCCATGGCTA +TCCCCCTATGAGCAGGCGCAGTAGTCATAGGCTTTCGCTTTAAGACTAAAAATGCCCTAGCCCACTTCTT +ACCGCAAGGCACACCTACACCCCTTATCCCCATACTAGTTATCATCGAAACTATTAGCCTACTCATTCAA +CCAATAGCCTTAGCCGTACGTCTAACCGCTAACATTACTGCAGGCCACCTACTCATGCACCTAATTGGAA +GCGCCACACTAGCATTATCAACTATCAATCTACCCTATGCACTCATTATCTTCACAATTCTAATCCTACT +GACTATTCTAGAGATCGCCGTCGCCTTAATCCAAGCCTACGTTTTTACACTTCTAGTGAGCCTCTACCTG +CACGACAACACATAATGACCCACCAATCACATGCCTACCACATAGTAAAACCCAGCCCATGACCCCTAAC +AGGGGCCCTCTCGGCCCTCCTAATAACCTCCGGCCTGGCCATATGATTCCACTTCTACTCCACAACACTA +CTCACACTAGGCTTACTAACTAACACATTGACCATATATCAATGATGACGCGATGTTATACGAGAAGGCA +CATACCAAGGCCACCACACACCACCCGTCCAAAAAGGTCTCCGATATGGGATAATTCTTTTTATTACCTC +AGAAGTTTTTTTCTTTGCAGGATTTTTTTGAGCTTTCTACCACTCCAGCCTAGCCCCTACCCCCCAGCTA +GGAGGACACTGGCCCCCAACAGGTATTACCCCACTAAATCCCCTAGAAGTCCCACTCCTAAACACATCTG +TATTACTCGCATCAGGAGTATCAATTACTTGAGCCCATCACAGCTTAATAGAAAATAACCGAAACCAAAT +AATTCAAGCACTGCTTATTACGATTCTACTAGGTCTTTATTTTACCCTCCTACAAGCCTCAGAATATTTC +GAATCCCCTTTTACCATTTCCGATGGCATCTACGGCTCAACATTCTTTGTAGCCACAGGCTTCCACGGAC +TCCACGTCATTATTGGATCAACTTTCCTCACTATCTGCCTCATCCGCCAACTAATATTTCACTTCACATC +CAAACATCACTTCGGCTTTCAAGCCGCCGCCTGATACTGACACTTCGTAGATGTAGTCTGACTATTTCTA +TATGTCTCTATTTACTGATGAGGATCTTACTCTTTTAGTATAAGTAGTACCGTTAACTTCCAATTAACTA +GTTTTGACAACATTCAAAAAAGAGTAATAAACTTCGTCCTAATTTTAATAACCAATACCCTTCTAGCCCT +ACTACTGATAATTATCACATTCTGACTACCACAACTCAACAGCTACATAGAAAAATCTACCCCTTACGAA +TGTGGCTTCGACCCTATATCCCCCGCCCGCGTCCCCTTCTCCATAAAATTTTTCCTAGTAGCCATCACCT +TCCTATTATTTGACCTAGAAATTGCCCTCCTATTGCCCTTACCTTGAGCCCTACAAACGGCCAACCTACC +ACTAATAGTCACATCATCCCTCTTATTAATTACTATCCTAGCCCTAAGCCTCGCCTACGAATGATTACAA +AAAGGGTTAGACTGAACCGAATTGGTATATAGTTTAAATAAAACGAATGATTTCGACTCATTAAATTATG +ATAATCATATTTACCAAATGCCCCTTATTTATATAAATATTATACTAGCATTTACCATCTCACTTCTAGG +AATACTAGTATATCGCTCACACCTAATATCTTCCCTACTATGCCTAGAAGGAATAATACTATCACTGTTC +ATCATAGCCACCCTCATAACCCTCAATACTCACTCCCTCTTAGCCAATATTGTACCCATCACCATACTAG +TCTTTGCTGCCTGCGAAGCAGCAGTAGGTCTAGCACTACTAGTTTCAATCTCTAACACATATGGCTTAGA +CTACGTACATAACCTAAACCTACTCCAATGCTAAAACTAATCATCCCGACAATTATATTACTACCACTAA +CATGATTCTCTAAAAAACGTATAATTTGAATCAACACAACCACTCACAGCCTAATTATCAGCACCATTCC +CTTACTATTTTTTAACCAAATTAACAACAACCTATTCAGCTGTTCCCTGCCCTTCTCCTCCGACCCCTTA +ACAACTCCCCTCCTAATATTAACTGCTTGACTTCTACCCCTCACAATCATAGCAAGCCAGCGCCACCTAT +CCAACGAACCACTATCACGAAAAAAACTCTACCTCTCCATGCTAATTTCCCTCCAAATCTCCTTAATTAT +AACATTCTCGGCCACAGAGCTAATTATATTTTATATCTTCTTCGAAACCACACTTATCCCCACCCTGGCT +ATCATCACCCGATGGGGTAACCAACCAGAACGCCTGAACGCAGGTACATACTTCCTATTCTATACCCTAG +TAGGCTCCCTCCCCCTACTCATCGCACTAATCTATACCCACAACACCCTAGGCTCACTAAATATCCTATT +ACTCACTCTTACAACCCAAGAACTATCAAACACCTGAGCCAACAACTTAATATGACTAGCGTACACGATG +GCTTTCATGGTAAAAATACCCCTTTACGGACTCCACCTATGACTCCCTAAAGCCCATGTCGAAGCCCCTA +TTGCCGGGTCAATGGTACTTGCTGCAGTACTCTTAAAATTAGGTGGCTATGGCATAATACGCCTCACACT +CATCCTCAACCCCCTAACAAAACATATAGCCTATCCCTTCCTCATGTTGTCCTTATGAGGTATAATCATA +ACAAGCTCCATCTGCCTGCGACAAACAGACCTAAAATCGCTCATTGCATACCCTTCAGTCAGCCACATAG +CCCTCGTAGTAACAGCCATTCTCATCCAAACCCCCTGAAGCTTCACCGGCGCAATTATCCTCATAATCGC +CCACGGACTTACATCCTCATTATTATCCTGCCTAGCAAACTCAAATTATGAACGCACCCACAGTCGCATC +ATAATTCTCTCCCAAGGACTTCAAACTCTACTCCCACTAATAGCCTTTTGATGACTCCTGGCAAGCCTCG +CTAACCTCGCCCTACCCCCTACCATTAATCTCCTAGGGGAACTCTCCGTGCTAGTAACCTCATTCTCCTG +ATCAAATACCACTCTCCTACTCACAGGATTCAACATACTAATCACAGCCCTGTACTCCCTCTACATGTTT +ACCACAACACAATGAGGCTCACTCACCCACCACATTAATAGCATAAAGCCCTCATTCACACGAGAAAACA +CTCTCATATTTTTACACCTATCCCCCATCCTCCTTCTATCCCTCAATCCTGATATCATCACTGGATTCAC +CTCCTGTAAATATAGTTTAACCAAAACATCAGATTGTGAATCTGACAACAGAGGCTCACGACCCCTTATT +TACCGAGAAAGCTTATAAGAACTGCTAACTCGTATTCCCATGCCTAACAACATGGCTTTCTCAACTTTTA +AAGGATAACAGTTATCCATTGGTCTTAGGCCCCAAAAATTTTGGTGCAACTCCAAATAAAAGTAATAACC +ATGTATGCTACCATAACCACCTTAGCCCTAACTTCCTTAATTCCCCCCATCCTCGGCGCCCTCATTAACC +CTAACAAAAAAAACTCATACCCCCATTACGTGAAATCCATTATCGCATCCACCTTTATCATTAGCCTTTT +CCCCACAACAATATTCATATGCCTAGACCAAGAAACTATTATCTCGAACTGACACTGAGCAACAACCCAA +ACAACCCAACTCTCCCTGAGCTTTAAACTAGACTATTTCTCCATAACATTTATCCCCGTAGCACTGTTCG +TTACATGATCCATCATAGAATTCTCACTATGATATATAGACTCAGACCCCAACATCAACCAATTCTTCAA +ATACTTACTTATCTTCCTAATTACTATACTAATCCTAGTCACCGCTAACAACCTATTCCAACTCTTCATC +GGCTGAGAAGGCGTAGGAATTATATCCTTTCTACTCATTAGCTGATGGTACGCCCGAACAGATGCCAACA +CAGCAGCCATCCAAGCAATCCTATATAACCGTATCGGTGATATTGGTTTTGTCCTAGCCCTAGCATGATT +TCTCCTACACTCCAACTCATGAGATCCACAACAAATAATCCTCCTAAGTACTAATACAGACCTTACTCCA +CTACTAGGCTTCCTCCTAGCAGCAGCAGGCAAATCAGCTCAACTAGGCCTTCACCCCTGACTCCCCTCAG +CCATAGAAGGCCCTACCCCTGTTTCAGCCCTACTCCACTCAAGCACCATAGTCGTAGCAGGAATCTTCCT +ACTCATCCGCTTCTACCCCCTAGCAGAGAATAACCCACTAATCCAAACTCTCACGCTATGCCTAGGCGCT +ATCACCACCCTATTCGCAGCAGTCTGCGCCCTCACACAAAATGACATCAAAAAAATCGTGGCCTTCTCCA +CTTCAAGCCAACTAGGACTCATAATAGTTACAATCGGTATCAACCAACCACACCTAGCATTCCTTCACAT +CTGCACCCACGCTTTCTTCAAAGCCATACTATTCATATGCTCCGGATCCATTATTCACAACCTCAATAAT +GAGCAAGACATTCGAAAAATAGGAGGATTACTCAAAACCATACCCCTCACTTCAACCTCCCTCACCATTG +GGAGCCTAGCATTAGCAGGAATACCCTTCCTCACAGGTTTCTACTCCAAAGACCTCATCATCGAAACCGC +TAACATATCATACACAAACGCCTGAGCCCTATCTATTACTCTCATCGCCACCTCTCTGACAAGCGCCTAC +AGCACCCGAATAATCCTCCTCACCCTAACAGGTCAACCTCGCTTCCCAACCCTCACCAACATTAACGAAA +ACAACCCCACTCTGTTAAATCCCATTAAACGCCTAACCATTGGAAGCTTATTTGCAGGATTTCTCATTAC +CAACAACATTCTCCCCATATCTACTCCCCAAGTGACAATTCCCCTTTACTTAAAACTTACAGCCCTAGGC +GTTACTTCCCTAGGACTTCTAACAGCCCTAGACCTCAATTACCTAACCAGCAAGCTCAAAATAAAATCCC +CACTATATACATTTCACTTCTCTAATATACTCGGATTCTACCCTAACATTATACACCGCTCGATCCCCTA +TCTAGGCCTTCTTACAAGCCAAAACCTACCCCTACTTCTTCTAGACCTGACCTGACTAGAGAAACTATTA +CCTAAAACAATTTCACAGTACCAAATCTCCGCTTCCATTACCACCTCAACCCAAAAAGGCATGATCAAAC +TTTATTTCCTCTCTTTTTTCTTCCCTCTCATCTTAACCTTACTCCTAATCACATAACCTATTCCCCCGAG +CAATCTCAATCACAATGTATACACCAACAAACAATGTCCAACCAGTAACTACTACTAACCAACGCCCATA +ATCATATAAGGCCCCCGCACCAATAGGATCCTCCCGAATCAGCCCTGGCCCCTCCCCTTCATAAATTATT +CAACTTCCCACGCTATTAAAATTTACCACAACCACCATCCCATCATACCCTTTTACCCATAACACTAATC +CTACCTCCATCGCCAGTCCTACTAAAACACTAACCAAAACCTCAACCCCTGACCCCCATGCCTCAGGATA +CTCCTCAATAGCCATAGCCGTAGTATACCCAAAAACAACCATTATTCCCCCCAAATAAATTAAAAAAACC +ATTAAACCTATATAACCTCCCCCATAATTCAAAATGATGGCACACCCAACTACACCACTAACAATCAATA +CTAAACCCCCATAAATGGGAGAAGGCTTAGAAGAAAACCCCACAAACCCTATCACTAAACTCACACTCAA +TAAAAATAAAGCATATGTCATTATTCTCGCACGGACTACAACCACGACCAATGATATGAAAAACCATCGT +TGTATTTCAACTACAAGAACACCAATGACCCCGACACGCAAAATTAACCCACTAATAAAATTAATTAATC +ACTCATTTATCGACCTCCCCACCCCATCCAACATTTCCGCATGATGGAACTTCGGCTCACTTCTCGGCGC +CTGCCTAATCCTTCAAATTACCACAGGATTATTCCTAGCTATACACTACTCACCAGACGCCTCAACCGCC +TTCTCGTCGATCGCCCACATCACCCGAGACGTAAACTATGGTTGGATCATCCGCTACCTCCACGCTAACG +GCGCCTCAATATTTTTTATCTGCCTCTTCCTACACATCGGCCGAGGTCTATATTACGGCTCATTTCTCTA +CCTAGAAACCTGAAACATTGGCATTATCCTCTTGCTCACAACCATAGCAACAGCCTTTATGGGCTATGTC +CTCCCATGAGGCCAAATATCCTTCTGAGGAGCCACAGTAATTACAAACCTACTGTCCGCTATCCCATACA +TCGGAACAGACCTGGTCCAGTGAGTCTGAGGAGGCTACTCAGTAGACAGCCCTACCCTTACACGATTCTT +CACCTTCCACTTTATCTTACCCTTCATCATCACAGCCCTAACAACACTTCATCTCCTATTCTTACACGAA +ACAGGATCAAATAACCCCCTAGGAATCACCTCCCACTCCGACAAAATTACCTTCCACCCCTACTACACAA +TCAAAGATATCCTTGGCTTATTCCTTTTCCTCCTTATCCTAATGACATTAACACTATTCTCACCAGGCCT +CCTAGGCGATCCAGACAACTATACCCTAGCTAACCCCCTAAACACCCCACCCCACATTAAACCCGAGTGA +TACTTTCTATTTGCCTACACAATCCTCCGATCCATCCCCAACAAACTAGGAGGCGTCCTCGCCCTACTAC +TATCTATCCTAATCCTAACAGCAATCCCTGTCCTCCACACATCCAAACAACAAAGCATAATATTTCGCCC +ACTAAGCCAACTGCTTTACTGACTCCTAGCCACAGACCTCCTCATCCTAACCTGAATCGGAGGACAACCA +GTAAGCTACCCCTTCATCACCATCGGACAAATAGCATCCGTATTATACTTCACAACAATCCTAATCCTAA +TACCAATCGCCTCTCTAATCGAAAACAAAATACTTGAATGAACCTGCCCTTGTAGTATAAACTAATACAC +CGGTCTTGTAAACCGGAAACGAAAACTTTCTTCCAAGGACAAATCAGAGAAAAAGTAATTAACTTCACCA +TCAGCACCCAAAGCTAAGATTCTAATTTAAACTATTCTCTGTTCTTTCATGGGGAAGCAAATTTAGGTAC +CACCTAAGTACTGGCTCATTCATTACAACCGCTATGTATTTCGTACATTACTGCCAGCCACCATGAATAT +CGTACAGTACCATATCACCCAACTACCTATAGTACATAAAATCCACTCCCACATCAAAACCTTCACTCCA +TGCTTACAAGCACGCACAACAATCAACTCCCAACTGTCGAACATAAAACACAATTCCAACGACACCCCTC +CCCCACCCCGATACCAACAGACCTATCTCCCCTTGACAGAACATAGTACATACAACCATACACCGTACAT +AGCACATTACAGTCAAACCCCTCCTCGCCCCCACGGATGCTCCCCCTCAGATAGGAATCCCTTGGTCACC +ATCCTCCGTGAAATCAATATCCCGCACAAGAGTGACTCTCCTCGCTCCGGGCCCATAACATCTGGGGGTA +GCTAAAGTGAACTGTATCCGACATCTGGTTCCTACCTCAGGGCCATGAAGTTCAAAAGACTCCCACACGT +TCCCCTTAAATAAGACATCACGATGGATCACAGGTCTATCACCCTATTAACCAGTCACGGGAGCCTTCCA +TGCATTTGGTATTTTCGTCTGGGGGGTGTGCACGCGATAGCATTGCGAAACGCTGGCCCCGGAGCACCCT +ATGTCGCAGTATCTGTCTTTGATTCCTGCCCCATTGTATTATTTATCGCACCTACGTTCAATATTACGAC +CTAGCATACCTACTAAAGTGTGTTGATTAATTAATGCTTGCAGGACATAACAACAGCAGCAAAATGCTCA +CATAACTGCTTTCCACACCAACATCATAACAAAAAATTCCCACAAACCCCCCCTTCCCCCCGGCCACAGC +ACTCAAACAAATCTCTGCCAAACCCCAAAAACAAAGAACCCAGACGCCAGCCTAGCCAGACTTCAAATTT +CATCTTTAGGCGGTATGCACTTTTAACAGTCACCCCTCAATTAACATGCCCTCCCCCCTCAACTCCCATT +CTACTAGCCCCAGCAACGTAACCCCCTACTCACCCTACTCAACACATATACCGCTGCTAACCCCATACCC +TGAACCAACCAAACCCCAAAGACACCCCTACACA diff --git a/src/cline_tools/help_pages/orffinder-to-gtf.txt b/src/cline_tools/help_pages/orffinder-to-gtf.txt new file mode 100644 index 0000000..597303b --- /dev/null +++ b/src/cline_tools/help_pages/orffinder-to-gtf.txt @@ -0,0 +1,35 @@ +USAGE + orffinder-to-gtf [-in input] [-infmt format] [-out output] [-outfmt format] [-orf_size int] + [-remove_nested boolean] [-trim_trailing boolean] [-max_orfs_per_sequence int] + [-attr_name string] + +DESCRIPTION + ORFFinder Python v1.5 + +PARAMETERS +[-h] +Shows this interface. + +[-in (string)]: +Input nucleotide sequence to extract ORFs from. + +[-infmt (string)]: +Can be "fasta", "genbank", or any other Biopython supported format. Default: "fasta" + +[-out (string)] +Optional output file. If not specified, will output to stdout. + +[-orf_size (integer)] +Minimum size (in nucleotides) of ORF. Default: 75 + +[-remove_nested (boolean)] +Remove ORFs that are completely nested in another ORF. Default: False + +[-trim_trailing (boolean)] +Remove ORFs that have a start codon but no stop codon at the edges of the sequence. Default: False + +[-max_orfs_per_sequence (integer)] +Maximum number of ORFs to return per sequence, sorted by length. Default: -1 (no limit) + +[-attr_name (string)] +Attribute ID name in GTF file. Suffixed by ORF index number. Default: "ORF_" diff --git a/src/cline_tools/help_pages/orffinder-to-sequence.txt b/src/cline_tools/help_pages/orffinder-to-sequence.txt new file mode 100644 index 0000000..310af0f --- /dev/null +++ b/src/cline_tools/help_pages/orffinder-to-sequence.txt @@ -0,0 +1,41 @@ +USAGE + orffinder-to-gtf [-in input] [-infmt format] [-out output] [-orf_size int] + [-remove_nested boolean] [-trim_trailing boolean] [-max_orfs_per_sequence int] + [-attr_name string] [-outtype protein/nucleotide] + +DESCRIPTION + ORFFinder Python v1.5 + +PARAMETERS +[-h] +Shows this interface. + +[-in (string)]: +Input nucleotide sequence to extract ORFs from. + +[-infmt (string)]: +Can be "fasta", "genbank", or any other Biopython supported format. Default: "fasta" + +[-out (string)] +Optional output file. If not specified, will output to stdout. + +[-outfmt (string)]: +Can be "fasta" or "fasta-2line". Default: "fasta" + +[-orf_size (integer)] +Minimum size (in nucleotides) of ORF. Default: 75 + +[-remove_nested (boolean)] +Remove ORFs that are completely nested in another ORF. Default: False + +[-trim_trailing (boolean)] +Remove ORFs that have a start codon but no stop codon at the edges of the sequence. Default: False + +[-max_orfs_per_sequence (integer)] +Maximum number of ORFs to return per sequence, sorted by length. Default: -1 (no limit) + +[-attr_name (string)] +Attribute ID name in GTF file. Suffixed by ORF index number. Default: "ORF_" + +[-outtype (string)] +Can be "protein" or "nucleotide". Default: "nucleotide" diff --git a/src/cline_tools/orffinder-to-gtf.py b/src/cline_tools/orffinder-to-gtf.py index bb8cd80..3d723f1 100644 --- a/src/cline_tools/orffinder-to-gtf.py +++ b/src/cline_tools/orffinder-to-gtf.py @@ -1,8 +1,9 @@ import sys +import os from Bio import SeqIO from orffinder import orffinder -arguments = sys.argv +arguments = sys.argv + [""] classed_arguments = {"orf_size": "75", "max_orfs_per_sequence": "-1", "remove_nested": "False", "trim_trailing": "False", "infmt": "fasta", "attr_name": "ORF_"} try: @@ -14,6 +15,11 @@ classed_arguments[argument[1:]] = arguments[i + 1] + if "h" in classed_arguments.keys(): + help_output = open("help_pages/orffinder-to-gtf.txt", "r").read() + print(help_output) + os._exit(1) + sequences = SeqIO.parse(classed_arguments["in"], classed_arguments["infmt"]) orf_size = int(classed_arguments["orf_size"]) diff --git a/src/cline_tools/orffinder-to-sequence.py b/src/cline_tools/orffinder-to-sequence.py new file mode 100644 index 0000000..aa74a45 --- /dev/null +++ b/src/cline_tools/orffinder-to-sequence.py @@ -0,0 +1,66 @@ +import sys +import os +from Bio import SeqIO +from Bio.SeqRecord import SeqRecord +from orffinder import orffinder + +arguments = sys.argv + [""] +classed_arguments = {"orf_size": "75", "outtype": "nucleotide", "max_orfs_per_sequence": "-1", "remove_nested": "False", "trim_trailing": "False", "infmt": "fasta", "attr_name": "ORF_", "outfmt": "fasta"} + +try: + for i in range(len(arguments)): + + argument = arguments[i] + + if argument.startswith("-"): + + classed_arguments[argument[1:]] = arguments[i + 1] + + if "h" in classed_arguments.keys(): + help_output = open("help_pages/orffinder-to-sequence.txt", "r").read() + print(help_output) + os._exit(1) + + sequences = SeqIO.parse(classed_arguments["in"], classed_arguments["infmt"]) + + orf_size = int(classed_arguments["orf_size"]) + remove_nested = classed_arguments["remove_nested"] == "True" + trim_trailing = classed_arguments["trim_trailing"] == "True" + attr_name = classed_arguments["attr_name"] + max_orfs_per_sequence = int(classed_arguments["max_orfs_per_sequence"]) + + output = list() + + for sequence in sequences: + + seqname = sequence.description + + if classed_arguments["outtype"] == "nucleotide": + output_seqs = orffinder.getORFNucleotides(sequence, minimum_length=orf_size, trim_trailing=trim_trailing, remove_nested=remove_nested) + + else: + output_seqs = orffinder.getORFProteins(sequence, minimum_length=orf_size, trim_trailing=trim_trailing, remove_nested=remove_nested) + + output += output_seqs + + index = int() + + new_output = list() + + for i in range(len(output)): + + #print(Seq(str(output_seq))) + index = i + 1 + output[i] = SeqRecord(seq=output[i], id=classed_arguments["attr_name"] + str(index), description="") + + + if "out" not in classed_arguments.keys(): + + SeqIO.write(output, sys.stdout, classed_arguments["outfmt"]) + + else: + + SeqIO.write(output, classed_arguments["out"], classed_arguments["outfmt"]) + +except: + print("USAGE\n orffinder-to-sequence [-in input] [-infmt format] [-out output] [-outfmt format] [-orf_size int]\n [-remove_nested boolean] [-trim_trailing boolean] [-max_orfs_per_sequence int]\n [-attr_name string] [-outtype protein/nucleotide]\n\nDESCRIPTION\n ORFFinder Python v1.5\n\nUse '-help' to print detailed descriptions of command line arguments\n========================================================================") diff --git a/src/cline_tools/test.fasta b/src/cline_tools/test.fasta new file mode 100644 index 0000000..d9925bf --- /dev/null +++ b/src/cline_tools/test.fasta @@ -0,0 +1,426 @@ +>ORF_1 +ATGATCTGCCGCAGTACTCTGAGCCCTAGGGTTTATCTTTCTCTTCACCGTAGGTGGCCT +AACCGGCATTGTACTAGCAAACTCATCATTAGACATCGTGCTACACGACACATACTACGT +CGTAGCCCACTTCCACTACGTTCTATCAATAGGAGCTGTATTCGCCATCATAGGAGGCTT +CATTCACTGATTCCCCCTATTCTCAGGCTATACCCTAGACCAAACCTATGCCAAAATCCA +ATTTGCCATCATGTTCATTGGCGTAAACCTAACCTTCTTCCCACAGCACTTCCTTGGCCT +ATCTGGGATGCCCCGACGTTACTCGGACTACCCCGATGCATACACCACATGAAATGTCCT +ATCATCCGTAGGCTCATTTATCTCCCTGACAGCAGTAATATTAATAATTTTCATGATTTG +AGAAGCCTTTGCTTCAAAACGAAAAGTCCTAATAGTAGAAGAGCCCTCCGCAAACCTGGA +ATGACTATATGGATGCCCCCCACCCTACCACACATTCGAAGAACCCGTATACATAAAATC +TAG +>ORF_2 +ATGACATATGCTTTATTTTTATTGAGTGTGAGTTTAGTGATAGGGTTTGTGGGGTTTTCT +TCTAAGCCTTCTCCCATTTATGGGGGTTTAGTATTGATTGTTAGTGGTGTAGTTGGGTGT +GCCATCATTTTGAATTATGGGGGAGGTTATATAGGTTTAATGGTTTTTTTAATTTATTTG +GGGGGAATAATGGTTGTTTTTGGGTATACTACGGCTATGGCTATTGAGGAGTATCCTGAG +GCATGGGGGTCAGGGGTTGAGGTTTTGGTTAGTGTTTTAGTAGGACTGGCGATGGAGGTA +GGATTAGTGTTATGGGTAAAAGGGTATGATGGGATGGTGGTTGTGGTAAATTTTAATAGC +GTGGGAAGTTGA +>ORF_3 +ATGAATATCGTACAGTACCATATCACCCAACTACCTATAGTACATAAAATCCACTCCCAC +ATCAAAACCTTCACTCCATGCTTACAAGCACGCACAACAATCAACTCCCAACTGTCGAAC +ATAAAACACAATTCCAACGACACCCCTCCCCCACCCCGATACCAACAGACCTATCTCCCC +TTGACAGAACATAGTACATACAACCATACACCGTACATAGCACATTACAGTCAAACCCCT +CCTCGCCCCCACGGATGCTCCCCCTCAGATAGGAATCCCTTGGTCACCATCCTCCGTGAA +ATCAATATCCCGCACAAGAGTGACTCTCCTCGCTCCGGGCCCATAACATCTGGGGGTAGC +TAA +>ORF_4 +ATGAACCATAACCAATACTACCAATCAATACTCATCATTAATAATTATAATAGCAATGGC +AATAAAACTAGGAATAGCCCCCTTTCACTTTTGAGTTCCAGAAGTTACCCAAGGCACCCC +CCTAATATCCGGCCTACTCCTCCTCACATGACAAAAATTAGCCCCTATTTCAATTATATA +CCAAATCTCCTCATCACTGAACGTAAACCTTCTCCTCACCCTTTCAATCTTGTCCATTAT +AGCAGGCAGCTGAGGCGGACTAAACCAAACCCAACTACGCAAAATCCTAGCATACTCCTC +AATCACCCACATAGGCTGAATAATAGCAGTCCTACCATATAA +>ORF_5 +ATGTTTATGTATTCGGCTATGAAAAATAGGGCAAAGGGGCCTGCGGCATACTCGATATTA +AAGCCTGAGACTAGTTCAGATTCTCCTTCAGTAAGGTCGAAGGGAGTTCGGTTGGTCTCT +GCTAGTGTAGAGATAAATCATATTATGGCCAGGGGTCATGTTGGCAGGATTAGTCAGAGG +TGCTCTTGTGTTGTGACAAGGGTAGAGAGATTGAAGGAGCCACTTATTAGTAGCGTTGAC +AGTAGGATAATGGCTAGAGTGACTTCGTATGAGATTGTTTGGGCTACTGCTCGTAGTGCA +CCGATTAAGGCGTAG +>ORF_6 +ATGAGTAGGCTAATAGTTTCGATGATAACTAGTATGGGGATAAGGGGTGTAGGTGTGCCT +TGCGGTAAGAAGTGGGCTAGGGCATTTTTAGTCTTAAAGCGAAAGCCTATGACTACTGCG +CCTGCTCATAGGGGGATAGCCATGGCTAGGTTTATAGATAGTTGGGTGGTTGGTGTGAAT +GAGTGGGGTAGAAGCCCAAGAAGATTGGTTGTGGTAATAAAAATGATTAAGGATACTAGT +ATGAGAGATCAGGTTCGTCCTTTAGTGCTGTGTATAGTTATTATTTGTTTTGAGGTCAGT +TGA +>ORF_7 +ATGATGACGCGATGTTATACGAGAAGGCACATACCAAGGCCACCACACACCACCCGTCCA +AAAAGGTCTCCGATATGGGATAATTCTTTTTATTACCTCAGAAGTTTTTTTCTTTGCAGG +ATTTTTTTGAGCTTTCTACCACTCCAGCCTAGCCCCTACCCCCCAGCTAGGAGGACACTG +GCCCCCAACAGGTATTACCCCACTAAATCCCCTAGAAGTCCCACTCCTAAACACATCTGT +ATTACTCGCATCAGGAGTATCAATTACTTGAGCCCATCACAGCTTAATAGAAAATAA +>ORF_8 +ATGCCCCTTATTTATATAAATATTATACTAGCATTTACCATCTCACTTCTAGGAATACTA +GTATATCGCTCACACCTAATATCTTCCCTACTATGCCTAGAAGGAATAATACTATCACTG +TTCATCATAGCCACCCTCATAACCCTCAATACTCACTCCCTCTTAGCCAATATTGTACCC +ATCACCATACTAGTCTTTGCTGCCTGCGAAGCAGCAGTAGGTCTAGCACTACTAGTTTCA +ATCTCTAACACATATGGCTTAGACTACGTACATAACCTAAACCTACTCCAATGCTAA +>ORF_9 +ATGGTTAAATTAAGAATGGTTATGTTAGGGTTATATGGTAGGACTGCTATTATTCAGCCT +ATGTGGGTGATTGAGGAGTATGCTAGGATTTTGCGTAGTTGGGTTTGGTTTAGTCCGCCT +CAGCTGCCTGCTATAATGGACAAGATTGAAAGGGTGAGGAGAAGGTTTACGTTCAGTGAT +GAGGAGATTTGGTATATAATTGAAATAGGGGCTAATTTTTGTCATGTGAGGAGGAGTAGG +CCGGATATTAGGGGGGTGCCTTGGGTAACTTCTGGAACTCAAAAGTGA +>ORF_10 +ATGCTAATTTCCCTCCAAATCTCCTTAATTATAACATTCTCGGCCACAGAGCTAATTATA +TTTTATATCTTCTTCGAAACCACACTTATCCCCACCCTGGCTATCATCACCCGATGGGGT +AACCAACCAGAACGCCTGAACGCAGGTACATACTTCCTATTCTATACCCTAGTAGGCTCC +CTCCCCCTACTCATCGCACTAATCTATACCCACAACACCCTAGGCTCACTAAATATCCTA +TTACTCACTCTTACAACCCAAGAACTATCAAACACCTGA +>ORF_11 +ATGGCTGCTGTGTTGGCATCTGTTCGGGCGTACCATCAGCTAATGAGTAGAAAGGATATA +ATTCCTACGCCTTCTCAGCCGATGAAGAGTTGGAATAGGTTGTTAGCGGTGACTAGGATT +AGTATAGTAATTAGGAAGATAAGTAAGTATTTGAAGAATTGGTTGATGTTGGGGTCTGAG +TCTATATATCATAGTGAGAATTCTATGATGGATCATGTAACGAACAGTGCTACGGGGATA +AATGTTATGGAGAAATAG +>ORF_12 +ATGACCAACCTCCTACTCCTCATTGTACCCATCCTAATCGCAATAGCATTCCTAATGCTA +ACCGAACGAAAAATTCTAGGCTACATACAACTACGCAAAGGTCCCAACATTGTAGGTCCT +TACGGGCTATTACAGCCCTTCGCTGACGCCATAAAACTCTTCACTAAAGAACCCTTAAAA +CCCTCCACTTCAACCATTACCCTCTACATCACCGCCCCAACCCTAGCCCTCACCATTGCC +CTCTTACTATGA +>ORF_13 +ATGGGAGAAGGCTTAGAAGAAAACCCCACAAACCCTATCACTAAACTCACACTCAATAAA +AATAAAGCATATGTCATTATTCTCGCACGGACTACAACCACGACCAATGATATGAAAAAC +CATCGTTGTATTTCAACTACAAGAACACCAATGACCCCGACACGCAAAATTAACCCACTA +ATAAAATTAATTAATCACTCATTTATCGACCTCCCCACCCCATCCAACATTTCCGCATGA +>ORF_14 +ATGATGGCTATGATGGTGGGGATGATGAGGCTATTATTTTTTGTGAATTCTTCGATGATA +ACTCATTTGGGTAAGAAGCCAGTTAGTGGGGGTAGGCCTCCTAGGGAGAGGAGGGTGGAT +GGAATTAGGGGAGTTAATCATGTTAGCTTGTTTCAGGTGCGAGATAGTAGTAGGGTTGTG +GTGCTGGAGTTTAAGTTGAGTAGCAGAAATGCGGTAGTAGTTAGGATGATGTAA +>ORF_15 +ATGGTTCATTGTCCGGAGAGTATGCTGTTGGAGAGGATAGCTATCAGGAGAATTATGGAC +GCAGTTGCTTGTGTGAGAAAGTATTTGATGGCGGCTTCTGTGGAGCGGGGGCTTATTTTT +TTGGTTAGGATTGGGATAAAAGCTAGTATATTTATTTCTAGGCCTACTCAGGTGAAAAAT +CAGTGTGAGCTTAGCGCTGTAATGAGCGTGCCTGTAAGGATGGTAGAGTAG +>ORF_16 +ATGGTGATGCCAGCAGCTAGGACTGGGAGGGATAGGAGAAGTAAGACTGCTGTGATTAGG +ACGGATCAGACGAAGAGGGGTGTTTGGTATTGGGTCATGGCAGGAGGTTTTATATTAATA +ATTGTTGTGATGAAGTTAATGGCTCCTAGGATAGAGGAGATGCCTGCCAGATGTAAGGAG +AAGATGGTTAGGTCTACGGAGGCTCCAGGATGCGAGTAG +>ORF_17 +ATGAGGCCAAATATCCTTCTGAGGAGCCACAGTAATTACAAACCTACTGTCCGCTATCCC +ATACATCGGAACAGACCTGGTCCAGTGAGTCTGAGGAGGCTACTCAGTAGACAGCCCTAC +CCTTACACGATTCTTCACCTTCCACTTTATCTTACCCTTCATCATCACAGCCCTAACAAC +ACTTCATCTCCTATTCTTACACGAAACAGGATCAAATAA +>ORF_18 +ATGAGATGTTTAGAAGTGGGGACCAGTAGAGGGGGGAATAGAATGATTAGTACTGCGGCG +GGTAAGCCTAGGATTGTGGGGGCAGCGAATGAAGCGAATAGATTTTCGTTCATTTTGGTT +CTCAGGGTTTATTGTAGTTTTTTATTTTTATGGGTTTTGGTGAGGGGGGTAGATGGTAAT +TTGAATTTAATATTTTTAGTTGGGTGA +>ORF_19 +ATGAGGTATAATCATAACAAGCTCCATCTGCCTGCGACAAACAGACCTAAAATCGCTCAT +TGCATACCCTTCAGTCAGCCACATAGCCCTCGTAGTAACAGCCATTCTCATCCAAACCCC +CTGAAGCTTCACCGGCGCAATTATCCTCATAATCGCCCACGGACTTACATCCTCATTATT +ATCCTGCCTAGCAAACTCAAATTATGA +>ORF_20 +ATGGCACATGCAGCGCAAGTAGGTCTACAAGATGCTACTTCCCCTATCATAGAAGAACTT +ATTATCTTTCACGACCATGCCCTCATAATTATCTTTCTCATCTGCTTTCTAGTCCTATAC +GCCCTTTTCCTAACACTCACAACAAAACTAACTAATACTAGTATTTCAGACGCCCAGGAA +ATAGAAACCGTCTGA +>ORF_21 +ATGGCAGATGCAAGTAGAAGTAGGAGAGAAGGGGGCAGGAGCCAGAAGCTTATGTTGTTT +ATGCGGGGGAATGCCATGTCGGGGGCACCAATTATCAAGGGAACTAGCCAGTTGCCAAAG +CCTCCGATTATAATAGGCATTACTATGAAGAAGATTATTACGAATGCATGGGCTGTGACG +ATGACATTGTAG +>ORF_22 +ATGTATGCTACCATAACCACCTTAGCCCTAACTTCCTTAATTCCCCCCATCCTCGGCGCC +CTCATTAACCCTAACAAAAAAAACTCATACCCCCATTACGTGAAATCCATTATCGCATCC +ACCTTTATCATTAGCCTTTTCCCCACAACAATATTCATATGCCTAGACCAAGAAACTATT +ATCTCGAACTGA +>ORF_23 +ATGGATCACAGGTCTATCACCCTATTAACCAGTCACGGGAGCCTTCCATGCATTTGGTAT +TTTCGTCTGGGGGGTGTGCACGCGATAGCATTGCGAAACGCTGGCCCCGGAGCACCCTAT +GTCGCAGTATCTGTCTTTGATTCCTGCCCCATTGTATTATTTATCGCACCTACGTTCAAT +ATTACGACCTAG +>ORF_24 +ATGTTTGGGATCTTTAAGGTTGTGGGTGTTGAGCTTGAACGCTTTCTTAATTGGTGGCTG +CTTTTAGGCCTACTATGGGTGTTAAATTTTTTACTCTCTTTACAAGGTTTTTTCCTAGTG +TCTAAAGAGCTGTTCCTCTTTGGACTAACAGTTAAGTTTACAAGGGGATTTAGAGGGTTC +TGTAGGTAA +>ORF_25 +ATGAATTCGAACAGCATATCCCCGATTTCGCTACGACCAGCTCATACACCTCCTATGAAA +AAACTTCCTACCACTCACCCTAGCATCACTCATGTGATATATCTCCATACCCACTACAAT +CTCCAGCATCCCCCCTCAAACCTAAGAAATATGTCTGATAAAAGAATTACTTTGATAGAG +TAA +>ORF_26 +ATGAGGATAATTGCGCCGGTGAAGCTTCAGGGGGTTTGGATGAGAATGGCTGTTACTACG +AGGGCTATGTGGCTGACTGAAGGGTATGCAATGAGCGATTTTAGGTCTGTTTGTCGCAGG +CAGATGGAGCTTGTTATGATTATACCTCATAAGGACAACATGAGGAAGGGATAG +>ORF_27 +ATGAGCTGTTCCCACATTAGGCCTAAAAACAGACGCAATTCCCGGACGCCTAAACCAAAC +CACTTTCACCGCCACACGACCAGGAGTATACTACGGCCAATGCTCAGAAATCTGTGGAGC +AAACCACAGTTTTATACCCATCGTCCTAGAATTAATCCCTCTAAAAATCTTTGA +>ORF_28 +ATGTGGTCATTACCTAGGAGGTTGCCTGGTTGGCCTAGTTCAGCCCGAATAAGGAGACTT +AGGGCTGTGCCCAGGACTCCAGCTCATGCACCGAATAGTAGGTATAGTGTTCCAATATCT +TTGTGGTTTGTAGAGAATAGTCAGCGGTCGGTGAACATCAGTAGGGTGGGGTAA +>ORF_29 +ATGCACCTAATTGGAAGCGCCACACTAGCATTATCAACTATCAATCTACCCTATGCACTC +ATTATCTTCACAATTCTAATCCTACTGACTATTCTAGAGATCGCCGTCGCCTTAATCCAA +GCCTACGTTTTTACACTTCTAGTGAGCCTCTACCTGCACGACAACACATAA +>ORF_30 +ATGCCTATTATAATCGGAGGCTTTGGCAACTGGCTAGTTCCCTTGATAATTGGTGCCCCC +GACATGGCATTCCCCCGCATAAACAACATAAGCTTCTGGCTCCTGCCCCCTTCTCTCCTA +CTTCTACTTGCATCTGCCATAGTAGAAGCCGGCGCGGGAACAGGTTGA +>ORF_31 +ATGATGGAACTTCGGCTCACTTCTCGGCGCCTGCCTAATCCTTCAAATTACCACAGGATT +ATTCCTAGCTATACACTACTCACCAGACGCCTCAACCGCCTTCTCGTCGATCGCCCACAT +CACCCGAGACGTAAACTATGGTTGGATCATCCGCTACCTCCACGCTAA +>ORF_32 +ATGGTGAAGTTAATTACTTTTTCTCTGATTTGTCCTTGGAAGAAAGTTTTCGTTTCCGGT +TTACAAGACCGGTGTATTAGTTTATACTACAAGGGCAGGTTCATTCAAGTATTTTGTTTT +CGATTAGAGAGGCGATTGGTATTAGGATTAGGATTGTTGTGA +>ORF_33 +ATGTTGAATCCTGTGAGTAGGAGAGTGGTATTTGATCAGGAGAATGAGGTTACTAGCACG +GAGAGTTCCCCTAGGAGATTAATGGTAGGGGGTAGGGCGAGGTTAGCGAGGCTTGCCAGG +AGTCATCAAAAGGCTATTAGTGGGAGTAGAGTTTGA +>ORF_34 +ATGCCTAGAAGGAATAATACTATCACTGTTCATCATAGCCACCCTCATAACCCTCAATAC +TCACTCCCTCTTAGCCAATATTGTACCCATCACCATACTAGTCTTTGCTGCCTGCGAAGC +AGCAGTAGGTCTAGCACTACTAGTTTCAATCTCTAA +>ORF_35 +ATGTTCGACAGTTGGGAGTTGATTGTTGTGCGTGCTTGTAAGCATGGAGTGAAGGTTTTG +ATGTGGGAGTGGATTTTATGTACTATAGGTAGTTGGGTGATATGGTACTGTACGATATTC +ATGGTGGCTGGCAGTAATGTACGAAATACATAG +>ORF_36 +ATGCTTCACTCAGCCATTTTACCCCACCCTACTGATGTTCACCGACCGCTGACTATTCTC +TACAAACCACAAAGATATTGGAACACTATACCTACTATTCGGTGCATGAGCTGGAGTCCT +GGGCACAGCCCTAAGTCTCCTTATTCGGGCTGA +>ORF_37 +ATGAGTCCTAGTTGGCTTGAAGTGGAGAAGGCCACGATTTTTTTGATGTCATTTTGTGTG +AGGGCGCAGACTGCTGCGAATAGGGTGGTGATAGCGCCTAGGCATAGCGTGAGAGTTTGG +ATTAGTGGGTTATTCTCTGCTAGGGGGTAG +>ORF_38 +ATGGGCCCGATAGCTTATTTAGCTGACCTTACTTTAGGATGGGGTGTGATAGGTGGCACG +GAGAATTTTGGATTCTCAGGGATGAGTTCGATTCTTATAGTCCTAGAAATAAGGGGATTT +GAACTCCTATTATTTACTCTATCAAAGTAA +>ORF_39 +ATGATTGTGAGGGGTAGAAGTCAAGCAGTTAATATTAGGAGGGGAGTTGTTAAGGGGTCG +GAGGAGAAGGGCAGGGAACAGCTGAATAGGTTGTTGTTAATTTGGTTAAAAAATAGTAAG +GGAATGGTGCTGATAATTAGGCTGTGA +>ORF_40 +ATGATGGCGGGCAGGATAGTTCAGACGGTTTCTATTTCCTGGGCGTCTGAAATACTAGTA +TTAGTTAGTTTTGTTGTGAGTGTTAGGAAAAGGGCGTATAGGACTAGAAAGCAGATGAGA +AAGATAATTATGAGGGCATGGTCGTGA +>ORF_41 +ATGTGCTATGTACGGTGTATGGTTGTATGTACTATGTTCTGTCAAGGGGAGATAGGTCTG +TTGGTATCGGGGTGGGGGAGGGGTGTCGTTGGAATTGTGTTTTATGTTCGACAGTTGGGA +GTTGATTGTTGTGCGTGCTTGTAA +>ORF_42 +ATGAACGAAAATCTATTCGCTTCATTCGCTGCCCCCACAATCCTAGGCTTACCCGCCGCA +GTACTAATCATTCTATTCCCCCCTCTACTGGTCCCCACTTCTAAACATCTCATCAACAAC +CGACTAATTACCACCCAACAATGA +>ORF_43 +ATGCTAGAGGTGATGTTTTTGGTAAACAGGCGGGGTAAGATTTGCCGAGTTCCTTTTACT +TTTTTTAACCTTTCCTTGTGGGCATGCCTGTGTTGGGTTAACAGCGGGGGTAATAATGGC +TTGTTGGTTGATTGTAGATATTAG +>ORF_44 +ATGTTACTTATACTAACATTAGTTCTTCTATGGGGTAATAGATTGGTCCAATTGGGTGTA +AGGAGTTCGGTTGTATGTTTGGGATCTTTAAGGTTGTGGGTGTTGAGCTTGAACGCTTTC +TTAATTGGTGGCTGCTTTTAG +>ORF_45 +ATGATATCAGGATTGAGGGATAGAAGGAGGATGGGGGATAGGTGTAAAAATATGAGAGTG +TTTTCTCGTGTGAATGAGGGCTTTATGCTATTAATGTGGTGGGTGAGTGAGCCTCATTGT +GTTGTGGTAAACATGTAG +>ORF_46 +ATGAAGGGGGAGATGGGTAGAAGCAGTGTGGTAAGGGTGATGAGTGTAGGGAGGAAGGGG +GTGGGTTTTGTATGTTCGAATTGTCATTTTATTTTTACGTTATTAGATATGGGAAGTAGT +GTAATTGAGGTGGAGTAG +>ORF_47 +ATGCCTTTTTGGGTTGAGGTGGTAATGGAAGCGGAGATTTGGTACTGTGAAATTGTTTTA +GGTAATAGTTTCTCTAGTCAGGTCAGGTCTAGAAGAAGTAGGGGTAGGTTTTGGCTTGTA +AGAAGGCCTAGATAG +>ORF_48 +ATGAGGGTGGCTATGATGAACAGTGATAGTATTATTCCTTCTAGGCATAGTAGGGAAGAT +ATTAGGTGTGAGCGATATACTAGTATTCCTAGAAGTGAGATGGTAAATGCTAGTATAATA +TTTATATAA +>ORF_49 +ATGGCTTGTTGGTTGATTGTAGATATTAGGCTGTTAATTGTCAGTTTAATATTTTGGTCT +GATGTAGGCTTATGCGGAGGAGAATGTTTTCATGTTACTTATACTAACATTAGTTCTTCT +ATGGGGTAA +>ORF_50 +ATGCCCTCCCCCCTCAACTCCCATTCTACTAGCCCCAGCAACGTAACCCCCTACTCACCC +TACTCAACACATATACCGCTGCTAACCCCATACCCTGAACCAACCAAACCCCAAAGACAC +CCCTACAC +>ORF_51 +ATGGGGAGAATGTTGTTGGTAATGAGAAATCCTGCAAATAAGCTTCCAATGGTTAGGCGT +TTAATGGGATTTAACAGAGTGGGGTTGTTTTCGTTAATGTTGGTGAGGGTTGGGAAGCGA +GGTTGA +>ORF_52 +ATGCAAGTAGAAGTAGGAGAGAAGGGGGCAGGAGCCAGAAGCTTATGTTGTTTATGCGGG +GGAATGCCATGTCGGGGGCACCAATTATCAAGGGAACTAGCCAGTTGCCAAAGCCTCCGA +TTATAA +>ORF_53 +ATGCAAAAGGTACAGGGGTTAGTCCTTGCTGTATTATGCTTGGGTATAATTTTTCATCTT +TCCCTTGCGGTACTATGTCTATTGCGCCGGTTTACAATTTCTATCGCCTATACTTTATTT +GGGTAA +>ORF_54 +ATGAGTTGGAGTGTAGGAGAAATCATGCTAGGGCTAGGACAAAACCAATATCACCGATAC +GGTTATATAGGATTGCTTGGATGGCTGCTGTGTTGGCATCTGTTCGGGCGTACCATCAGC +TAA +>ORF_55 +ATGACCCACCATAATTACCCCCATACTCCTGACACTATTTCTCGTCACCCAACTAAAAAT +ATTAAATTCAAATTACCATCTACCCCCCTCACCAAAACCCATAAAAATAAAAAACTACAA +TAA +>ORF_56 +ATGAGCCTACGGATGATAGGACATTTCATGTGGTGTATGCATCGGGGTAGTCCGAGTAAC +GTCGGGGCATCCCAGATAGGCCAAGGAAGTGCTGTGGGAAGAAGGTTAGGTTTACGCCAA +TGA +>ORF_57 +ATGAAATTTGAAGTCTGGCTAGGCTGGCGTCTGGGTTCTTTGTTTTTGGGGTTTGGCAGA +GATTTGTTTGAGTGCTGTGGCCGGGGGGAAGGGGGGGTTTGTGGGAATTTTTTGTTATGA +>ORF_58 +ATGAAAGCCATCGTGTACGCTAGTCATATTAAGTTGTTGGCTCAGGTGTTTGATAGTTCT +TGGGTTGTAAGAGTGAGTAATAGGATATTTAGTGAGCCTAGGGTGTTGTGGGTATAG +>ORF_59 +ATGGTACTTGCTGCAGTACTCTTAAAATTAGGTGGCTATGGCATAATACGCCTCACACTC +ATCCTCAACCCCCTAACAAAACATATAGCCTATCCCTTCCTCATGTTGTCCTTATGA +>ORF_60 +ATGCTTGGGTATAATTTTTCATCTTTCCCTTGCGGTACTATGTCTATTGCGCCGGTTTAC +AATTTCTATCGCCTATACTTTATTTGGGTAAATGGTTTGGTTAAGGTTGTTTGGTAG +>ORF_61 +ATGCTTACAAGCACGCACAACAATCAACTCCCAACTGTCGAACATAAAACACAATTCCAA +CGACACCCCTCCCCCACCCCGATACCAACAGACCTATCTCCCCTTGACAGAACATAG +>ORF_62 +ATGCTTGCATGTGTAATCTTACTAAGAGCTAATAGAAAGGCTAGGACCAAACCTGTTTGT +TTATGGGGTGATGTAAACCCGTCGAAACATTTTCAGTGTATTGCTTTGAGGGGGTAA +>ORF_63 +ATGGGCCCGGAGCGAGGAGAGTCACTCTTGTGCGGGATATTGATTTCACGGAGGATGGTG +ACCAAGGGATTCCTATCTGAGGGGGAGCATCCGTGGGGGCGAGGAGGGGTTTGA +>ORF_64 +ATGCTTTGTTGTTTGGATGTGTGGAGGACAGGGATTGCTGTTAGGATTAGGATAGATAGT +AGTAGGGCGAGGACGCCTCCTAGTTTGTTGGGGATGGATCGGAGGATTGTGTAG +>ORF_65 +ATGAAAATCACCTCAGAGCTGGTAAAAAGAGGCTTAACCCCTGTCTTTAGATTTACAGTC +CAATGCTTCACTCAGCCATTTTACCCCACCCTACTGATGTTCACCGACCGCTGA +>ORF_66 +ATGTCTAATGATGAGTTTGCTAGTACAATGCCGGTTAGGCCACCTACGGTGAAGAGAAAG +ATAAACCCTAGGGCTCAGAGTACTGCGGCAGATCATTTCATATTGCTTCCGTGA +>ORF_67 +ATGATCCATCATAGAATTCTCACTATGATATATAGACTCAGACCCCAACATCAACCAATT +CTTCAAATACTTACTTATCTTCCTAATTACTATACTAATCCTAGTCACCGCTAA +>ORF_68 +ATGAGATTGTTTGGGCTACTGCTCGTAGTGCACCGATTAAGGCGTAGTTCGAGTTTGATG +CTCACCCTGATCAGAGGATTGAGTAAACGGCTAGGCTGGAGGTGGCTAGAATAA +>ORF_69 +ATGGTTTTTCATATCATTGGTCGTGGTTGTAGTCCGTGCGAGAATAATGACATATGCTTT +ATTTTTATTGAGTGTGAGTTTAGTGATAGGGTTTGTGGGGTTTTCTTCTAA +>ORF_70 +ATGAGGGCGCCGAGGATGGGGGGAATTAAGGAAGTTAGGGCTAAGGTGGTTATGGTAGCA +TACATGGTTATTACTTTTATTTGGAGTTGCACCAAAATTTTTGGGGCCTAA +>ORF_71 +ATGACAATTCGAACATACAAAACCCACCCCCTTCCTCCCTACACTCATCACCCTTACCAC +ACTGCTTCTACCCATCTCCCCCTTCATACTAATAATCTTATAGAAATTTAG +>ORF_72 +ATGATTAACTCCCCTAATTCCATCCACCCTCCTCTCCCTAGGAGGCCTACCCCCACTAAC +TGGCTTCTTACCCAAATGAGTTATCATCGAAGAATTCACAAAAAATAA +>ORF_73 +ATGGTTGGATCATCCGCTACCTCCACGCTAACGGCGCCTCAATATTTTTTATCTGCCTCT +TCCTACACATCGGCCGAGGTCTATATTACGGCTCATTTCTCTACCTAG +>ORF_74 +ATGACCCCTAACAGGGGCCCTCTCGGCCCTCCTAATAACCTCCGGCCTGGCCATATGATT +CCACTTCTACTCCACAACACTACTCACACTAGGCTTACTAACTAA +>ORF_75 +ATGTGTGGTAGGGTGGGGGGCATCCATATAGTCATTCCAGGTTTGCGGAGGGCTCTTCTA +CTATTAGGACTTTTCGTTTTGAAGCAAAGGCTTCTCAAATCATGA +>ORF_76 +ATGTTCATTGGCGTAAACCTAACCTTCTTCCCACAGCACTTCCTTGGCCTATCTGGGATG +CCCCGACGTTACTCGGACTACCCCGATGCATACACCACATGA +>ORF_77 +ATGTACTATGTTCTGTCAAGGGGAGATAGGTCTGTTGGTATCGGGGTGGGGGAGGGGTGT +CGTTGGAATTGTGTTTTATGTTCGACAGTTGGGAGTTGA +>ORF_78 +ATGAGTCGAAATCATTCGTTTTATTTAAACTATATACCAATTCGGTTCAGTCTAACCCTT +TTTGTAATCATTCGTAGGCGAGGCTTAGGGCTAGGATAG +>ORF_79 +ATGCTGGAGATTGTAGTGGGTATGGAGATATATCACATGAGTGATGCTAGGGTGAGTGGT +AGGAAGTTTTTTCATAGGAGGTGTATGAGCTGGTCGTAG +>ORF_80 +ATGACATTAACACTATTCTCACCAGGCCTCCTAGGCGATCCAGACAACTATACCCTAGCT +AACCCCCTAAACACCCCACCCCACATTAAACCCGAGTGA +>ORF_81 +ATGAGTAGGAAGATTCCTGCTACGACTATGGTGCTTGAGTGGAGTAGGGCTGAAACAGGG +GTAGGGCCTTCTATGGCTGAGGGGAGTCAGGGGTGA +>ORF_82 +ATGCAGAGTGGGGTTTTGCAGTCCTTAGTTGTTGCAGAAATTAAGTATTGTAACTTGCTG +AGGGCTTTGAAGGCTCTTGGTCTGTGCTTAACCTAA +>ORF_83 +ATGTCGCAGTATCTGTCTTTGATTCCTGCCCCATTGTATTATTTATCGCACCTACGTTCA +ATATTACGACCTAGCATACCTACTAAAGTGTGTTGA +>ORF_84 +ATGCATTTGGTATTTTCGTCTGGGGGGTGTGCACGCGATAGCATTGCGAAACGCTGGCCC +CGGAGCACCCTATGTCGCAGTATCTGTCTTTGA +>ORF_85 +ATGGATAACTGTTATCCTTTAAAAGTTGAGAAAGCCATGTTGTTAGGCATGGGAATACGA +GTTAGCAGTTCTTATAAGCTTTCTCGGTAA +>ORF_86 +ATGATATTGAACCTACGAATACACCGACTACGGCGGGCTAATCTTCAACTCCTACATACT +CCCCCCATTATTTCTAGAACCAGGTGA +>ORF_87 +ATGAAAATTATTAATATTACTGCTGTCAGGGAGATAAATGAGCCTACGGATGATAGGACA +TTTCATGTGGTGTATGCATCGGGGTAG +>ORF_88 +ATGATATTATCTCAATTTAGCGCCATGCCAACACCCACTCAAGAACAGAGTTTGTTAAGA +TGGCAGAGCCCGGTAATTGCATAA +>ORF_89 +ATGGTGAGGGAGGTTGAAGTGAGGGGTATGGTTTTGAGTAATCCTCCTATTTTTCGAATG +TCTTGCTCATTATTGAGGTTGTGA +>ORF_90 +ATGAGGCAGATAGTGAGGAAAGTTGATCCAATAATGACGTGGAGTCCGTGGAAGCCTGTG +GCTACAAAGAATGTTGAGCCGTAG +>ORF_91 +ATGTGGCTTCGACCCTATATCCCCCGCCCGCGTCCCCTTCTCCATAAAATTTTTCCTAGT +AGCCATCACCTTCCTATTATTTGA +>ORF_92 +ATGGGGTGTGATAGGTGGCACGGAGAATTTTGGATTCTCAGGGATGAGTTCGATTCTTAT +AGTCCTAGAAATAAGGGGATTTGA +>ORF_93 +ATGTCGGATACAGTTCACTTTAGCTACCCCCAGATGTTATGGGCCCGGAGCGAGGAGAGT +CACTCTTGTGCGGGATATTGA +>ORF_94 +ATGGCAGAGCCCGGTAATTGCATAAAACTTAAAACTTTACAATCAGAGGTTCAATTCCTC +TTCTTGACAACACACCCATGA +>ORF_95 +ATGGAATTAGGGGAGTTAATCATGTTAGCTTGTTTCAGGTGCGAGATAGTAGTAGGGTTG +TGGTGCTGGAGTTTAAGTTGA +>ORF_96 +ATGGGTACAATGAGGAGTAGGAGGTTGGTCATGGGTGTGTTGTCAAGAAGAGGAATTGAA +CCTCTGATTGTAAAGTTTTAA +>ORF_97 +ATGTATGGGATAGCGGACAGTAGGTTTGTAATTACTGTGGCTCCTCAGAAGGATATTTGG +CCTCATGGGAGGACATAG +>ORF_98 +ATGGCCAGGCCGGAGGTTATTAGGAGGGCCGAGAGGGCCCCTGTTAGGGGTCATGGGCTG +GGTTTTACTATGTGGTAG +>ORF_99 +ATGGGCTGGGTTTTACTATGTGGTAGGCATGTGATTGGTGGGTCATTATGTGTTGTCGTG +CAGGTAGAGGCTCACTAG +>ORF_100 +ATGCCTAGACCAAGAAACTATTATCTCGAACTGACACTGAGCAACAACCCAAACAACCCA +ACTCTCCCTGAGCTTTAA +>ORF_101 +ATGGTTGAAGTGGAGGGTTTTAAGGGTTCTTTAGTGAAGAGTTTTATGGCGTCAGCGAAG +GGCTGTAATAGCCCGTAA +>ORF_102 +ATGTTAAGCTACACTCTGGTTCGTCCAAGTGCACTTTCCAGTACACTTACCATGTTACGA +CTTATCTCCTCTATATAA +>ORF_103 +ATGCTATCGCGTGCACACCCCCCAGACGAAAATACCAAATGCATGGAAGGCTCCCGTGAC +TGGTTAATAGGGTGA +>ORF_104 +ATGGCTCCACGAGGGTTTAGCTGTCTCTTACTTTCAACCAGTGAAATTGACCTACCCGTG +AAGAGGCGGGCATAA +>ORF_105 +ATGAGAGTAATAGATAGGGCTCAGGCGTTTGTGTATGATATGTTAGCGGTTTCGATGATG +AGGTCTTTGGAGTAG +>ORF_106 +ATGAAGCGAATAGATTTTCGTTCATTTTGGTTCTCAGGGTTTATTGTAGTTTTTTATTTT +TATGGGTTTTGGTGA +>ORF_107 +ATGTATTGCTCGGAGGTTGGGTTGTGCTCCGAGGTCGCCCCAACCGAAATTTTTAATGCA +GGTTTAATAGTTTAG