In [3]:
consensus_file = r"D:\josiah\Documents\Research\Colleagues\Will Plumb\consensus align.txt"
with open(consensus_file, 'r') as infile:
    for line in infile.read().splitlines():
        print(line)


>CON
ATGGAAGACMAAAWWGCWAATTTGWTWGCVTTTTYCRTWGTWAYTSTACT
CATARTTGYCATTATCATTGCTCGTNTWTYTCTGAAACTYTCCARGACDT
TTTTTCTKATATKTGGAGCTGATATTGCAGCAATTCTAGCAGTTTTTGCA
KTWRTRGCKATCCGGVYTCGTTTYRCYGCTCGRMGAAAACAACTYGAACD
RCRGTWYGATTCAGAWGGCCGWGAGCTTMGAATMGAGTACAGTTTTCTGA
GGAAAGTTGCYGGMGTTCCSAYAAARTTCMGGTATMGGGAYYTRGAWRTA
GCCACRGATGGCTTTSGATCWATGGTRGGACGTGGGKCSTCRGCTKYART
CTTTAAAGGGATMCTCARYGAYGGGACRGCWGTKGCAGTAAAAMGGATYG
AAGGGGRTGATCRAGGASRGAAGGAATTCAAATCAGAAGTYGCAGCTATT
GCTAGCGTGCAACACGTMAACCTYGTHCGYCTTCTYGGGTWYTGTKTCBM
GTCSACTGGTCCTCGWYTCMTYGTTTACGABTTCATTCAYAAYGGCTCGT
TGGATAATTGGATTTTCCCCARGVGSGWAMKDBKTGRYCRAYKYAVTGGT
TGTTTGACATGGGATTYGAGATGTRSAGTTGCTCTYGAYGTAGCKARAGC
RCTWTCTTACTTGCAYCRYGATTGTCGRTCTTGYATACTGCATCTAGATG
TKAAGCCRGAAAATATACTTMTMGACCAWGATTATCGYGCRCTYGTGTCR
GAYTTYGGGCTCTCRAAAMTDAAAGGAAKAGASGAGAGTCGAGTTGTGAC
AACDATYCGDGGGACTAGAGGTTAYTTGGCTCCTGAATGGMTCCTGGAGA
AYGGAGTWTCHGAGAAATGTGAYGTGTACAGTTATGGAATGGTGCTBTTA
GAGATTATYGGTGGACRAARAARYGTCNGTGTTCTYGAMAAWGGYAWHSG
YGARTCGAAAARAAAGTTTCARTWCTTCCCRAAGATYGTGAGYGASAAAT
WKAAAGMTGGGAAACTTAYGGAAATTGTTGATCCAAGGYTRGTTGAAGAT
KKWGGGRTTAAYGAGAGRCARTTAAARAGACTGGTTTGTGCAGCTTTATG
GTGCATACAAGAGAMGRCCAAGCKTAGGCCAASCATGGCTAYGGTYGTTG
AAATGCTYGAGGGGCGTGTACYDGTYSAAGACCCKCCCRACACRCAAATG
CTTRTWRTTGATWTVTTAWCAMTTGRYRARGAKSMRGCTRTYRTRCTCCC
ARGCSTAGATWTGGTRTAGTGRGAWRRWTACSAAATGAATAGTGACATTC
CTTCMWCRTCRAGTTACTCGGTTACAATGTCRRYASTSTCRGGYCGGTAG
>FRAX21_FRAEX38873_V2_000292250.1_R0
ATGGAAGACAAAAAAGCAAATTTGATTGCATTTTCCATAGTAACTCTACT
CATAATTGCCATTATCATTGCTCGTTTATCTCTGAAACTTTCCAAGACAT
TTTTTCTGATATGTGGAGCTGATATTGCAGCAATTCTAGCAGTTTTTGCA
GTAATAGCTATCCGGGCTCGTTTTACCGCTCGACGAAAACAACTCGAACG
GCAGTATGATTCAGAAGGCCGAGAGCTTCGAATCGAGTACAGTTTTCTGA
GGAAAGTTGCCGGAGTTCCCATAAAGTTCCGGTATCGGGACTTGGAAATA
GCCACGGATGGCTTTCGATCTATGGTGGGACGTGGGGCGTCAGCTTCAAT
CTTTAAAGGGATACTCAATGATGGGACGGCAGTGGCAGTAAAACGGATCG
AAGGGGATGATCGAGGACAGAAGGAATTCAAATCAGAAGTTGCAGCTATT
GCTAGCGTGCAACACGTAAACCTCGTCCGTCTTCTCGGGTATTGTGTCCC
GTCGACTGGTCCTCGTTTCCTTGTTTACGATTTCATTCATAACGGCTCGT
TGGATAATTGGATTTTCCCCAAGGGCGAAAGTCGTGGTCGATGTAGTGGT
TGTTTGACATGGGATTTGAGATGTGGAGTTGCTCTCGATGTAGCTAGAGC
GCTTTCTTACTTGCACCACGATTGTCGGTCTTGTATACTGCATCTAGATG
TGAAGCCGGAAAATATACTTCTCGACCATGATTATCGCGCACTTGTGTCA
GATTTTGGGCTCTCAAAACTAAAAGGAAGAGACGAGAGTCGAGTTGTGAC
AACAATTCGGGGGACTAGAGGTTACTTGGCTCCTGAATGGCTCCTGGAGA
ATGGAGTTTCTGAGAAATGTGATGTGTACAGTTATGGAATGGTGCTGTTA
GAGATTATTGGTGGACGAAAAAACGTCCGTGTTCTCGAAAATGGTAACGG
TGAATCGAAAAAAAAGTTTCAATTCTTCCCAAAGATTGTGAGTGACAAAT
TTAAAGATGGGAAACTTATGGAAATTGTTGATCCAAGGCTGGTTGAAGAT
GGAGGGGTTAACGAGAGGCAATTAAAGAGACTGGTTTGTGCAGCTTTATG
GTGCATACAAGAGAAGGCCAAGCTTAGGCCAAGCATGGCTATGGTCGTTG
AAATGCTCGAGGGGCGTGTACCGGTTGAAGACCCGCCCAACACACAAATG
CTTGTAGTTGATTTGTTATCAATTGATGAAGAGCAAGCTGTTATGCTCCC
AGGCCTAGATTTGGTATAGT-GGAAGAATACCAAATGAATAGTGACATTC
CTTCCACGTCGAGTTACTCGGTTACAATGTCGATACTCTCAGGCCGGTAG
>FRAX19_FRAEX38873_V2_000292250.1_R0
ATGGAAGACAAAAAAGCAAATTTGATTGCATTTTCCATAGTAATTGTACT
CATAATTGTCATTATCATTGCTCGTTTATTTCTGAAACTTTCCAAGACAT
TTTTTCTGATATGTGGAGCTGATATTGCAGCAATTCTAGCAGTTTTTGCA
GTTATAGCGATCCGGCTTCGTTTTACCGCTCGACGAAAACAACTCGAACG
ACAGTTCGATTCAGAAGGCCGAGAGCTTCGAATCGAGTACAGTTTTCTGA
GGAAAGTTGCCGGAGTTCCCATAAAGTTCCGGTATCGGGATTTAGAAGTA
GCCACGGATGGCTTTCGATCAATGGTAGGACGTGGGGCGTCGGCTTCAGT
CTTTAAAGGGATACTCAATGATGGGACGGCAGTGGCAGTAAAAAGGATCG
AAGGGGATGATCAAGGAGAGAAGGAATTCAAATCAGAAGTCGCAGCTATT
GCTAGCGTGCAACACGTAAACCTCGTACGCCTTCTCGGGTATTGTGTCCC
GTCGACTGGTCCTCGTTTCCTTGTTTACGAGTTCATTCATAACGGCTCGT
TGGATAATTGGATTTTCCCCAAGGGGGAAATTTGTGGTCGACGTAGTGGT
TGTTTGACATGGGATTCGAGATGTAGAGTTGCTCTTGATGTAGCGAGAGC
GCTTTCTTACTTGCACCACGATTGTCGATCTTGTATACTGCATCTAGATG
TGAAGCCGGAAAATATACTTCTAGACCATGATTATCGCGCACTCGTGTCA
GATTTCGGGCTCTCGAAACTAAAAGGAAGAGAGGAGAGTCGAGTTGTGAC
AACGATCCGGGGGACTAGAGGTTACTTGGCTCCTGAATGGCTCCTGGAGA
ACGGAGTATCAGAGAAATGTGATGTGTACAGTTATGGAATGGTGCTGTTA
GAGATTATTGGTGGACAAAGAAACGTCCGTGTTCTCGAAAATGGCATCGG
TGAGTCGAAAAAAAAGTTTCAGTACTTCCCAAAGATTGTGAGTGACAAAT
TGAAAGATGGGAAACTTATGGAAATTGTTGATCCAAGGTTGGTTGAAGAT
TGTGGGGTTAATGAGAGGCAATTAAAGAGACTGGTTTGTGCAGCTTTATG
GTGCATACAAGAGAAGGCCAAGCGTAGGCCAAGCATGGCTATGGTCGTTG
AAATGCTCGAGGGGCGTGTACCTGTCGAAGACCCGCCCAACACACAAATG
CTTATTGTTGATTTATTATCAATTGATGAAGAGGAAGCTGTTGTACTCCC
AGGCCTAGATTTGGTATAGT-GGATAATTACCAAATGAATAGTGACATTC
CTTCCTCGTCGAGTTACTCGGTTACAATGTCAGTACTCTCAGGCCGGTAG
>FRAX20_FRAEX38873_V2_000292250.1_R0
ATGGAAGACAAAAAAGCAAATTTGTTAGCATTTTCCATAGTAATTGTACT
CATAATTGTCATTATCATTGCTCGTTTATTTCTGAAACTTTCCAGGACAT
TTTTTCTGATATGTGGAGCTGATATTGCAGCAATTCTAGCAGTTTTTGCA
GTTATAGCGATCCGGGTTCGTTTTACCGCTCGACGAAAACAACTCGAACG
ACAGTTCGATTCAGAAGGCCGTGAGCTTCGAATCGAGTACAGTTTTCTGA
GGAAAGTTGCCGGAGTTCCGATAAAGTTCCGGTATCGGGATCTGGAAGTA
GCCACGGATGGCTTTCGATCAATGGTAGGACGTGGGGCGTCGGCTTCAGT
CTTTAAAGGGATACTCAATGATGGGACGGCAGTGGCAGTAAAAAGGATCG
AAGGGGATGATCAAGGAGAGAAGGAATTCAAATCAGAAGTTGCAGCTATT
GCTAGCGTGCAACACGTAAACCTCGTTCGCCTTCTCGGGTATTGTGTCCA
GTCGACTGGTCCTCGACTCCTTGTTTACGAGTTCATTCATAACGGCTCGT
TGGATAATTGGATTTTCCCCAGGCGGGAACGTTGTGGTCGACTTAGTGGT
TGTTTGACATGGGATTCGAGATGTAGAGTTGCTCTTGATGTAGCGAGAGC
GCTATCTTACTTGCACCACGATTGTCGATCTTGCATACTGCATCTAGATG
TGAAGCCGGAAAATATACTTCTCGACCATGATTATCGCGCACTCGTGTCG
GATTTCGGGCTCTCGAAACTAAAAGGAATAGACGAGAGTCGAGTTGTGAC
AACGATCCGAGGGACTAGAGGTTACTTGGCTCCTGAATGGCTCCTGGAGA
ACGGAGTATCAGAGAAATGTGATGTGTACAGTTATGGAATGGTGCTGTTA
GAGATTATTGGTGGACAAAGAAACGTCCGTGTTCTCGAAAATGGCATCCG
TGAGTCGAAAAAAAAGTTTCAATACTTCCCAAAGATTGTGAGTGACAAAT
TGAAAGATGGGAAACTTATGGAAATTGTTGATCCAAGGTTGGTTGAAGAT
GGAGGGGTTAATGAGAGGCAATTAAAGAGACTGGTTTGTGCAGCTTTATG
GTGCATACAAGAGAAGGCCAAGCGTAGGCCAAGCATGGCTATGGTCGTTG
AAATGCTCGAGGGGCGTGTACCTGTCGAAGACCCGCCCAACACGCAAATG
CTTATTGTTGATTTATTATCAATTGATGAAGAGGAAGCTGTTGTACTCCC
AGGCGTAGATTTGGTATAGT-GGATAATTACCAAATGAATAGTGACATTC
CTTCCTCGTCGAGTTACTCGGTTACAATGTCAGTACTCTCAGGCCGGTAG
>FRAX31_FRAEX38873_V2_000292250.1_R0
ATGGAAGACAAAAATGCAAATTTGATTGCGTTTTCCATAGTAATTGTACT
CATAATTGTCATTATCATTGCTCGTTTATCTCTGAAACTTTCCAAGACAT
TTTTTCTGATATTTGGAGCTGATATTGCAGCAATTCTAGCAGTTTTTGCA
TTTATAGCGATCCGGGTTCGTTTTGCCGCTCGGAGAAAACAACTCGAACG
ACAGTTCGATTCAGAAGGCCGAGAGCTTCGAATCGAGTACAGTTTTCTGA
GGAAAGTTGCCGGAGTTCCGATAAAGTTCCGGTATCGGGACTTGGAAGTA
GCCACGGATGGCTTTCGATCTATGGTAGGACGTGGGGCGTCGGCTTTAGT
CTTTAAAGGGATACTCAATGATGGGACGGCAGTTGCAGTAAAAAGGATCG
AAGGGGATGATCGAGGAGAGAAGGAATTCAAATCAGAAGTTGCAGCTATT
GCTAGCGTGCAACACGTCAACCTCGTACGCCTTCTCGGGTATTGTGTCCC
GTCGACTGGTCCTCGTCTCCTTGTTTACGACTTCATTCATAATGGCTCGT
TGGATAATTGGATTTTCCCCAAGGGGGAAAGTCGTGGTCGACGTACTGGT
TGTTTGACATGGGATTCGAGATGTAGAGTTGCTCTTGATGTAGCGAAAGC
GCTTTCTTACTTGCACCACGATTGTCGATCTTGTATACTGCATCTAGATG
TGAAGCCGGAAAATATACTTCTCGACCATGATTATCGCGCACTCGTGTCA
GATTTCGGGCTCTCGAAACTGAAAGGAAGAGACGAGAGTCGAGTTGTGAC
AACTATCCGTGGGACTAGAGGTTACTTGGCTCCTGAATGGCTCCTGGAGA
ATGGAGTTTCTGAGAAATGTGATGTGTACAGTTATGGAATGGTGCTGTTA
GAGATTATTGGTGGACGAAGAAACGTCCGTGTTCTCGAAAAAGGCAAAGG
TGAGTCGAAAAAAAAGTTTCAATACTTCCCAAAGATTGTGAGCGACAAAT
TTAAAGATGGGAAACTTATGGAAATTGTTGATCCAAGGTTGGTTGAAGAT
GGAGGGGTTAATGAGAGACAATTAAAGAGACTGGTTTGTGCAGCTTTATG
GTGCATACAAGAGAAGGCCAAGCTTAGGCCAAGCATGGCTATGGTCGTTG
AAATGCTCGAGGGGCGTGTACCGGTCGAAGACCCGCCCAACACACAAATG
CTTATTGTTGATTTGTTATCAATTGATGAAGAGGCAGCTGTCGTACTCCC
AGGCCTAGATTTGGTATAGT-GGAAAGTTACCAAATGAATAGTGACATTC
CTTCCACGTCGAGTTACTCGGTTACAATGTCGATACTCTCAGGCCGGTAG
>FRAX25_FRAEX38873_V2_000292250.1_R0
ATGGAAGACAAAAAAGCAAATTTGATTGCATTTTTCATAGTAATTGTACT
CATAATTGTCATTATCATTGCTCGTTTATCTCTGAAACTTTCCAAGACTT
TTTTTCTTATATGTGGAGCTGATATTGCAGCAATTCTAGCAGTTTTTGCA
GTTATAGCGATCCGGGTTCGTTTTACCGCTCGACGAAAACAACTCGAACG
ACAGTTTGATTCAGAAGGCCGAGAGCTTCGAATAGAGTACAGTTTTCTGA
GGAAAGTTGCCGGAGTTCCGATAAAGTTCCGGTATCGGGACTTGGAAGTA
GCCACAGATGGCTTTCGATCTATGGTAGGACGTGGGGCGTCGGCTTCAGT
CTTTAAAGGGATACTCAATGATGGGACGGCAGTGGCAGTAAAAAGGATCG
AAGGGGATGATCGAGGAGAGAAGGAATTCAAATCAGAAGTTGCAGCTATT
GCTAGCGTGCAACACGTAAACCTCGTACGCCTTCTCGGGTATTGTTTCCC
GTCCACTGGTCCTCGTTTCCTTGTTTACGAGTTCATTCATAACGGCTCGT
TGGATAATTGGATTTTCCCCAAGAGGGAAAGTTGTGGTCGACGTAGTGGT
TGTTTGACATGGGATTCGAGATGTAGAGTTGCTCTTGATGTAGCGAGAGC
GCTTTCTTACTTGCACCACGATTGTCGATCTTGTATACTGCATCTAGATG
TGAAGCCGGAAAATATACTTCTCGACCATGATTATCGCGCGCTCGTGTCA
GATTTCGGGCTCTCAAAACTAAAAGGAAGAGACGAGAGTCGAGTTGTGAC
AACGATCCGGGGGACTAGAGGTTATTTGGCTCCTGAATGGCTCCTGGAGA
ATGGAGTTTCTGAGAAATGTGATGTGTACAGTTATGGAATGGTGCTTTTA
GAGATTATTGGTGGACGAAGAAGCGTCCGTGTTCTCGAAAATGGCAACGG
TGAATCGAAAAGAAAGTTTCAATTCTTCCCAAAGATTGTGAGTGACAAAT
TTAAAGATGGGAAACTTATGGAAATTGTTGATCCAAGGTTAGTTGAAGAT
GGAGGGGTTAATGAGAGGCAATTAAAAAGACTGGTTTGTGCAGCTTTATG
GTGCATACAAGAGAAGGCCAAGCTTAGGCCAAGCATGGCTACGGTCGTTG
AAATGCTCGAGGGGCGTGTACCGGTTGAAGACCCGCCCGACACACAAATG
CTTATAGTTGATATGTTATCAATTGATGAAGAGGCAGCTGTTGTACTCCC
AGGCCTAGATTTGGTATAGT-AGAAAATTACCAAATGAATAGTGACATTC
CTTCCACATCGAGTTACTCGGTTACAATGTCGATACTCTCAGGCCGGTAG
>FRAX07_FRAEX38873_V2_000292250.1_R0
ATGGAAGACAAAAAAGCAAATTTGATTGCATTTTCCGTAGTAATTGTACT
CATAATTGTCATTATCATTGCTCGTTTATCTCTGAAACTTTCCAAGACAT
TTTTTCTGATATGTGGAGCTGATATTGCAGCAATTCTAGCAGTTTTTGCA
GTTATAGCGATCCGGGTTCGTTTCACCGCTCGACGAAAACAACTCGAACG
ACAGTTTGATTCAGATGGCCGAGAGCTTAGAATCGAGTACAGTTTTCTGA
GGAAAGTTGCCGGAGTTCCGATAAAGTTCCGGTATCGGGACTTGGAAGTA
GCCACGGATGGCTTTCGATCTATGGTAGGACGTGGGGCGTCGGCTTCAGT
CTTTAAAGGGATACTCAATGATGGGACGGCAGTGGCAGTAAAAAGGATCG
AAGGGGATGATCAAGGAGGGAAGGAATTCAAATCAGAAGTTGCAGCTATT
GCTAGCGTGCAACACGTAAACCTCGTACGCCTTCTCGGGTATTGTGTCTC
GTCCACTGGTCCTCGTTTCCTCGTTTACGAGTTCATTCACAACGGCTCGT
TGGATAATTGGATTTTCCCCAAGGGGGTAAGTTGTGGCCGACGTAATGGT
TGTTTGACATGGGATTCGAGATGTAGAGTTGCTCTTGATGTAGCGAGAGC
GCTTTCTTACTTGCACCGTGATTGTCGATCTTGTATACTGCATCTAGATG
TGAAGCCGGAAAATATACTTCTCGACCATGATTATCGCGCACTCGTGTCA
GATTTCGGGCTCTCGAAACTAAAAGGAAGAGACGAGAGTCGAGTTGTGAC
AACGATCCGGGGGACTAGAGGTTACTTGGCTCCTGAATGGCTCCTGGAGA
ATGGAGTTTCTGAGAAATGTGACGTGTACAGTTATGGAATGGTGCTCTTA
GAGATTATTGGTGGACAAAGAAACGTCCGTGTTCTCGACAATGGCAACGG
TGAATCGAAAAAAAAGTTTCAATTCTTCCCAAAGATTGTGAGTGACAAAT
TTAAAGATGGGAAACTTATGGAAATTGTTGATCCAAGGTTAGTTGAAGAT
GGAGGGGTTAATGAGAGGCAATTAAAGAGACTGGTTTGTGCAGCTTTATG
GTGCATACAAGAGAAGACCAAGCTTAGGCCAACCATGGCTACGGTCGTTG
AAATGCTCGAGGGGCGTGTACTGGTTGAAGACCCGCCCAACACACAAATG
CTTATAGTTGATTTGTTATCAATTGATGAAGAGGCGGCTGTTGTACTCCC
AGGCCTAGATTTGGTATAGT-AGAAAATTACCAAATGAATAGTGACATTC
CTTCCACGTCGAGTTACTCGGTTACAATGTCGGTACTCTCAGGCCGGTAG
>FRAX08_FRAEX38873_V2_000292250.1_R0
ATGGAAGACAAAATAGCAAATTTGATTGCATTTTCCGTAGTAATTGTACT
CATAATTGTCATTATCATTGCTCGTTTATCTCTGAAACTTTCCAAGACAT
TTTTTCTGATATGTGGAGCTGATATTGCAGCAATTCTAGCAGTTTTTGCA
GTTATAGCGATCCGGGTTCGTTTCACCGCTCGACGAAAACAACTTGAACG
ACAGTTTGATTCAGAAGGCCGAGAGCTTCGAATCGAGTACAGTTTTCTGA
GGAAAGTTGCCGGAGTTCCGATAAAGTTCCGGTATCGGGACTTGGAAGTA
GCCACGGATGGCTTTCGATCTATGGTAGGACGTGGGGCGTCGGCTTCAGT
CTTTAAAGGGATACTCAATGATGGGACGGCAGTGGCAGTAAAAAGGATCG
AAGGGGATGATCAAGGAGAGAAGGAATTCAAATCAGAAGTTGCAGCTATT
GCTAGCGTGCAACACGTAAACCTCGTACGCCTTCTCGGGTATTGTGTCTC
GTCCACTGGTCCTCGTTTCCTCGTTTACGAGTTCATTCACAACGGCTCGT
TGGATAATTGGATTTTCCCCAAGAGGGAAAGTTGTGGCCGACGTAATGGT
TGTTTGACATGGGATTCGAGATGTAGAGTTGCTCTTGATGTAGCGAGAGC
GCTTTCTTACTTGCACCGTGATTGTCGATCTTGTATACTGCATCTAGATG
TGAAGCCGGAAAATATACTTCTCGACCATGATTATCGCGCACTCGTGTCA
GATTTCGGGCTCTCGAAACTAAAAGGAAGAGACGAGAGTCGAGTTGTGAC
AACGATCCGGGGGACTAGAGGTTACTTGGCTCCTGAATGGCTCCTGGAGA
ATGGAGTTTCTGAGAAATGTGATGTGTACAGTTATGGAATGGTGCTTTTA
GAGATTATTGGTGGACAAAGAAACGTCCGTGTTCTCGAAAATGGCAACGG
TGAATCGAAAAAAAAGTTTCAATTCTTCCCAAAGATTGTGAGTGACAAAT
TTAAAGATGGGAAACTTATGGAAATTGTTGATCCAAGGTTAGTTGAAGAT
GGAGGGGTTAATGAGAGGCAATTAAAGAGACTGGTTTGTGCAGCTTTATG
GTGCATACAAGAGAAGGCCAAGCTTAGGCCAACCATGGCTACGGTCGTTG
AAATGCTCGAGGGGCGTGTACTGGTTGAAGACCCGCCCAACACACAAATG
CTTATAGTTGATTTGTTATCAATTGATGAAGAGGCGGCTGTTGTACTCCC
AGGCCTAGATTTGGTATAGT-AGAAAATTACCAAATGAATAGTGACATTC
CTTCCACGTCGAGTTACTCGGTTACAATGTCGGTACTCTCAGGCCGGTAG
>FRAX12_FRAEX38873_V2_000292250.1_R0
ATGGAAGACAAAAAAGCAAATTTGATTGCATTTTCCGTAGTAATTGTACT
CATAATTGTCATTATCATTGCTCGTTTATCTCTGAAACTTTCCAAGACAT
TTTTTCTGATATGTGGAGCTGATATTGCAGCAATTCTAGCAGTTTTTGCA
GTTATAGCGATCCGGGTTCGTTTCACCGCTCGACGAAAACAACTCGAACG
ACAGTTTGATTCAGATGGCCGAGAGCTTAGAATCGAGTACAGTTTTCTGA
GGAAAGTTGCCGGAGTTCCGATAAAGTTCCGGTATAGGGACTTGGAAGTA
GCCACGGATGGCTTTCGATCTATGGTAGGACGTGGGGCGTCGGCTTCAGT
CTTTAAAGGGATACTCAATGATGGGACGGCAGTGGCAGTAAAAAGGATCG
AAGGGGGTGATCAAGGAGAGAAGGAATTCAAATCAGAAGTTGCAGCTATT
GCTAGCGTGCAACACGTAAACCTCGTACGCCTTCTCGGGTATTGTGTCTC
GTCCACTGGTCCTCGTTTCCTCGTTTACGAGTTCATTCACAACGGCTCGT
TGGATAATTGGATTTTCCCCAAGGGGGAAAGTTGTGGCCGACGTAATGGT
TGTTTGACATGGGATTCGAGATGTAGAGTTGCTCTTGATGTAGCGAGAGC
GCTTTCTTACTTGCACCATGATTGTCGATCTTGTATACTGCATCTAGATG
TGAAGCCGGAAAATATACTTCTCGACCATGATTATCGCGCACTCGTGTCA
GATTTCGGGCTCTCGAAACTAAAAGGAAGAGACGAGAGTCGAGTTGTGAC
AACGATCCGGGGGACTAGAGGTTACTTGGCTCCTGAATGGCTCCTGGAGA
ATGGAGTTTCTGAGAAATGTGATGTGTACAGTTATGGAATGGTGCTGTTA
GAGATTATTGGTGGACGAAGAAACGTCCGTGTTCTCGAAAATGGCAACGG
TGAATCGAAAAAAAAGTTTCAATTCTTCCCAAAGATTGTGAGTGACAAAT
TTAAAGATGGGAAACTTATGGAAATTGTTGATCCAAGGTTAGTTGAAGAT
GGAGGGGTTAATGAGAGGCAATTAAAGAGACTGGTTTGTGCAGCTTTATG
GTGCATACAAGAGAAGGCCAAGCTTAGGCCAACCATGGCTACGGTCGTTG
AAATGCTCGAGGGGCGTGTACTGGTTGAAGACCCGCCCAACACACAAATG
CTTATAGTTGATTTGTTATCAATTGATGAAGAGGCGGCTGTTGTACTCCC
AGGCCTAGATTTGGTATAGT-AGAAAATTACCAAATGAATAGTGACATTC
CTTCAACGTCGAGTTACTCGGTTACAATGTCGGTACTCTCAGGCCGGTAG
>FRAX29_FRAEX38873_V2_000292250.1_R0
ATGGAAGACAAAAAAGCAAATTTGATTGCATTTTCCGTAGTAATTGTACT
CATAATTGTCATTATCATTGCTCGTTTATCTCTGAAACTTTCCAAGACAT
TTTTTCTGATATGTGGAGCTGATATTGCAGCAATTCTAGCAGTTTTTGCA
GTTATAGCGATCCGGGTTCGTTTCACCGCTCGACGAAAACAACTCGAACG
ACAGTTTGATTCAGATGGCCGAGAGCTTAGAATCGAGTACAGTTTTCTGA
GGAAAGTTGCCGGAGTTCCGATAAAGTTCCGGTATCGGGACTTGGAAGTA
GCCACGGATGGCTTTCGATCTATGGTAGGACGTGGGGCGTCGGCTTCAGT
CTTTAAAGGGATACTCAATGATGGGACGGCAGTGGCAGTAAAAAGGATCG
AAGGGGATGATCAAGGAGAGAAGGAATTCAAATCAGAAGTTGCAGCTATT
GCTAGCGTGCAACACGTAAACCTCGTACGCCTTCTCGGGTATTGTGTCTC
GTCCACTGGTCCTCGTTTCCTCGTTTACGAGTTCATTCACAACGGCTCGT
TGGATAATTGGATTTTCCCCAAGAGGGAAATTTGTGGCCGACGTAATGGT
TGTTTGACATGGGATTCGAGATGTAGAGTTGCTCTTGATGTAGCGAGAGC
GCTTTCTTACTTGCACCGTGATTGTCGATCTTGTATACTGCATCTAGATG
TGAAGCCGGAAAATATACTTCTCGACCATGATTATCGCGCACTCGTGTCA
GATTTCGGGCTCTCGAAACTAAAAGGAAGAGACGAGAGTCGAGTTGTGAC
AACGATCCGGGGGACTAGAGGTTACTTGGCTCCTGAATGGCTCCTGGAGA
ATGGAGTTTCTGAGAAATGTGATGTGTACAGTTATGGAATGGTGCTGTTA
GAGATTATTGGTGGACGAAGAAACGTCCGTGTTCTCGAAAATGGCAACGG
TGAATCGAAAAAAAAGTTTCAATTCTTCCCAAAGATTGTGAGTGACAAAT
TTAAAGATGGGAAACTTATGGAAATTGTTGATCCAAGGTTAGTTGAAGAT
GGAGGGGTTAATGAGAGGCAATTAAAGAGACTGGTTTGTGCAGCTTTATG
GTGCATACAAGAGAAGGCCAAGCTTAGGCCAACCATGGCTACGGTCGTTG
AAATGCTCGAGGGGCGTGTACTGGTTGAAGACCCGCCCAACACACAAATG
CTTATAGTTGATTTGTTATCAATTGATGAAGAGGCGGCTGTTGTACTCCC
AGGCCTAGATTTGGTATAGT-AGAAAATTACCAAATGAATAGTGACATTC
CTTCCACGTCGAGTTACTCGGTTACAATGTCGGTACTCTCAGGCCGGTAG
>FRAX28_FRAEX38873_V2_000292250.1_R0
ATGGAAGACAAAAAAGCAAATTTGATTGCATTTTCCGTAGTAATTGTACT
CATAATTGTCATTATCATTGCTCGTTTATCTCTGAAACTTTCCAAGACAT
TTTTTCTGATATGTGGAGCTGATATTGCAGCAATTCTAGCAGTTTTTGCA
GTTATAGCGATCCGGGTTCGTTTCACCGCTCGACGAAAACAACTCGAACG
ACAGTTTGATTCAGATGGCCGAGAGCTTAGAATCGAGTACAGTTTTCTGA
GGAAAGTTGCCGGAGTTCCGATAAAGTTCCGGTATCGGGACTTGGAAGTA
GCCACGGATGGCTTTCGATCTATGGTAGGACGTGGGGCGTCGGCTTCAGT
CTTTAAAGGGATACTCAATGATGGGACGGCAGTGGCAGTAAAAAGGATCG
AAGGGGATGATCAAGGAGAGAAGGAATTCAAATCAGAAGTTGCAGCTATT
GCTAGCGTGCAACACGTAAACCTCGTACGCCTTCTCGGGTATTGTGTCTC
GTCCACTGGTCCTCGTTTCCTTGTTTACGAGTTCATTCACAACGGCTCGT
TGGATAATTGGATTTTCCCCAAGGGGGAAAGTTGTGGCCGACGTAATGGT
TGTTTGACATGGGATTCGAGATGTAGAGTTGCTCTTGATGTAGCGAGAGC
GCTTTCTTACTTGCATCGTGATTGTCGATCTTGTATACTGCATCTAGATG
TTAAGCCGGAAAATATACTTCTCGACCATGATTATCGCGCACTCGTGTCA
GATTTCGGGCTCTCGAAACTAAAAGGAAGAGACGAGAGTCGAGTTGTGAC
AACGATCCGGGGGACTAGAGGTTACTTGGCTCCTGAATGGATCCTGGAGA
ATGGAGTTTCTGAGAAATGTGATGTGTACAGTTATGGAATGGTGCTGTTA
GAGATTATTGGTGGACGAAGAAACGTCCGTGTTCTCGAAAATGGCAACGG
TGAATCGAAAAAAAAGTTTCAGTTCTTCCCAAAGATTGTGAGTGACAAAT
TTAAAGATGGGAAACTTATGGAAATTGTTGATCCAAGGTTAGTTGAAGAT
GGAGGGGTTAATGAGAGGCAATTAAAGAGACTGGTTTGTGCAGCTTTATG
GTGCATACAAGAGAAGGCCAAGCTTAGGCCAACCATGGCTACGGTCGTTG
AAATGCTCGAGGGGCGTGTACTGGTTGAAGACCCGCCCAACACACAAATG
CTTATAGTTGATTTGTTATCAATTGACGAAGAGGCGGCTGTTGTACTCCC
AGGCCTAGATTTGGTATAGT-AGAAAATTACCAAATGAATAGTGACATTC
CTTCCACGTCGAGTTACTCGGTTACAATGTCGGTACTCTCAGGCCGGTAG
>FRAX30_FRAEX38873_V2_000292250.1_R0
ATGGAAGACCAAAAAGCAAATTTGATTGCATTTTCCGTAGTAATTGTACT
CATAATTGTCATTATCATTGCTCGTTTATCTCTGAAACTTTCCAAGACAT
TTTTTCTGATATGTGGAGCTGATATTGCAGCAATTCTAGCAGTTTTTGCA
GTTATAGCGATCCGGATTCGTTTCACCGCTCGACGAAAACAACTCGAACG
ACAGTTTGATTCAGATGGCCGAGAGCTTAGAATCGAGTACAGTTTTCTGA
GGAAAGTTGCCGGAGTTCCGATAAAGTTCCGGTATCGGGACTTGGATGTA
GCCACGGATGGCTTTCGATCTATGGTAGGACGTGGGGCGTCGGCTTCAGT
CTTTAAAGGGATACTCAATGATGGGACGGCAGTGGCAGTAAAAAGGATCG
AAGGGGGTGATCAAGGAGAGAAGGAATTCAAATCAGAAGTTGCAGCTATT
GCTAGCGTGCAACACGTAAACCTCGTACGCCTTCTCGGGTATTGTGTCTC
GTCCACTGGTCCTCGTTTCCTTGTTTACGAGTTCATTCACAACGGCTCGT
TGGATAATTGGATTTTCCCCAAGGGGGAAAGTTGTGGCCGACGTAATGGT
TGTTTGACATGGGATTCGAGATGTAGAGTTGCTCTTGATGTAGCGAGAGC
GCTTTCTTACTTGCACCGTGATTGTCGATCTTGTATACTGCATCTAGATG
TGAAGCCGGAAAATATACTTCTCGACCATGATTATCGCGCACTCGTGTCA
GATTTCGGGCTCTCAAAACTAAAAGGAAGAGACGAGAGTCGAGTTGTGAC
AACGATCCGGGGGACTAGAGGTTACTTGGCTCCTGAATGGATCCTGGAGA
ATGGAGTTTCTGAGAAATGTGATGTGTACAGTTATGGAATGGTGCTGTTA
GAGATTATTGGTGGACGAAGAAACGTCCGTGTTCTCGAAAATGGCAACGG
TGAATCGAAAAAAAAGTTTCAATTCTTCCCAAAGATTGTGAGTGACAAAT
TTAAAGATGGGAAACTTATGGAAATTGTTGATCCAAGGTTAGTTGAAGAT
GGAGGGGTTAATGAGAGGCAATTAAAGAGACTGGTTTGTGCAGCTTTATG
GTGCATACAAGAGAAGGCCAAGCTTAGGCCAACCATGGCTACGGTCGTTG
AAATGCTCGAGGGGCGTGTACTGGTTGAAGACCCGCCCAACACACAAATG
CTTATAGTTGATTTGTTATCAATTGATGAAGAGGCGGCTGTTGTACTCCC
AGGCCTAGATTTGGTATAGT-AGAAAATTACGAAATGAATAGTGACATTC
CTTCCACGTCGAGTTACTCGGTTACAATGTCGGTACTCTCAGGCCGGTAG
>FRAX32_FRAEX38873_V2_000292250.1_R0
ATGGAAGACAAAAAAGCAAATTTGATTGCATTTTCCGTAGTAATTGTACT
CATAGTTGTCATTATCATTGCTCGTTTATCTCTGAAACTTTCCAAGACAT
TTTTTCTGATATGTGGAGCTGATATTGCAGCAATTCTAGCAGTTTTTGCA
GTTATAGCGATCCGGGTTCGTTTCACCGCTCGACGAAAACAACTCGAACG
ACAGTTTGATTCAGATGGCCGAGAGCTTAGAATCGAGTACAGTTTTCTGA
GGAAAGTTGCCGGAGTTCCGATAAAGTTCCGGTATCGGGACTTGGAAGTA
GCCACGGATGGCTTTCGATCTATGGTAGGACGTGGGGCGTCGGCTTCAGT
CTTTAAAGGGATACTCAATGACGGGACGGCAGTGGCAGTAAAAAGGATCG
AAGGGGGTGATCAAGGAGAGAAGGAATTCAAATCAGAAGTTGCAGCTATT
GCTAGCGTGCAACACGTAAACCTCGTACGCCTTCTCGGGTATTGTGTCTC
GTCCACTGGTCCTCGTTTCCTTGTTTACGAGTTCATTCACAACGGCTCGT
TGGATAATTGGATTTTCCCCAAGGGGGAAAGTTGTGGCCGACGTAATGGT
TGTTTGACATGGGATTCGAGATGTAGAGTTGCTCTTGATGTAGCGAGAGC
GCTTTCTTACTTGCACCGTGATTGTCGATCTTGTATACTGCATCTAGATG
TGAAGCCGGAAAATATACTTCTCGACCATGATTATCGCGCACTCGTGTCA
GATTTCGGGCTCTCAAAACTAAAAGGAAGAGACGAGAGTCGAGTTGTGAC
AACGATCCGGGGGACTAGAGGTTACTTGGCTCCTGAATGGATCCTGGAGA
ATGGAGTTTCTGAGAAATGTGATGTGTACAGTTATGGAATGGTGCTGTTA
GAGATTATTGGTGGACGAAGAAACGTCCGTGTTCTCGAAAATGGCAACGG
TGAATCGAAAAAAAAGTTTCAATTCTTCCCAAAGATTGTGAGTGACAAAT
TTAAAGATGGGAAACTTATGGAAATTGTTGATCCAAGGTTAGTTGAAGAT
GGAGGGGTTAATGAGAGGCAATTAAAGAGACTGGTTTGTGCAGCTTTATG
GTGCATACAAGAGAAGGCCAAGCTTAGGCCAACCATGGCTACGGTCGTTG
AAATGCTCGAGGGGCGTGTACTGGTTGAAGACCCGCCCAACACACAAATG
CTTATAGTTGATTTGTTATCAATTGATGAAGAGGCGGCTGTTGTACTCCC
AGGCCTAGATTTGGTATAGT-AGAAAATTACCAAATGAATAGTGACATTC
CTTCCACGTCGAGTTACTCGGTTACAATGTCGGTACTCTCAGGCCGGTAG
>FRAX16_FRAEX38873_V2_000292250.1_R0
ATGGAAGACAAAAAAGCAAATTTGATTGCCTTTTCCATAGTAATTGTACT
CATAATTGTCATTATCATTGCTCGTCTATCTCTGAAACTTTCCAAGACAT
TTTTTCTGATATGTGGAGCTGATATTGCAGCAATTCTAGCAGTTTTTGCA
GTTATAGCGATCCGGGTTCGTTTTACTGCTCGACGAAAACAACTCGAACG
ACAGTTTGATTCAGAAGGCCGAGAGCTTCGAATCGAGTACAGTTTTCTGA
GGAAAGTTGCCGGAGTTCCGATAAAGTTCCGGTATCGGGACTTGGAAGTA
GCCACGGATGGCTTTCGATCTATGGTAGGACGTGGGGCGTCAGCTGCAGT
CTTTAAAGGGATACTCAATGATGGGACGGCAGTGGCAGTAAAAAGGATCG
AAGGGGATGATCAAGGAGAGAAGGAATTCAAATCAGAAGTTGCAGCTATT
GCTAGCGTGCAACACGTAAACCTCGTACGCCTTCTCGGGTATTGTGTCCA
GTCCACTGGTCCTCGTTTCCTTGTTTACGAGTTCATTCATAACGGCTCGT
TGGATAATTGGATTTTCCCCAAGGGGGAAAGATTTGGTCGACGTAGTGGT
TGTTTGACATGGGATTCGAGATGTAGAGTTGCTCTTGATGTAGCGAGAGC
GCTTTCTTACTTGCACCACGATTGTCGATCTTGTATACTGCATCTAGATG
TGAAGCCGGAAAATATACTTCTCGACCATGATTATCGCGCACTTGTGTCA
GATTTCGGGCTCTCGAAACTAAAAGGAAGAGACGAGAGTCGAGTTGTGAC
AACGATCCGGGGGACTAGAGGTTACTTGGCTCCTGAATGGCTCCTGGAGA
ATGGAGTTTCTGAGAAATGTGATGTGTACAGTTATGGAATGGTGCTGTTA
GAGATTATTGGTGGACGAAGAAACGTCGGTGTTCTTGAAAATGGCAACGG
TGAATCGAAAAAAAAGTTTCAATTCTTCCCGAAGATTGTGAGTGACAAAT
TTAAAGATGGGAAACTTATGGAAATTGTTGATCCAAGGTTGGTTGAAGAT
GGAGGGGTTAATGAGAGGCAATTAAAGAGACTGGTTTGTGCAGCTTTATG
GTGCATACAAGAGAAGGCCAAGCTTAGGCCAAGCATGGCTACGGTCGTTG
AAATGCTTGAGGGGCGTGTACCGGTTGAAGACCCGCCCAACACACAAATG
CTTATAGTTGATTTGTTATCAATTGATGAAGAGGCAGCTGTTGTACTCCC
AGGCCTAGATTTGGTGTAGT-AGAAAATTACCAAATGAATAGTGACATTC
CTTCCACGTCGAGTTACTCGGTTACAATGTCGATACTCTCAGGCCGGTAG
>FRAX23_FRAEX38873_V2_000292250.1_R0
ATGGAAGACAAAAAAGCAAATTTGATTGCCTTTTCCATTGTAATTGTACT
CATAATTGTCATTATCATTGCTCGTCTATCTCTGAAACTTTCCAAGACAT
TTTTTCTGATATGTGGAGCTGATATTGCAGCAATTCTAGCAGTTTTTGCA
GTTATAGCGATCCGGGTTCGTTTTACCGCTCGACGAAAACAACTCGAACG
ACAGTTTGATTCAGAAGGCCGAGAGCTTCGAATCGAGTACAGTTTTCTGA
GGAAAGTTGCCGGAGTTCCGATAAAGTTCCGGTATCGGGACTTGGAAGTA
GCCACGGATGGCTTTCGATCTATGGTAGGACGTGGGGCGTCAGCTTCAGT
CTTTAAAGGGATACTCAATGATGGGACGGCAGTGGCAGTAAAAAGGATCG
AAGGGGATGATCAAGGAGAGAAGGAATTCAAATCAGAAGTCGCAGCTATT
GCTAGCGTGCAACACGTAAACCTCGTACGCCTTCTCGGGTATTGTGTCCA
GTCCACTGGTCCTCGTTTCCTTGTTTACGAGTTCATTCATAACGGCTCGT
TGGATAATTGGATTTTCCCCAAGGGGGAAAGATTTGGTCGACGTAGTGGT
TGTTTGACATGGGATTCGAGATGTAGAGTTGCTCTTGATGTAGCGAGAGC
GCTTTCTTACTTGCACCACGATTGTCGATCTTGTATACTGCATCTAGATG
TGAAGCCGGAAAATATACTTCTCGACCATGATTATCGCGCACTCGTGTCA
GATTTCGGGCTCTCGAAACTAAAAGGAAGAGACGAGAGTCGAGTTGTGAC
AACGATCCGGGGGACTAGAGGTTACTTGGCTCCTGAATGGCTCCTGGAGA
ATGGAGTTTCCGAGAAATGTGATGTGTACAGTTATGGAATGGTGCTGTTA
GAGATTATTGGTGGACGAAGAAATGTCCGTGTTCTTGAAAATGGCAACGG
TGAATCGAAAAAAAAGTTTCAATACTTCCCAAAGATTGTGAGTGACAAAT
ATAAAGATGGGAAACTTACGGAAATTGTTGATCCAAGGTTGGTTGAAGAT
GGAGGGGTTAATGAGAGGCAATTAAAGAGACTGGTTTGTGCAGCTTTATG
GTGCATACAAGAGAAGGCCAAGCTTAGGCCAAGCATGGCTACGGTCGTTG
AAATGCTTGAGGGGCGTGTACCGGTTGAAGACCCGCCCAACACACAAATG
CTTATAGTTGATTTGTTATCAATTGATGAAGATGCAGCTGTCGTACTCCC
AGGCCTAGATTTGGTATAGT-GGAAAATTACCAAATGAATAGTGACATTC
CTTCCACGTCGAGTTACTCGGTTACAATGTCGATACTCTCAGGTCGGTAG
>FRAX06_FRAEX38873_V2_000292250.1_R0
ATGGAAGACAAAAAAGCAAATTTGATTGCCTTTTCCATTGTAATTGTACT
CATAATTGTCATTATCATTGCTCGTCTTTCTCTGAAACTTTCCAAGACAT
TTTTTCTGATATGTGGAGCTGATATTGCAGCAATTCTAGCAGTTTTTGCA
GTTATAGCGATCCGGGTTCGTTTTACCGCTCGACGAAAACAACTCGAACG
ACAGTTCGATTCAGAAGGCCGAGAGCTTCGAATCGAGTACAGTTTTCTGA
GGAAAGTTGCCGGAGTTCCGATAAAGTTCAGGTATCGGGACTTGGAAGTA
GCCACGGATGGCTTTCGATCTATGGTAGGACGTGGGGCGTCAGCTGCAGT
CTTTAAAGGGATCCTCAATGATGGGACGGCAGTGGCAGTAAAAAGGATCG
AAGGGGATGATCAAGGAGAGAAGGAATTCAAATCAGAAGTCGCAGCTATT
GCTAGCGTGCAACACGTAAACCTCGTACGCCTTCTCGGGTATTGTGTCCA
GTCCACTGGTCCTCGTTTCCTTGTTTACGAGTTCATTCATAACGGCTCGT
TGGATAATTGGATTTTCCCCAAGGGGGAAAGATTTGGTCGACGTAGTGGT
TGTTTGACATGGGATTCGAGATGTAGAGTTGCTCTTGATGTAGCGAGAGC
ACTTTCTTACTTGCACCACGATTGTCGATCTTGTATACTGCATCTAGATG
TGAAGCCGGAAAATATACTTCTCGACCATGATTATCGCGCACTCGTGTCA
GATTTCGGGCTCTCGAAACTAAAAGGAAGAGACGAGAGTCGAGTTGTGAC
AACGATCCGGGGGACTAGAGGTTACTTGGCTCCTGAATGGCTCCTGGAGA
ATGGAGTTTCTGAGAAATGTGATGTGTACAGTTATGGAATGGTGCTGTTA
GAGATTATCGGTGGACGAAGAAACGTCCGTGTTCTCGAAAATGGCAACGG
TGAATCGAAAAAAAAGTTTCAATACTTCCCAAAGATTGTGAGTGACAAAT
TTAAAGATGGGAAACTTATGGAAATTGTTGATCCAAGGTTGGTTGAAGAT
GGAGGGGTTAATGAGAGGCAATTAAAGAGACTGGTTTGTGCAGCTTTATG
GTGCATACAAGAGAAGGCCAAGCTTAGGCCAAGCATGGCTACGGTCGTTG
AAATGCTTGAGGGGCGTGTACCGGTTGAAGACCCGCCCAACACACAAATG
CTTATAGTTGATTTGTTATCAATTGATAAAGATGCAGCTGTTGTACTCCC
AGGCCTAGATTTGGTATAGT-GGAAAATTACCAAATGAATAGTGACATTC
CTTCCACGTCGAGTTACTCGGTTACAATGTCGATACTCTCAGGCCGGTAG
>FRAEX38873_v2_000292250
ATGGAAGACAAAAAAGCAAATTTGATTGCCTTTTCCATTGTAATTGTACT
CATAATTGTCATTATCATTGCTCGTGTATCTCTGAAACTTTCCAAGACAT
TTTTTCTGATATGTGGAGCTGATATTGCAGCAATTCTAGCAGTTTTTGCA
GTTATAGCGATCCGGGTTCGTTTTACCGCTCGACGAAAACAACTCGAACG
ACAGTTTGATTCAGAAGGCCGAGAGCTTCGAATCGAGTACAGTTTTCTGA
GGAAAGTTGCCGGAGTTCCGATAAAGTTCCGGTATCGGGACTTGGAAGTA
GCCACGGATGGCTTTCGATCTATGGTGGGACGTGGGGCGTCAGCTGCAGT
CTTTAAAGGGATACTCAATGATGGGACGGCAGTGGCAGTAAAAAGGATCG
AAGGGGATGATCAAGGAGAGAAGGAATTCAAATCAGAAGTTGCAGCTATT
GCTAGCGTGCAACACGTAAACCTCGTACGCCTTCTCGGGTTTTGTGTCCA
GTCCACTGGTCCTCGTTTCCTTGTTTACGAGTTCATTCATAACGGCTCGT
TGGATAATTGGATTTTCCCCAAGGGGGAAAGATTTGGTCGACGTAGTGGT
TGTTTGACATGGGATTCGAGATGTAGAGTTGCTCTTGATGTAGCGAGAGC
GCTTTCTTACTTGCACCACGATTGTCGATCTTGTATACTGCATCTAGATG
TGAAGCCGGAAAATATACTTCTCGACCATGATTATCGCGCACTCGTGTCA
GATTTCGGGCTCTCGAAACTAAAAGGAAGAGACGAGAGTCGAGTTGTGAC
AACGATCCGGGGGACTAGAGGTTACTTGGCTCCTGAATGGCTCCTGGAGA
ATGGAGTATCTGAGAAATGTGATGTGTACAGTTATGGAATGGTGCTGTTA
GAGATTATTGGTGGACGAAGAAACGTCCGTGTTCTCGAAAATGGCAACGG
TGAGTCGAAAAAAAAGTTTCAATACTTCCCAAAGATTGTGAGTGACAAAT
TTAAAGATGGGAAACTTATGGAAATTGTTGATCCAAGGTTGGTTGAAGAT
GGAGGGGTTAATGAGAGGCAATTAAAGAGACTGGTTTGTGCAGCTTTATG
GTGCATACAAGAGAAGGCCAAGCTTAGGCCAAGCATGGCTACGGTCGTTG
AAATGCTTGAGGGGCGTGTACCGGTTCAAGACCCGCCCAACACACAAATG
CTTATAGTTGATTTGTTATCAATTGATGAAGAGGCAGCTGTTGTACTCCC
AGGCCTAGATTTGGTATAGTGGGAAAATTACCAAATGAATAG--------
--------------------------------------------------
>FRAX01_FRAEX38873_V2_000292250.1_R0
ATGGAAGACAAAAAAGCAAATTTGATTGCCTTTTCCGTTGTAATTGTACT
CATAATTGTCATTATCATTGCTCGTCTATCTCTGAAACTTTCCAAGACGT
TTTTTCTGATATGTGGAGCTGATATTGCAGCAATTCTAGCAGTTTTTGCA
GTTATAGCGATCCGGGTTCGTTTTACCGCTCGACGAAAACAACTCGAACG
ACAGTTCGATTCAGAAGGCCGAGAGCTTCGAATCGAGTACAGTTTTCTGA
GGAAAGTTGCCGGAGTTCCGATAAAGTTCCGGTATCGGGACTTGGAAGTA
GCCACGGATGGCTTTCGATCTATGGTAGGACGTGGGGCGTCAGCTGCAGT
CTTTAAAGGGATACTCAATGATGGGACGGCAGTGGCAGTAAAAAGGATCG
AAGGGGATGATCAAGGAGAGAAGGAATTCAAATCAGAAGTCGCAGCTATT
GCTAGCGTGCAACACGTAAACCTCGTACGCCTTCTCGGGTATTGTGTCCA
GTCCACTGGTCCTCGTTTCCTTGTTTACGAGTTCATTCATAACGGCTCGT
TGGATAATTGGATTTTCCCCAAGGGGGAAAGATTTGGTCGACGTAGTGGT
TGTTTGACATGGGATTCGAGATGTAGAGTTGCTCTTGATGTAGCGAGAGC
GCTTTCTTACTTGCACCACGATTGTCGATCTTGTATACTGCATCTAGATG
TGAAGCCGGAAAATATACTTCTCGACCATGATTATCGCGCACTCGTGTCA
GATTTCGGGCTCTCGAAACTAAAAGGAAGAGACGAGAGTCGAGTTGTGAC
AACGATCCGGGGGACTAGAGGTTACTTGGCTCCTGAATGGCTCCTGGAGA
ATGGAGTTTCTGAGAAATGTGATGTGTACAGTTATGGAATGGTGCTGTTA
GAGATTATTGGTGGACGAAGAAACGTCCGTGTTCTTGAAAATGGCAACGG
CGAATCGAAAAAAAAGTTTCAATACTTCCCAAAGATTGTGAGTGACAAAT
TTAAAGATGGGAAACTTATGGAAATTGTTGATCCAAGGTTGGTTGAAGAT
GGAGGGGTTAATGAGAGGCAATTAAAGAGACTGGTTTGTGCAGCTTTATG
GTGCATACAAGAGAAGGCCAAGCTTAGGCCAAGCATGGCTACGGTCGTTG
AAATGCTTGAGGGGCGTGTACCGGTTCAAGACCCGCCCAACACACAAATG
CTTATAGTTGATTTGTTATCAATTGATGAAGAGGCAGCTGTTGTACTCCC
AGGCCTAGATTTGGTATAGT-GGAAAATTACCAAATGAATAGTGACATTC
CTTCCACGTCGAGTTACTCGGTTACAATGTCGATACTCTCAGGCCGGTAG
>FRAX15_FRAEX38873_V2_000292250.1_R0
ATGGAAGACAAAAAAGCAAATTTGATTGCCTTTTCCGTTGTAATTGTACT
CATAATTGTCATTATCATTGCTCGTCTATCTCTGAAACTTTCCAAGACGT
TTTTTCTGATATGTGGAGCTGATATTGCAGCAATTCTAGCAGTTTTTGCA
GTTATAGCGATCCGGGTTCGTTTTACCGCTCGACGAAAACAACTCGAACG
ACAGTTCGATTCAGAAGGCCGAGAGCTTCGAATCGAGTACAGTTTTCTGA
GGAAAGTTGCCGGAGTTCCGATAAAGTTCCGGTATCGGGACTTGGAAGTA
GCCACGGATGGCTTTCGATCTATGGTAGGACGTGGGGCGTCAGCTGCAGT
CTTTAAAGGGATACTCAATGATGGGACGGCAGTGGCAGTAAAAAGGATCG
AAGGGGATGATCAAGGAGAGAAGGAATTCAAATCAGAAGTCGCAGCTATT
GCTAGCGTGCAACACGTAAACCTCGTACGCCTTCTCGGGTATTGTGTCCA
GTCCACTGGTCCTCGTTTCCTTGTTTACGAGTTCATTCATAACGGCTCGT
TGGATAATTGGATTTTCCCCAAGGGGGAAAGATTTGGTCGACGTAGTGGT
TGTTTGACATGGGATTCGAGATGTAGAGTTGCTCTTGATGTAGCGAGAGC
GCTTTCTTACTTGCACCACGATTGTCGATCTTGTATACTGCATCTAGATG
TGAAGCCGGAAAATATACTTCTCGACCATGATTATCGCGCACTCGTGTCA
GATTTCGGGCTCTCGAAACTAAAAGGAAGAGACGAGAGTCGAGTTGTGAC
AACGATCCGGGGGACTAGAGGTTACTTGGCTCCTGAATGGCTCCTGGAGA
ACGGAGTTTCTGAGAAATGTGATGTGTACAGTTATGGAATGGTGCTGTTA
GAGATTATTGGTGGACGAAGAAACGTCCGTGTTCTCGAAAATGGCAACGG
TGAATCGAAAAAAAAGTTTCAATACTTCCCAAAGATTGTGAGTGACAAAT
TTAAAGATGGGAAACTTATGGAAATTGTTGATCCAAGGTTGGTTGAAGAT
GGAGGGGTTAATGAGAGGCAATTAAAGAGACTGGTTTGTGCAGCTTTATG
GTGCATACAAGAGAAGGCCAAGCTTAGGCCAAGCATGGCTACGGTCGTTG
AAATGCTCGAGGGGCGTGTACCGGTTGAAGACCCGCCCAACACACAAATG
CTTATAGTTGATTTGTTATCAATTGATGAAGAGGCAGCTATTGTACTCCC
AGGCCTAGATTTGGTATAGT-AGAAAATTACCAAATGAATAGTGACATTC
CTTCCACGTCGAGTTACTCGGTTACAATGTCGATACTCTCAGGCCGGTAG
>FRAX03_FRAEX38873_V2_000292250.1_R0
ATGGAAGACAAAAAAGCAAATTTGATTGCATTTTCCATAGTAATTGTACT
CATAATTGTCATTATCATTGCTCGTTTATCTCTGAAACTCTCCAAGACAT
TTTTTCTGATATGTGGAGCTGATATTGCAGCAATTCTAGCAGTTTTTGCA
GTTATAGCGATCCGGGTTCGTTTTACTGCTCGACGAAAACAACTCGAACA
ACGGTTCGATTCAGAAGGCCGAGAGCTTCGAATCGAGTACAGTTTTCTGA
GGAAAGTTGCTGGAGTTCCGACAAAGTTCCGGTATCGGGACTTGGAAGTA
GCCACGGATGGCTTTCGATCTATGGTAGGACGTGGGTCGTCGGCTTCAGT
CTTTAAAGGGATACTCAGTGATGGGACAGCAGTTGCAGTAAAAAGGATCG
AAGGGGATGATCGAGGAGAGAAGGAATTCAAATCAGAAGTTGCAGCTATT
GCTAGCGTGCAACACGTAAACCTCGTACGCCTTCTCGGGTATTGTGTCCA
GTCGACTGGTCCTCGTTTCATTGTTTACGAGTTCATTCATAACGGCTCGT
TGGATAATTGGATTTTCCCCAAGGGGGAAAGGGGTGGTCAACGCAGTGGT
TGTTTGACATGGGATTCGAGATGTAGAGTTGCTCTTGATGTAGCGAGAGC
GCTTTCTTACTTGCACCACGATTGTCGATCTTGTATACTGCATCTAGATG
TGAAGCCGGAAAATATACTTCTCGACCATGATTATCGTGCACTCGTGTCA
GACTTTGGGCTCTCGAAAATAAAAGGAAGAGACGAGAGTCGAGTTGTGAC
AACGATCCGGGGGACTAGAGGTTACTTGGCTCCTGAATGGCTCCTGGAGA
ATGGAGTTTCTGAGAAATGTGATGTGTACAGTTATGGAATGGTGCTGTTA
GAGATTATTGGTGGACGAAGAAACGTCCGTGTTCTCGAAAATGGCAATGG
TGAGTCGAAAAAAAAGTTTCAATACTTCCCAAAGATTGTGAGCGACAAAT
TTAAAGATGGGAAACTTATGGAAATTGTTGATCCAAGGTTGGTTGAAGAT
GGAGGGATTAATGAGAGGCAATTAAAGAGACTGGTTTGTGCAGCTTTATG
GTGCATACAAGAGAAGGCCAAGCTTAGGCCAAGCATGGCTATGGTCGTTG
AAATGCTCGAGGGGCGTGTACCGGTCGAAGACCCGCCCAACACACAAATG
CTTATTGTTGATTTCTTATCAATTGATGAAGAGGCAGCTGTTGTACTCCC
AAGCCTAGATTTGGTATAGT-GGAAAATTACCAAATGAATAGTGACATTC
CTTCCACGTCAAGTTACTCGGTTACAATGTCGATACTCTCAGGCCGGTAG
>FRAX14_FRAEX38873_V2_000292250.1_R0
ATGGAAGACAAAAAAGCAAATTTGATTGCATTTTCCATAGTAATTGTACT
CATAATTGTCATTATCATTGCTCGTTTATCTCTGAAACTTTCCAAGACAT
TTTTTCTGATATGTGGAGCTGATATTGCAGCAATTCTAGCAGTTTTTGCA
GTTATAGCGATCCGGGTTCGTTTTACTGCTCGACGAAAACAACTCGAACA
ACGGTTCGATTCAGAAGGCCGAGAGCTTCGAATCGAGTACAGTTTTCTGA
GGAAAGTTGCTGGAGTTCCGACAAAGTTCCGGTATCGGGACTTGGAAGTA
GCCACGGATGGCTTTCGATCTATGGTAGGACGTGGGTCGTCGGCTTCAGT
CTTTAAAGGGATACTCAGTGATGGGACGGCAGTTGCAGTAAAAAGGATCG
AAGGGGATGATCGAGGAGAGAAGGAATTCAAATCAGAAGTTGCAGCTATT
GCTAGCGTGCAACACGTAAACCTCGTACGCCTTCTCGGGTATTGTGTCCA
GTCGACTGGTCCTCGTTTCATTGTTTACGAGTTCATTCATAACGGCTCGT
TGGATAATTGGATTTTCCCCAAGGGGGAAAGGGGTGGTCAACGTAGTGGT
TGTTTGACATGGGATTCGAGATGTAGAGTTGCTCTTGATGTAGCGAGAGC
GCTTTCTTACTTGCACCACGATTGTCGATCTTGTATACTGCATCTAGATG
TGAAGCCGGAAAATATACTTATCGACCATGATTATCGTGCACTCGTGTCA
GATTTTGGGCTCTCGAAAATAAAAGGAAGAGACGAGAGTCGAGTTGTGAC
AACGATCCGGGGGACTAGAGGTTACTTGGCTCCTGAATGGCTCCTGGAGA
ATGGAGTTTCTGAGAAATGTGATGTGTACAGTTATGGAATGGTGCTGTTA
GAGATTATTGGTGGACGAAGAAACGTCCGTGTTCTCGAAAATGGCAATGG
TGAGTCGAAAAAAAAGTTTCAATACTTCCCAAAGATCGTGAGCGACAAAT
TTAAAGCTGGGAAACTTATGGAAATTGTTGATCCAAGGTTGGTTGAAGAT
GGAGGGATTAATGAGAGGCAATTAAAGAGACTGGTTTGTGCAGCTTTATG
GTGCATACAAGAGACGGCCAAGCTTAGGCCAAGCATGGCTATGGTCGTTG
AAATGCTCGAGGGGCGTGTACCGGTCGAAGACCCTCCCAACACACAAATG
CTTATTGTTGATTTCTTATCAATTGATGAAGAGGCAGCTGTTGTACTCCC
AAGCCTAGATTTGGTATAGT-GGAAAATTACCAAATGAATAGTGACATTC
CTTCCACGTCAAGTTACTCGGTTACAATGTCGATACTCTCAGGCCGGTAG
>FRAX26_FRAEX38873_V2_000292250.1_R0
ATGGAAGACAAAAAAGCAAATTTGATTGCATTTTCCATAGTAATTGTACT
CATAATTGTCATTATCATTGCTCGTTTATCTCTGAAACTTTCCAAGACAT
TTTTTCTGATATGTGGAGCTGATATTGCAGCAATTCTAGCAGTTTTTGCA
GTTATAGCGATCCGGGTTCGTTTTACTGCTCGACGAAAACAACTCGAACA
ACGGTTCGATTCAGAAGGCCGAGAGCTTCGAATCGAGTACAGTTTTCTGA
GGAAAGTTGCTGGAGTTCCGACAAAGTTCCGGTATCGGGACTTGGAAGTA
GCCACGGATGGCTTTGGATCTATGGTAGGACGTGGGTCGTCGGCTTCAGT
CTTTAAAGGGATACTCAGTGATGGGACGGCAGTTGCAGTAAAAAGGATCG
AAGGGGATGATCGAGGAGAGAAGGAATTCAAATCAGAAGTTGCAGCTATT
GCTAGCGTGCAACACGTAAACCTCGTACGCCTTCTCGGGTATTGTGTCCA
GTCGACTGGTCCTCGTTTCATTGTTTACGAGTTCATTCATAACGGCTCGT
TGGATAATTGGATTTTCCCCAAGGGGGAAAGGGGTGGTCAACGTAGTGGT
TGTTTGACATGGGATTCGAGATGTAGAGTTGCTCTTGATGTAGCGAGAGC
GCTTTCTTACTTGCACCACGATTGTCGATCTTGTATACTGCATCTAGATG
TGAAGCCGGAAAATATACTTATCGACCATGATTATCGTGCACTCGTGTCA
GATTTTGGGCTCTCGAAAATAAAAGGAAGAGACGAGAGTCGAGTTGTGAC
AACGATCCGGGGGACTAGAGGTTACTTGGCTCCTGAATGGCTCCTGGAGA
ATGGAGTTTCTGAGAAATGTGATGTGTACAGTTATGGAATGGTGCTGTTA
GAGATTATTGGTGGACGAAGAAACGTCCGTGTTCTCGAAAATGGCAATGG
TGAGTCGAAAAAAAAGTTTCAATACTTCCCAAAGATTGTGAGCGACAAAT
TTAAAGATGGGAAACTTATGGAAATTGTTGATCCAAGGTTGGTTGAAGAT
GGAGGGATTAATGAGAGGCAATTAAAGAGACTGGTTTGTGCAGCTTTATG
GTGCATACAAGAGAAGGCCAAGCTTAGGCCAAGCATGGCTATGGTCGTTG
AAATGCTCGAGGGGCGTGTACCGGTCGAAGACCCTCCCAACACACAAATG
CTTATTGTTGATTTCTTATCAATTGATGAAGAGGCAGCTGTTGTACTCCC
AAGCCTAGATTTGGTATAGT-GGAAAATTACCAAATGAATAGTGACATTC
CTTCCACGTCAAGTTACTCGGTTACAATGTCGATACTCTCAGGCCGGTAG
>FRAX05_FRAEX38873_V2_000292250.1_R0
--------------------------------------------------
--------------------------------------------------
--------------------------------------------------
--------------------------------------------------
--------------------------------------------------
--------------------------------------------------
---------------------ATGGTAGGACGTGGGTCGTCGGCTTCAGT
CTTTAAAGGGATACTCAGTGATGGGACGGCAGTTGCAGTAAAAAGGATCG
AAGGGGATGATCGAGGAGAGAAGGAATTCAAATCAGAAGTTGCAGCTATT
GCTAGCGTGCAACACGTAAACCTCGTACGCCTTCTCGGGTATTGTGTCCA
GTCGACTGGTCCTCGTTTCATTGTTTACGAGTTCATTCATAACGGCTCGT
TGGATAATTGGATTTTCCCCAAGGGGGAAAGGGGTGGTCAACGTAGTGGT
TGTTTGACATGGGATTCGAGATGTAGAGTTGCTCTTGATGTAGCGAGAGC
GCTTTCTTACTTGCACCACGATTGTCGATCTTGTATACTGCATCTAGATG
TGAAGCCGGAAAATATACTTCTCGACCAAGATTATCGTGCACTCGTGTCA
GATTTCGGGCTCTCGAAAATAAAAGGAAGAGACGAGAGTCGAGTTGTGAC
AACGATCCGGGGGACTAGAGGTTACTTGGCTCCTGAATGGCTCCTGGAGA
ATGGAGTTTCTGAGAAATGTGATGTGTACAGTTATGGAATGGTGCTGTTA
GAGATTATTGGTGGACGAAGAAACGTCCGTGTTCTCGAAAATGGCAATGG
TGAGTCGAAAAAAAAGTTTCAATACTTCCCAAAGATTGTGAGCGACAAAT
TTAAAGATGGGAAACTTATGGAAATTGTTGATCCAAGGTTGGTTGAAGAT
GGAGGGGTTAATGAGAGGCAATTAAAGAGACTGGTTTGTGCAGCTTTATG
GTGCATACAAGAGAAGGCCAAGCTTAGGCCAAGCATGGCTATGGTTGTTG
AAATGCTCGAGGGGCGTGTACCGGTTGAAGACCCGCCCAACACACAAATG
CTTATTGTTGATTTGTTAACAATTGGTGAAGAGGCAGCTGTTGTACTCCC
AGGCCTAGATTTGGTATAGT-GGAAAATTACCAAATGAATAGTGACATTC
CTTCCACGTCAAGTTACTCGGTTACAATGTCGATACTCTCAGGCCGGTAG
>FRAX09_FRAEX38873_V2_000292250.1_R0
ATGGAAGACAAAAAAGCAAATTTGATTGCATTTTCCATAGTAATTGTACT
CATAATTGTCATTATCATTGCTCGTTTATCTCTGAAACTTTCCAAGACAT
TTTTTCTGATATGTGGAGCTGATATTGCAGCAATTCTAGCAGTTTTTGCA
GTTATAGCGATCCGGGTTCGTTTTACTGCTCGACGAAAACAACTCGAACA
ACGGTTCGATTCAGAAGGCCGAGAGCTTCGAATCGAGTACAGTTTTCTGA
GGAAAGTTGCTGGAGTTCCGACAAAGTTCCGGTATCGGGACTTGGAAGTA
GCCACGGATGGCTTTCGATCTATGGTAGGACGTGGGTCGTCGGCTTCAGT
CTTTAAAGGGATACTCAGTGATGGGACGGCAGTTGCAGTAAAAAGGATCG
AAGGGGATGATCGAGGAGAGAAGGAATTCAAATCAGAAGTTGCAGCTATT
GCTAGCGTGCAACACGTAAACCTCGTACGCCTTCTCGGGTATTGTGTCCA
GTCGACTGGTCCTCGTTTCATTGTTTACGAGTTCATTCATAACGGCTCGT
TGGATAATTGGATTTTCCCCAAGGGGGAAAGGGGTGGTCAACGTAGTGGT
TGTTTGACATGGGATTCGAGATGTAGAGTTGCTCTTGATGTAGCGAGAGC
GCTTTCTTACTTGCACCACGATTGTCGATCTTGTATACTGCATCTAGATG
TGAAGCCGGAAAATATACTTCTCGACCATGATTATCGTGCACTCGTGTCA
GATTTCGGGCTCTCGAAAATAAAAGGAAGAGACGAGAGTCGAGTTGTGAC
AACGATCCGGGGGACTAGAGGTTACTTGGCTCCTGAATGGCTCCTGGAGA
ATGGAGTTTCTGAGAAATGTGATGTGTACAGTTATGGAATGGTGCTGTTA
GAGATTATTGGTGGACGAAGAAACGTCCGTGTTCTCGAAAATGGCAATGG
TGAGTCGAAAAAAAAGTTTCAATACTTCCCAAAGATTGTGAGTGACAAAT
TTAAAGATGGGAAACTTATGGAAATTGTTGATCCAAGGTTGGTTGAAGAT
GGAGGGGTTAATGAGAGGCAATTAAAGAGACTGGTTTGTGCAGCTTTATG
GTGCATACAAGAGAAGGCCAAGCTTAGGCCAAGCATGGCTATGGTTGTTG
AAATGCTCGAGGGGCGTGTACCGGTTGAAGACCCGCCCAACACACAAATG
CTTATTGTTGATTTGTTAACAATTGGTGAAGAGGCAGCTGTTGTACTCCC
AGGCCTAGATTTGGTATAGT-GGAAAATTACCAAATGAATAGTGACATTC
CTTCCACGTCGAGTTACTCGGTTACAATGTCGACACTCTCAGGCCGGTAG
>FRAX10_FRAEX38873_V2_000292250.1_R0
ATGGAAGACAAAAAAGCAAATTTGATTGCATTTTCCATAGTAATTGTACT
CATAATTGTCATTATCATTGCTCGTTTATCTCTGAAACTTTCCAAGACAT
TTTTTCTGATATGTGGAGCTGATATTGCAGCAATTCTAGCAGTTTTTGCA
GTTATAGCGATCCGGGTTCGTTTTACTGCTCGACGAAAACAACTCGAACA
ACAGTTCGATTCAGAAGGCCGAGAGCTTCGAATCGAGTACAGTTTTCTGA
GGAAAGTTGCTGGAGTTCCGACAAAGTTCCGGTATCGGGACTTGGAAGTA
GCCACGGATGGCTTTCGATCTATGGTAGGACGTGGGTCGTCGGCTTCAGT
CTTTAAAGGGATACTCAGTGATGGGACGGCAGTTGCAGTAAAAAGGATTG
AAGGGGATGATCGAGGAGAGAAGGAATTCAAATCAGAAGTTGCAGCTATT
GCTAGCGTGCAACACGTAAACCTCGTACGCCTTCTCGGGTATTGTGTCCA
GTCGACTGGTCCTCGTTTCATTGTTTACGAGTTCATTCATAACGGCTCGT
TGGATAATTGGATTTTCCCCAAGGGGGAAAGGGGTGGTCAACGTAGTGGT
TGTTTGACATGGGATTCGAGATGTACAGTTGCTCTTGATGTAGCGAGAGC
GCTTTCTTACTTGCACCACGATTGTCGATCTTGTATACTGCATCTAGATG
TGAAGCCAGAAAATATACTTCTCGACCATGATTATCGTGCACTCGTGTCA
GATTTCGGGCTCTCGAAAATAAAAGGAAGAGACGAGAGTCGAGTTGTGAC
AACGATCCGGGGGACTAGAGGTTACTTGGCTCCTGAATGGCTCCTGGAGA
ATGGAGTTTCTGAGAAATGTGATGTGTACAGTTATGGAATGGTGCTGTTA
GAGATTATTGGTGGACGAAGAAACGTCCGTGTTCTCGAAAATGGCAATGG
TGAGTCGAAAAAAAAGTTTCAATACTTCCCAAAGATTGTGAGTGACAAAT
TTAAAGATGGGAAACTTATGGAAATTGTTGATCCAAGGTTGGTTGAAGAT
GTAGGGGTTAATGAGAGGCAGTTAAAGAGACTGGTTTGTGCAGCTTTATG
GTGCATACAAGAGAAGGCCAAGCTTAGGCCAAGCATGGCTATGGTCGTTG
AAATGCTCGAGGGGCGTGTACCGGTCGAAGACCCGCCCAACACACAAATG
CTTATTGTTGATTTGTTATCAATTGATGAGGAGGCAGCTGTTGTACTCCC
AGGCCTAGATTTGGTATAGT-GGAAAATTACCAAATGAATAGTGACATTC
CTTCCACGTCGAGTTACTCGGTTACAATGTCGATACTCTCAGGCCGGTAG
>FRAX13_FRAEX38873_V2_000292250.1_R0
ATGGAAGACAAAAAAGCTAATTTGATTGCATTTTCCATAGTAATTGTACT
CATAATTGTCATTATCATTGCTCGTTTATCTCTGAAACTTTCCAAGACAT
TTTTTCTGATATGTGGAGCTGATATTGCAGCAATTCTAGCAGTTTTTGCA
GTTATAGCGATCCGGGTTCGTTTTACTGCTCGACGAAAACAACTCGAACA
ACGGTTCGATTCAGAAGGCCGAGAGCTTCGAATCGAGTACAGTTTTCTGA
GGAAAGTTGCTGGAGTTCCGACAAAGTTCCGGTATCGGGACTTGGAAGTA
GCCACGGATGGCTTTCGATCTATGGTAGGACGTGGGTCGTCGGCTTCAGT
CTTTAAAGGGATACTCAGTGATGGGACGGCAGTTGCAGTAAAAAGGATCG
AAGGGGATGATCGAGGAGAGAAGGAATTCAAATCAGAAGTTGCAGCTATT
GCTAGCGTGCAACACGTAAACCTCGTACGCCTTCTTGGGTATTGTGTCCA
GTCGACTGGTCCTCGTTTCATTGTTTACGAGTTCATTCATAACGGCTCGT
TGGATAATTGGATTTTCCCCAAGGGGGAAAGGGGTGGTCAACGTAGTGGT
TGTTTGACATGGGATTCGAGATGTACAGTTGCTCTTGATGTAGCGAGAGC
GCTTTCTTACTTGCACCACGATTGTCGATCTTGTATACTGCATCTAGATG
TGAAGCCAGAAAATATACTTCTCGACCATGATTATCGTGCACTCGTGTCA
GATTTTGGGCTCTCGAAAATAAAAGGAAGAGACGAGAGTCGAGTTGTGAC
AACGATCCGGGGGACTAGAGGTTACTTGGCTCCTGAATGGCTCCTGGAGA
ATGGAGTTTCTGAGAAATGTGATGTGTACAGTTATGGAATGGTGCTGTTA
GAGATTATTGGTGGACGAAGAAACGTCCGTGTTCTCGAAAATGGCAATGG
TGAGTCGAAAAAAAAGTTTCAATACTTCCCAAAGATTGTGAGTGACAAAT
TTAAAGATGGGAAACTTATGGAAATTGTTGATCCAAGGTTGGTTGAAGAT
GGAGGGGTTAATGAGAGGCAATTAAAGAGACTGGTTTGTGCAGCTTTATG
GTGCATACAAGAGAAGGCCAAGCTTAGGCCAAGCATGGCTATGGTCGTTG
AAATGCTCGAGGGGCGTGTACCGGTCGAAGACCCGCCCAACACACAAATG
CTTATTGTTGATTTGTTATCAATTGATGAGGAGGCAGCTGTTGTACTCCC
AGGCCTAGATTTGGTATAGT-GGAAAATTACCAAATGAATAGTGACATTC
CTTCCACGTCGAGTTACTCGGTTACAATGTCGATACTCTCAGGCCGGTAG
>FRAX33_FRAEX38873_V2_000292250.1_R0
ATGGAAGACAAAAAAGCAAATTTGATTGCATTTTCCATAGTTATTGTACT
CATAATTGTCATTATCATTGCTCGTTTATCTCTGAAACTTTCCAAGACAT
TTTTTCTGATATGTGGAGCTGATATTGCAGCAATTCTAGCAGTTTTTGCA
GTTATAGCGATCCGGGTTCGTTTTACTGCTCGACGAAAACAACTCGAACG
ACAGTTCGATTCAGAAGGCCGAGAGCTTCGAATCGAGTACAGTTTTCTGA
GGAAAGTTGCCGGAGTTCCGATAAAATTCCGGTATCGGGACTTGGAAGTA
GCCACGGATGGCTTTCGATCTATGGTAGGACGTGGGGCCTCGGCTTCAGT
CTTTAAAGGGATACTCAACGATGGGACGGCAGTTGCAGTAAAAAGGATCG
AAGGGGATGATCGAGGAGAGAAGGAATTCAAATCAGAAGTTGCAGCTATT
GCTAGCGTGCAACACGTAAACCTCGTTCGCCTTCTCGGGTACTGTGTCGC
GTCGACTGGTCCTCGTTTCCTTGTTTACGAGTTCATTCATAACGGCTCGT
TGGATAATTGGATTTTCCCCAAGAGGGAAAGTTGTGGTCGACGTAGTGGT
TGTTTGACATGGGATTCGAGATGTAGAGTTGCTCTTGACGTAGCGAGAGC
GCTTTCTTACTTGCACCACGATTGTCGATCTTGTATACTGCATCTAGATG
TGAAGCCGGAAAATATACTTCTCGACCATGATTATCGCGCACTCGTGTCA
GATTTCGGGCTCTCGAAACTAAAAGGAAGAGACGAGAGTCGAGTTGTGAC
AACGATCCGGGGGACTAGAGGTTACTTGGCTCCTGAATGGCTCCTGGAGA
ATGGAGTTTCTGAGAAATGTGATGTGTACAGTTATGGAATGGTGCTGTTA
GAGATTATTGGTGGACGAAAAAACGTCTGTGTTCTCGAAAATGGCAACGG
TGAGTCGAAAAAAAAGTTTCAATACTTCCCAAAGATTGTGAGTGACAAAT
TTAAAGATGGGAAACTTATGGAAATTGTTGATCCAAGGTTGGTTGAAGAT
GGAGGGGTTAATGAGAGGCAATTAAAGAGACTGGTTTGTGCAGCTTTATG
GTGCATACAAGAGAAGGCCAAGCTTAGGCCAAGCATGGCTATGGTCGTTG
AAATGCTCGAGGGGCGTGTACCGGTTGAAGACCCGCCCAACACACAAATG
CTTATTATTGATTTGTTATCAATTGATGAAGAGGCAGCTGTTGTACTCCC
AGGCCTAGATATGGTATAGT-GGAAAATTACCAAATGAATAGTGACATTC
CTTCCACGTCGAGTTACTCGGTTACAATGTCGATACTGTCAGGCCGGTAG
>FRAX11_FRAEX38873_V2_000292250.1_R0
ATGGAAGACAAAATAGCAAATTTGATTGCATTTTCCATAGTAATTGTACT
CATAATTGTCATTATCATTGCTCGTATATCTCTGAAACTTTCCAAGACAT
TTTTTCTGATATGTGGAGCTGATATTGCAGCAATTCTAGCAGTTTTTGCA
GTTGTGGCGATCCGGGTTCGTTTTACCGCTCGACGAAAACAACTCGAACG
ACAGTTCGATTCAGAAGGCCGAGAGCTTCGAATCGAGTACAGTTTTCTGA
GGAAAGTTGCCGGAGTTCCGATAAAGTTCCGGTATCGGGACTTGGAAGTA
GCCACGGATGGCTTTCGATCTATGGTAGGACGTGGGGCGTCGGCTTCAGT
CTTTAAAGGGATACTCAATGATGGGACGGCTGTTGCAGTAAAAAGGATCG
AAGGGGATGATCAAGGAGAGAAGGAATTCAAATCAGAAGTTGCAGCTATT
GCTAGCGTGCAACACGTAAACCTCGTACGCCTTCTCGGGTATTGTGTCCC
GTCGACTGGTCCTCGTTTCATTGTTTACGAGTTCATTCATAACGGCTCGT
TGGATAATTGGATTTTCCCCAAGAGGGAAAGTCTTGGTCGACGTAGTGGT
TGTTTGACATGGGATTCGAGATGTAGAGTTGCTCTTGATGTAGCGAGAGC
GCTTTCTTACTTGCACCACGATTGTCGATCTTGTATACTGCATCTAGATG
TGAAGCCGGAAAATATACTTCTCGACCATGATTATCGCGCGCTCGTGTCA
GATTTCGGGCTCTCGAAACTTAAAGGAAGAGACGAGAGTCGAGTTGTGAC
AACTATCCGGGGGACTAGAGGTTACTTGGCTCCTGAATGGCTCCTGGAGA
ATGGAGTTTCTGAGAAATGTGATGTGTACAGTTATGGAATGGTGCTGTTA
GAGATTATTGGTGGACGAAGAAACGTCTGTGTTCTCGAAAATGGCAAAGG
TGAGTCGAAAAAAAAGTTTCAATACTTCCCAAAGATTGTGAGTGAGAAAT
TTAAAGATGGGAAACTTATGGAAATTGTTGATCCAAGGTTGGTTGAAGAT
GGAGGGGTTAATGAGAGGCAATTAAAGAGACTGGTTTGTGCAGCTTTATG
GTGCATACAAGAGAAGGCCAAGCTTAGGCCAAGCATGGCTATGGTCGTTG
AAATGCTCGAGGGGCGTGTACCAGTTGAAGACCCGCCCAACACACAAATG
CTTATTGTTGATTTATTATCACTTGATGAAGAGGAAGCTGTTGTACTCCC
AGGCCTAGATTTGGTATAGT-GGAAAATTACCAAATGAATAGTGACATTC
CTTCCACGTCGAGTTACTCGGTTACAATGTCGATAGTCTCGGGCCGGTAG
>FRAX04_FRAEX38873_V2_000292250.1_R0
ATGGAAGACAAAATAGCAAATTTGATTGCATTTTCCATAGTAATTGTACT
CATAATTGTCATTATCATTGCTCGTATATCTCTGAAACTTTCCAAGACAT
TTTTTCTGATATGTGGAGCTGATATTGCAGCAATTCTAGCAGTTTTTGCA
GTTGTGGCGATCCGGGTTCGTTTTACCGCTCGACGAAAACAACTCGAACT
ACAGTTCGATTCAGAAGGCCGAGAGCTTCGAATCGAGTACAGTTTTCTGA
GGAAAGTTGCCGGCGTTCCGATAAAGTTCCGGTATCGGGACTTGGAAGTA
GCCACGGATGGCTTTCGATCTATGGTAGGACGTGGGGCGTCGGCTTCAGT
CTTTAAAGGGATACTCAATGATGGGACGGCAGTTGCAGTAAAAAGGATCG
AAGGGGATGATCAAGGAGAGAAGGAATTCAAATCAGAAGTTGCAGCTATT
GCTAGCGTGCAACACGTAAACCTTGTACGCCTTCTCGGGTATTGTGTCCC
GTCGACTGGTCCTCGTTTCATTGTTTACGAGTTCATTCATAACGGCTCGT
TGGATAATTGGATTTTCCCCAAGAGGGAAAGTCGTGATCGACGTAGTGGT
TGTTTGACATGGGATTCGAGATGTAGAGTTGCTCTTGATGTAGCGAGAGC
GCTTTCTTACTTGCACCACGATTGTCGATCTTGTATACTGCATCTAGATG
TGAAGCCGGAAAATATACTTCTCGACCATGATTATCGCGCGCTCGTGTCA
GATTTCGGGCTCTCGAAACTTAAAGGAAGAGACGAGAGTCGAGTTGTGAC
AACTATCCGGGGGACTAGAGGTTACTTGGCTCCTGAATGGCTCCTGGAGA
ATGGAGTTTCTGAGAAATGTGATGTGTACAGTTATGGAATGGTGCTGTTA
GAGATTATTGGTGGACGAAGAAACGTCAGTGTTCTCGAAAATGGCAAAGG
TGAGTCGAAAAAAAAGTTTCAATACTTCCCAAAGATTGTGAGTGAGAAAT
TTAAAGATGGGAAACTTATGGAAATTGTTGATCCAAGGTTGGTTGAAGAT
GGAGGGGTTAATGAGAGGCAATTAAAGAGACTGGTTTGTGCAGCTTTATG
GTGCATACAAGAGAAGGCCAAGCTTAGGCCAAGCATGGCTATGGTCGTTG
AAATGCTCGAGGGGCGTGTACCGGTCGAAGACCCGCCCAACACACAAATG
CTTATTGTTGATTTATTATCACTTGATGAAGAGGAAGCTGTTGTACTCCC
AGGCCTAGATTTGGTATAGT-GGAAAATTACCAAATGAATAGTGACATTC
CTTCCACGTCGAGTTACTCGGTTACAATGTCGATACTCTCGGGCCGGTAG
>FRAX27_FRAEX38873_V2_000292250.1_R0
ATGGAAGACAAAATAGCAAATTTGATTGCATTTTCCATAGTAATTGTACT
CATAATTGTCATTATCATTGCTCGTATATCTCTGAAACTTTCCAAGACAT
TTTTTCTGATATGTGGAGCTGATATTGCAGCAATTCTAGCAGTTTTTGCA
GTTGTGGCGATCCGGGTTCGTTTTACCGCTCGACGAAAACAACTCGAACG
ACAGTTCGATTCAGAAGGCCGAGAGCTTCGAATCGAGTACAGTTTTCTGA
GGAAAGTTGCCGGAGTTCCGATAAAGTTCCGGTATCGGGACTTGGAAGTA
GCCACGGATGGCTTTCGATCTATGGTAGGACGTGGGGCGTCGGCTTCAGT
CTTTAAAGGGATACTCAATGATGGGACGGCAGTTGCAGTAAAAAGGATCG
AAGGGGATGATCAAGGAGAGAAGGAATTCAAATCAGAAGTTGCAGCTATT
GCTAGCGTGCAACACGTAAACCTCGTACGCCTTCTCGGGTATTGTGTCCC
GTCGACTGGTCCTCGTTTCATTGTTTACGAGTTCATTCATAACGGCTCGT
TGGATAATTGGATTTTCCCCAAGAGGGAAAGTCGTGATCGACGTAGTGGT
TGTTTGACATGGGATTCGAGATGTAGAGTTGCTCTTGATGTAGCGAGAGC
GCTTTCTTACTTGCACCACGATTGTCGATCTTGTATACTGCATCTAGATG
TGAAGCCGGAAAATATACTTCTCGACCATGATTATCGCGCGCTCGTGTCA
GATTTCGGGCTCTCGAAACTTAAAGGAAGAGACGAGAGTCGAGTTGTGAC
AACTATCCGGGGGACTAGAGGTTACTTGGCTCCTGAATGGCTCCTGGAGA
ATGGAGTTTCTGAGAAATGTGATGTGTACAGTTATGGAATGGTGCTGTTA
GAGATTATTGGTGGACGAAGAAACGTCCGTGTTCTCGAAAATGGCAAAGG
TGAGTCGAAAAAAAAGTTTCAATACTTCCCAAAGATTGTGAGTGAGAAAT
TTAAAGATGGGAAACTTATGGAAATTGTTGATCCAAGGTTGGTTGAAGAT
GGAGGGGTTAATGAGAGGCAATTAAAGAGACTGGTTTGTGCAGCTTTATG
GTGCATACAAGAGAAGGCCAAGCTTAGGCCAAGCATGGCTATGGTCGTTG
AAATGCTCGAGGGGCGTGTACCGGTTGAAGACCCGCCCAACACACAAATG
CTTATTGTTGATTTATTATCACTTGATGAAGAGGAAGCTGTTGTACTCCC
AGGCCTAGATTTGGTATAGT-GGAAAATTACCAAATGAATAGTGACATTC
CTTCCACGTCGAGTTACTCGGTTACAATGTCGATACTCTCGGGCCGGTAG

In [28]:
from DNASkittleUtils.Contigs import read_contigs, write_contigs_to_file

consensus_contigs = read_contigs(consensus_file)
len(consensus_contigs)


Out[28]:
30

In [12]:
con = consensus_contigs[0].seq
con


Out[12]:
'ATGGAAGACMAAAWWGCWAATTTGWTWGCVTTTTYCRTWGTWAYTSTACTCATARTTGYCATTATCATTGCTCGTNTWTYTCTGAAACTYTCCARGACDTTTTTTCTKATATKTGGAGCTGATATTGCAGCAATTCTAGCAGTTTTTGCAKTWRTRGCKATCCGGVYTCGTTTYRCYGCTCGRMGAAAACAACTYGAACDRCRGTWYGATTCAGAWGGCCGWGAGCTTMGAATMGAGTACAGTTTTCTGAGGAAAGTTGCYGGMGTTCCSAYAAARTTCMGGTATMGGGAYYTRGAWRTAGCCACRGATGGCTTTSGATCWATGGTRGGACGTGGGKCSTCRGCTKYARTCTTTAAAGGGATMCTCARYGAYGGGACRGCWGTKGCAGTAAAAMGGATYGAAGGGGRTGATCRAGGASRGAAGGAATTCAAATCAGAAGTYGCAGCTATTGCTAGCGTGCAACACGTMAACCTYGTHCGYCTTCTYGGGTWYTGTKTCBMGTCSACTGGTCCTCGWYTCMTYGTTTACGABTTCATTCAYAAYGGCTCGTTGGATAATTGGATTTTCCCCARGVGSGWAMKDBKTGRYCRAYKYAVTGGTTGTTTGACATGGGATTYGAGATGTRSAGTTGCTCTYGAYGTAGCKARAGCRCTWTCTTACTTGCAYCRYGATTGTCGRTCTTGYATACTGCATCTAGATGTKAAGCCRGAAAATATACTTMTMGACCAWGATTATCGYGCRCTYGTGTCRGAYTTYGGGCTCTCRAAAMTDAAAGGAAKAGASGAGAGTCGAGTTGTGACAACDATYCGDGGGACTAGAGGTTAYTTGGCTCCTGAATGGMTCCTGGAGAAYGGAGTWTCHGAGAAATGTGAYGTGTACAGTTATGGAATGGTGCTBTTAGAGATTATYGGTGGACRAARAARYGTCNGTGTTCTYGAMAAWGGYAWHSGYGARTCGAAAARAAAGTTTCARTWCTTCCCRAAGATYGTGAGYGASAAATWKAAAGMTGGGAAACTTAYGGAAATTGTTGATCCAAGGYTRGTTGAAGATKKWGGGRTTAAYGAGAGRCARTTAAARAGACTGGTTTGTGCAGCTTTATGGTGCATACAAGAGAMGRCCAAGCKTAGGCCAASCATGGCTAYGGTYGTTGAAATGCTYGAGGGGCGTGTACYDGTYSAAGACCCKCCCRACACRCAAATGCTTRTWRTTGATWTVTTAWCAMTTGRYRARGAKSMRGCTRTYRTRCTCCCARGCSTAGATWTGGTRTAGTGRGAWRRWTACSAAATGAATAGTGACATTCCTTCMWCRTCRAGTTACTCGGTTACAATGTCRRYASTSTCRGGYCGGTAG'

In [13]:
''.join([c for c in con if c not in 'ACGT' ])


Out[13]:
'MWWWWWVYRWWYSRYNWYYRDKKKWRRKVYYRYRMYDRRWYWWMMYMSYRMMYYRWRRSWRKSRKYRMRYYRWKMYRRSRYMYHYYWYKBMSWYMYBYYRVSWMKDBKRYRYKYVYRSYYKRRWYRYRYKRMMWYRYRYYRMDKSDYDYMYWHYBYRRRYNYMWYWHSYRRRWRYYSWKMYYRKKWRYRRRMRKSYYYYDYSKRRRWRWVWMRYRRKSMRRYRRRSWRRWRRWSMWRRRRYSSRY'

In [17]:
informative_positions = [i for i,c  in enumerate(con) if c not in 'ACGT' ]
informative_positions


Out[17]:
[9,
 13,
 14,
 17,
 24,
 26,
 29,
 34,
 36,
 38,
 41,
 43,
 45,
 54,
 58,
 75,
 77,
 79,
 89,
 94,
 98,
 107,
 112,
 150,
 152,
 153,
 155,
 158,
 165,
 166,
 173,
 174,
 176,
 182,
 183,
 194,
 199,
 200,
 202,
 205,
 206,
 215,
 221,
 228,
 233,
 260,
 263,
 269,
 271,
 275,
 279,
 285,
 290,
 291,
 293,
 296,
 297,
 305,
 315,
 320,
 326,
 336,
 338,
 341,
 345,
 346,
 348,
 362,
 367,
 368,
 371,
 377,
 380,
 383,
 393,
 398,
 406,
 412,
 417,
 418,
 440,
 467,
 473,
 476,
 479,
 485,
 490,
 491,
 495,
 498,
 499,
 503,
 515,
 516,
 519,
 521,
 530,
 539,
 542,
 571,
 573,
 575,
 577,
 579,
 580,
 581,
 582,
 583,
 586,
 587,
 589,
 591,
 592,
 593,
 595,
 616,
 624,
 625,
 635,
 638,
 644,
 646,
 650,
 653,
 665,
 667,
 668,
 677,
 683,
 701,
 707,
 720,
 722,
 728,
 737,
 740,
 743,
 749,
 752,
 755,
 764,
 768,
 770,
 778,
 782,
 803,
 806,
 809,
 824,
 840,
 851,
 857,
 860,
 872,
 896,
 908,
 916,
 919,
 922,
 923,
 927,
 935,
 938,
 941,
 944,
 946,
 947,
 948,
 950,
 953,
 961,
 971,
 973,
 980,
 986,
 992,
 995,
 1000,
 1001,
 1006,
 1018,
 1038,
 1040,
 1050,
 1051,
 1052,
 1056,
 1061,
 1067,
 1070,
 1076,
 1114,
 1116,
 1123,
 1132,
 1141,
 1145,
 1157,
 1171,
 1172,
 1175,
 1176,
 1184,
 1188,
 1193,
 1203,
 1205,
 1206,
 1212,
 1214,
 1218,
 1221,
 1225,
 1226,
 1227,
 1229,
 1232,
 1233,
 1234,
 1235,
 1239,
 1241,
 1242,
 1244,
 1251,
 1254,
 1260,
 1265,
 1271,
 1274,
 1275,
 1276,
 1277,
 1281,
 1304,
 1305,
 1307,
 1310,
 1331,
 1332,
 1333,
 1335,
 1337,
 1340,
 1343]

In [18]:
def informative_bases(seq, informative_positions):
    return ''.join([seq[i] for i in informative_positions])

informative_bases(con, informative_positions)


Out[18]:
'MWWWWWVYRWWYSRYNWYYRDKKKWRRKVYYRYRMYDRRWYWWMMYMSYRMMYYRWRRSWRKSRKYRMRYYRWKMYRRSRYMYHYYWYKBMSWYMYBYYRVSWMKDBKRYRYKYVYRSYYKRRWYRYRYKRMMWYRYRYYRMDKSDYDYMYWHYBYRRRYNYMWYWHSYRRRWRYYSWKMYYRKKWRYRRRMRKSYYYYDYSKRRRWRWVWMRYRRKSMRRYRRRSWRRWRRWSMWRRRRYSSRY'

In [25]:
assert all([base not in informative_bases(con, informative_positions) for base in 'ACGT'])

In [26]:
informative_bases(consensus_contigs[2].seq, informative_positions)


Out[26]:
'AAAAATACAAATGATTATTAAGGGTAAGCTTACACCGAATCAACCCACTGCCTTAAGGCAAGGGTCGAATTGAGACAAGACACACCATGCCGTTCTGTCAGGAATTTGGTGCGTGCAGTTGGGTCACATGGCATCACATCGCAGGGCGCCCAATGTAGACCCATCTCGTGAGAATTCTGATTGTGTGTGAGAGGGTCCCTCGGAAATGTATAATGAGGAAGTGAGCTAGTAATCCTGGAGTCCAC'

In [38]:
from DNASkittleUtils.Contigs import read_contigs, write_contigs_to_file, Contig
from os.path import splitext

def barcoding_sequences(input_fasta_path):
    consensus_contigs = read_contigs(input_fasta_path)
    con = consensus_contigs[0].seq
    informative_positions = [i for i,c  in enumerate(con) if c not in 'ACGT' ]
    reduced_contigs = []
    for species in consensus_contigs[1:]:  # skip consensus
        seq = informative_bases(species.seq, informative_positions) 
        reduced_contigs.append(Contig(species.name + '__reduced', seq))  
    out_path = splitext(input_fasta_path)[0] + '__reduced_consensus.fa'
    write_contigs_to_file(out_path, reduced_contigs)
    with open(out_path + '.csv', 'w') as outfile:
        outfile.write('List of ambiguous bases output (0-index based)\n')
        for x in informative_positions:
            outfile.write("%i,%s\n" % (x, con[x]) )

    
consensus_file = r"D:\josiah\Documents\Research\Colleagues\Will Plumb\Barcoding-Fraxinus\data2\consensus align.fa"
barcoding_sequences(consensus_file)


Done writing  29 contigs and 7,105bp

In [ ]: