In [12]:
import os, os.path
import shutil
import glob
import sys
from subprocess import check_call, check_output
os.chdir('/home/will/Dropbox/PhredDirectory/')
staden_path = '/home/will/staden-2.0.0b9.x86_64/bin/'
sys.path.append('/home/will/PySeqUtils/')
In [13]:
from GeneralSeqTools import call_muscle, fasta_reader, fasta_writer
In [43]:
#from Bio import SeqIO
from Bio.SeqIO.AbiIO import AbiIterator
files = glob.glob('../Wigdahl Trace files/2:11:11/*.ab1')
seqs = []
for f in files:
rec = AbiIterator(open(f, mode = 'rb'), trim = True).next()
seqs.append( (rec.id, rec.seq.tostring()) )
In [57]:
!/home/will/staden-2.0.0b9.x86_64/bin/convert_trace --help
Usage: convert_trace [options] [informat outformat] < in > out
Or convert_trace [options] -fofn file_of_filenames
Options are:
-in_format format Format for input (defaults to any
-out_format format Format for output (default ztr)
-fofn file_of_filenames Get "Input Output" names from a fofn
-passed fofn Output fofn of passed names
-error errs Redirect stderr to file "errs"
-failed fofn Output fofn of failed names
-name id ID line for experiment file output
-subtract_background Auto-subtracts the trace background
-subtract amount Subtracts a specified background amount
-normalise Normalises peak heights
-min_normalise Minimum trace amp for normalising
-scale range Downscales peaks to 0-range
-compress mode Compress file output (not if stdout)
-abi_data counts ABI DATA lanes to copy: eg 9,10,11,12
-signed Apply global shift to avoid negative values
-noneg Shift each channel independently to avoid -ve
-- Explicitly state end of options
In [45]:
res = call_muscle(seqs)
with open('align_data.fasta', 'w') as handle:
fasta_writer(handle, res)
In [47]:
from HIVTransTool import process_seqs
results = list(process_seqs(seqs[:50], extract_regions = True, known_names = 50))
WARNING:root:Started ThreadPool with 5 workers
Processed 1 Sequences of 50
Processed 2 Sequences of 50
Processed 3 Sequences of 50
Processed 4 Sequences of 50
In [52]:
for row in results:
if row['RegionName'] == 'LTR5':
print row['Name'], row['QueryNuc']
A0109-R04-Primer7 ATTGGCAGACTACACACCAGGGCCAGGGGTCAGATATCCACTGACCTTTGGATGGTGCTACAAGCTAGTACCAGTTGAGCCAGATAAGGTAGAAGAGGCCAATAAAGGAGAGAACACCAGCTTGTTACACCCTGTGAGCCTGCATGGAATGGATGACCCTGAGAGAGAAGTGTTAGAGTGGAGGTTTGACAGCCGCCTAGCATTTCATCACGTGGCCCGAGAGCTGCATCCGGAGTACTTCAAGAACTGCTGACATCGAGCTTGCTACAAGGGACTTTCCGCTGGGGACTTTCCAGGGAGGCGTGGCCTGGGCGGGACTGGGGAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCTGCTTTTTGCCTGTACTGGGTCTCTCTGGTTAGACCAGATTTGAGCCTGGGAGCTCTCTGGCTAACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCTTGAGTGCTTCAAGTAGTGTGTGCCCGTCTGTTGTGTGACTCT
8-Primer7 ANGGCAGACTACACACCAGGGCNAGGNNTCAGATACCCACTGTGTTTTGGTTGGTGCTTTAAGCTAGTACCAGTTGAGCCAGAGGATGTAGAAAAGGCCAACGAAGGAGAGAACAACAGCCTGTTACACCCTATGAGCCTGCATGGGATGGAGGACACGGAGAAAGAAGTGTTAGTGTGGAGGTTTGACAGCCGCCTAGCATTTCATCACGTGGCCCGAGAGAAGCATCCGGAATACTACCAGAACTGCTGACATCGAGATTGCTACAAGGGACTTTCCGCTGGGGACTTTCCACGGGGGTGGGGNCTGGGCGGGAATGGGGAATGGCNAACCC
A0343-R02-Primer7 TACACACCAGGGCCNNGNNNCAGATATCCACTGACCTTTGGATGGTGCTTCAAGCTAGTCCCAGTGGATCCAGAGAAGATAGAAGAGGCCAATGAAGGGGAGAACAACTGCTTGTTACACCCTATGAGCCAGCATGGGATGGATGACCCAGAGAAAGAAGTGCTAGAGTGGAGGTTTGACAGCCGCCTAGCATTCCATCACATGGCCCGAGAGCTGCATCCGGAGTACTACAAGGACTGCTGACACCGAGCTTTCTACAAAGGACTTTCCGCTGGNGACTTTCCAGGGGAGGCGTGGCCTGNGCAAGGTTAGGGAGTGGCGAGCCCTCANATGCTGCATATAAGCAGCTGCTCTTTGCCTGTACTAAGTCTCTCTGGTTAGACCAGATCAGAGCCTAGGAGCTCTCTAGCTANCTAAGGAAC
A0141-R01-Primer7 TTGGCAGACTACACACCAGGGCNNNNNNCTAGATGGTCACTGACCTTTGGATGGTGCTTCAAGCTAGTACCAGTTGAGCCAGAGAAGATAGAAGAGGCCAATGCAGGAGAGAACAACTGCTTGTTACACCCTATGAGCCAGCATGGAATGGATGACCCGGAGAGAGAAGGGTTAGAGTGGAGGTTTGACAGCCGCCTAGCATTTCATCACGTGGCCCGAGAGCTGCATCCGGAGTACTACAAGAACTGATGACCTCGAGCTTTCTACAAGGGACTTTCCGCTGGGGACTTTCCAGGGAAGGCGTGGCCTGGGCGGGACTGGGGAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCTGCTTTTGCCTGTACTGGGTCTCTCTGGTTAGACCAGATCTGAGCCTGGGAGCTCTCTGGCTAGCTAGGGAACCCACTGCTTAAGCCTCAATAAAGCNNGNCTGGAGTGCT
A0145-R04-Primer7 GNNACTNCNCACCAGTGGNNNNNNNNCCAGATATCCCCTGACCTTTGGATGGTGCTTCAAGCTAGTACCAGTGGAGCCAGAGAAGGTAGAAGAGGCCAATGAAGGAGAGAACAATTGCCTGTTACACCCTATGAGCCAGCATGGGATGGACGACCCGGAGAGAGAAGTGTTAGCATGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGAGCTGCATCCGGAGTACTACAAGGACTGCTGACACCGAGCTTTCTACAAGGGACTTTCCGCTGGGGACTTTCCAGGGAGGTGTGGCCTGGGCGGGACTGGGGAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCTGCTTTCTGCCTGTACTGGGTCTCTCTGGTTAGACCAGATCTGAGCCTGGGAGCTCTCTGGCTAACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCTTGAGTGCTTCAAGTAGTGTGTGCCCGTCTGTTGTGTGACTCTGGTAACTAGAGA
A0025-R04-Primer7 GGCAGATTACNCACCAGGGCNNNGNANCAGATANCCACTGACCTTTGGATGGTGCTTCAAGCTNNTACCAGTTAAGCCAGAGGATGTAGAAGAGGCCAATACGGGAGAGAACAACAGCTTGCTACACCCTATGAGCCTGCATGGGATGGAAGACCCGGAGAGGGAAGTGTTAGTGTGGAAGTTTGACAGCAAACTAGCATTTCATCACATGGCCCGAGAGCTGCATCCGGACTACTACAAGAACTGCTGATATCGAGCTTTCTACAAGGGACTTTCCGCTGGGGACTTTCCAGAGGAGGCGTGGCCTGGGCGGGACTGGGGAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCTGCTTTTCGCCTGTACTGGGTCTCTCTGGTTAGACCAGATCTGAGCCTGGGAGCTCTCTGGCTGACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCTTGAGTGCTTTAAGTAGTGTGTGCCCGTCTGTTGTGTGACTCTGGTAACT
6-Primer7 ATTGGCANATTACNCACCAGGGCCAGGNATCAGATATCCACTGACCTTTGGATGGTGCTTCAAGCTAGTACCAGTTGATCCAGAGAAAGTAGAAGAGGCCAATGAAGGAGAGAACAACTGCTTGTTACACCCCATAAGCCAGCATGGGATGGGGGACCCGGAGAGAGAAGTGTTAATGTGGAAGTTTGACAGCACCCTAGCATTTCACCACAGGGCCCGAGAGCTACATCCGGAGTACTACAAAAACTGATGACATTGATCTTTCTACAAGGGACTTTCCGCTGGGACTTTCCGGGGAGGCGCGGCCTGGGCGGGACAGGGGAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCTGCTTTTTGCCTGTACTGGGTCTCTCTGGTTAGACCAGATCCGAGCCTGGGAGCTCTCTGGCTGACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCTTGAGTGCTTCAAGTAGTGTGTGCCCGTCTGTTGTGTGACTCTGGTAAC
A0266-R03-Primer7 TTGGCAGACTACACACCAGGGCCAGGNNCCAGATTTCCACTGACCTTTGGATGGTGCTTNAANNNNNNNNNNNNTGATCCAGATCANGTAGAAAAGGCTAATGAAGGANAANACAACANCTTGTTACACCCTATGAGCCTGCATGGGATAGAGGACACGGAGAGAGAAGTGTTAGTGTGGAAGTTTGACTCCAAGCTAGCATTTCATCACATGGCCCGAGAGAAGCATCCGGAGTACTACAAGAACTGCTGACATCGAGCTTTCTACAAGGGACTTTCCGCTGGGGACTTTCCAGGGAGGCGTGGCCTGGGCGGGACTGGGGAGTGGCGAGCCCTCAGATGCTGCATATGANCAGCTGCTTTTTGCCGGNCCGGGGGTCTCTGGGGNNANCNNAAATGAACCCGGGGGCTCTCTGGGTAACTTAGGGAACCNACGGNTAAACCCTCATTAAACCTGGCCTGGATTGTTTCAAGTATGGNGGGCCCTCCGGTTGTGGGATTTGGGTACTAAAAAA
A0105-R04-Primer7 TNGNAGACTACNCACCAGGGNCNNNNNNCCAGATATCCCCTGACCTTTGGATGGTGCTTTAANNNNNNNCCAGTTGAGCCAGAGCAGGTAGAAGAGGCCACGAGAGGAGAGAACACCACTTTGTTACACCCTGTAAGCCTGCATGGGATGGAGGACCCGGAGAAAGAAGTGCTGATGTGGAAGTTTGATAGCCGCCTCGCATTCCGTCACGTGGCCCGAGAGCTGCATCCGGAGTACTTCAAAAACTGATGACATTGAGCTTCTCTAAGGGACTTTCCGTTGGGGACTTTCCAGGGGAGGCGCGGCCTGGGCGGGACTGGGGAGTGGCGAGCCCTCAGATGCTGCATAAAAGCAGCCGCTTTTCGCTTGTACTGGGTCTCTCTGGTTAGACCAGATCTGAGCCTGGGAGCTCTCTGGCTAGCTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCTNGAGTGCTTAAAGTANTGTGTGCCCGTCTGTTGTGTGACTCTGGTAACTAGANAT
A0332-Primer7 TNNNNACTACNCNCCAGGGCCAGNNGNGNTCAGATATCCACTGACCTTTGGATGGTGCTACAAGCTAGTACCAGTTGAGCCAGATAAGGTAGAAGAGGCCAATAAAGGAGAGAACACCAGCTTGTTACACCCTGTGAGCCTGCATGGAATGGATGACCCTGAGAGAGAAGTGTTAGAGTGGAGGTTTGACAGCCGCCTAGCATTTCATCACGTGGCCCGAGAGCTGCATCCGGAGTACTTCAAGAACTGCTGACATCGAGCTTGCTACAAGGGACTTTCCGCTGGGGACTTTCCAGGGAGGCGTGGCCTGGGCGGGACTGGGGAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCTGCTTTTTGCCTGTACTGGGTCTCTCTGGTTAGACCAGATTTGAGCCTGGGAGCTCTCTGGCTAACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCTTGAGTGCTTCAAGTANTGTGTGCCCGTCTGTTGTGTGACTCTGGTAACTAGAGATCCCT
A0235-R01-Primer7 TGGCANACTACNCACCAGGGCCAGGNACCAGATTTCCACTGACCTTTGGATGGTGCTTCAAGCTAGTACCAGTTGATCCAGATCAGGTAGAAAAGGCTAATGAAGGAGAAGACAACAACTTGTTACACCCTATGAGCCTGCATGGGATGGAGGACCCGGAGAGAGAAGTGTTAGTGTGGAAGTTTGACTCCAAGCTAGCATTTCATCACATGGCCCGAGAGAAGCATCCGGAGTACTACAAGAACTGCTGACATCGAGCTTTCTACAAGGGACTTTCCGCTGGGGACTTTCCAGGGAGGCGTGGCCTGGGCGGGACTGGGGAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCTGCTTTTTGCCGGACTGGGTCTCTTCTGGTAAAACAAAATTGAACCCGGGAACTTCTTGGGTTACTTAGGAAACCCCTGGTTAAACCCTCATAAAACTTGGCTTGGNTGATTTCAGTAATGGGGGG
A0161-R02-P5-Primer5 GCTACTTCNNTGATTGNNNNNNNNNNCNCCAGGGCCAGGGACAAGATTTCCACNNNNNNNNGGNNGGGGAATTCAAACTAGTACCAGTTGAGCAAGAGAAGATAGAGGACAATGAAAGAGAAAACAGCAGCCTGTTACACCCCATGAGCCAGCATGGGATGGATGACCCAGAGAAAGAAGTATTACAGTGGAAGTTTGACAGCCGCCTAGCCTTCCATCACGTGGCCCGAGAGCTGCATCCGGAGTACTACAAGAATTGATGACACCGAGCTTTCTACAAGGGACTTTCCGCTGGGGACTTTCCAGGGAGGTGTGGCCTGGGCGGGACTGGGGAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCCGCTTTGCGCTTGTACAGGGTCTCTCTGGTTAGACCAGATCTGAGCCTGGGAGCTCTCTGGCTGACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCTTGAGTGCTTCAAGTAGTGTGTGCCCGTCTGTTG
A0389_R01-Primer7 TTGCAGACTACNCACCAGNNNNNNNNNNNCAGATTTCCACTGACCTTTGGATGGTGCTTCAAGCTNNTNCCAGTTGAGCCAGAGGAGGTAGAAAAAGCCAATGAAGGAGAAAACAACTGCTTGTTGCACCCTATGAGCCAGCATGGGATGGATGACCCAGAGAAAGAAGTGTTAGTATGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGAGATACATCCGGAGTACTACAAGGACTGCTGACATTGAGCTTTCTACAAGGGACTTTCCGCTGGGGACTTTCCAGGGAGGCGTGGCCTGGGCGGGACTGGGGAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCTGCTTTTTGCCTGTACTGGGTCTCTCTGGTTAGACCAGATCTGAGCCTGGGAGCTCTCTGGCTAGCTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCTTGAGTGCTTTAAGTAGTGTGTGCCCGTCTGTTGTGTGACTCTGGTAACTAGAGAT
A0392-Primer7 ATGNGACTACNCACCAGGGCNNNGNNNCAGATATCCACTGACCTTTGGATGGTGCTACAAGCTAGTACCAGTTGAGCCAGATAAGGTAGAAGAGGCCAATAAAGGAGAGAACACCAGCTTGTTACACCCTGTGAGCCTGCATGGAATGGATGACCCTGAGAGAGAAGTGTTAGAGTGGAGGTTTGACAGCCGCCTAGCATTTCATCACGTGGCCCGAGAGCTGCATCCGGAGTACTTCAAGAACTGCTGACATCGAGCTTGCTACAAGGGACTTTCCGCTGGGGACTTTCCAGGGAGGCGTGGCCTGGGCGGGACTGGGGAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCTGCTTTTTGCCTGTACTGGGTCTCTCTGGTTAGACCAGATTTGAGCCTGGGAGCTCTCTGGCTAACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCTTGAGTGCTTCAAGTAGTGTGTGCCCGTCTGTTGTGTGACTCTGGTAACTAGAGA
A0431-Primer7 TGNAACTACNCACCAGGGCNNNNNNNNANATTTCCACTGACCTTTGGGTGGTGCTTCNNGNNNNTACCAGTTGATCCAGATCAGGTAGAAAAGGCTAATGAAGGAGAGATAAATAGCTTGCTACACCCTATGAGCCTGCATGGAATGGAGGACCCGGACGGAGAAGGAGAAGTGCTAATGTGGAAGTTTGACAGCCTCCTAGCAGTTCGTCACATGGCCCGAGAGATGCATCCGGAATACTACAAGGACTGCTGACATCGAGCTTTCTACAAGGGACTTTCCGCTGGGGACTTTCCANGGGAGGCNTGACATGGNCGGGACTGGGGANTGNCGACNCCTCANATGCAGCATATAAACGCCGGCTTTTTGCCTGTGCTG
A0176-Primer7 ATTGGCAGACTACACACCAGGGCCAGGGGTCAGATATCCACTGACCTTTGGATGGTGCTACAAGCTAGTACCAGTTGAGCCAGATAAGGTAGAAGAGGCCAATAAAGGAGAGAACACCAGCTTGTTACACCCTGTGAGCCTGCNNGNNATGGATGACCCTGAGAGAGAAGTGTTAGAGTGGAGGTTTGACAGCCGCCTAGCATTTCATCACGTGGCCCGAGAGCTGCATCCGGAGTACTTCAAGAACTGCTGACATCGAGCTTGCTACAAGGGACTTTCCGCTGGGGACTTTCCAAGGAGGTGTGGCCTGGGCGGGACTGGGGAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCTGCTTTTTGCCTGTACTGGGTCTCTCTGGTTAGACCAGATCTGAGCCTGGGAGCTCTCTGGCTAACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCTTGAGTGCTTCAAGTAGTGTGTGCCCGTCTGTTGTGTGACTCTGGTAAC
A0339-R01-Primer7 TGNNACTNCNCACCAGGNNNNNNNNNCAGATTCCAATAACCTTTGGGTGGTGCTTCAAGTTAGTANNNGTTGAGCCAGANAAGGTAGAAGAGGCCACTGAACAGGAGAACACCACCTTGTTGCACCCTATAAGCCAGCATGGGATAGAGGACCCGGAGAGAGAAGTGTTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGAGAAGCATCCGGAGTACTACAAGGACTGCTGACATCGAGCTTTCTACAAGGGACTTTCCGCTGGGGACTTTCCAGGGGAGGCGTGGACTGGGCGGGACAGGGGAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCTGCTTTTTGCCTGTACTGGGTCTCTCTTGTTAGACCAGATCTGAGCCTGGGAGCTCTCTGGCTAACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCTTGAGTGCTTCAAGTAGTGTGTGCCCATCTGTTGTGTGACTCTGGTAACTAGAGAT
A0305-R03-Primer7 TNNAGACTACNCACCAGGCNNNNNNNNCTAGATTCCCACTGACCTTTGGATGGTGCTTCAAGCTNNTNCCAGTTGAGCCAGAGGAGGTAGAAAAGGCCAATGAAGGAGAAAACAACAGCCTGTTGCACCCTATGAGCCAGCATGGGATGGATGACCCGGAGAAAGAAGTGTTAGTATGGAGATTTGACAGCCGCCTAGCATTTCATCACGTGGCCCGAGAGATGCATCCGGAGTTCTACAAGGACTGCTGACATTGAGCTTTCTACAAGGGACTTTCCGCTGGGGACTTTCCAGGGAGGTGTGGCGGGAGGTGTGGCTTGGGCGTGGCGATCCCTCAGATGCTGCATATAAGCAGCTGCTTTCTGCCTGTACTGGGTCTCTCTGGTTAGACCAGATCTGAGCCTGGGAGCTCTCTGGCTAGCTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCTTGAGTGCTTCAAGTAGTGTGTGCCCGTCTGTTGTGTGACTCTGGTAACT
A0310-Primer7 TGGCAGACTACACACCAGGGCCAGGNNGTCAGATATCCACTGACCTTTGGATGGTGCTACAAGCTAGTACCAGTTGAGCCAGATAAGGTAGAAGAGGCCAATAAAGGAGAGAACACCAGCTTGTTACACCCTGTGAGCCTGCATGGAATGGATGACCCTGAGAGAGAAGTGTTAGAGCGGAGGTTTGACAGCCGCCTAGCATTTCATCACGTGGCCCGAGAGCTGCATCCGGAGTACTTCAAGAACTGCTGACATCGAGCTTGCTACAAGGGACTTTCCGCTGGGGACTTTCCAGGGAGGTGTGGCCTGGGCGGGACTGGGGAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCTGCTTTTTGCCTGTACTGGGTCTCTCTGGTTAGACCAGATTTGAACCTGGGAGCTCTCTGGCTAACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCTTGAGTGCTTCAAGTAGTGTGTGCCCGTCTGTTGTGTGACTCTGGTAACT
A0095-R01-Primer7 ATTGGCAGACTACACACCAGGGCCAGGGNANNANATANGCCACTGACCTTTGGATGGTGCTTCAAGCTAGTACCAGTTGAGCCAGATAAGGTAGAAGAGGCCAATGNAGGAGAGAACACCTGCTTGTTACACCCTATGAGCCTGCATGGAATGGATGACCCGGAGAGAGAAGGGTTAGAGTGGAGGTTTGACAGCCGCCTAGCATTTCATCACGTGGCCCGAGAGCTGCATCCGGAGTACTTCAAGAACTGATGACATCGAGCTTTCTACAAGGGACTTTCCGCTGGGGACTTTCCAGGGAAGGCTGGCCTGGGCCGGAATTGGGAATGGCCAACCCTTCAAATCTGGAAATTAACCGCCGGTTTTTGCCTGTACTGGGTCTCTCTGGTTAGACCAGATCTGAGCCTGGGAGCTCTCTGGCTAACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCTTGAGTGCTTTAAGTAGTGTGTGCCCGTCTGTTGTGTGACT
A0245-R01-Primer7 ATTGGCAGACTACACACCAGGGCCAGGGATCAGATATCCACTGACCTTTGGATGGTGCTACAAGCTAGTACCAGTTGAGCCAGAGAAGATAGAAGAAGCCAATAAAGGAGAGAACACCAGCTTGTTACACCCTGTGAGCCTGCATGGGATGGATGACCCTGAGAGAGAAGTGTTAGAGTGGAGGTTTGACAGCCGCCTAGCATTTCATCACGTGGCCCGAGAGCTGCATCCGGAGTACTTCAAGAACTGCTGATATCGAGCTTGCTACAAGGGACTTTCCGCTGGGGACTTTCCAGGGAGGCGTGGCCTGGGCGGGACTGGGGAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCTGCTTTTTGCCTGTACTGGGTCTCTCTGGTTAGACCAGATCTGAGCCTGGGAGCTCTCTGGCTAGCTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCTTGAGTGCTTCAAGTAGTGTGTGCCCGTCTGTTGTATGAC
A0120_R02-Primer7 TNNNTACTACNCNCCAGGGCCNNNNATCAGATATCCACTGACCTTTGGATGGTGCTTCAAGCTANTACCAAGGGAACCAGAGGACAATGAAAAAGAGAACAGCAGCTTATTGCACCCTGCGAGTCTGCATGGGATGGAGGACCCGGAGAAAGAAGAGTTAATATGGAAGTTTGACAGCCACCTAGCATTTCGTCACATGGCCCGAGAACTGCATCCGGAGTACTTCAAGAACTGCTGACATTGAGCTTCCTACAAGGGACTTTCCGCTGGGGACTTTCCAGGGAGGCGTGGCCGGGGCGTGGTCTGGGCGGGACTGGGGAGTGGANAGCCCTCAGATGCTGCATATAATCAGCTGCTTTTGCCTGTAACTGGGTCTCTCTGGTTAAACCAGATCTGACCCTGGGAGCTCTCTGGCTAACAAGGGAACCCACTGCTTAAGCCTCANTAAAGCTTGCCTTGAGTGCTTCGAGTANNGGGTGCCCGTCTGTTGTGTGACTCT
A0385-R01-Primer7 GNNNNNNNNANNNNNNGANGGCAGACTACNCACCAGGGCCAGGGGTCAGATATCCACTGACCTTCGGATGGTGCTTCAAGTTAGTACCAGTTGATCCAGAGCAGGTGGAAAAGGCCAATGAAGGAGAGAACAACAGCTTGCTACACCCTATGAGCCAGCATGGGATGGATTCAGAAGGAGAAGTGTTAATGTGGCAGTTTGACAGTAAACTGGCATTTCATCACGTAGCCCGAGAGCTGCATCCGGAGTACTACAAGAACTGATGACATTGAGAACTGCTGACATTGAGCTTTCTACAAGGGACTTTCCGCTGGGGACTTTCCAGGGAGGCGTGGCCTGGGCGGGACATGGGAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCTGCTTTTGCCTGTACTGGGTCTCTCTGGTTAAACCANATCTGAACCTGGGAACTCTCTGGCTGAATANGGAACCCANTGNNTAANCCTCAATAAANCTTGGCTTGANTGNTTTAANTANTGTGTGCCCNTCTGTTGTGTGACTCTGGTAAC
27-Primer7 GNNGACTNCNNCNANGNNNNNNNNNNNANTCCACTGACCTTTGGATGGTGCTCANNNNNNNNCCAGTTGAGCCAGANAGGTAGAAGAGGCCAATAAAGGAGAGAACAAAAGCTTGTTACACCCTGTGAGCCTGCATGGAATGGATGACCCTGAGAGAGAAGTGTTAGAGTGGAGGTTTGACAGCCGCCTAGCATTTCATCACGTGGCCCGAGAGCTGCATCCGGANTACTTCAAGAACTGCTGACATCGAGCTTGCTACAAGGGACTTTCCGCTGGGGACTTTCCAGGGAGGTGTGGCCTGGGCGGGACTGGGGAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCTGCTTTTTGCCTGTACTGGGTCTCTCTGGTTAGACCAGANNTGAGCCTGGGAGCTCTCTGGCTAACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCTT
A0262-R01-Primer7 ATTNGCAGACTACACACCAGGGCCAGGGGNTCAGATATCCACTGACCTTTGGATGGTGCTACAAGCTAGTACCAGTTGAGCCAGATAAGGTAGAAGAGGCCAATAAAGGAGAGAACACCAGCTTGTTACACCCTGTGAGCCTGCATGGGATGGATGACCCGGAGAGAGAAGTGTTAGAGTGGAGGTTTGACAGCCGCCTAGCATTTCATCACGTGGCCCGAGAGCTGCATCCGGAGTACTTCAAGAACTGCTGATATCGAGCTTGCTACAAGGGACTTTCCGCTGGGGACTTTCCAGGGAGGCGTGGCCTGGGCGGGACTGGGGAGTGGCGAGCCCTCAGATCCTGCATATAAGCAGCTGCTTTTTGCCTGTACTGGGTCTCTCTGGTTAGACCAGATCTGAGCCTGGGAGCTCTCTGGCTAACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCTTGAGTGCTTCAAGTAGTGTGTGCCCGTCTGTTGTGTGACTCTGG
A0430-Primer7 ANNNNNNNNNNNNNATNNNNACTNCNCACCAGGGCCAGNNNNAAGATTTCCACTGACCTTTGGATGGTGCTTNNAANANNGGACCAGTTGAGCAAGAGAAGATAGAGGACAATGAAAGAGAAAACAGCAGCCTGTTACACCCCATGAGCCAGCATGGGATGGATGACCCAGAGAAAGAAGTATTACAGTGGAAGTTTGACAGCCGCCTAGCCTTCCATCACGTGGCCCGAGAGCTGCATCCGGAGTACTACAAGAATTGATGACACCGAGCTTTCTACAAGGGACTTTCCGCTGGGGACTTTCCAGGGAGGTGTGGCCTGGGCGGGACTGGGGAGTGGCGAGCCCTCANATGCTGCATATAAGCAGCCGCTTTGCGCTTGTNCAGGGTCTCTCTGGNTAGANCGTATCTGAGCCTGGNAGCTCTCTGGCTGANTAGNGAACCCACTGCTTGGNCCACAATGAAGCTTGCCGTGAATGCTTCAANTAGTGTGGGCCCGAG
A0305-R02-Primer7 CNNNNGGCAGACTACACACCAGGGCNNNGNNCCAGATATCCACTGTGTTTTGGATGGTGCTTCAAGCTCGTACCAGTTGAGCCAGAGGAGGTAGAAAAGGCCAATGAAGGAGAAAACAACATCTTGTTGCACCCTATGAGCCTGCATGGGATGGATGACCCGGAGAAAGAAGTGTTAGTATGGAGGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGAGAAGCATCCGGAGTTCTACAAGGACTGCTGACACTGAGCTTTCTACAAGGGACTTTCCGCTGGGGACTTTCCAGGGAGGTGTGGCCTGGGCGGGACTGGGGAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCTGCTTTTTGCCTGTACTGGGTCTCTCTGGTTAGACCAGATCTGAGCCTGGGAGCTCTCTGGCTAGCTGGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCTTGAGTGCTTTAAGTAGTGTGTGCCCGTCTGTTGTGTGACTCTGGTAAC
A0095-R03-Primer7 GATTGGNAGACTACACACCAGGGCCANGNNTTAGATACCCACTGTGTTTTGGATGGTGCTTCAAGCTAGTACCAGTTGATCCAGAGAAGGTAGAAGAGGCCAATGAAGCAGAGAACAACTGCTTGCTACACCCTATGAGCCTGCATGGGATGGATGACCCGGAGAAAGAAGTGTTAGTGTGGAGATTTGACAGTCATCTAGCATTTCGTCACCTGGCCCGAGAGAAACATCCGGAATACTTTAAAGACTGCTGACATCGAGATTTCTACAAGGGACTTTCCGCTGGGGACTTTCCAGGGGAGGCGTAACCTGGGCGGGACTGGGGAGTGGCGAGCCCTCAAATGCTGCATATAAGCAGCTGCTTTTTGCCTGTACTGGGTCTCTCTGGTTAGACCAGATCTGAGCCTGGGAGCTCTCTGGCTAACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCTTGAGTGTTTAAGTAGTGTGTGCCCGTCTGTTGTGTGACTCTGGTAA
A0384-R01-Primer7 CNNNTTGGCAGACTACACACCAGGGCCAGGGGTCAGATATCCACTGACCTTTGGATGGTGCTACAAGCTAGTACCAGTTGAGCCAGATAAGGTAGAAGAGGCCAATAAAGGAGAGAACACCAGCTTGTTACACCCTGTGAGCCTGCATGGAATGGATGACCCTGAGAGAGAAGTGTTAGAGTGGAGGTTTGACAGCCGCCTAGCATTTCATCACGTGGCCCGAGAGCTGCATCCGGAGTACTTCAAGAACTGCTGACATCGAGCTTGCTACAAGGGACTTTCCGCTGGGGACTTTCCAGGGAGGCGTGGCCTGGGCGGGACTGGGGAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCTGCTTTTTGCCTGTACTGGGTCTCTCTGGTTAGACCAGATCTGAGCCTGGGAGCTCTCTGGCTAACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCTTGAGTGCTTCAAGTAGTGTGTGCCCGTCTGTTGTGTGACTCTGG
A0184-R03-Primer7 TGGCAGACTACACGCCAGGGCNNNNNNTCAGATATCCACTGACCTTTGGATGGTGCTTCAAGCTAGTACCAGTGGAGCCAGAGGAGGTAGAAAAGGCCAATGAAGGAGAAAACAACTGCTTGTTACACCCTATGAGCCAGCATGGGATGGATGACCCGGAGAAAGAAGTGTTAATATGGAGGTTTGACAGCCGCCTAGCATTTCATCATGTGGCCCGAGAGAAGCATCCGGATTACTACAAGAACTGCTGACATCCTACAATAACTGCTGACACCGAGCTTCCTTCAAGGGACTTTCCGCTGGGGACTTTCCATAAGGCGTGGCCTGGGCGGGACGGGGGAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCTGCTTTTTGCCTGTACTGGGTCTCTCTGGTTAGACCAGATCTGAGCCTGGGAGCTCTCTGGCTAACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCTTGAGTGCTTCAAGTAGTGTGTGCCCGTCTGTTGTGTGACTCTGGTAAC
A0451-Primer7 TGNAAACTACNCACCAGGGCCNGGNNTAAGATATCCACTGACCTTTGGATGGTGCTTCAAGTTNNGTACCGGTAGAGAAAGAGCAGGTAGAAGAGGCCAATGCAGGAGAGAACAACTGCTTATTACACCCTATGAGCCTGCATGGGATGGAGGACTCGGAGAAAGAAGTGTTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACGTGGCCAAAGAGCTGCATCCGGAGTACTACAAAGACTGCTGACATCGAGCTTTCTACAAGGGACTTTCCGCTGGGGACTTTCCAGGGGGCGCGGCCTGGGCGGGACTGGGGAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCCGCTTTTTGCCTGTACTGGGTCTCTCTGGTTAGACCAGATCTGAGCCTGGGAGCTCTCTGGCTAACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCTTGAGTGCTTCAAGTAGTGTGTGCCCGTCTGTTGTGTGACTCTGGTAACTAGAGATCCC
A0432-Primer7 TGNNANTACNCACCAGGGCCNGGGGTCAGATATCCACTGACCTTTGGATGGTGCTTCNNGCTNGTACCAGTGGATCCAGAGAAGGTAGAAGAGGCCACTGAAGGAGAGAACATCAATCTGCTACACCCTATAAGCCTGCATGGGATGGAAGACTCGGAGGGAGAAGTGCTGCAGTGGAAGTTTGACAGCCGCCTAGCATTTCGGCATGTTGCCCAAGAGATACATCCGGAGTACTACGAGAATCGCTGACACCGAGCTTTCTACAAGGGACTTTCCGCTGGGGACTTTCCAGGGAGGTGTGGCCTGGGCGGGACCGGGGAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCTGCTTTCTGCCTGTACTGGGTCTCTCTGGTTAGACCAGATCTGAGCCTGGGAGCTCTCTGGCTAGCTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCTTGAGTGCTTCAAGTAGTGTGTGCCCGTCTGTTGTGTGACTCTGGTAACTAGAGATC
A0048-R02-Primer7 GATTACACACCAGGGCCAGGNAANNNGATTTCCACTGACCTTTGGATGGTGCTTCAAGCTAGTACCAGTTAAGCCAGAGGATGTAGAAGAGGCCAATACAGGGGAGAACAACAGCTTGTTACACCCTATGAGCCTGCATGGGATGGAAGACCCGGAGAAGGAAGTGTTAGTGTGGAAGTTTGACAGCAAACTAGCATTTCATCACATGGCCCGAGAGCTGCATCCGGAGTACTACAAGAACTGCTGACATCGAGCTTTCTACAAGGGACTTTCCGCTGGGGACTTTCCAGGGGAGGCGTGACCTGGGCGGGACTGGGGAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCTGCTTTCTGCCTGTACTGGGTCTCTCTGGTTAGACCAGATCTGAGCCTGGGAGCTCTCTGGCTAACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCTTGAGTGCTTCAAGTANTGTGTGCCCGTCTGTTGTGTGACTCTGGTAACT
A0312-R01-Primer7 GGNAGATTACACACCAGGGCNNNNNNCCAGATACCCACTGTGTTTTGGCTGGTGCTTCAAGCTAGTACCAGTAAAGCCAGACACTAAAAGAGAAGAAAACAATTGCTTGTTACACCCTATAAACCAGCATGAAATGAATAACTCGGAAAAAGAAGTATTACAGTGAAAGTTTAACAGCTACCTAGCCTACCGTCACGTGGCCCGAGAGCTGCATCCGGAGTACTTCAAAGACTGCTGACACTAAGCTTTCTACAAAAGACTTTCCGCTAGGAACTTTCCAGAANAGGCGTAACCTGAGCAGGACTGAAAAGTGGCGAGCCCTCAGAAGCTGCATATAAGCAGCTGCTTTTTGCCTGTACTGAGTCTCTCTGGTTAAACCAGATCTAAGCCTAAAAGCTCTCTAGCTAGCTAGAGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCTTAAGTGCTTCAAGTAGTGTGTGCCCATCTGTTGTGTAACTCTGGTAGTGTAACTCTGGTAACAANAGATC
A0280-Primer7 GGNANACTACNCACCAGGGCNANNNNNNCAGATATCCATTGACCTTTGGATGGTGCTACAAGCTAGTACCAGTTGAGCCAGATAAGGTAGAAGAGGCCAATAAAGGAGAGAACACCAGCTTGTTACGCCCTGTGAGGCTGNGTCAAATGGATGACCCTGAGAGAGAAGTGTTAGAGTGGAGGTTTGACAGCCGCCTAGCATTTCATCACGTGGCCCGAGAGCTGCATCCGGAGTACTTCAAGAACTGCTGACATCGAGCTTGCTACAAGGGACTTTCCGCTGGGGACTTTCCAGGGAGGCGTGGCCTGGGCGGGACTGGGGAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCTGCTTTTTGCCTGTACTGGGTCTCTCTGGTTAGACCAGATCTGAGCCTGGGAGTTCTCTGGCTAACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCTTGAGTGCTTCAAGTAGTGTGTGCCCGTCTGTTGTATGACTCTGGTAACTAANAT
20-Primer7 AGATTACNCNCCAGGGCCAGNGNANCAGATTTCCACTAACCTTTGGGTGGTGCTTCAAGCTAGTACCAGTTAAGCCAGAGGATGTAGAAGAGGCCAATACAGGAGAGAACAACAGCCTGTTACATCCTATGAGCCTACATGGGATGGAAGACCCAGAGAAGGAAGTGCTAGTGTGGAAGTTTGACAGCAAACTAGCATTTCATCACGTGGCCCGAGAGCTGCATCCGGAGTACTACAAGAACTGCTGACACTGAAGATCTATAAGGGACTTTCCGCTGGGGACTTTCCAGGGGAGGCGTGGACTGGGCGGGACTGGGGAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCTGCTTTTGCCTGTACTGGGTCTCTCTGGTTAGACCAGATCTGAGCCTGGGAGCTCTCTGGCTAACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCTTTGAGTGCTTCAAGTAGTGTGTGCCCGTCTGTTGTATGACTCTGGTAA
A0249-Primer7 GATTGGCAGACTACACACCAGGGCCAGGGGTCAGATATCCACTGACCTTTGGATGGTGCTACAAGCTAGTACCAGTTGAGCCAGATAAGGTAGAAGAGGCCAATAAAGGAGAGAACACCAGCTTGTTACACCCTGTGAGCCTGCATGGAATGGATGACCCTGAGAGAGAAGTGTTAGAGTGGAGGTTTGACAGCCGCCTAGCATTTCATCACGTGGCCCGAGAGCTGCATCCGGAGTACTTCAAGAACTGCTGACATCGAGCTTGCTACAAGGGACTTTCCGCTGGGGACTTTCCAGGGAGGCGTGGCCTGGGCGGGACTGGGGAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCTGCTTTTTGCCTGTACTGGGTCTCTCTGGTTAGACCAGATTTGAGCCTGGGAGCTCTCTGGCTAACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCTTGAGTGCTTCAAGTAGTGTGTGCCCGTCTGTTGTGTGACTC
A0148-R02-Primer7 TGGNAGACTACACACCAGGGCCAGGGGTCAGATATCCACTGACCTTTGGATGGTGCTACAAGCNAGTACCAGTTGAGCCAGATAAGGTAGAAGAGGCCAATAAAGGANANAACACCAGCTTGTTACACCCTGTGAGCCTGCATGGAATGGATGACCCTGAGAGAGAAGTGTTAGAGTGGAGGTTTGACAGCCGCCTAGCATTTCATCACGTGGCCCGAGAGCTGCATCCGGAGTACTTCAAGAACTGCTGACATCGAGCTTGCTACAAGGGACTTTCCGCTGGGGACTTTCCAGGGAGGCGTGGCCTGGGCGGGACTGGGGAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCTGCTTTTTGCCTGTACTGGGTCTCTCTGGTTAGACCAGATCTGAGCCTGGGAGCTCTCTGGCTAACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCTTGAGTGCTTCAAGTAGTGTGTGCCCGTCTGTTGTGTGACTCTGGTAACTAGAGAT
A0428-Primer7 ATTGGCAGANTACNCNCCAGGGCCAGGGATCAAGATATCCACTGACCTTTGGGTGGTGCTTCAAGTTAGTACCAGTTGAGCCAGAGGAGGTAGAAAAGGCTAATGAAGGAGAGAACAATTGCTTGTTACACCCTATGAGCCAGCATGGGATGGACGACTCAGAGAAAGAAGTGTTAGTGTGGAAGTTTGACAGCCGCCTCGCATTTCATCACGTGGCCCGAGAGCTGCATCCGGATTACTACAAGGACTGCTGACATCGAGCGTTCTACATGCTGACACTGAGCTTTCTACAAGGGACTTTCCGCTGGGACTTTCCGGGGAGGCGCGGCCTGGGCGGGACAGGGGAGTGGCGAGCCCTCANATGCTGCATATAAGCAGCTGCTTTCTGCCTGTACAGGGTCTCTCTGGTTAGACCAGATCTGAACCTGGGAGCTCTCTGGCTAGCTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCTTGAGTGCTTACAGTAGTGTGTGCCCGTCTGTTGTGTGACANTGGTAACT
A0080-R04-Primer7 CCNCTGACCTTTGGATGGTGCTTCNNNNNNNNNNNNTTGAGCCAGATCACAATGAAGGAGAGAACACCAGCCTGTTACACCCTGTGAGCCTGCATGGGATGGAGGACACAGAGAGAGAAGTGTTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACGTACCCCGAGAGAAGCATCCAGAGTTCTACAAGAACTGCTGACACCGACACAAGAACTGCTGACATTGAGCTTTCTACAGGGACTTTCCGCTGGGGACTTTCCAGGGGAGGCGTGGCCTGGGCGGGACTGGGGAGTGGNNAGCCCTCAGATGCTGCATATAAGCAGCTGCTTTTTGCCTGTACTGGGTCTCTCTGGTTAGACCAGATCTGAGCCCGGGAGCTCTCTGGCTAGCTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCTTGAGTGCTTCAAGTAGTGTGTGCCCGTCTGTTGTGTGACTC
A0001-R06-Primer7 CNGATTGGNNNNCTACACACCAGGGCCAGGNATCAGATATCCACTGACCTTTGGATGGTGCTTCAAACTAGTACCAGTTGAGCAAGAGAAGGTAGAAGAGGCCAATGCAGGGGAGAACAACAAATTGTTACACCCTATGAGCCTGCATGGGATGGATGACCCGGAGAAAGAAGTGCTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACGTGGCCCGAGAGCTGCATCCGGAGTACTACAAGAACTGCTGACATCGGAATTGCTGACAGGGAGCTTTCTATGGGGGATTTTCCGGTGGGGACTTTCCGGGGAGGTGTGGCCTGGGCGGGACCGGGGAATGGCGAGCCCTCACATGCTGCTTATAACCGTCTGCTTTCTGCCTGGTCTGGGTCTCTCTGGTTATACCAGATCTGAGCCTGGGAGCTCTCTGGCTAGCTAAGGAACCCACTGCTTAAGCCTCG
A0284-R03-Primer7 GGCAGACTACNCACCAGGACCAGGGGTTAGATACCCACTGTGTTTTGGCTGGTGTGTGACTCTGGTAACTAGAGATCCCTCANNAGTAGAGAAGAGTGAGAAAGNAGACAGCTGCTTGTTACACCCTGCAAGCCAGCATGGGATGGATGACCCAGAGAAAGAAGTGCTGCAGTGGAAGTTTGACAGCCGCCTAGCCTTCCATCACGTGGCCCGAGAGCTGCATCCGGAGTACTTCAAGAACTGCTGACACCGAGCTTCATAACGGGGACTTTCCGCTGGGGACTTTCCAGGGGAGGTGTGGCCTGGGCGGGACTGGGGAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCTGCTTTTTGCCTGTACTGGGTCTCTCTTGTTAGACCAGATCTGAGCCTGGGAGCTCTCTGGCTAGCTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCTTGAGTGCTTCAAGTAGTGTGTGCCCGTCTGTTGTGTGACTCTGGTAA
A0412-R01-Primer7 CNNNTTGGNAGACTACACACCAGGGCCAGGGGTCAGATATCCACTGACCTTTGGATGGTGCTACAAGCTAGTACCAGTTGAGCCAGATAAGGTAGAAGAGGCCAATAAAGGAGAGAACACCAGCTTGTTACACCCTGTGAGCCTGCATGGAATGGATGACCCTGAGAGAGAAGTGTTAGAGTGGAGGTTTGACAGCCGCCTAGCATTTCATCACGTGGCCCGAGAGCTGCATCCGGAGTACTTCAAGAACTGCTGACATCGAGCTTGCTACAAGGGACTTTCCGCTGGGGACTTTCCAGGGAGGCGTGGCCTGGGCGGGACTGGGGAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCTGCTTTTTGCCTGTACTGGGTCTCTCTGGTTAGACCAGATCTGAGCCTGGGAGCTCTCTGGCTAACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCTTGAGTGCTTCAAGTAGTGTGTGCCCGTCTGTTGTGTGACTCTG
A0402-R01-Primer7 ATGNNACTACNCGCCAGGGCCAGGGACCAGATATCCCCTGACCTTTGGATGGTGCTTCNNGCTAGTACCGGTTGAGCCAGAGGAGGTAGAAAAGGCCAATGAAGGAGAGAACAACTGCTTGTTACACCCTATGAGCCAGCATGGGATGGATGACCCGGAGAAAGAAGTATTAGTATGGAAGTTTGACAGCAGCCTAGCATTTCATCACGTGGCCCGAGAGCTGCATCCGGAGTACTACAAGAACAGCTGACATCGAACTTTCTACAAGGGACTTTCCGCTGGGGACTTTCCATGAGAGGCGTGCCCTGGGGGGGAGGGGGGAGTGGAGACCCCTCANANGCTGCATATAANCATCNGCTTTTTGCCTGTACTGGGTCTCTGTGGTTAGACCAGATCTGACCGGGGGAGCTCTCTGGNTAGCTGGGAAACCCAGTGCTTAANCCTCAATAAANCTNGCCTTGAGTGCTTCAAGTAGTGTGTGCCCGTCTGTTGTG
A0067_R06-Primer7 GNANANTACACATCAGGGCCAGNGGGTCAGATACCCACTGTGCTTTGGCTGGTGCTTCAAGCNNNTACCAGCTGAGCCAGAGGAGGTAGAAAAGGCCAATGAAGGAGAAAAGAACAGCTTGTTACACCCTGCGAGCCTGCATGGAATGGATGACCCTGAGGGAGAAGTGTTAGTGTGGAGATTTGACAGCCGCCTGGCGTTCCATCACGTGGCCCGAGAGCTGCATCCGGAGTACTTCAAGAACTGATGACACTGAACTTTCTACAAGGGACTTTCCACTGGGGACTTTCCAGAGAGGGCGTGGACTGGGCGGGACTGGGAATGGCGAACCCTCANATGCTGCATATAAACAGCTGCTCTCTGCTTGNACTGGGTCTCTCTGGTTANACCANATCANAACCTGGGAGCTCTCTGGCTAACTAGGGAACCCACTGCTTAANCCTCCATAAAGCTTGCCTT
A0427-Primer7 ATTGCANACTACNCACCAGGGCCAGGGATCAGATATCCACTGACCCTTGGATGGTGCTTCANGCTNGTGCCAGTTGAGCCAGGGAAGGTAGAAGAGGCCAATGAAGGAGAGAACTACGGCTTGCTACACCCTATGAGCCTGCATGGGATGGATGACCCGGAGAGAGAAGTGTTAGAGTGGAGGTTTGACAGCCGCCTGGCATTTCATCACGTGGCCCGAGAGCTGCATCCGGAGTACTTCAAGGACTGCTGACACCGAGCTTTCTACAAGGGACTTTCCGCTGGGGACTTTCCAGGGGAGGCGTGACCTGGGCGGGACTGGGGAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCTGCTTTCTGCCTGTACTGGGTCTCTCTGGTTAGACCAGATCAGAGCCTGGGAGCTCTCTGGCTAGCTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCTTGAGTGCTTTAAGTAGTGTGTGCCCGTCTGTTGTGTGACTCTGGTAACTAGAGATC
A0072-R02-Primer7 TNNNTNNNNACTACNCNCCAGGNNNNNNNNNNNNNAGATATCCACTGACCTTTGNATGGTGCTTCANGNNNNNNNNCNGNTAATCCAGAACAAGTAAAAAAGGCCAATAAAGGAAAGAACAACTGCTTGTTACACCCTATAAGCCTGCATAGAATGAAGGACTCAAAAGAAAAAGTGCTAATGTGGAAGTTTAACAGCCGCCTGGCATTTCACCACATAGCCAAAGAGCTACATCCGAAGTACTACAAGAACTAATAACACCAAGCTTTCTACAAGAGACTTTCCGCTGGGAACTTTCCAGGGGAGGCGTGGCCTGGGCGGGACTGGGGAGTGGCAAGCCCTCAAATGCTGCATATAAGCAGCTGCTTTTTGCCTGTACTGGGTCTCTCGGGTCAGACCAGATCAGAGCCTGGAAGCTCTCTGGTTAACTAGGGAACCCACTGCTTAANCCTCNNNAAAGCTTGCCTTAAGTGCTTCNAGTAGTGTGTGCCCATCTGTTG
A0183-R02-Primer7 GNANANTACACACCAGGNCCAGGNATCAGATATCCACTGACCTTTGGATGGTGCTTCAAGCTAGTACCAGTTAAGCCAGAAGATGTAGAAGAGGCCAATACAGGAGAGAACAACAGCTTGTTACACCCTATGAGCCTGCATGGGATGGAAGACTCGGAGAAGGAAGTGTTACAGTGGAGGTTTGACAGCAAACTAGCCTTCCATCACGTGGCCCAAGAGCTGCATCCGGAGTTTTACAAGAACTGCTGACATCGAGCTTTCTACAAGGGACTTTCCGCCGGGGACTTTCCAGGGGAGGCGTGACCTGGGCGGGACTGGGGAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCTGCTTTTCGCTTGTACTGGGTCTCTCTGGTTAGACCAGATCTGAGCCTGGGAGCTCTCTGGCTAACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCTTGAGTGCTTCAAGTAGTGTGTGCCCGTCTGTTGTGTGACTCTGGTAACTANGGAT
A0192-R03-Primer7 TGGCAGANTTACACACCANGGGNCCANNNGATCAGATATCCACTGACCTTTGGATGGTGCTTCAAGCTGGTACCAGTTGAGAAAGAGGTGGTAGAAGAGGCCAATACGGGAGAGAACAACAGCTTGTTACACCCTATGAGCCTGCATGGAATGGAAGACCCGGAGGGGGAAGTGTTAGTGTGGAAGTTTGACAGCAAACTAGCATTTCATCACGTGGCCCGAGAGGTACATCCGGAGTACTACAAGAACTGCTGACATCGAGCTCTCTACAAGGGACTTTCCGCTGGGGACTTTCCAGGGGAGGCGCGGCCTGGGCGGGACTGGGGAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCTGCTTTTTGCCTGTACTGGGTCTCTCTAGTTAGACCAGATCTGAGCCTGGGAGCTCTCTGGCTGACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCTTGAGTGCTTCAAGTAGTGTGTGCCCGTCTGTTGTGTGACTCTGGTA
A0426-Primer7 ANGGCAGACTACACACCAGGGCCAGGNACCAGATATCCAATAACCTTTGGATGGTGCTTCAAGTTAGTACCAGTGGATCAAGAGAAGGTGGAACAGGCCAACGAAGGAGAGAACAACTGCCTGCTACACCCTATGAGCCAGCATGGGATGGATGACCCAGAGAAAGAAGTGTTAATGTGGAAGTTTGACAGCAGCCTAGCATTTCATCACGTTGCCCGAGAGATGCATCCGGAGTACTATAAAGACTGCTGACACTGAGTTTCTACAAGGGACTTTCCGCTGGGGACTTTCCAGGAAGGCGTGGCCTGGGCGGGACTGGGGAGTGGCGAGCCCTCAAATGCTGCATATAAGCAGCTGCTTTTTGCCTGTACTGGGTCTCTCTAGTTAAACCANATCTGANCCTGGGANCTCTCTGGCTAGCTAGGGAAC
In [51]:
results[:5]
Out[51]:
[{'Name': u'A0109-R04-Primer7',
'QueryAA': u'XWQTTHQGQGSDIH*PLDGATS*YQLSQIR*KRPIKERTPACYTL*ACMEWMTLREKC*SGGLTAA*HFITWPESCIRSTSRTAX',
'QueryNuc': u'ATTGGCAGACTACACACCAGGGCCAGGGGTCAGATATCCACTGACCTTTGGATGGTGCTACAAGCTAGTACCAGTTGAGCCAGATAAGGTAGAAGAGGCCAATAAAGGAGAGAACACCAGCTTGTTACACCCTGTGAGCCTGCATGGAATGGATGACCCTGAGAGAGAAGTGTTAGAGTGGAGGTTTGACAGCCGCCTAGCATTTCATCACGTGGCCCGAGAGCTGCATCCGGAGTACTTCAAGAACTGCTG',
'QueryNucStart': 1,
'QueryNucStop': 253,
'RegionAAStart': 123,
'RegionAAStop': 207,
'RegionName': u'Nef',
'RegionNucStart': 368,
'RegionNucStop': 621},
{'Name': u'A0109-R04-Primer7',
'QueryAA': None,
'QueryNuc': u'ATTGGCAGACTACACACCAGGGCCAGGGGTCAGATATCCACTGACCTTTGGATGGTGCTACAAGCTAGTACCAGTTGAGCCAGATAAGGTAGAAGAGGCCAATAAAGGAGAGAACACCAGCTTGTTACACCCTGTGAGCCTGCATGGAATGGATGACCCTGAGAGAGAAGTGTTAGAGTGGAGGTTTGACAGCCGCCTAGCATTTCATCACGTGGCCCGAGAGCTGCATCCGGAGTACTTCAAGAACTGCTGACATCGAGCTTGCTACAAGGGACTTTCCGCTGGGGACTTTCCAGGGAGGCGTGGCCTGGGCGGGACTGGGGAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCTGCTTTTTGCCTGTACTGGGTCTCTCTGGTTAGACCAGATTTGAGCCTGGGAGCTCTCTGGCTAACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCTTGAGTGCTTCAAGTAGTGTGTGCCCGTCTGTTGTGTGACTCT',
'QueryNucStart': 1,
'QueryNucStop': 504,
'RegionAAStart': None,
'RegionAAStop': None,
'RegionName': u'LTR3',
'RegionNucStart': 79,
'RegionNucStop': 583},
{'Name': u'A0109-R04-Primer7',
'QueryAA': None,
'QueryNuc': u'ATTGGCAGACTACACACCAGGGCCAGGGGTCAGATATCCACTGACCTTTGGATGGTGCTACAAGCTAGTACCAGTTGAGCCAGATAAGGTAGAAGAGGCCAATAAAGGAGAGAACACCAGCTTGTTACACCCTGTGAGCCTGCATGGAATGGATGACCCTGAGAGAGAAGTGTTAGAGTGGAGGTTTGACAGCCGCCTAGCATTTCATCACGTGGCCCGAGAGCTGCATCCGGAGTACTTCAAGAACTGCTGACATCGAGCTTGCTACAAGGGACTTTCCGCTGGGGACTTTCCAGGGAGGCGTGGCCTGGGCGGGACTGGGGAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCTGCTTTTTGCCTGTACTGGGTCTCTCTGGTTAGACCAGATTTGAGCCTGGGAGCTCTCTGGCTAACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCTTGAGTGCTTCAAGTAGTGTGTGCCCGTCTGTTGTGTGACTCT',
'QueryNucStart': 1,
'QueryNucStop': 504,
'RegionAAStart': None,
'RegionAAStop': None,
'RegionName': u'LTR5',
'RegionNucStart': 79,
'RegionNucStop': 583},
{'Name': u'8-Primer7',
'QueryAA': u'XXQTTHQGXXSDTHCVLVGALS*YQLSQRM*KRPTKERTTACYTL*ACMGWRTRRKKC*CGGLTAA*HFITWPERSIRNTTRTAX',
'QueryNuc': u'ANGGCAGACTACACACCAGGGCNAGGNNTCAGATACCCACTGTGTTTTGGTTGGTGCTTTAAGCTAGTACCAGTTGAGCCAGAGGATGTAGAAAAGGCCAACGAAGGAGAGAACAACAGCCTGTTACACCCTATGAGCCTGCATGGGATGGAGGACACGGAGAAAGAAGTGTTAGTGTGGAGGTTTGACAGCCGCCTAGCATTTCATCACGTGGCCCGAGAGAAGCATCCGGAATACTACCAGAACTGCTG',
'QueryNucStart': 1,
'QueryNucStop': 252,
'RegionAAStart': 124,
'RegionAAStop': 207,
'RegionName': u'Nef',
'RegionNucStart': 369,
'RegionNucStop': 621},
{'Name': u'8-Primer7',
'QueryAA': None,
'QueryNuc': u'ANGGCAGACTACACACCAGGGCNAGGNNTCAGATACCCACTGTGTTTTGGTTGGTGCTTTAAGCTAGTACCAGTTGAGCCAGAGGATGTAGAAAAGGCCAACGAAGGAGAGAACAACAGCCTGTTACACCCTATGAGCCTGCATGGGATGGAGGACACGGAGAAAGAAGTGTTAGTGTGGAGGTTTGACAGCCGCCTAGCATTTCATCACGTGGCCCGAGAGAAGCATCCGGAATACTACCAGAACTGCTGACATCGAGATTGCTACAAGGGACTTTCCGCTGGGGACTTTCCACGGGGGTGGGGNCTGGGCGGGAATGGGGAATGGCNAACCC',
'QueryNucStart': 1,
'QueryNucStop': 335,
'RegionAAStart': None,
'RegionAAStop': None,
'RegionName': u'LTR3',
'RegionNucStart': 80,
'RegionNucStop': 415}]
In [ ]:
Content source: JudoWill/ResearchNotebooks
Similar notebooks: