In [1]:
from classy import *


Version:  0.0.15

In [2]:
sequence_data=bio.load_sequences('data/small sequence dataset.xlsx')


Target Column Found
Sequences
88 sequences of median length 288
Unique letters: [ 'MRKFNKPLLALLIGSTLCSAAQAAAPGKPTIAWGNTKFAIVEVDQAATAYNNLVKVKNAADVSVSWNLWNGDAGTTAKILLNGKEAWSGPSTGSSGTANFKVNKGGRYQMQVALCNADGCTASDATEIVVADTDGSHLAPLKEPLLEKNKPYKQNSGKVVGSYFVEWGVYGRNFTVDKIPAQNLTHLLYGFIPICGGNGINDSLKEIEGSFQALQRSCQGREDFKVSIHDPFAALQKAQKGVTAWDDPYKGNFGQLMALKQAHPDLKILPSIGGWTLSDPFFFMGDKVKRDRFVGSVKEFLQTWKFFDGVDIDWEFPGGKGANPNLGSPQDGETYVLLMKELRAMLDQLSAETGRKYELTSAISAGKDKIDKVAYNVAQNSMDHIFLMSYDFYGPFDLKNLGHQTALNAPAWKPDTAYTTVNGVNALLAQGVKPGKVVVGTAMYGRGWTGVNGYQNNIPFTGTATGPVKGTWKNGIVDYRQIAGQFMSGEWQYTYDATAEAPYVFKPSTGDLITFDDARSVQAKGKYVLDKQLGGLFSWEIDADNGDILNSMNASLGNSAGVQMSTRKAVIGYYFIPTNQINNYTETDTSVVPFPVSNITPAKAKQLTHINFSFLDINSNLECAWDPATNDAKARDVVNRLTALKAHNPSLRIMFSIGGWYYSNDLGVSHANYVNAVKTPAARTKFAQSCVRIMKDYGFDGVDIDWEYPQAAEVDGFIAALQEIRTLLNQQTIADGRQALPYQLTIAGAGGAFFLSRYYSKLAQIVAPLDYINLMTYDLAGPWEKITNHQAALFGDAAGPTFYNALREANLGWSWEELTRAFPSPFSLTVDAAVQQHLMMEGVPSAKIVMGVPFYGRAFKGVSGGNGGQYSSHSTPGEDPYPNADYWLVGCDECVRDKDPRIASYRQLEQMLQGNYGYQRLWNDKTKTPYLYHAQNGLFVTYDDAESFKYKAKYIKQQQLGGVMFWHLGQDNRNGDLLAALDRYFNAADYDDSQLDMGTGLRYTGVGPGNLPIMTAPAYVPGTTYAQGALVSYQGYVWQTKWGYITSAPGSDSAWLKVGRLAMLSFVKKSIALVAALQAVTALATPISSEAGVEKRGSGFANAVYFTNWGIYGRNFQPADLPASEITHVLYSFMNVRADGTIFSGDTYADYEKHYAGDSWNDVGTNAYGCVKQLYLLKKQNRNMKVMLSIGGWTWSTNFPAAASSAATRKTFAQSAVGFMKDWGFDGIDIDWEYPADATQAQNMVLLLQAVRSELDSYAAQYAKGHHFLLSIAAPAGPDNYNKLKFAELGKVLDYINLMAYDYAGSWSNYTGHDANIYANPQNPNATPYNTDDAVQAYINGGVPANKIVLGMPIYGRSFQQTEGIGKPYNGIGSGSWENGIWDYKALPKAGATVKCDDTAKGCYSYDPSTKELISFDTPAMISTKVSWLKGKGLGGTMFWEASASKKGSDSLISTSHQGLGSQDSTQNYLDYPNSKYDNIKKGMNMILNLIILLAISIVASASNIAAYWGQNAGGDQQTLGDYCSSSPASIIILSFLDGFPNLSLNFANQCSGTFSSGLAHCSQIGSDIKSCQQQGKTILLSLGGATGNYGFSSDSEAVQFAGTLWNKFGGGKDSERPFDDAIVDGFDFDIENKDQTGYAALATQLRKYFSTGTKSYYLSAAPQCPYPDESVGDLMSQVDLDFAFIQFYNNYCSLNQQFNWNSWSNYARGKSIKLYLGLPGSSSSAGSGFVGLSTVQRVVASIKGDSSFGGISIWDISSAENGGYLNQLYQALSGSGSPAAPSNSYQPNTPLTRTYGGSTATASAYISVGFTAGATHGSTTTNDLLAWIDSLFGSSQSSVQQYATPVQSVTATPQPVAATTTSAPKPTASAFNWFGWFDGTTTSTTLQTVYSTVPADQTVYVTLTTTVGSQMLQSLFDKRDVIAEAKSTNLQICWLLFIPLLALICSMAKRTQAILLLLLAISLIMSSSHVDGGGIAIYWGQNGNEGTLTQTCSTRKYSYVNIAFLNKFGNGQTPQINLAGHCNPAAGGCTIVSNGIRSCQIQGIKVMLSLGGGIGSYTLASQADAKNVADYLWNNFLGGKSSSRPLGDAVLDGIDFDIEHGSTLYWDDLARYLSAYSKQGKKVYLTAAPQCPFPDRYLGTALNTGLFDYVWVQFYNNPPCQYSSGNINNIINSWNRWTTSINAGKIFLGLPAAPEAAGSGYVPPDVLISRILPEIKKSPKYGGVMLWSKFYDDKNGYSSSILDSVLFLHSEECMTVLMTKLILLTGLVLILNLQLGSAYQLTCYFTNWAQYRPGLGRFMPDNIDPCLCTHLIYAFAGRQNNEITTIEWNDVTLYQAFNGLKNKNSQLKTLLAIGGWNFGTAPFTAMVSTPENRQTFITSVIKFLRQYEFDGLDFDWEYPGSRGSPPQDKHLFTVLVQEMREAFEQEAKQINKPRLMVTAAVAAGISNIQSGYEIPQLSQYLDYIHVMTYDLHGSWEGYTGENSPLYKYPTDTGSNAYLNVDYVMNYWKDNGAPAEKLIVGFPTYGHNFILSNPSNTGIGAPTSGAGPAGPYAKESGIWAYYEICTFLKNGATQGWDAPQEVPYAYQGNVWVGYDNIKSFDIKAQWLKHNKFGGAMVWAIDLDDFTGTFCNQGKFPLISTLKKALGLQSASCTAPAQPIEPITAAPSGSGNGSGSSSSGGSSGGSGFCAVRANGLYPVANNRNAFWHCVNGVTYQQNCQAGLVFDTSCDCCNWAMKKFINQFSASLKNNILVFLAFPFVWTSCARDNPLSSENSNISPNAAARAAVTGTTKANIKLFSFTEVNDTNPLNNLNFTLKNSGKPLVDMVVLFSANINYDAANDKVFVSNNPNVQHLLTNRAKYLKPLQDKGIKVILSILGNHDRSGIANLSTARAKAFAQELKNTCDLYNLDGVFFDDEYSAYQTPPPSGFVTPSNNAAARLAYETKQAMPNKLVTVYVYSRTSSFPTAVDGVNAGSYVDYAIHDYGGSYDLATNYPGLAKSGMVMSSQEFNQGRYATAQALRNIVTKGYGGHMIFAMDPNRSNFTSGQLPALKLIAKELYGDELVYSNTPYSKDWMKLNIFTKSMIGMGLVCSALPALAMEAWNNQQGGNKYQVIFDGKIYENAWWVSSTNCPGKAKANDATNPWRLKRTATAAEISQFGNTLSCEKSGSSSSSNSNTPASNTPANGGSATPAQGTVPSNSSVVAWNKQQGGQTWYVVFNGAVYKNAWWVASSNCPGDAKSNDASNPWRYVRAATATEISETSNPQSCTSAPQPSPDVKPAPDVKPAPDVQPAPADKSNDNYAVVAWKGQEGSSTWYVIYNGGIYKNAWWVGAANCPGDAKENDASNPWRYVRAATATEISQYGNPGSCSVKPDNNGGAVTPVDPTPETPVTPTPDNSEPSTPADSVNDYSLQAWSGQEGSEIYHVIFNGNVYKNAWWVGSKDCPRGTSAENSNNPWRLERTATAAELSQYGNPTTCEIDNGGVIVADGFQASKAYSADSIVDYNDAHYKTSVDQDAWGFVPGGDNPWKKYEPAKAWSASTVYVKGDRVVVDGQAYEALFWTQSDNPALVANQNATGSNSRPWKPLGKAQSYSNEELNNAPQFNPETLYASDTLIRFNGVNYISQSKVQKVSPSDSNPWRVFVDWTGTKERVGTPKKAWPKHVYAPYVDFTLNTIPDLAALAKNHNVNHFTLAFVVSKDANTCLPTWGTAYGMQNYAQYSKIKALREAGGDVMLSIGGANNAPLAASCKNVDDLMQHYYDIVDNLNLKVLDFDIEGTWVADQASIERRNLAVKKVQDKWKSEGKDIAIWYTLPILPTGLTPEGMNVLSDAKAKGVELAGVNVMTMDYGNAICQSANTEGQNIHGKCATSAIANLHSQLKGLHPNKSDAEIDAMMGTTPMVGVNDVQGEVFYLSDARLVMQDAQKRNLGMVGIWSIARDLPGGTNLSPEFHGLTKEQAPKYAFSEIFAPFTKQMSTPRAAASLAKKAALVALAVLAAALATAARAEQCGAQAGGARCPNCLCCSRWGWCGTTSDFCGDGCQSQCSGCGPTPTPTPPSPSDGVGSIVPRDLFERLLLHRNDGACPARGFYTYEAFLAAAAAFPAFGGTGNTETRKREVAAFLGQTSHETTGGWPTAPDGPFSWGYCFKQEQNPPSDYCQPSPEWPCAPGRKYYGRGPIQLSFNFNYGPAGRAIGVDLLSNPDLVATDATVSFKTALWFWMTPQGNKPSSHDVITGRWAPSPADAAAGRAPGYGVITNIVNGGLECGHGPDDRVANRIGFYQRYCGAFGIGTGGNLDCYNQRPFNSGSSVGLAEQMPPQKENHRTLNKMKTNLFLFLIFSLLLSLSSAEQCGRQAGGALCPNGLCCSEFGWCGNTEPYCKQPGCQSQCTPGGTPPGPTGDLSGIISSSQFDDMLKHRNDAACPARGFYTYNAFITAAKSFPGFGTTGDTATRKKEVAAFFGQTSHETTGGWATAPDGPYSWGYCFKQEQNPASDYCEPSATWPCASGKRYYGRGPMQLSWNYNYGLCGRAIGVDLLNNPDLVANDAVIAFKAAIWFWMTAQPPKPSCHAVIAGQWQPSDADRAAGRLPGYGVITNIINGGLECGRGQDGRVADRIGFYQRYCNIFGVNPGGNLDCYNQRSFVNGLLEAAIMRLCKFTALSSLLFSLLLLSASAEQCGSQAGGARCPSGLCCSKFGWCGNTNDYCGPGNCQSQCPGGPTPTPPTPPGGGDLGSIISSSMFDQMLKHRNDNACQGKGFYSYNAFINAARSFPGFGTSGDTTARKREIAAFFAQTSHETTGGWATAPDGPYAWGYCWLREQGSPGDYCTPSGQWPCAPGRKYFGRGPIQISHNYNYGPCGRAIGVDLLNNPDLVATDPVISFKSALWFWMTPQSPKPSCHDVIIGRWQPSAGDRAANRLPGFGVITNIINGGLECGRGTDSRVQDRIGFYRRYCSILGVSPGDNLDCGNQRSFGNGLLVDTMMRSLAVVVAVVATVAMAIGTARGSVSSIVSRAQFDRMLLHRNDGACQAKGFYTYDAFVAAAAAFPGFGTTGSADAQKREVAAFLAQTSHETTGGWATAPDGAFAWGYCFKQERGASSDYCTPSAQWPCAPGKRYYGRGPIQLSHNYNYGPAGRAIGVDLLANPDLVATDATVGFKTAIWFWMTAQPPKPSSHAVIAGQWSPSGADRAAGRVPGFGVITNIINGGIECGHGQDSRVADRIGFYKRYCDILGVGYGNNLDCYSQRPFAMGAFALFAVLAMAVTMAVAEQCGSQAGGATCPNCLCCSRFGWCGSTSDYCGDGCQSQCAGCGGGGTPVTPTPTPSGGGGVSSIVSRALFDRMLLHRNDGACQAKGFYTYDAFVAAAGAFPGFGTTGSTDTRKREVAAFLAQTSHETTGGWATAPDGAFAWGYCFKQERGATSNYCTPSAQWPCAPGKSYYGRGPIQLSHNYNYGPAGRAIGVDLLRNPDLVATDPTVSFKTAMWFWMTAQAPKPSSHAVITGQWSPSGTDRAAGRVPGFGVITNIVNGGIECGHGQDSRVADRIGFYKRYCDILRVGYGNNLDCYNQRPFAMRLSEFTTLFLLFSVLLLSASAEQCGSQAGGALCASGLCCSKFGWCGNTNEYCGPGNCQSQCPGGPGPSGDLGGVISNSMFDQMLNHRNDNACQGKNNFYSYNAFVTAAGSFPGFGTTGDITARKREIAAFLAQTSHETTGGWPTAPDGPYAWGYCFLREQGSPGDYCTPSSQWPCAPGRKYFGRGPIQISHNYNYGPCGRAIGVDLLNNPDLVATDPVISFKSAIWFWMTPQSPKPSCHDVITGRWQPSGADQAANRVPGFGVITNIINGGLECGHGSDSRVQDRIGFYRRYCGILGVSPGENLDCGNQRSFGNGLLVDIMQNCQCDTTIYCCSQHGYCGNSYDYCGPGCQAGPCWDPCEGDGTLTVSDIVTQEFWDGIASQAAANCPGKSFYTRSNFLEAVSAYPGFGTKCTDEDRKREIAAYFAHVTHETGHLCYIEERDGHANNYCQESQQYPCNPNKEYFGRGPMQLSWNYNYIDAGKELHFDGLNDPDIVGRDPIISFKTSLWFWIRKGVQYVILDPNQGFGATIRIINGGQECDGHNTAQMMARVGYYQEYCAQLGVSPGNNLPCMKKNRMMMMIWSVGVVWMLLLVGGSYGEQCGRQAGGALCPGGNCCSQFGWCGSTTDYCGPGCQSQCGGPSPAPTDLSALISRSTFDQMLKHRNDGACPAKGFYTYDAFIAAAKAYPSFGNTGDTATRKREIAAFLGQTSHETTGGWATAPDGPYAWGYCFVRERNPSTYCSATPQFPCAPGQQYYGRGPIQISWNYNYGQCGRAIGVDLLNKPDLVATDSVISFKSALWFWMTAQSPKPSSHDVITSRWTPSSADVAARRLPGYGTVTNIINGGLECGRGQDSRVQDRIGFFKRYCDLLGVGYGNNLDCYSQTPFGNSLLLSDLVTSQMRSLLILVLCFLPLAALGKVFGRCELAAAMKRHGLDNYRGYSLGNWVCAAKFESNFNTQATNRNTDGSTDYGILQINSRWWCNDGRTPGSRNLCNIPCSALLSSDITASVNCAKKIVSDGNGMNAWVAWRNRCKGTDVQAWIRGCRLMKALIVLGLVLLSVTVQGKVFERCELARTLKRLGMDGYRGISLANWMCLAKWESGYNTRATNYNAGDRSTDYGIFQINSRYWCNDGKTPGAVNACHLSCSALLQDNIADAVACAKRVVRDPQGIRAWVAWRNRCQNRDVRQYVQGCGVMKAFIVLVALACAAPAFGRTMDRCSLAREMSNLGVPRDQLNKWACIAEHESSYRTGVVGPENYNGSNDYGIFQINDYYWCAPPSGRFSYNECGLSCNALLTDDITHSVRCAQKVLSQQGWSAWSTWHYCSGWLPSIDDCFKIFSKCELARKLKSMGMDGFHGYSLANWVCMAEYESNFNTQAFNGRNSNGSSDYGIFQLNSKWWCKSNSHSSANACNIMCSKFLDDNIDDDIACAKRVVKDPNGMSAWVAWVKHCKGKDLSKYLASCNLMTKYVILLAVLAFALHCDAKRFTRCGLVQELRRLGFDETLMSNWVCLVENESGRFTDKIGKVNKNGSRDYGLFQINDKYWCSKGTTPGKDCNVTCNQLLTDDISVAATCAKKIYKRHKFDAWYGWKNHCQHGLPDISDCKVYDRCEFARILKKSGMDGYRGVSLANWVCLAKWESDFNTKAINRNVGSTDYGIFQINSRYWCNDGKTPKAVNACHISCKVLLDDDLSQDIECAKRVVRDPQGIKAWVAWRTHCQNKDVSQYIRGCKLMKAVIILGLVLLSVTVQGKIFERCELARTLKRLGLDGYRGISLANWVCLAKWESDYNTQATNYNPGDQSTDYGIFQINSHYWCNNGKTPGAVNACRISCNALLQDNIADAVTCAKRVVRDPQGIRAWVAWRNHCQNRDVSQYVQGCGVKIYEQCEAAREMKRLGLDGYDGYSLGDWVCTAKHESNFNTGATNYNRGDQSTDYGIFQINSRWWCNDGKTPNAKNACGIECSELLKADITAAVICAKRVVRDPNGMGAWVAWTKYCKGKDVSQWIKGCKLMSALWLLLGLLALMDLSESSNWGCYGNIQSLDTPGASCGIGRRHGLNYCGVRASERLAEIDMPYLLKYQPMMQTIGQKYCMDPAVIAGVLSRKSPGDKILVNMGDRTSMVQDPGSQAPTSWISESQVSQTTEVLTTRIKEIQRRFPTWTPDQYLRGGLCAYSGGAGYVRSSQDLSCDFCNDVLARAKYLKRHGFRTDCYGNVNRIDTTGASCKTAKPEGLSYCGVSASKKIAERDLQAMDRYKTIIKKVGEKLCVEPAVIAGIISRESHAGKVLKNGWGDRGNGFGLMQVDKRSHKPQGTWNGEVHITQGTTILINFIKTIQKKFPSWTKDQQLKGGISAYNAGAGNVRSYARMDIGTTHDDYANDVVARAQYYKQHGYMVPSVVFWGLIALVGTAKGSYTHSVHSMNPHVHPRLYHGCYGDIMTMETFGAPCDINNLMNCGIHGSEMFAEMDLKAIKPYRILIKEVGQRHCIDPALIAAIISRESHGGAVLQNGWDHKGQRFGLMQLDKNMYHPIGSWDSKEHLLQSVGILTERIKAMKRKFPTWNTAQQLKGGLTAFKSGMETIVTPADIDGDLVDDVLARAKFYKRHGFMGYGNIMNVETTGASWQTAQQDKLGYSGVRASHTMANTDSGRMERYRSKINSVGAKYGIDPALIAAIISEESRAGNVLHDGWGDYDSNRGAYNAWGLMQVDVNPNGGGHTARGAWDSEEHLSQGAEILVYFIGRIRNKFPGWNTEQQLKGGIAAYNMGDGNVHSYDNVDGRTTGGDYSNDVVARAQWYKTQKGFMPYGKIEDIKTSGASDVTAAQDGLKEGGWKSSHRMAEIDSNRMENYRTIINEAGRQCDVDPAVIAGIISRESRAGNQLINGWGDHGKAFGLMQIDVTPPPNGGGHTPVGTWDSLEHLIQATEILVEFIERIKTKFPRWNADQHLKGALAAYNKGEKNVESYASVDAKTTGKDYSNDVVARAQWYKSNMGFMKCLVALFLSLSLVACQYDDYDTERKNNNMLSSMNILDLLDSFGLNIKARIAHVRRVAGRIRLTLDIGLGNGDVERESEEAEGEGTDGRGGGEGEREGWGGEREGGEGEREGGEGEREGREGEREGKSSESNESPEDFIGPPVDMCAGESRRGSPSIGCIAAECCQHSFYINSLCPGSSVCCFSMDVCDRLPVPVIPPFPTDPGTLPPPPPIPDSQTTVSPNQPSSYMCHGDFMKLMPKGADQRTARQDNLAYAGVRASNKLVDNDLAELNKRKDCYVQAGKNHCIHPAVIAAIASRETRGGKLLYSTNGYGDGGRAYGIMQCDGGASGLGDICKKYPWDSCEHINQLTDIILLNYVNQMKTKHPSWPAHYQLKGGVSAYNAGVGNVQTIAGMDAGTTNDDYSNDVIARAQRLVNAHGWMLGKNDPMCLVLVLLGLTALLGICQGGTGCYGSVSRIDTTGASCRTAKPEGLSYCGVRASRTIAERDLGSMNKYKVLIKRVGEALCIEPAVIAGIISRESHAGKILKNGWGDRGNGFGLMQVDKRYHKIEGTWNGEAHIRQGTRILIDMVKKIQRKFPRWTRDQQLKGGISAYNAGVGNVRSYERMDIGTLHDDYSNDVVARAQYFKQHGYMHLMLVLLGLAALLGTSQSRTGCYGDVNRVDTTGASCKSAKPEKLNYCGVAASRKIAERDLQSMDRYKALIKKVGQKLCVDPAVIAGIISRESHAGKALRNGWGDNGNGFGLMQVDRRSHKPVGEWNGERHLMQGTEILISMIKAIQKKFPRWTKEQQLKGGISAYNAGPGNVRSYERMDIGTTHDDYANDVVARAQYYKQHGYMNIFEMLRIDEGLRLKIYKDTEGYYTIGIGHLLTKSPSLNAAKSELDKAIGRNCNGVITKDEAEKLFNQDVDAAVRGILRNAKLKPVYDSLDAVRRCALINMVFQMGETGVAGFTNSLRMLQQKRWDEAAVNLAKSRWYNQTPNRAKRVITTFRTGTWDAYKNLMEMISNNLNWFVGVVEDRMDPLKLGRVRVRVVGLHPPQRAQGDVMGIPTEKLPWMSVIQPITSAAMSGIGGSVTGPVEGTRVYGHFLDKWKTNGIVLGTYGGIVREKPNRLEGFSDPTGQYPRRLGNDTNVLNQGGEVGYDSSSNVIQDSNLDTAINPDDRPLSEIPTDDNPNMSMAEMLRRDEGLRLKVYWDTEGYPTIGIGHLIMKQPVRDMAQINKVLSKQVGREITGNPGSITMEEATTLFERDLADMQRDIKSHSKVGPVWQAVNRSRQMALENMAFQMGVGGVAKFNTMLTAMLAGDWEKAYKAGRDSLWYQQTKGRASRVTMIILTGNLESYGVEVKTPARSLSAMAATVAKSSDPADPPIPNDSRILFKEPVSSYKGEYPYVHTMETESGHIQEFDDTPGQERYRLVHPTGTYEEVSPSGRRTRKTVDNLYDITNADGNFLVAGDKKTNVGGSEIYYNMDNRLHQIDGSNTIFVRGDETKTVEGNGTILVKGNVTIIVEGNADITVKGDATTLVEGNQTNTVNGNLSWKVAGTVDWDVGGDWTEKMASMSSISSGQYTIDGSRIDIGMPPSLRKAVAAAIGGGAIAIASVLITGPSGNDGLEGVSYIPYKDIVGVWTVCHGHTGKDIMLGKTYTKAECKALLNKDLATVARQINPYIKVDIPETTRGALYSFVYNVGAGNFRTSTLLRKINQGDIKGACDQLRRWTYAGGKQWKGLMTRREIEREVCLWGQQMVEINNQRKAFLDMLAWSEGTDNGRQKTRNHGYDVIVGGELFTDYSDHPRKLVTLNPKLKSTGAGRYQLLSRWWDAYRKQLGLKDFSPKSQDAVALQQIKERGALPMIDRGDIRQAIDRCSNIWASLPGAGYGQFEHKADSLIAKFKEAGGTVREIDVMKGKTAAGGGAICAIAVMITIVMGNGNVRTNQAGLELIGNAEGCRRDPYMCPAGVWTDGIGNTHGVTPGVRKTDQQIAADWEKNILIAERCINQHFRGKDMPDNAFSAMTSAAFNMGCNSLRTYYSKARGMRVETSIHKWAQKGEWVNMCNHLPDFVNSNGVPLRGLKIRREKERQLCLTGLVNEMMQISSNGITRLKREEGERLKAYSDSRGIPTIGVGHTGKVDGNSVASGMTITAEKSSELLKEDLQWVEDAISSLVRVPLNQNQYDALCSLIFNIGKSAFAGSTVLRQLNLKNYQAAADAFLLWKKAGKDPDILLPRRRRERALFLSMQISQAGINLIKSFEGLQLKAYKAVPTEKHYTIGYGHYGSDVSPRQVITAKQAEDMLRDDVQAFVDGVNKALKVSVTQNQFDALVSFAYNVGLGAFRSSSLLEYLNEGRTALAAAEFPKWNKSGGKVYQGLINRRAQEQALFNSGTPKNVSRGTSSTKTTPKYKVKSGDNLTKIAKKHNTTVATLLKLNPSIKDPNMIRVGQTINVTGSGGKTHKVKSGDTLSKIAVDNKTTVSRLMSLNPEITNPNHIKVGQTIRLSMKVSQNGLNLIKEFEGCRLTAYKPVPWEQMYTIGWGHYGVTAGTTWTQAQADSQLEIDINNKYAPMVDAYVKGKANQNEFDALVSLAYNCGNVFVADGWAPFSHAYCASMIPKYRNAGGQVLQGLVRRRQAELNLFNKPVSSNSNQNNQTGGMIKMYLIIGLDNSGKAKHWYVSDGVSVRHVRTIRMLENYQNKWAKLNLPVDTMFIAEIEAEFGRKIDMASGEVKMVKKNDLFVDVSSHNGYDITGILEQMGTTNTIIKISESTTYLNPCLSAQVEQSNPIGFYHFARFGGDVAEAEREAQFFLDNVPMQVKYLVLDYEDDPSGDAQANTNACLRFMQMIADAGYKPIYYSYKPFTHDNVDYQQILAQFPNSLWIAGYGLNDGTANFEYFPSMDGIRWWQYSSNPFDKNIVLLDDEEDDKPKTAGTWKQDSKGWWFRRNNGSFPYNKWEKIGGVWYYFDSKGYCLTSEWLKDNEKWYYLKDNGAMATGWVLVGSEWYYMDDSGAMVTGWVKYKNNWYYMTNERGNMVSNEFIKSGKGWYFMNTNGELADNPSFTKEPDGLITVATVQGFDISSYQPSVNFAGAYSAGARFVIIKATEGTSYTNPSFSSQYNGATTATGNYFIRGGYHFAHPGETTGAAQADYFIAHGGGWSGDGITLPGMLDLESEGSNPACWGLSAASMVAWIKAFSDRYHAVTGRYPMLYTNPSWWSSCTGNSNAFVNTNPLVLANRYASAPGTIPGGWPYQTIWQNSDAYAYGGSNNFINGSIDNLKKLATGMKGIDIYSGQGSVDFNAVKESGVEVVYIKATEGLTYTDSTYKDFYDGAKNAGLKIGFYHYLRANDPTSEAEHFFNTISGLSLDCKCAIDVEVTLGQSIDQISSNVRKFADYLINKGLDVCVYTYTNFYKDNLNSTVKDLPLWIAEYGVSKPNIDASYVGFQYSDSGSVNGISGSADLDEFSEGILVGGTVVIDPGQGGDDNIKAIQQDLNILLKRGLEVDGIEGPETEAAIKDFQSIMGLTVDGIWGTNTSGAAQQIFSRPLDGVAYPHYEYATRYIQYRVGASVDGTFGSGTKAKVAAWQSNQGLMADGVVGSATWSKLLDENKLGIDVSQPTSTSSFTCLRNKGFTTMVIVRAWKSTGSFDTNAPQTLKNANAAGFSIENSDVYYYPCISCGNMAGQVRTFWQKVGQYSLKVKRVWFDIEGTWTSSVSTNQNYLMQMMNEARAIGIVHGIYGSKYYWGNLFGSSYKYRYRSSTPLWYPHYDNSPSFSDFSSFGGWTSPSMKQYRGDVSVCSAGVDYNYKPMPAYSSLARRGRRPAVVLLGGLVSASLALTLAPTAAAAPLAPPPGKDVGPGEAYMGVGTRIEQGLGAGPDERTIGPADTSGVQGIDVSHWQGSINWSSVKSAGMSFAYIKATEGTNYKDDRFSANYTNAYNAGIIRGAYHFARPNASSGTAQADYFASNGGGWSRDNRTLPGVLDIEHNPSGAMCYGLSTTQMRTWINDFHARYKARTTRDVVIYTTASWWNTCTGSWNGMAAKSPFWVAHWGVSAPTVPSGFPTWTFWQYSATGRVGGVSGDVDRNKFNGSAARLLALANNTAMTKTYGVDVAVYQPIDLAAYHKAGASFAIVKLTEGVDYVNRRGPSRWTAPGLTTSTLMPTISRSFGSSVSRAKKEAAYFLKEAKKQDISKKRMLWLDWEAGSGNVVTGSKSSNTAAILDFMDAIKAAGWRPGLYSGASLMRTAIDTKQVVKKYGTCLWVASYPTMAAVSTADFGYFRQWTGSPSGSLPVTAWPGRRRERCSGMQLRITSRKKLTSLLCALGLISIVAIYPRQTVNFFYSTAVQITDYIHFYGYRPVKSFAIRIPASYTIHGIDVSRWQERIDWQRVAKMRDNGIRLQFAFIKATEGEKLVDPYFSRNWQLSRENGLLRGAYHYFSPSVSASVQARLFLQTVDFSQGDFPAVLDVEERGKLSAKELRKRVSQWLKMVEKSTGKKPIIYSGAVFYHTNLAGYFNEYPWWVAHYYQRRPDNDGMAWRFWQHSDRGQVDGINGPVDFNVFNGTVEELQAFVDGIKETPMRFIALLISFFALLKVISAISGVDISSASTIESFTCLKSAGYDFAIIRAYESLGQVDPNGPHSVYNARDAGIEYVDVYMFPCPTCGNGAGQAETMVNYLKGYNANYGMVWLDIEGPQYWMSQSENVAFFESLVAGLKAEGAHIGVYTSASQWEPIMGGYTGGSEFPLWYAHYDGNPSFSDFSPFNGWSTPSVKQYDDTGDSCGLGFDLNWYPMHCAPSWKSSDERRTMLDQINTLDPNSLTALKRMSKDNSPAAIKGAAQQFEALFLQNMLKSMRDATVTSDAMGSETTRFYQGLYDQQLAAMMAQRGGIGLADVMEKQMGAQAASAQNAAAAGASSAGNVPLSLDAARAAAAHTASGDKVPTTPQAFVDATWPQAAKAAQSLGVPAHFLVAQAALETGWGKSQIRNKDGTPSYNLFNIKAGSNWTGKVVEARTVEYENGQRKVRVERFRAYDSYEQAFQDYADLVGNSPRYAKVAGKTDGHAFARALQEGGYATDPSYADKLARVINGNALRQRLMASAASARGMINKKWMKIVMIPMLVVPMYGLTSVSGQIQDSLTGENSFVKDAEAATTASQQAFIDKIAPAAQASQEQYHLLSSITLAQAILESGWGKSGLATKGYNLFGIKGKYNGQSVIMSTSEYVNGQWIKIDAEFRKYPSWNESVTDHTLLLVNGTSWNKNLYKKVVDATDYKVAAMELQKAGYASPTYGASLIQVIENYDLAKYDVLYDKILTQKSTSGKATVTSPTGNGVWTLPYKVKGVQSVSPASTYANKDIDLVSVATTKRGTYYQFKYNGKVVGWVDAKALTIYDSVNYDKVNVGRAKITSPVSNGIWSKPYNVYGREFVTNATTYAQQEIKLLREAQTAKGTYYQFSINNKTIGWIDKRALTIYPYDSIVSSKNVSLDGQITNPTGNGIWTKAYKLEGTTSVAQATKYANKDVKISQQVETQHGTYYNISIDGKAIGWLDKNAITLYDQAEYNKTVAFDAAIRNVQGNAVWTEPYRTVGTKLIGPAETYLNKEVEVVREAKTPKGTYYQFKSGGKVIGWLDKKAFEVYDNINYNKAVNLDAVVENVTGNAVWTAPYKSKGVKLVTSAATYKGKATKITREAQTSRGTYYEFSVNGKVIGWLDKKAFDVYDSIEYNKAINMTGLLSNAPGNGIWTEPYRVLDTKNIGQATAYANKTVQLVREAKTSHSTYYQMSLNGKVIGWIDKRAFTNVKMVNTQVKRVKKQKFIAGTALLLGMATFGMVGKADDLSSSNTNGGVDNSKVDNDNQESVKTSTEGVSSTTENANTVPESKVTSTVDSESAPSKTISAGTQSNISGTSDGSDSLPKTETSDSSSKPSTSNSSSKPSTSNSSSKPSTSNSSSNNNSATKPSTTTQAPPVAPSTTAPSATPSTTAPSNYYQNSSYNQTSTAAQIPNSSSDSAASVYSGPVLKKIEAAKPIEKIDSSSTEAFIKSIADRVRILAGKNNLYASIILAQAILESGSGQSNMTQQYFNIFNITGAYLGKSISFKTEEFSGNNPYYIEQSFRVYSNYDQALDDYINLMIKGTTWNSEIYAGAWKSHAKTYQEAAQALQGIFATDPEYAQKLIEIIEEYNLNFYDNVDSTTQVLDSNIPESPLVASKLDSSTYPDYNGVEYPGADSYAFGNCTQYVYNRIIQLGGQIGTHMGNGGEWGINAQAQGYFTTTVPTEGYAVSFPPGVAGSSPEYGHVAFVEKVYPDNSILVSEMNVKGNNIVSERHISAGVAALATYIQPKMNRNRLSCLIVGAVIGAGAIVCTTNTKVHAKPVNEVKNINTSKGNSFGEIISSEDIGLRKGADSSHEIITSIPSGARVNIIDKMSKDWYKVSYKDFTGYLQAKDIRVLGDELNQDNVGLISANQLNVRTSPNENGQVIGTLHKNDKVNVLDKSIDGWYKIDFNGRRAYVSSKYVNLISYKNNEVKTEVKKEPIEGTGKVNINTALNVRQASTTNSRIIGSLKGGEKVNIISESNGFYKIEFNNSYGYVYSKYISKDGDSEKVQVVKQEEVKKEKVDESKKEAKATPKAEPVVLAVRSLNKTGIVNVSSSLNVREGAGTSSKVIGSLSGNTKVTIVGEEGAFYKIEYKGSHGYVAKEYVKDVTESSNSNQGTQTPEKPSTPESTEKTGIVNVSSSLNVREGASTSSKVIGSLSGNTKVIIVGEEGAFYKIEYKGSHGYVAKEYIKDVTESNNSNQGTQTPEKPSTPESTEKTGIVNVSSSLNVREGASTSSKVIGSLSGNTKVTIVGEEGAFYKIEYKGSHGYVAKEYIKDIKDEVVTEPEKPSAPENTEKTGVVNVSSSLNVREGASTSSKVIGSLSGNTKVIIVGEEGAFYKIEYKGSHGYVAKEYIKDVTESNNSNQGTQTPEKPSTPESTEKTGIVNVSSSLNVREGASTSSKVIGSLSGNTKVTIVGEEGAFYKIEYKGSHGYVAKEYVKDVTESNNSNQGTQTPEKPSTPESAEKTGVVNVSSSLNVREGASTSSKVIGSLSGNTKITIVGEEGAFYKIEYKGSHGYVAKEYIKDIKDEVVTEPEKPSTHENSKKTGVVTASKGLNVRKEANTSSQIIGILNSGESVEIIGEENGFYKITYKGQEAYASKNYINIFDGNSNVNPGLDIGNASKTNYGVSLNEYIKLQQRNNPSNYSYSEFEKYINPAKATNKLQFLRIDKFRSVNVSGLSSRLSNKGVLTGQGQAFVNAAKAFNIDPIYLVAQCLHETGNGTSKLAKGVTITEIADESKPIYNGNGQLVGYHMIKLSKPVTVYNLFGIGAKDNSSVFPNRALILGTTYAYNRGWTSIENAIKGAAEFVSLNYVHSSRYSQNTLYKMRYNQNVSNIWHQYATTPWYASSIADIMRSYQDLYLENNFTFDVPVFAGMKKESMSRIERRKAQQRKKTPVQWKKSTTLFSSALIVSSVGTPVALLPVTAEATEEQPTNAEVAQAPTTETGLVETPTTETTPGTTEQPTTDSSTTTESTTESSKETPTTPSTEQPTADSTTPVESGTTDSSVAEITPVAPSATESEAAPAVTPDDEVKVPEARVASAQTFSALSPTQSPSEFIAELARCAQPIAQANDLYASVMMAQAIVESGWGASTLSKAPNYNLFGIKGSYNGQSVYMDTWEYLNGKWLVKKEPFRKYPSYMESFQDNAHVLKTTSFQAGVYYYAGAWKSNTSSYRDATAWLTGRYATDPSYNAKLNNVITAYNLTQYDTPSSGGNTGGGTVNPGTGGSNNQSGTNTYYTVKSGDTLNKIAAQYGVSVANLRSWNGISGDLIFVGQKLIVKKGASGNTGGSGSGGSNNNQSGTNTYYTVKSGDTLNKIAAQYGVSVANLRSWNGISGDLIFVGQKLIVKKGASGNTGGSNNGGSNNNQSGTNTYYTIKSGDTLNKIAAQYGVSVANLRSWNGISGDLIFAGQKIIVKKGTSGNTGGSSNGGSNNNQSGTNTYYTIKSGDTLNKISAQFGVSVANLQAWNNISGSLIFAGQKIIVKKGANSGSTNTNKPTNNGGGATTSYTIKSGDTLNKISAQFGVSVANLRSWNGIKGDLIFAGQTIIVKKGASAGGNASSTNSASGKRHTVKSGDSLWGLSMQYGISIQKIKQLNGLSGDTIYIGQTLKVGMKKRLIAPMLLSAASLAFFAMSGSAQAAAYTDYSLYKVEPSNTFSTESQASQAVAKLEKDTGWDASYQASGTTTTYQISASGIHSESEAKAILSGLAKQTSITGTSSPVGSKQPYVTISSGAISGEKQANTILAKLKQETGVAGAVKAYGAAQPYMNVMTSDIADETKVKALIQSLAKQTGIKSSYQPITHTVSVTTIQSGTIVGDSRAAQIKNAFQKESGLQASLKETVKGQAYYTFTTAAISGEANAKTLLQQLKQSTGITGSYKSINQKTTVESYNVQSAYFKGLSTVKDAISQIKKNTGVSGSYQQVGKSTSYTVNMKGITKQQLQKIDTFFKKKKWHYTSSSVKKTTTSAAYQITTAKILGEQQANKAAAFFAQKKVKAAKTAAGSTAENQYQLISEETSDQAKVTKGLNILKKNQLSASAKSVKKQIADTFKITTESLLDQTKVNQALTFFKSNHISVASQKTGQTAASSYQITTEAIISQEEIDRVLTFFKQNHIAVTTSKTGQTAYTQYKIVTTQLSSKTALNNGLTYLKSKSVTPSYTTKSNTLYKISVNEQFTGNDTAAAASTKLKQLYGWTSSIVKIKNGPQIMKTNYNLSLRDMVQKQMTVSPQTDGAAYVSLTYINTATSTVTADVLNIRSTPEVSPTNVIGQFKKGDKVKVIGQINGWAKINLGWRNASSDEVVQYVDPNNFSRDSKYYFQFLKLSQTAGLSVTEVNQKVLAGKGILTGRAKAFIDAANQYSINELYLISHALLETGNGTSALANGLTYNGKTVYNMYGIGAYDSNPNYYGAKYAYEQGWFTPEAAIIGGAKFIGSSYIHNTAYNQDTLYKMRWSATATHQYATDIGWAYKQVNRMYSLYSLLDGYTLYFDVPEYRMARKKLKKRKLLISLFFLVSIPLALFVLATTLSKPIEISKETEEIDEQQVFIDSLSGHAQILYEKYHVLPSITIAQAILESDWGNSELAAKANNLFGVKGNYKGHHVTMETDEVEKGKRKTIRAKFRKYSTFFESMDDHAQLFVRGTSWNKKKYKPVLEAGNYKEAATALQTSGYATDPDYADKISAIVEKYDLDEYDEVNPSLKSVDLNASIKDSAVQDVWSKPSTDDRSIRLTSAQSYVGKDIKVVSKKQKGQSVWYQFQINDKLIGWIDDSAVEIKEATMARKLIKNLGKSKSVKRVKLLFKKIFITVFIVASIVAIFNITKYFEELYKVRDLKSTKIEYYMDVADEAGDGKVQLSWKALLAIDMVIHDEDLSNIKKKDTLDIGEKFIVEDKNDKGEKVYKVKKFNKVLSELKFDSSQKSRARKYMKDLEYTYLGNKQLDSSDEKIKFIKKLEDSAIREYIDYGILPSITIGQAILESGWGNSKLTKQSNNLFGIKADKAWKGKSVEISTSEHYNEKIVASFRSYNSLQDSVKDHSLFLINNKRYRKHGLFEAKDYISQAQALENAGYSTAEDKKGNRIYAELLIDVIRSYNLQLIDNKVETKMFFLTLPLLLGCTAATTPLTAATPPVDPLPLKVVSTDQLPKGLAKDQQLWNKVNGQKGDYKALLTAIDHSLEYLGTDKAQKDYQDYKVPGITRDRVSRSLRRFRQLVVQAKSPQALETAVKKEFQFYQSIGNDQKGNVDFTGYYEATYPASRQPTTEFRYPLYQAPADLKAWPKPHPTRAELEGADGLQASQGPLKGLELVWLRDRIQAFLVQVQGSARLGLTDGTEMTVGYAGKTAHPYTSIGKALIADGKFTLEELSLPVVLQYFEENPQDLDLYIPKNKSFVFFQETFGSPPMGNLNVPVTDERSIATDKSLMPPGALALIQTNLPYYNASQTLEFKDVSRFVLDHDTGSAIKGPGRVDIFMGTGAKAKERAGVMTGSGQLYYLLLKDNMNTPFSIDEVSFRDLPGWGQDDPRKLFPAMATILSHLRNAKPYRTGALGITAAELVSLLELAERGQVNSPEQARQFFETNSVPFRISPAQGKSGFVTAFYEPELEVSATPDDVWRYPIYRRPPELVDIDNDNRPDGFDPSYAFGKADEEGISYFPDRRAIDEGCLRGRGLEIAWARSKVDLFFVHVQGAARLVFPDGAIKRITYAAKAGHVFSPIGRLLLDRGELDPKTISMQTIRQWLADHPDEVDGVLWHNRSYIFFREADVAGLDMGPIAAAKVPLVAGRALAVDRLIHTFGLPFFIHAPTLTHLDDGKPFARLMLALDTGSAIVGPARGDIFTGSGFEAGELAGTVRNEADFYILLPRIAAERYRRMRKIQVAVFLFVGLLAACSTVPPSSAPTTCAQCQPCPACPAVTPAITPAPAPAFSRSLLPASWGDLPGWAEDDVTAAWPAFMQSCRGIASRGNAAGWRRVCELARAADGKPENDVRRFFERHLKPYAIVNGDGLVSGLVTGYYEPMLRGSRTKAKGYEQPVRGVPDDLLTIDLSAVFPELKDKRVRGRLEGNKVVPYWSRAEIAARGDKLPGKTLLYVDDAVELFFLQVQGSGRVKLADGGMVRLNYADQNGYQYQSIGKALVERGELKLEEASMQGIQAWARANPARLESLLNTNPSYVFFREVANSADGPVGALGVPLTAERSIAIDPRSVPLGSPVFLATTRPNSAVPLNRLVMAQDTGGAIKGGVRADFFWGFGKEAGDQAGRMKQSGRMWILLPTELAPKMKGRWVKYLLMGTVVAMLAACSSKPTDRGQQYKDGKFTQPFSLVNQPDAVGAPINAGDFAEQINHIRNSSPRLYGNQSNVYNAVQEWLRAGGDTRNMRQFGIDAWQMEGADNYGNVQFTGYYTPVIQARHTRQGEFQYPIYRMPPKRGRLPSRAEIYAGALSDKYILAYSNSLMDNFIMDVQGSGYIDFGDGSPLNFFSYAGKNGHAYRSIGKVLIDRGEVKKEDMSMQAIRHWGETHSEAEVRELLEQNPSFVFFKPQSFAPVKGASAVPLVGRASVASDRSIIPPGTTLLAEVPLLDNNGKFNGQYELRLMVALDVGGAIKGQHFDIYQGIGPEAGHRAGWYNHYGRVWVLKTAPGAGNVFSGMKKYLFRAALCGIAAAILAACQSKSIQTFPQPDTSVINGPDRPVGIPDPAGTTVGGGGAVYTVVPHLSLPHWAAQDFAKSLQSFRLGCANLKNRQGWQDVCAQAFQTPVHSVQAKQFFERYFTPWQVAGNGSLAGTVTGYYEPVLKGDDRRTAQARFPIYGIPDDFISVPLPAGLRSGKALVRIRQTGKNSGTIDNTGGTHTADLSQFPITARTTAIKGRFEGSRFLPYHTRNQINGGALDGKAPILGYAEDPVELFFMHIQGSGRLKTPSGKYIRIGYADKNEHPYVSIGRYMADKGYLKLGQTSMQGIKAYMQQNPQRLAEVLGQNPSYIFFRELTGSSNDGPVGALGTPLMGEYAGAVDRHYITLGAPLFVATAHPVTRKALNRLIMAQDTGSAIKGAVRVDYFWGYGDEAGELAGKQKTTGYVWQLLPNGMKPEYRPMKFPFHPWRRLLLCALPFAALLTACDDGKKEPPPTPAEVTTYNSVPWDALPATSDADLLAGFNAWRSACARLAKDPVWGEPCASATTVAADPTAVRAFLQERMQVYSLRSSSNGDQGLITGYYEPVYHGSLSQGEKTPVPVYGVPDDLVVVALESVYPELKGKRLRGRLEGRVLKPYDDAATIRDNGSSAPVLAWLGDPMDLQFLQIQGSGRIQLEDGRQLRIGYGDQNGHPYKPVGRWLVEQGLVPKEEISMKRIRDWAEANPQRVSELLASNPSFVFFSLRPDSDEGPRGSLNVPLTDGYSVAIDRKVIPLGSLMWLSTTRPDDGSAVVRPVAAQDTGGAIVGEVRADLFWGTGDAAGELAGHMKQPGRLWLLWPKGAPLPASMGAMNGTSGRRLSTATRVAAMAGVLLLAACGGPSSRPGLVSRPAGVAGPVSYQRVAIEGLPGWSTDRVADALPVFRRSCERLRAVSPNSMVGPSVWGSRASDWQAACAVAARLPAFDDDAARRFFAERFQAWQVTGAGDPTGLFTGYYEAALDGSLSPSAVYSTPIYGVPLDLRMEGGKGMRVSGGRSLPYPDRAAIEEGAISGVAPVIMWARDPVDVFMLHIQGSGQVRLPDGRIQRIGYAANNGHPFVGIGAIMRDRGLGDGSSMIAIRAWLRANPAEGRALMRENPRFIFFRPIEGEGPIGAQGLPLTGGRSLAVDPSSVPLGAPVWLATSDAHGETVNRLMVAQDTGSAIKGAVRGDFFWGSGEEALYHAGGMKSAGRYWVLVPRGGRNAVAQNMKGRWAKYVATGVMLAMLAACSSKPTDRGQQYKDGKFTQPFSLVNQPDAVGAPINAGDFAEQVNQIRSASPRLYTNQSNVYNAVQNWLRSGGDTRTMRQFGIDAWQMEGTDNYGNVQFTGYYTPVVQARHTRQGAFQYPIYSMPPKRGRLPSRAQIYAGALSDKYILAWSNSLMDNFIMDVQGSGYIDFGDGSPLNFFSYAGKNGWPYRSIGKVLIDRGEVKKEDMSMQAIREWGEKHSEAEVRELLEQNPSFVFFKPQSFAPVKGASAVPLIGRASVASDRSIIPPGTTLLAEVPLLDNNGKFSGQYELRLMVALDVGGAIKGQHFDIYQGIGPDAGHRAGWYNHYGRVWVLKSAPGAGNVFSGMFKRRYVTLLPLFVLLAACSSKPKPTETDTTTGTPSGGFLLEPQHNVMQMGGDFANNPNAQQFIDKMVNKHGFDRQQLQEILSQAKRLDSVLRLMDNQAPTTSVKPPSGPNGAWLRYRKKFITPDNVQNGVVFWNQYEDALNRAWQVYGVPPEIIVGIIGVETRWGRVMGKTRILDALATLSFNYPRRAEYFSGELETFLLMARDEQDDPLNLKGSFAGAMGYGQFMPSSYKQYAVDFSGDGHINLWDPVDAIGSVANYFKAHGWVKGDQVAVMANGQAPGLPNGFKTKYSISQLAAAGLTPQQPLGNHQQASLLRLDVGTGYQYWYGLPNFYTITRYNHSTHYAMAVWQLGQAVALARVQMFALTAYRLRCAAWLLATGIFLLLAGCSEAKAPTALERVQKEGVLRVITRNSPATYFQDRNGETGFEYELAKRFAERLGVELKIETADNLDDLYAQLSREGGPALAAAGLTPGREDDASVRYSHTYLDVTPQIIYRNGQQRPTRPEDLVGKRIMVLKGSSHAEQLAELKKQYPELKYEESDAVEVVDLLRMVDVGDIDLTLVDSNELAMNQVYFPNVRVAFDFGEARGLAWALPGGDDDSLMNEVNAFLDQAKKEGLLQRLKDRYYGHVDVLGYVGAYTFAQHLQQRLPRYESHFKQSGKQLDTDWRLLAAIGYQESLWQPGATSKTGVRGLMMLTNRTAQAMGVSNRLDPKQSIQGGSKYFVQIRSELPESIKEPDRSWFALAAYNIGGAHLEDARKMAEKEGLNPNKWLDVKKMLPRLAQKQWYAKTRYGYARGGETVHFVQNVRRYYDILTWVTQPQMEGSQIAESGLHLPGVNKTRPEEDSGDEKLMIGADTAKECDAMTFKLLPLAVLCAALVGCQSAQSRDARAESPATAESAAPTAEAPVSEAQEADFETWLANFRRQARGEGIDEATLARALDGLRYRPRVIELDGSQPEFVRPIWEYLDSAVSASRVKKGRERLAEYRDTVRQMTERYGVPGEVLVAIWGIESSYGDYLGDFSTLEALATLAYDGRRRDFARGELLAALRIIEAGDISPERMKGSWAGAMGHTQFIPSSFLAHAVDGDGDGRRDIWNSIADVLASTANYLDEAGWREGEPWGTEVSLPQGFDYTLTEPDIRRSSAEWAAAGVRSRDGHALPDFASASVIAPAGAQGPVFLVGHNFRVILRYNNATSYALAVATLSDAIAGRAGIQGEWPREQPALKRSEVREMQQLLDARGFDVGTPDGILGPNTRRGLRAFQREIGVTPDGFATKALLERLRRMPGLPRARMAQWHPLYSVRLAKDTMTDTQRSLRRPLLGAALSAAALGLCGLSPSLLAAGKRRVSLREEEIEPGRYRDNPQARAFIDEMVARHGFDRGMLQDWFGQAVYSATVVRLIMPPATTGRKSWRTYRSRFIEPIRINAGVRFWQDNRDTLRRAEAEFGVPASVIVGIIGVETIYGRDMGSFRVLDSLSTLAFDYPATPNREARSTLFRNQLADYLLWCRDTRTDVYSVLGSYAGAIGIPQFMPTSLREYALDYDNNGHIDLRNSPTDAIGSVARFLQLHGWEPGRPVVWRIAPDDGSLGVATAAADGEPWPTRTLNQLTRAGLRVDEPINLAREGETGVLVVDLPTPDQPTEYLLGLRNFYVLTRYNRSFFYALAVYQLGEAVKAAMGMFGILNRREMLRGTAATLLLPGILTSAHAGQVAEDPLLRYPWLAQWAGADGLDAPWLRGVFQNLKKYPRVIRAMNHQAEAKPFYLYREHVTSPWLYKKGREAWQQHRAMLEAAGARYGVDAPFVLALWGMESRFGRNQGEHPVLRTLFTLAVDYPRRQTFFRQELRHFLILCRQQGWDPMLLKGSYAGAMGHVQMIPSSLRYYAVDGDGDGRLDVFNNPMDATASIAHYLGKHGWELGGPYLIPVYGITDLSAIKSAKVKEMQPWSSWYALGVRTRGEPPPAERAMALIALEEQDGLRYYGVFNNFRVILDWNRSTRFAKVVGELAEGFVLMPTPATRASLIGLALASGLLAGPARADFQSCLAGIQAQAAGAGVSAQTFRAATANIAYDDKVIELSQAQPEFKTPIWDYMSALVDEERVEDGRAAMRQHAQALANAEARYGVDRHTIAAVWGVESNFGKNLGKMPLVQSLATLACSSNRRRDFFRSELIATLKIIERGDIEASRLTGSWAGAFGQTQFMPTTYQRLAVDGDGDGRRDVVDSVADAVASTANFLRVAKWSNGQPWGYEVRLPRGFNVAAAGRKNKHAVGHWASLGVTRVDGKALTGDGPAGIIAPAGINGPAFLVTKNFDAIYSYNAAESYGLAIAVLSDRLRGRPGVQADWPTDDPPLSRAERRDLQTRLTARGYDVGEPDGKVGSKTREAIKEIERQLGMPATGRPGGKVLEALRRGMFKYSFIAVIVSTVLLSACADSHQKSAEKKPVTSEIANIATSAPARWKQIDVVSLEQAFPKQSRTPAQFPAYVDALKQKAAELGYKPETINFAFSEIHFIDRVVKSDRNQPEKKITLDVYLPRVVTKGRIAEGAKLYQANQQTLAQISNQYGVPANYIVALWGLESGFGRVQGKEDVISALATLAFEGRREALFSRQLMAALEIIENGHLPVGQRLKGSWAGAMGQTQFMPSSFLTYAADGNGDGNIDIWNSREDAFASAANYLATEGWQRDLPWGEQVSLPANFNQQLEGIKTEQQKTVAQWKALGVQLPANSQLSDDMKVWLIIPDDDLHRSYLVTQNFRTIMHWNSSYFFALSIVTMADGVANKINTLPTQHMKKESRPAFDAAAVFDAAAVPVSDSGFAANANVRRFVDDEVGKGDFSRAEWQDFFDKAAYKADIVKIMHRPSTSRPWYVFRTGNSGKAKFRGARRFYAENRALIDDVAQKYGVPAELIVAVIGIETNYGKNTGSFRVADALATLGFDYPRRAGFFQKELVELLKLAKEEGGDVFAFKGSYAGAMGMPQFMPSSYRKWAVDYDGDGHRDIWGNIGDVAASVANYMKQHGWRTGGKILVSATLAPGADVQAIIGEKTALTRTVADLKAYGIIPGEELADDEKAVLFKLETAPGVFEYYLGLNNFYTVWQYNHSRMYVTAVRDIANSLGGSGLMASSSSSKQAKPIHRMAWRLGVSLTLLLGLGALFVLPKFDPKSLTWPTTEPGRIAPLAMSGGNPYLRALMRTISASESNDASPYTVLYGGSHIENLQEHPDRCIPIRWGPNQGLCTTAAGRYQFITTTWLETAEKYHPAPTGEWMWRRYSFAPEYQDRVVYAWLDDVNYWGTDIPQLLEDGQLQTVLKRLSGTWTSLGYGIESNKVTPHLMHIYERMLAEEIALANGLPTNYLPTVANQSVETTRMIIQHSQPKRKGTKYRLKKPYKLVFNLIIVVGLIGLVYSFKKNTQPLVNPSLVTHLPELEMSGGDPYIRALMLTISASESNHKNSYYLLYGGSHVHNLQQHPDQCIPINIGPNRGNCSTAAGRYQFLNSTWQEKARKYHPNPQKNYRQYIYSFEPKYQDIVVYRWLKDHHQWNVDLLTLLKQDQVEEVLRKLSNVWTSLGGGIEDNSMTPHLPSIYRYFLAQELNRENADQNSLMVEINNQRKAFLDMLAWSEGTDNGRQKTRNHGYDVIVGGELFTDYSDHPRKLVTLNPKLKSTAAGRYQLLSRWWDAYRKQLGLKDFSPKSQDAVALQQIKERGALPMIDRGDIRQAIDRCSNIWASLPGAGYGQFEHKADSLIVKFKEAGGTVREIEVMGYTWKGLAKQYGFTDFSPATQDKAAVALILAKKGAMEAILNGDYEQAVMKLGGIWASFPTAPNEYRQHKRSWGFVHNFFRQRGFMARISAADAGGVNVIAFLDMLAWSEGTSTIKASDYGYDVLVGGKLFSEYSKHPRVKVWLPKYSIYSSAAGRYQFLAGTWDAIVKNYGFKGRFIPEAQDLAAIKLLTECGALPLIKAGRIVEAIAKAAPIWASLPGAGYGQREHKLAALLGIYEAERAAEAKPQDQLLAMFSACGGEMAAMTRYEFALLALAAVGYVVWRDWQRSEEPGAQSPDFIDQAENLFYDATEGNFFGGTEDTDMGQAQLNRAAFLLTIRTGEGTAGNDGYRMLFGGGKFDSFADHPRQVVTALSNGKPISSSAAGAYQFLRRTWDTLAARLGLTDFSPASQDAAALELIREAGALGDVDAGRFALAVRKVRKIWASMPGAGYGQPEVALERLQAAYQAAGGVVNGMPVINTHQNIAAFLDMLAYSEGTANHPLTKNRGYDVIVTSLDGRPEIFTDYSDHPFAHGRPAKVFNRRGEKSTASGRYQQLYMFWPHYKKQLALPDFSPLSQDKLAIQLIRERGAIDDIRAGRIERAVSRCRNIWASLPGAGYGQREHSLEKLVTVWRTAGGVVAMYSQQVQQINQPQKNSDIQLINMWLQQIHPIQQNSHLYIAQMFLKFIKKPLKKVTSADVIAFANVYGVRSHNSHSNQQKRIETINSLLKFGQEAGILPRNQKKTFSPNTTNFKTSVYSQNKIKNYRTTGKQQKKPLNWSQLFNLQLASSVLIVFILLMAILQLFRQVSGSTNANQNKSVTSVVMPKIDPTKNWAYPVNVPRIRAFLDTIAVTEGTTGPKGYYRQYTGSHFLSFEDHPRELKCANSNGKKLCSDAAGRYQFLSTSWDRFAPVVKAQNFSPTYQDRVAIELIRDKNALKDIEEGRVKEAFQKLYMVWPSFGETETDVEQLMPKLVGTYEQKLALYQIKNMDDEFERAFKKILDYEGGYSDEQKDHGGKTKYGITEKLARDYGHEGEMKDLELEKAKEIYYREFWANHLYSWIEDERIATEVFEQAVNMGAKTANKHLQKAYNLLADKEIAVDGIIGQRTLEAVNNFEHNSDLFKLLNILQAKKYINIVKNDASQQKFIRGWLRRVELDIDSRKSMKRNFQTVMPYIFSEEGGYADNPADPGGATNMGITINTLSAWEGRQVSPQDVKELTQATATQIYQVEFWNKIDGNDLPSGVDYALFDFAVNSGPGRAAKTLQKILAMPEDGIIGAQTVAAAAARSPEGIINALCDARAAWLRGLSTAATFGNGWLARVERVRARALALAATPPAITQPADPAGNPSPKARQADIAFTSALKHPEALGTMGSVASGLAAIATGNGPVQYALAIVMVACAGVGLWYFVRRVRSEPMNFDQAFDRLLGHEGGYSNNSADPGGETMWGVTARVARADGYLGEMRDLPRDRAKSIYRRLYWTPVRADELPEVVRFDVFDGAVNSGPAQSIKWLQRAAGAVDDGILGPRTMAAAVAAGPVLAARYNGHRLLFLADRPTWGSFGKGWARRVGKNLLGAMDQPPWLQAAWAEFGVREIPGKEDAPEILRYFRDAGDTNVETEATPWCAAFLGAMLKRAGYAGTGSLLARSYLDWGDRLDDARFGAVAVLSRGDDPNAGHVGFLLSDTNGKLYLLGGNQGDAVTVASFDKARLLGLRWPKENVEAASKGDDAIFSRVLAHVLEMEGGFSNDPYDPGGPTNRGITLEVYAKFRKETLDDGTRARLIAELKRIPDAIVTAIYRQRYFDPASCPVFTAPLALMHFDAAVNHGVGAAIRMLQGVAGVTVDGEIGPETLAAIGAKSLADLLDDYAETRRARYRALPHFWRFGRGWLKRVDATLALARTWAAAEATNRGLIEPQQIAKGEGKMGEKSKTEISSSDDSKWWLNSKTMWGTLITAAATVIPVLGPAVGIVLPADLITSFGDQVVTAAQALAGLFGTALAIYGRLKADTPLVLRKNMSAPLTFQQVFDRVVGHEGGYVNDPHDPGGETNWGITKYTARENGYTGSMKAMTREQAYKIYEKAFWQRYHCEKLPEAVAFQFFDAAVNHGVGNASRMLQRAVNVADDGIIGKVTLSAVEKMPISDLLLRFNAERIRFYTKLKNFPRYGKGWMNRIAGNLAYAAIDNEVMNPIIDGIIALEGGYVFNPKDKGGATHWGITEATARAHGYAGDMRDLTHAEAYAILEEDYWIKPGFDVISTLSWPVSFELCDAAVNIGAYHPSAWLQRWLNVFNHEGKRYPDIHVDGNIGPRTLAALEHYLAWRGQEGEAVLVKALNCSQGTYYLNVAEKNHNNEQFIYGWIKNRVTMDSFEDAFKALIGNEGGYSFNPADPGGETMWGVTARVARSEGYNGAMKDLPLETAHQIAKRRYWDPLHLDELDPRVAFQIFDANYNGGLVVLWMQKASGAKEDGKFGPDTLDAVKNADPMKFVMRFAAYRLRYLRNLHSWPSFSRGWTERMAANLLLGAAMSQTATLSDFNKAFDRVIQHEGGYVNDPRDAGGETKFGITIHTARANGYTGSMFTMTRDDAKQIYLKAFWQRYRCNEFPPELAFQFFDACVNHGSGNASRMLQRAVGVVDDGIIGEITLAAIRKRSTVEVVTLFNAERLEFYTKLSGFQHFGKGWIRRMAGNLRHIADDVGDK']
Target names: '18', '19', '22', '23', '24', '25', '73', '102', '103', '104', '108'

In [ ]:
sequence_data


Out[ ]:
{'DESCR': 'Sequences',
 'data': ['MRKFNKPLLALLIGSTLCSAAQAAAPGKPTIAWGNTKFAIVEVDQAATAYNNLVKVKNAADVSVSWNLWNGDAGTTAKILLNGKEAWSGPSTGSSGTANFKVNKGGRYQMQVALCNADGCTASDATEIVVADTDGSHLAPLKEPLLEKNKPYKQNSGKVVGSYFVEWGVYGRNFTVDKIPAQNLTHLLYGFIPICGGNGINDSLKEIEGSFQALQRSCQGREDFKVSIHDPFAALQKAQKGVTAWDDPYKGNFGQLMALKQAHPDLKILPSIGGWTLSDPFFFMGDKVKRDRFVGSVKEFLQTWKFFDGVDIDWEFPGGKGANPNLGSPQDGETYVLLMKELRAMLDQLSAETGRKYELTSAISAGKDKIDKVAYNVAQNSMDHIFLMSYDFYGPFDLKNLGHQTALNAPAWKPDTAYTTVNGVNALLAQGVKPGKVVVGTAMYGRGWTGVNGYQNNIPFTGTATGPVKGTWKNGIVDYRQIAGQFMSGEWQYTYDATAEAPYVFKPSTGDLITFDDARSVQAKGKYVLDKQLGGLFSWEIDADNGDILNSMNASLGNSAGVQ',
  'MSTRKAVIGYYFIPTNQINNYTETDTSVVPFPVSNITPAKAKQLTHINFSFLDINSNLECAWDPATNDAKARDVVNRLTALKAHNPSLRIMFSIGGWYYSNDLGVSHANYVNAVKTPAARTKFAQSCVRIMKDYGFDGVDIDWEYPQAAEVDGFIAALQEIRTLLNQQTIADGRQALPYQLTIAGAGGAFFLSRYYSKLAQIVAPLDYINLMTYDLAGPWEKITNHQAALFGDAAGPTFYNALREANLGWSWEELTRAFPSPFSLTVDAAVQQHLMMEGVPSAKIVMGVPFYGRAFKGVSGGNGGQYSSHSTPGEDPYPNADYWLVGCDECVRDKDPRIASYRQLEQMLQGNYGYQRLWNDKTKTPYLYHAQNGLFVTYDDAESFKYKAKYIKQQQLGGVMFWHLGQDNRNGDLLAALDRYFNAADYDDSQLDMGTGLRYTGVGPGNLPIMTAPAYVPGTTYAQGALVSYQGYVWQTKWGYITSAPGSDSAWLKVGRLA',
  'MLSFVKKSIALVAALQAVTALATPISSEAGVEKRGSGFANAVYFTNWGIYGRNFQPADLPASEITHVLYSFMNVRADGTIFSGDTYADYEKHYAGDSWNDVGTNAYGCVKQLYLLKKQNRNMKVMLSIGGWTWSTNFPAAASSAATRKTFAQSAVGFMKDWGFDGIDIDWEYPADATQAQNMVLLLQAVRSELDSYAAQYAKGHHFLLSIAAPAGPDNYNKLKFAELGKVLDYINLMAYDYAGSWSNYTGHDANIYANPQNPNATPYNTDDAVQAYINGGVPANKIVLGMPIYGRSFQQTEGIGKPYNGIGSGSWENGIWDYKALPKAGATVKCDDTAKGCYSYDPSTKELISFDTPAMISTKVSWLKGKGLGGTMFWEASASKKGSDSLISTSHQGLGSQDSTQNYLDYPNSKYDNIKKGMN',
  'MILNLIILLAISIVASASNIAAYWGQNAGGDQQTLGDYCSSSPASIIILSFLDGFPNLSLNFANQCSGTFSSGLAHCSQIGSDIKSCQQQGKTILLSLGGATGNYGFSSDSEAVQFAGTLWNKFGGGKDSERPFDDAIVDGFDFDIENKDQTGYAALATQLRKYFSTGTKSYYLSAAPQCPYPDESVGDLMSQVDLDFAFIQFYNNYCSLNQQFNWNSWSNYARGKSIKLYLGLPGSSSSAGSGFVGLSTVQRVVASIKGDSSFGGISIWDISSAENGGYLNQLYQALSGSGSPAAPSNSYQPNTPLTRTYGGSTATASAYISVGFTAGATHGSTTTNDLLAWIDSLFGSSQSSVQQYATPVQSVTATPQPVAATTTSAPKPTASAFNWFGWFDGTTTSTTLQTVYSTVPADQTVYVTLTTTVGSQMLQSLFDKRDVIAEAKSTNLQICWLLFIPLLALICS',
  'MAKRTQAILLLLLAISLIMSSSHVDGGGIAIYWGQNGNEGTLTQTCSTRKYSYVNIAFLNKFGNGQTPQINLAGHCNPAAGGCTIVSNGIRSCQIQGIKVMLSLGGGIGSYTLASQADAKNVADYLWNNFLGGKSSSRPLGDAVLDGIDFDIEHGSTLYWDDLARYLSAYSKQGKKVYLTAAPQCPFPDRYLGTALNTGLFDYVWVQFYNNPPCQYSSGNINNIINSWNRWTTSINAGKIFLGLPAAPEAAGSGYVPPDVLISRILPEIKKSPKYGGVMLWSKFYDDKNGYSSSILDSVLFLHSEECMTVL',
  'MTKLILLTGLVLILNLQLGSAYQLTCYFTNWAQYRPGLGRFMPDNIDPCLCTHLIYAFAGRQNNEITTIEWNDVTLYQAFNGLKNKNSQLKTLLAIGGWNFGTAPFTAMVSTPENRQTFITSVIKFLRQYEFDGLDFDWEYPGSRGSPPQDKHLFTVLVQEMREAFEQEAKQINKPRLMVTAAVAAGISNIQSGYEIPQLSQYLDYIHVMTYDLHGSWEGYTGENSPLYKYPTDTGSNAYLNVDYVMNYWKDNGAPAEKLIVGFPTYGHNFILSNPSNTGIGAPTSGAGPAGPYAKESGIWAYYEICTFLKNGATQGWDAPQEVPYAYQGNVWVGYDNIKSFDIKAQWLKHNKFGGAMVWAIDLDDFTGTFCNQGKFPLISTLKKALGLQSASCTAPAQPIEPITAAPSGSGNGSGSSSSGGSSGGSGFCAVRANGLYPVANNRNAFWHCVNGVTYQQNCQAGLVFDTSCDCCNWA',
  'MKKFINQFSASLKNNILVFLAFPFVWTSCARDNPLSSENSNISPNAAARAAVTGTTKANIKLFSFTEVNDTNPLNNLNFTLKNSGKPLVDMVVLFSANINYDAANDKVFVSNNPNVQHLLTNRAKYLKPLQDKGIKVILSILGNHDRSGIANLSTARAKAFAQELKNTCDLYNLDGVFFDDEYSAYQTPPPSGFVTPSNNAAARLAYETKQAMPNKLVTVYVYSRTSSFPTAVDGVNAGSYVDYAIHDYGGSYDLATNYPGLAKSGMVMSSQEFNQGRYATAQALRNIVTKGYGGHMIFAMDPNRSNFTSGQLPALKLIAKELYGDELVYSNTPYSKDW',
  'MKLNIFTKSMIGMGLVCSALPALAMEAWNNQQGGNKYQVIFDGKIYENAWWVSSTNCPGKAKANDATNPWRLKRTATAAEISQFGNTLSCEKSGSSSSSNSNTPASNTPANGGSATPAQGTVPSNSSVVAWNKQQGGQTWYVVFNGAVYKNAWWVASSNCPGDAKSNDASNPWRYVRAATATEISETSNPQSCTSAPQPSPDVKPAPDVKPAPDVQPAPADKSNDNYAVVAWKGQEGSSTWYVIYNGGIYKNAWWVGAANCPGDAKENDASNPWRYVRAATATEISQYGNPGSCSVKPDNNGGAVTPVDPTPETPVTPTPDNSEPSTPADSVNDYSLQAWSGQEGSEIYHVIFNGNVYKNAWWVGSKDCPRGTSAENSNNPWRLERTATAAELSQYGNPTTCEIDNGGVIVADGFQASKAYSADSIVDYNDAHYKTSVDQDAWGFVPGGDNPWKKYEPAKAWSASTVYVKGDRVVVDGQAYEALFWTQSDNPALVANQNATGSNSRPWKPLGKAQSYSNEELNNAPQFNPETLYASDTLIRFNGVNYISQSKVQKVSPSDSNPWRVFVDWTGTKERVGTPKKAWPKHVYAPYVDFTLNTIPDLAALAKNHNVNHFTLAFVVSKDANTCLPTWGTAYGMQNYAQYSKIKALREAGGDVMLSIGGANNAPLAASCKNVDDLMQHYYDIVDNLNLKVLDFDIEGTWVADQASIERRNLAVKKVQDKWKSEGKDIAIWYTLPILPTGLTPEGMNVLSDAKAKGVELAGVNVMTMDYGNAICQSANTEGQNIHGKCATSAIANLHSQLKGLHPNKSDAEIDAMMGTTPMVGVNDVQGEVFYLSDARLVMQDAQKRNLGMVGIWSIARDLPGGTNLSPEFHGLTKEQAPKYAFSEIFAPFTKQ',
  'MSTPRAAASLAKKAALVALAVLAAALATAARAEQCGAQAGGARCPNCLCCSRWGWCGTTSDFCGDGCQSQCSGCGPTPTPTPPSPSDGVGSIVPRDLFERLLLHRNDGACPARGFYTYEAFLAAAAAFPAFGGTGNTETRKREVAAFLGQTSHETTGGWPTAPDGPFSWGYCFKQEQNPPSDYCQPSPEWPCAPGRKYYGRGPIQLSFNFNYGPAGRAIGVDLLSNPDLVATDATVSFKTALWFWMTPQGNKPSSHDVITGRWAPSPADAAAGRAPGYGVITNIVNGGLECGHGPDDRVANRIGFYQRYCGAFGIGTGGNLDCYNQRPFNSGSSVGLAEQ',
  'MPPQKENHRTLNKMKTNLFLFLIFSLLLSLSSAEQCGRQAGGALCPNGLCCSEFGWCGNTEPYCKQPGCQSQCTPGGTPPGPTGDLSGIISSSQFDDMLKHRNDAACPARGFYTYNAFITAAKSFPGFGTTGDTATRKKEVAAFFGQTSHETTGGWATAPDGPYSWGYCFKQEQNPASDYCEPSATWPCASGKRYYGRGPMQLSWNYNYGLCGRAIGVDLLNNPDLVANDAVIAFKAAIWFWMTAQPPKPSCHAVIAGQWQPSDADRAAGRLPGYGVITNIINGGLECGRGQDGRVADRIGFYQRYCNIFGVNPGGNLDCYNQRSFVNGLLEAAI',
  'MRLCKFTALSSLLFSLLLLSASAEQCGSQAGGARCPSGLCCSKFGWCGNTNDYCGPGNCQSQCPGGPTPTPPTPPGGGDLGSIISSSMFDQMLKHRNDNACQGKGFYSYNAFINAARSFPGFGTSGDTTARKREIAAFFAQTSHETTGGWATAPDGPYAWGYCWLREQGSPGDYCTPSGQWPCAPGRKYFGRGPIQISHNYNYGPCGRAIGVDLLNNPDLVATDPVISFKSALWFWMTPQSPKPSCHDVIIGRWQPSAGDRAANRLPGFGVITNIINGGLECGRGTDSRVQDRIGFYRRYCSILGVSPGDNLDCGNQRSFGNGLLVDTM',
  'MRSLAVVVAVVATVAMAIGTARGSVSSIVSRAQFDRMLLHRNDGACQAKGFYTYDAFVAAAAAFPGFGTTGSADAQKREVAAFLAQTSHETTGGWATAPDGAFAWGYCFKQERGASSDYCTPSAQWPCAPGKRYYGRGPIQLSHNYNYGPAGRAIGVDLLANPDLVATDATVGFKTAIWFWMTAQPPKPSSHAVIAGQWSPSGADRAAGRVPGFGVITNIINGGIECGHGQDSRVADRIGFYKRYCDILGVGYGNNLDCYSQRPFA',
  'MGAFALFAVLAMAVTMAVAEQCGSQAGGATCPNCLCCSRFGWCGSTSDYCGDGCQSQCAGCGGGGTPVTPTPTPSGGGGVSSIVSRALFDRMLLHRNDGACQAKGFYTYDAFVAAAGAFPGFGTTGSTDTRKREVAAFLAQTSHETTGGWATAPDGAFAWGYCFKQERGATSNYCTPSAQWPCAPGKSYYGRGPIQLSHNYNYGPAGRAIGVDLLRNPDLVATDPTVSFKTAMWFWMTAQAPKPSSHAVITGQWSPSGTDRAAGRVPGFGVITNIVNGGIECGHGQDSRVADRIGFYKRYCDILRVGYGNNLDCYNQRPFA',
  'MRLSEFTTLFLLFSVLLLSASAEQCGSQAGGALCASGLCCSKFGWCGNTNEYCGPGNCQSQCPGGPGPSGDLGGVISNSMFDQMLNHRNDNACQGKNNFYSYNAFVTAAGSFPGFGTTGDITARKREIAAFLAQTSHETTGGWPTAPDGPYAWGYCFLREQGSPGDYCTPSSQWPCAPGRKYFGRGPIQISHNYNYGPCGRAIGVDLLNNPDLVATDPVISFKSAIWFWMTPQSPKPSCHDVITGRWQPSGADQAANRVPGFGVITNIINGGLECGHGSDSRVQDRIGFYRRYCGILGVSPGENLDCGNQRSFGNGLLVDIM',
  'QNCQCDTTIYCCSQHGYCGNSYDYCGPGCQAGPCWDPCEGDGTLTVSDIVTQEFWDGIASQAAANCPGKSFYTRSNFLEAVSAYPGFGTKCTDEDRKREIAAYFAHVTHETGHLCYIEERDGHANNYCQESQQYPCNPNKEYFGRGPMQLSWNYNYIDAGKELHFDGLNDPDIVGRDPIISFKTSLWFWIRKGVQYVILDPNQGFGATIRIINGGQECDGHNTAQMMARVGYYQEYCAQLGVSPGNNLPC',
  'MKKNRMMMMIWSVGVVWMLLLVGGSYGEQCGRQAGGALCPGGNCCSQFGWCGSTTDYCGPGCQSQCGGPSPAPTDLSALISRSTFDQMLKHRNDGACPAKGFYTYDAFIAAAKAYPSFGNTGDTATRKREIAAFLGQTSHETTGGWATAPDGPYAWGYCFVRERNPSTYCSATPQFPCAPGQQYYGRGPIQISWNYNYGQCGRAIGVDLLNKPDLVATDSVISFKSALWFWMTAQSPKPSSHDVITSRWTPSSADVAARRLPGYGTVTNIINGGLECGRGQDSRVQDRIGFFKRYCDLLGVGYGNNLDCYSQTPFGNSLLLSDLVTSQ',
  'MRSLLILVLCFLPLAALGKVFGRCELAAAMKRHGLDNYRGYSLGNWVCAAKFESNFNTQATNRNTDGSTDYGILQINSRWWCNDGRTPGSRNLCNIPCSALLSSDITASVNCAKKIVSDGNGMNAWVAWRNRCKGTDVQAWIRGCRL',
  'MKALIVLGLVLLSVTVQGKVFERCELARTLKRLGMDGYRGISLANWMCLAKWESGYNTRATNYNAGDRSTDYGIFQINSRYWCNDGKTPGAVNACHLSCSALLQDNIADAVACAKRVVRDPQGIRAWVAWRNRCQNRDVRQYVQGCGV',
  'MKAFIVLVALACAAPAFGRTMDRCSLAREMSNLGVPRDQLNKWACIAEHESSYRTGVVGPENYNGSNDYGIFQINDYYWCAPPSGRFSYNECGLSCNALLTDDITHSVRCAQKVLSQQGWSAWSTWHYCSGWLPSIDDCF',
  'KIFSKCELARKLKSMGMDGFHGYSLANWVCMAEYESNFNTQAFNGRNSNGSSDYGIFQLNSKWWCKSNSHSSANACNIMCSKFLDDNIDDDIACAKRVVKDPNGMSAWVAWVKHCKGKDLSKYLASCNL',
  'MTKYVILLAVLAFALHCDAKRFTRCGLVQELRRLGFDETLMSNWVCLVENESGRFTDKIGKVNKNGSRDYGLFQINDKYWCSKGTTPGKDCNVTCNQLLTDDISVAATCAKKIYKRHKFDAWYGWKNHCQHGLPDISDC',
  'KVYDRCEFARILKKSGMDGYRGVSLANWVCLAKWESDFNTKAINRNVGSTDYGIFQINSRYWCNDGKTPKAVNACHISCKVLLDDDLSQDIECAKRVVRDPQGIKAWVAWRTHCQNKDVSQYIRGCKL',
  'MKAVIILGLVLLSVTVQGKIFERCELARTLKRLGLDGYRGISLANWVCLAKWESDYNTQATNYNPGDQSTDYGIFQINSHYWCNNGKTPGAVNACRISCNALLQDNIADAVTCAKRVVRDPQGIRAWVAWRNHCQNRDVSQYVQGCGV',
  'KIYEQCEAAREMKRLGLDGYDGYSLGDWVCTAKHESNFNTGATNYNRGDQSTDYGIFQINSRWWCNDGKTPNAKNACGIECSELLKADITAAVICAKRVVRDPNGMGAWVAWTKYCKGKDVSQWIKGCKL',
  'MSALWLLLGLLALMDLSESSNWGCYGNIQSLDTPGASCGIGRRHGLNYCGVRASERLAEIDMPYLLKYQPMMQTIGQKYCMDPAVIAGVLSRKSPGDKILVNMGDRTSMVQDPGSQAPTSWISESQVSQTTEVLTTRIKEIQRRFPTWTPDQYLRGGLCAYSGGAGYVRSSQDLSCDFCNDVLARAKYLKRHGF',
  'RTDCYGNVNRIDTTGASCKTAKPEGLSYCGVSASKKIAERDLQAMDRYKTIIKKVGEKLCVEPAVIAGIISRESHAGKVLKNGWGDRGNGFGLMQVDKRSHKPQGTWNGEVHITQGTTILINFIKTIQKKFPSWTKDQQLKGGISAYNAGAGNVRSYARMDIGTTHDDYANDVVARAQYYKQHGY',
  'MVPSVVFWGLIALVGTAKGSYTHSVHSMNPHVHPRLYHGCYGDIMTMETFGAPCDINNLMNCGIHGSEMFAEMDLKAIKPYRILIKEVGQRHCIDPALIAAIISRESHGGAVLQNGWDHKGQRFGLMQLDKNMYHPIGSWDSKEHLLQSVGILTERIKAMKRKFPTWNTAQQLKGGLTAFKSGMETIVTPADIDGDLVDDVLARAKFYKRHGF',
  'MGYGNIMNVETTGASWQTAQQDKLGYSGVRASHTMANTDSGRMERYRSKINSVGAKYGIDPALIAAIISEESRAGNVLHDGWGDYDSNRGAYNAWGLMQVDVNPNGGGHTARGAWDSEEHLSQGAEILVYFIGRIRNKFPGWNTEQQLKGGIAAYNMGDGNVHSYDNVDGRTTGGDYSNDVVARAQWYKTQKGF',
  'MPYGKIEDIKTSGASDVTAAQDGLKEGGWKSSHRMAEIDSNRMENYRTIINEAGRQCDVDPAVIAGIISRESRAGNQLINGWGDHGKAFGLMQIDVTPPPNGGGHTPVGTWDSLEHLIQATEILVEFIERIKTKFPRWNADQHLKGALAAYNKGEKNVESYASVDAKTTGKDYSNDVVARAQWYKSNMGF',
  'MKCLVALFLSLSLVACQYDDYDTERKNNNMLSSMNILDLLDSFGLNIKARIAHVRRVAGRIRLTLDIGLGNGDVERESEEAEGEGTDGRGGGEGEREGWGGEREGGEGEREGGEGEREGREGEREGKSSESNESPEDFIGPPVDMCAGESRRGSPSIGCIAAECCQHSFYINSLCPGSSVCCFSMDVCDRLPVPVIPPFPTDPGTLPPPPPIPDSQTTVSPNQPSSYMCHGDFMKLMPKGADQRTARQDNLAYAGVRASNKLVDNDLAELNKRKDCYVQAGKNHCIHPAVIAAIASRETRGGKLLYSTNGYGDGGRAYGIMQCDGGASGLGDICKKYPWDSCEHINQLTDIILLNYVNQMKTKHPSWPAHYQLKGGVSAYNAGVGNVQTIAGMDAGTTNDDYSNDVIARAQRLVNAHGW',
  'MLGKNDPMCLVLVLLGLTALLGICQGGTGCYGSVSRIDTTGASCRTAKPEGLSYCGVRASRTIAERDLGSMNKYKVLIKRVGEALCIEPAVIAGIISRESHAGKILKNGWGDRGNGFGLMQVDKRYHKIEGTWNGEAHIRQGTRILIDMVKKIQRKFPRWTRDQQLKGGISAYNAGVGNVRSYERMDIGTLHDDYSNDVVARAQYFKQHGY',
  'MHLMLVLLGLAALLGTSQSRTGCYGDVNRVDTTGASCKSAKPEKLNYCGVAASRKIAERDLQSMDRYKALIKKVGQKLCVDPAVIAGIISRESHAGKALRNGWGDNGNGFGLMQVDRRSHKPVGEWNGERHLMQGTEILISMIKAIQKKFPRWTKEQQLKGGISAYNAGPGNVRSYERMDIGTTHDDYANDVVARAQYYKQHGY',
  'MNIFEMLRIDEGLRLKIYKDTEGYYTIGIGHLLTKSPSLNAAKSELDKAIGRNCNGVITKDEAEKLFNQDVDAAVRGILRNAKLKPVYDSLDAVRRCALINMVFQMGETGVAGFTNSLRMLQQKRWDEAAVNLAKSRWYNQTPNRAKRVITTFRTGTWDAYKNL',
  'MEMISNNLNWFVGVVEDRMDPLKLGRVRVRVVGLHPPQRAQGDVMGIPTEKLPWMSVIQPITSAAMSGIGGSVTGPVEGTRVYGHFLDKWKTNGIVLGTYGGIVREKPNRLEGFSDPTGQYPRRLGNDTNVLNQGGEVGYDSSSNVIQDSNLDTAINPDDRPLSEIPTDDNPNMSMAEMLRRDEGLRLKVYWDTEGYPTIGIGHLIMKQPVRDMAQINKVLSKQVGREITGNPGSITMEEATTLFERDLADMQRDIKSHSKVGPVWQAVNRSRQMALENMAFQMGVGGVAKFNTMLTAMLAGDWEKAYKAGRDSLWYQQTKGRASRVTMIILTGNLESYGVEVKTPARSLSAMAATVAKSSDPADPPIPNDSRILFKEPVSSYKGEYPYVHTMETESGHIQEFDDTPGQERYRLVHPTGTYEEVSPSGRRTRKTVDNLYDITNADGNFLVAGDKKTNVGGSEIYYNMDNRLHQIDGSNTIFVRGDETKTVEGNGTILVKGNVTIIVEGNADITVKGDATTLVEGNQTNTVNGNLSWKVAGTVDWDVGGDWTEKMASMSSISSGQYTIDGSRIDIG',
  'MPPSLRKAVAAAIGGGAIAIASVLITGPSGNDGLEGVSYIPYKDIVGVWTVCHGHTGKDIMLGKTYTKAECKALLNKDLATVARQINPYIKVDIPETTRGALYSFVYNVGAGNFRTSTLLRKINQGDIKGACDQLRRWTYAGGKQWKGLMTRREIEREVCLWGQQ',
  'MVEINNQRKAFLDMLAWSEGTDNGRQKTRNHGYDVIVGGELFTDYSDHPRKLVTLNPKLKSTGAGRYQLLSRWWDAYRKQLGLKDFSPKSQDAVALQQIKERGALPMIDRGDIRQAIDRCSNIWASLPGAGYGQFEHKADSLIAKFKEAGGTVREIDV',
  'MKGKTAAGGGAICAIAVMITIVMGNGNVRTNQAGLELIGNAEGCRRDPYMCPAGVWTDGIGNTHGVTPGVRKTDQQIAADWEKNILIAERCINQHFRGKDMPDNAFSAMTSAAFNMGCNSLRTYYSKARGMRVETSIHKWAQKGEWVNMCNHLPDFVNSNGVPLRGLKIRREKERQLCLTGLVNE',
  'MMQISSNGITRLKREEGERLKAYSDSRGIPTIGVGHTGKVDGNSVASGMTITAEKSSELLKEDLQWVEDAISSLVRVPLNQNQYDALCSLIFNIGKSAFAGSTVLRQLNLKNYQAAADAFLLWKKAGKDPDILLPRRRRERALFLS',
  'MQISQAGINLIKSFEGLQLKAYKAVPTEKHYTIGYGHYGSDVSPRQVITAKQAEDMLRDDVQAFVDGVNKALKVSVTQNQFDALVSFAYNVGLGAFRSSSLLEYLNEGRTALAAAEFPKWNKSGGKVYQGLINRRAQEQALFNSGTPKNVSRGTSSTKTTPKYKVKSGDNLTKIAKKHNTTVATLLKLNPSIKDPNMIRVGQTINVTGSGGKTHKVKSGDTLSKIAVDNKTTVSRLMSLNPEITNPNHIKVGQTIRLS',
  'MKVSQNGLNLIKEFEGCRLTAYKPVPWEQMYTIGWGHYGVTAGTTWTQAQADSQLEIDINNKYAPMVDAYVKGKANQNEFDALVSLAYNCGNVFVADGWAPFSHAYCASMIPKYRNAGGQVLQGLVRRRQAELNLFNKPVSSNSNQNNQTGGMIKMYLIIGLDNSGKAKHWYVSDGVSVRHVRTIRMLENYQNKWAKLNLPVDTMFIAEIEAEFGRKIDMASGEVK',
  'MVKKNDLFVDVSSHNGYDITGILEQMGTTNTIIKISESTTYLNPCLSAQVEQSNPIGFYHFARFGGDVAEAEREAQFFLDNVPMQVKYLVLDYEDDPSGDAQANTNACLRFMQMIADAGYKPIYYSYKPFTHDNVDYQQILAQFPNSLWIAGYGLNDGTANFEYFPSMDGIRWWQYSSNPFDKNIVLLDDEEDDKPKTAGTWKQDSKGWWFRRNNGSFPYNKWEKIGGVWYYFDSKGYCLTSEWLKDNEKWYYLKDNGAMATGWVLVGSEWYYMDDSGAMVTGWVKYKNNWYYMTNERGNMVSNEFIKSGKGWYFMNTNGELADNPSFTKEPDGLITVA',
  'TVQGFDISSYQPSVNFAGAYSAGARFVIIKATEGTSYTNPSFSSQYNGATTATGNYFIRGGYHFAHPGETTGAAQADYFIAHGGGWSGDGITLPGMLDLESEGSNPACWGLSAASMVAWIKAFSDRYHAVTGRYPMLYTNPSWWSSCTGNSNAFVNTNPLVLANRYASAPGTIPGGWPYQTIWQNSDAYAYGGSNNFINGSIDNLKKLATG',
  'MKGIDIYSGQGSVDFNAVKESGVEVVYIKATEGLTYTDSTYKDFYDGAKNAGLKIGFYHYLRANDPTSEAEHFFNTISGLSLDCKCAIDVEVTLGQSIDQISSNVRKFADYLINKGLDVCVYTYTNFYKDNLNSTVKDLPLWIAEYGVSKPNIDASYVGFQYSDSGSVNGISGSADLDEFSEGILVGGTVVIDPGQGGDDNIKAIQQDLNILLKRGLEVDGIEGPETEAAIKDFQSIMGLTVDGIWGTNTSGAAQQIFSRPLDGVAYPHYEYATRYIQYRVGASVDGTFGSGTKAKVAAWQSNQGLMADGVVGSATWSKLLDEN',
  'KLGIDVSQPTSTSSFTCLRNKGFTTMVIVRAWKSTGSFDTNAPQTLKNANAAGFSIENSDVYYYPCISCGNMAGQVRTFWQKVGQYSLKVKRVWFDIEGTWTSSVSTNQNYLMQMMNEARAIGIVHGIYGSKYYWGNLFGSSYKYRYRSSTPLWYPHYDNSPSFSDFSSFGGWTSPSMKQYRGDVSVCSAGVDYNYKP',
  'MPAYSSLARRGRRPAVVLLGGLVSASLALTLAPTAAAAPLAPPPGKDVGPGEAYMGVGTRIEQGLGAGPDERTIGPADTSGVQGIDVSHWQGSINWSSVKSAGMSFAYIKATEGTNYKDDRFSANYTNAYNAGIIRGAYHFARPNASSGTAQADYFASNGGGWSRDNRTLPGVLDIEHNPSGAMCYGLSTTQMRTWINDFHARYKARTTRDVVIYTTASWWNTCTGSWNGMAAKSPFWVAHWGVSAPTVPSGFPTWTFWQYSATGRVGGVSGDVDRNKFNGSAARLLALANNTA',
  'MTKTYGVDVAVYQPIDLAAYHKAGASFAIVKLTEGVDYVNRRGPSRWTAPGLTTSTLMPTISRSFGSSVSRAKKEAAYFLKEAKKQDISKKRMLWLDWEAGSGNVVTGSKSSNTAAILDFMDAIKAAGWRPGLYSGASLMRTAIDTKQVVKKYGTCLWVASYPTMAAVSTADFGYFRQWTGSPSGSLPVTAWPGRRRERCSG',
  'MQLRITSRKKLTSLLCALGLISIVAIYPRQTVNFFYSTAVQITDYIHFYGYRPVKSFAIRIPASYTIHGIDVSRWQERIDWQRVAKMRDNGIRLQFAFIKATEGEKLVDPYFSRNWQLSRENGLLRGAYHYFSPSVSASVQARLFLQTVDFSQGDFPAVLDVEERGKLSAKELRKRVSQWLKMVEKSTGKKPIIYSGAVFYHTNLAGYFNEYPWWVAHYYQRRPDNDGMAWRFWQHSDRGQVDGINGPVDFNVFNGTVEELQAFVDGIKETP',
  'MRFIALLISFFALLKVISAISGVDISSASTIESFTCLKSAGYDFAIIRAYESLGQVDPNGPHSVYNARDAGIEYVDVYMFPCPTCGNGAGQAETMVNYLKGYNANYGMVWLDIEGPQYWMSQSENVAFFESLVAGLKAEGAHIGVYTSASQWEPIMGGYTGGSEFPLWYAHYDGNPSFSDFSPFNGWSTPSVKQYDDTGDSCGLGFDLNWYP',
  'MHCAPSWKSSDERRTMLDQINTLDPNSLTALKRMSKDNSPAAIKGAAQQFEALFLQNMLKSMRDATVTSDAMGSETTRFYQGLYDQQLAAMMAQRGGIGLADVMEKQMGAQAASAQNAAAAGASSAGNVPLSLDAARAAAAHTASGDKVPTTPQAFVDATWPQAAKAAQSLGVPAHFLVAQAALETGWGKSQIRNKDGTPSYNLFNIKAGSNWTGKVVEARTVEYENGQRKVRVERFRAYDSYEQAFQDYADLVGNSPRYAKVAGKTDGHAFARALQEGGYATDPSYADKLARVINGNALRQRLMASAASARG',
  'MINKKWMKIVMIPMLVVPMYGLTSVSGQIQDSLTGENSFVKDAEAATTASQQAFIDKIAPAAQASQEQYHLLSSITLAQAILESGWGKSGLATKGYNLFGIKGKYNGQSVIMSTSEYVNGQWIKIDAEFRKYPSWNESVTDHTLLLVNGTSWNKNLYKKVVDATDYKVAAMELQKAGYASPTYGASLIQVIENYDLAKYDVLYDKILTQKSTSGKATVTSPTGNGVWTLPYKVKGVQSVSPASTYANKDIDLVSVATTKRGTYYQFKYNGKVVGWVDAKALTIYDSVNYDKVNVGRAKITSPVSNGIWSKPYNVYGREFVTNATTYAQQEIKLLREAQTAKGTYYQFSINNKTIGWIDKRALTIYPYDSIVSSKNVSLDGQITNPTGNGIWTKAYKLEGTTSVAQATKYANKDVKISQQVETQHGTYYNISIDGKAIGWLDKNAITLYDQAEYNKTVAFDAAIRNVQGNAVWTEPYRTVGTKLIGPAETYLNKEVEVVREAKTPKGTYYQFKSGGKVIGWLDKKAFEVYDNINYNKAVNLDAVVENVTGNAVWTAPYKSKGVKLVTSAATYKGKATKITREAQTSRGTYYEFSVNGKVIGWLDKKAFDVYDSIEYNKAINMTGLLSNAPGNGIWTEPYRVLDTKNIGQATAYANKTVQLVREAKTSHSTYYQMSLNGKVIGWIDKRAFTNVK',
  'MVNTQVKRVKKQKFIAGTALLLGMATFGMVGKADDLSSSNTNGGVDNSKVDNDNQESVKTSTEGVSSTTENANTVPESKVTSTVDSESAPSKTISAGTQSNISGTSDGSDSLPKTETSDSSSKPSTSNSSSKPSTSNSSSKPSTSNSSSNNNSATKPSTTTQAPPVAPSTTAPSATPSTTAPSNYYQNSSYNQTSTAAQIPNSSSDSAASVYSGPVLKKIEAAKPIEKIDSSSTEAFIKSIADRVRILAGKNNLYASIILAQAILESGSGQSNMTQQYFNIFNITGAYLGKSISFKTEEFSGNNPYYIEQSFRVYSNYDQALDDYINLMIKGTTWNSEIYAGAWKSHAKTYQEAAQALQGIFATDPEYAQKLIEIIEEYNLNFYDNVDSTTQVLDSNIPESPLVASKLDSSTYPDYNGVEYPGADSYAFGNCTQYVYNRIIQLGGQIGTHMGNGGEWGINAQAQGYFTTTVPTEGYAVSFPPGVAGSSPEYGHVAFVEKVYPDNSILVSEMNVKGNNIVSERHISAGVAALATYIQPK',
  'MNRNRLSCLIVGAVIGAGAIVCTTNTKVHAKPVNEVKNINTSKGNSFGEIISSEDIGLRKGADSSHEIITSIPSGARVNIIDKMSKDWYKVSYKDFTGYLQAKDIRVLGDELNQDNVGLISANQLNVRTSPNENGQVIGTLHKNDKVNVLDKSIDGWYKIDFNGRRAYVSSKYVNLISYKNNEVKTEVKKEPIEGTGKVNINTALNVRQASTTNSRIIGSLKGGEKVNIISESNGFYKIEFNNSYGYVYSKYISKDGDSEKVQVVKQEEVKKEKVDESKKEAKATPKAEPVVLAVRSLNKTGIVNVSSSLNVREGAGTSSKVIGSLSGNTKVTIVGEEGAFYKIEYKGSHGYVAKEYVKDVTESSNSNQGTQTPEKPSTPESTEKTGIVNVSSSLNVREGASTSSKVIGSLSGNTKVIIVGEEGAFYKIEYKGSHGYVAKEYIKDVTESNNSNQGTQTPEKPSTPESTEKTGIVNVSSSLNVREGASTSSKVIGSLSGNTKVTIVGEEGAFYKIEYKGSHGYVAKEYIKDIKDEVVTEPEKPSAPENTEKTGVVNVSSSLNVREGASTSSKVIGSLSGNTKVIIVGEEGAFYKIEYKGSHGYVAKEYIKDVTESNNSNQGTQTPEKPSTPESTEKTGIVNVSSSLNVREGASTSSKVIGSLSGNTKVTIVGEEGAFYKIEYKGSHGYVAKEYVKDVTESNNSNQGTQTPEKPSTPESAEKTGVVNVSSSLNVREGASTSSKVIGSLSGNTKITIVGEEGAFYKIEYKGSHGYVAKEYIKDIKDEVVTEPEKPSTHENSKKTGVVTASKGLNVRKEANTSSQIIGILNSGESVEIIGEENGFYKITYKGQEAYASKNYINIFDGNSNVNPGLDIGNASKTNYGVSLNEYIKLQQRNNPSNYSYSEFEKYINPAKATNKLQFLRIDKFRSVNVSGLSSRLSNKGVLTGQGQAFVNAAKAFNIDPIYLVAQCLHETGNGTSKLAKGVTITEIADESKPIYNGNGQLVGYHMIKLSKPVTVYNLFGIGAKDNSSVFPNRALILGTTYAYNRGWTSIENAIKGAAEFVSLNYVHSSRYSQNTLYKMRYNQNVSNIWHQYATTPWYASSIADIMRSYQDLYLENNFTFDVPVFAG',
  'MKKESMSRIERRKAQQRKKTPVQWKKSTTLFSSALIVSSVGTPVALLPVTAEATEEQPTNAEVAQAPTTETGLVETPTTETTPGTTEQPTTDSSTTTESTTESSKETPTTPSTEQPTADSTTPVESGTTDSSVAEITPVAPSATESEAAPAVTPDDEVKVPEARVASAQTFSALSPTQSPSEFIAELARCAQPIAQANDLYASVMMAQAIVESGWGASTLSKAPNYNLFGIKGSYNGQSVYMDTWEYLNGKWLVKKEPFRKYPSYMESFQDNAHVLKTTSFQAGVYYYAGAWKSNTSSYRDATAWLTGRYATDPSYNAKLNNVITAYNLTQYDTPSSGGNTGGGTVNPGTGGSNNQSGTNTYYTVKSGDTLNKIAAQYGVSVANLRSWNGISGDLIFVGQKLIVKKGASGNTGGSGSGGSNNNQSGTNTYYTVKSGDTLNKIAAQYGVSVANLRSWNGISGDLIFVGQKLIVKKGASGNTGGSNNGGSNNNQSGTNTYYTIKSGDTLNKIAAQYGVSVANLRSWNGISGDLIFAGQKIIVKKGTSGNTGGSSNGGSNNNQSGTNTYYTIKSGDTLNKISAQFGVSVANLQAWNNISGSLIFAGQKIIVKKGANSGSTNTNKPTNNGGGATTSYTIKSGDTLNKISAQFGVSVANLRSWNGIKGDLIFAGQTIIVKKGASAGGNASSTNSASGKRHTVKSGDSLWGLSMQYGISIQKIKQLNGLSGDTIYIGQTLKVG',
  'MKKRLIAPMLLSAASLAFFAMSGSAQAAAYTDYSLYKVEPSNTFSTESQASQAVAKLEKDTGWDASYQASGTTTTYQISASGIHSESEAKAILSGLAKQTSITGTSSPVGSKQPYVTISSGAISGEKQANTILAKLKQETGVAGAVKAYGAAQPYMNVMTSDIADETKVKALIQSLAKQTGIKSSYQPITHTVSVTTIQSGTIVGDSRAAQIKNAFQKESGLQASLKETVKGQAYYTFTTAAISGEANAKTLLQQLKQSTGITGSYKSINQKTTVESYNVQSAYFKGLSTVKDAISQIKKNTGVSGSYQQVGKSTSYTVNMKGITKQQLQKIDTFFKKKKWHYTSSSVKKTTTSAAYQITTAKILGEQQANKAAAFFAQKKVKAAKTAAGSTAENQYQLISEETSDQAKVTKGLNILKKNQLSASAKSVKKQIADTFKITTESLLDQTKVNQALTFFKSNHISVASQKTGQTAASSYQITTEAIISQEEIDRVLTFFKQNHIAVTTSKTGQTAYTQYKIVTTQLSSKTALNNGLTYLKSKSVTPSYTTKSNTLYKISVNEQFTGNDTAAAASTKLKQLYGWTSSIVKIKNGPQIMKTNYNLSLRDMVQKQMTVSPQTDGAAYVSLTYINTATSTVTADVLNIRSTPEVSPTNVIGQFKKGDKVKVIGQINGWAKINLGWRNASSDEVVQYVDPNNFSRDSKYYFQFLKLSQTAGLSVTEVNQKVLAGKGILTGRAKAFIDAANQYSINELYLISHALLETGNGTSALANGLTYNGKTVYNMYGIGAYDSNPNYYGAKYAYEQGWFTPEAAIIGGAKFIGSSYIHNTAYNQDTLYKMRWSATATHQYATDIGWAYKQVNRMYSLYSLLDGYTLYFDVPEYR',
  'MARKKLKKRKLLISLFFLVSIPLALFVLATTLSKPIEISKETEEIDEQQVFIDSLSGHAQILYEKYHVLPSITIAQAILESDWGNSELAAKANNLFGVKGNYKGHHVTMETDEVEKGKRKTIRAKFRKYSTFFESMDDHAQLFVRGTSWNKKKYKPVLEAGNYKEAATALQTSGYATDPDYADKISAIVEKYDLDEYDEVNPSLKSVDLNASIKDSAVQDVWSKPSTDDRSIRLTSAQSYVGKDIKVVSKKQKGQSVWYQFQINDKLIGWIDDSAVEIKEAT',
  'MARKLIKNLGKSKSVKRVKLLFKKIFITVFIVASIVAIFNITKYFEELYKVRDLKSTKIEYYMDVADEAGDGKVQLSWKALLAIDMVIHDEDLSNIKKKDTLDIGEKFIVEDKNDKGEKVYKVKKFNKVLSELKFDSSQKSRARKYMKDLEYTYLGNKQLDSSDEKIKFIKKLEDSAIREYIDYGILPSITIGQAILESGWGNSKLTKQSNNLFGIKADKAWKGKSVEISTSEHYNEKIVASFRSYNSLQDSVKDHSLFLINNKRYRKHGLFEAKDYISQAQALENAGYSTAEDKKGNRIYAELLIDVIRSYNLQLIDNKVETK',
  'MFFLTLPLLLGCTAATTPLTAATPPVDPLPLKVVSTDQLPKGLAKDQQLWNKVNGQKGDYKALLTAIDHSLEYLGTDKAQKDYQDYKVPGITRDRVSRSLRRFRQLVVQAKSPQALETAVKKEFQFYQSIGNDQKGNVDFTGYYEATYPASRQPTTEFRYPLYQAPADLKAWPKPHPTRAELEGADGLQASQGPLKGLELVWLRDRIQAFLVQVQGSARLGLTDGTEMTVGYAGKTAHPYTSIGKALIADGKFTLEELSLPVVLQYFEENPQDLDLYIPKNKSFVFFQETFGSPPMGNLNVPVTDERSIATDKSLMPPGALALIQTNLPYYNASQTLEFKDVSRFVLDHDTGSAIKGPGRVDIFMGTGAKAKERAGVMTGSGQLYYLLLKDN',
  'MNTPFSIDEVSFRDLPGWGQDDPRKLFPAMATILSHLRNAKPYRTGALGITAAELVSLLELAERGQVNSPEQARQFFETNSVPFRISPAQGKSGFVTAFYEPELEVSATPDDVWRYPIYRRPPELVDIDNDNRPDGFDPSYAFGKADEEGISYFPDRRAIDEGCLRGRGLEIAWARSKVDLFFVHVQGAARLVFPDGAIKRITYAAKAGHVFSPIGRLLLDRGELDPKTISMQTIRQWLADHPDEVDGVLWHNRSYIFFREADVAGLDMGPIAAAKVPLVAGRALAVDRLIHTFGLPFFIHAPTLTHLDDGKPFARLMLALDTGSAIVGPARGDIFTGSGFEAGELAGTVRNEADFYILLPRIAAERYRR',
  'MRKIQVAVFLFVGLLAACSTVPPSSAPTTCAQCQPCPACPAVTPAITPAPAPAFSRSLLPASWGDLPGWAEDDVTAAWPAFMQSCRGIASRGNAAGWRRVCELARAADGKPENDVRRFFERHLKPYAIVNGDGLVSGLVTGYYEPMLRGSRTKAKGYEQPVRGVPDDLLTIDLSAVFPELKDKRVRGRLEGNKVVPYWSRAEIAARGDKLPGKTLLYVDDAVELFFLQVQGSGRVKLADGGMVRLNYADQNGYQYQSIGKALVERGELKLEEASMQGIQAWARANPARLESLLNTNPSYVFFREVANSADGPVGALGVPLTAERSIAIDPRSVPLGSPVFLATTRPNSAVPLNRLVMAQDTGGAIKGGVRADFFWGFGKEAGDQAGRMKQSGRMWILLPTELAPK',
  'MKGRWVKYLLMGTVVAMLAACSSKPTDRGQQYKDGKFTQPFSLVNQPDAVGAPINAGDFAEQINHIRNSSPRLYGNQSNVYNAVQEWLRAGGDTRNMRQFGIDAWQMEGADNYGNVQFTGYYTPVIQARHTRQGEFQYPIYRMPPKRGRLPSRAEIYAGALSDKYILAYSNSLMDNFIMDVQGSGYIDFGDGSPLNFFSYAGKNGHAYRSIGKVLIDRGEVKKEDMSMQAIRHWGETHSEAEVRELLEQNPSFVFFKPQSFAPVKGASAVPLVGRASVASDRSIIPPGTTLLAEVPLLDNNGKFNGQYELRLMVALDVGGAIKGQHFDIYQGIGPEAGHRAGWYNHYGRVWVLKTAPGAGNVFSG',
  'MKKYLFRAALCGIAAAILAACQSKSIQTFPQPDTSVINGPDRPVGIPDPAGTTVGGGGAVYTVVPHLSLPHWAAQDFAKSLQSFRLGCANLKNRQGWQDVCAQAFQTPVHSVQAKQFFERYFTPWQVAGNGSLAGTVTGYYEPVLKGDDRRTAQARFPIYGIPDDFISVPLPAGLRSGKALVRIRQTGKNSGTIDNTGGTHTADLSQFPITARTTAIKGRFEGSRFLPYHTRNQINGGALDGKAPILGYAEDPVELFFMHIQGSGRLKTPSGKYIRIGYADKNEHPYVSIGRYMADKGYLKLGQTSMQGIKAYMQQNPQRLAEVLGQNPSYIFFRELTGSSNDGPVGALGTPLMGEYAGAVDRHYITLGAPLFVATAHPVTRKALNRLIMAQDTGSAIKGAVRVDYFWGYGDEAGELAGKQKTTGYVWQLLPNGMKPEYRP',
  'MKFPFHPWRRLLLCALPFAALLTACDDGKKEPPPTPAEVTTYNSVPWDALPATSDADLLAGFNAWRSACARLAKDPVWGEPCASATTVAADPTAVRAFLQERMQVYSLRSSSNGDQGLITGYYEPVYHGSLSQGEKTPVPVYGVPDDLVVVALESVYPELKGKRLRGRLEGRVLKPYDDAATIRDNGSSAPVLAWLGDPMDLQFLQIQGSGRIQLEDGRQLRIGYGDQNGHPYKPVGRWLVEQGLVPKEEISMKRIRDWAEANPQRVSELLASNPSFVFFSLRPDSDEGPRGSLNVPLTDGYSVAIDRKVIPLGSLMWLSTTRPDDGSAVVRPVAAQDTGGAIVGEVRADLFWGTGDAAGELAGHMKQPGRLWLLWPKGAPLPAS',
  'MGAMNGTSGRRLSTATRVAAMAGVLLLAACGGPSSRPGLVSRPAGVAGPVSYQRVAIEGLPGWSTDRVADALPVFRRSCERLRAVSPNSMVGPSVWGSRASDWQAACAVAARLPAFDDDAARRFFAERFQAWQVTGAGDPTGLFTGYYEAALDGSLSPSAVYSTPIYGVPLDLRMEGGKGMRVSGGRSLPYPDRAAIEEGAISGVAPVIMWARDPVDVFMLHIQGSGQVRLPDGRIQRIGYAANNGHPFVGIGAIMRDRGLGDGSSMIAIRAWLRANPAEGRALMRENPRFIFFRPIEGEGPIGAQGLPLTGGRSLAVDPSSVPLGAPVWLATSDAHGETVNRLMVAQDTGSAIKGAVRGDFFWGSGEEALYHAGGMKSAGRYWVLVPRGGRNAVAQN',
  'MKGRWAKYVATGVMLAMLAACSSKPTDRGQQYKDGKFTQPFSLVNQPDAVGAPINAGDFAEQVNQIRSASPRLYTNQSNVYNAVQNWLRSGGDTRTMRQFGIDAWQMEGTDNYGNVQFTGYYTPVVQARHTRQGAFQYPIYSMPPKRGRLPSRAQIYAGALSDKYILAWSNSLMDNFIMDVQGSGYIDFGDGSPLNFFSYAGKNGWPYRSIGKVLIDRGEVKKEDMSMQAIREWGEKHSEAEVRELLEQNPSFVFFKPQSFAPVKGASAVPLIGRASVASDRSIIPPGTTLLAEVPLLDNNGKFSGQYELRLMVALDVGGAIKGQHFDIYQGIGPDAGHRAGWYNHYGRVWVLKSAPGAGNVFSG',
  'MFKRRYVTLLPLFVLLAACSSKPKPTETDTTTGTPSGGFLLEPQHNVMQMGGDFANNPNAQQFIDKMVNKHGFDRQQLQEILSQAKRLDSVLRLMDNQAPTTSVKPPSGPNGAWLRYRKKFITPDNVQNGVVFWNQYEDALNRAWQVYGVPPEIIVGIIGVETRWGRVMGKTRILDALATLSFNYPRRAEYFSGELETFLLMARDEQDDPLNLKGSFAGAMGYGQFMPSSYKQYAVDFSGDGHINLWDPVDAIGSVANYFKAHGWVKGDQVAVMANGQAPGLPNGFKTKYSISQLAAAGLTPQQPLGNHQQASLLRLDVGTGYQYWYGLPNFYTITRYNHSTHYAMAVWQLGQAVALARVQ',
  'MFALTAYRLRCAAWLLATGIFLLLAGCSEAKAPTALERVQKEGVLRVITRNSPATYFQDRNGETGFEYELAKRFAERLGVELKIETADNLDDLYAQLSREGGPALAAAGLTPGREDDASVRYSHTYLDVTPQIIYRNGQQRPTRPEDLVGKRIMVLKGSSHAEQLAELKKQYPELKYEESDAVEVVDLLRMVDVGDIDLTLVDSNELAMNQVYFPNVRVAFDFGEARGLAWALPGGDDDSLMNEVNAFLDQAKKEGLLQRLKDRYYGHVDVLGYVGAYTFAQHLQQRLPRYESHFKQSGKQLDTDWRLLAAIGYQESLWQPGATSKTGVRGLMMLTNRTAQAMGVSNRLDPKQSIQGGSKYFVQIRSELPESIKEPDRSWFALAAYNIGGAHLEDARKMAEKEGLNPNKWLDVKKMLPRLAQKQWYAKTRYGYARGGETVHFVQNVRRYYDILTWVTQPQMEGSQIAESGLHLPGVNKTRPEEDSGDEKL',
  'MIGADTAKECDAMTFKLLPLAVLCAALVGCQSAQSRDARAESPATAESAAPTAEAPVSEAQEADFETWLANFRRQARGEGIDEATLARALDGLRYRPRVIELDGSQPEFVRPIWEYLDSAVSASRVKKGRERLAEYRDTVRQMTERYGVPGEVLVAIWGIESSYGDYLGDFSTLEALATLAYDGRRRDFARGELLAALRIIEAGDISPERMKGSWAGAMGHTQFIPSSFLAHAVDGDGDGRRDIWNSIADVLASTANYLDEAGWREGEPWGTEVSLPQGFDYTLTEPDIRRSSAEWAAAGVRSRDGHALPDFASASVIAPAGAQGPVFLVGHNFRVILRYNNATSYALAVATLSDAIAGRAGIQGEWPREQPALKRSEVREMQQLLDARGFDVGTPDGILGPNTRRGLRAFQREIGVTPDGFATKALLERLRR',
  'MPGLPRARMAQWHPLYSVRLAKDTMTDTQRSLRRPLLGAALSAAALGLCGLSPSLLAAGKRRVSLREEEIEPGRYRDNPQARAFIDEMVARHGFDRGMLQDWFGQAVYSATVVRLIMPPATTGRKSWRTYRSRFIEPIRINAGVRFWQDNRDTLRRAEAEFGVPASVIVGIIGVETIYGRDMGSFRVLDSLSTLAFDYPATPNREARSTLFRNQLADYLLWCRDTRTDVYSVLGSYAGAIGIPQFMPTSLREYALDYDNNGHIDLRNSPTDAIGSVARFLQLHGWEPGRPVVWRIAPDDGSLGVATAAADGEPWPTRTLNQLTRAGLRVDEPINLAREGETGVLVVDLPTPDQPTEYLLGLRNFYVLTRYNRSFFYALAVYQLGEAVKAAMG',
  'MFGILNRREMLRGTAATLLLPGILTSAHAGQVAEDPLLRYPWLAQWAGADGLDAPWLRGVFQNLKKYPRVIRAMNHQAEAKPFYLYREHVTSPWLYKKGREAWQQHRAMLEAAGARYGVDAPFVLALWGMESRFGRNQGEHPVLRTLFTLAVDYPRRQTFFRQELRHFLILCRQQGWDPMLLKGSYAGAMGHVQMIPSSLRYYAVDGDGDGRLDVFNNPMDATASIAHYLGKHGWELGGPYLIPVYGITDLSAIKSAKVKEMQPWSSWYALGVRTRGEPPPAERAMALIALEEQDGLRYYGVFNNFRVILDWNRSTRFAKVVGELAEGFVL',
  'MPTPATRASLIGLALASGLLAGPARADFQSCLAGIQAQAAGAGVSAQTFRAATANIAYDDKVIELSQAQPEFKTPIWDYMSALVDEERVEDGRAAMRQHAQALANAEARYGVDRHTIAAVWGVESNFGKNLGKMPLVQSLATLACSSNRRRDFFRSELIATLKIIERGDIEASRLTGSWAGAFGQTQFMPTTYQRLAVDGDGDGRRDVVDSVADAVASTANFLRVAKWSNGQPWGYEVRLPRGFNVAAAGRKNKHAVGHWASLGVTRVDGKALTGDGPAGIIAPAGINGPAFLVTKNFDAIYSYNAAESYGLAIAVLSDRLRGRPGVQADWPTDDPPLSRAERRDLQTRLTARGYDVGEPDGKVGSKTREAIKEIERQLGMPATGRPGGKVLEALRRG',
  'MFKYSFIAVIVSTVLLSACADSHQKSAEKKPVTSEIANIATSAPARWKQIDVVSLEQAFPKQSRTPAQFPAYVDALKQKAAELGYKPETINFAFSEIHFIDRVVKSDRNQPEKKITLDVYLPRVVTKGRIAEGAKLYQANQQTLAQISNQYGVPANYIVALWGLESGFGRVQGKEDVISALATLAFEGRREALFSRQLMAALEIIENGHLPVGQRLKGSWAGAMGQTQFMPSSFLTYAADGNGDGNIDIWNSREDAFASAANYLATEGWQRDLPWGEQVSLPANFNQQLEGIKTEQQKTVAQWKALGVQLPANSQLSDDMKVWLIIPDDDLHRSYLVTQNFRTIMHWNSSYFFALSIVTMADGVANKINTLPTQH',
  'MKKESRPAFDAAAVFDAAAVPVSDSGFAANANVRRFVDDEVGKGDFSRAEWQDFFDKAAYKADIVKIMHRPSTSRPWYVFRTGNSGKAKFRGARRFYAENRALIDDVAQKYGVPAELIVAVIGIETNYGKNTGSFRVADALATLGFDYPRRAGFFQKELVELLKLAKEEGGDVFAFKGSYAGAMGMPQFMPSSYRKWAVDYDGDGHRDIWGNIGDVAASVANYMKQHGWRTGGKILVSATLAPGADVQAIIGEKTALTRTVADLKAYGIIPGEELADDEKAVLFKLETAPGVFEYYLGLNNFYTVWQYNHSRMYVTAVRDIANSLGGSGL',
  'MASSSSSKQAKPIHRMAWRLGVSLTLLLGLGALFVLPKFDPKSLTWPTTEPGRIAPLAMSGGNPYLRALMRTISASESNDASPYTVLYGGSHIENLQEHPDRCIPIRWGPNQGLCTTAAGRYQFITTTWLETAEKYHPAPTGEWMWRRYSFAPEYQDRVVYAWLDDVNYWGTDIPQLLEDGQLQTVLKRLSGTWTSLGYGIESNKVTPHLMHIYERMLAEEIALANGLPTNYLPTVANQSVETTR',
  'MIIQHSQPKRKGTKYRLKKPYKLVFNLIIVVGLIGLVYSFKKNTQPLVNPSLVTHLPELEMSGGDPYIRALMLTISASESNHKNSYYLLYGGSHVHNLQQHPDQCIPINIGPNRGNCSTAAGRYQFLNSTWQEKARKYHPNPQKNYRQYIYSFEPKYQDIVVYRWLKDHHQWNVDLLTLLKQDQVEEVLRKLSNVWTSLGGGIEDNSMTPHLPSIYRYFLAQELNRENADQNSL',
  'MVEINNQRKAFLDMLAWSEGTDNGRQKTRNHGYDVIVGGELFTDYSDHPRKLVTLNPKLKSTAAGRYQLLSRWWDAYRKQLGLKDFSPKSQDAVALQQIKERGALPMIDRGDIRQAIDRCSNIWASLPGAGYGQFEHKADSLIVKFKEAGGTVREIEV',
  'MGYTWKGLAKQYGFTDFSPATQDKAAVALILAKKGAMEAILNGDYEQAVMKLGGIWASFPTAPNEYRQHKRSWGFVHNFFRQRGF',
  'MARISAADAGGVNVIAFLDMLAWSEGTSTIKASDYGYDVLVGGKLFSEYSKHPRVKVWLPKYSIYSSAAGRYQFLAGTWDAIVKNYGFKGRFIPEAQDLAAIKLLTECGALPLIKAGRIVEAIAKAAPIWASLPGAGYGQREHKLAALLGIYEAERAAEAKPQDQLLAMFSACGGEMAA',
  'MTRYEFALLALAAVGYVVWRDWQRSEEPGAQSPDFIDQAENLFYDATEGNFFGGTEDTDMGQAQLNRAAFLLTIRTGEGTAGNDGYRMLFGGGKFDSFADHPRQVVTALSNGKPISSSAAGAYQFLRRTWDTLAARLGLTDFSPASQDAAALELIREAGALGDVDAGRFALAVRKVRKIWASMPGAGYGQPEVALERLQAAYQAAGGVVNG',
  'MPVINTHQNIAAFLDMLAYSEGTANHPLTKNRGYDVIVTSLDGRPEIFTDYSDHPFAHGRPAKVFNRRGEKSTASGRYQQLYMFWPHYKKQLALPDFSPLSQDKLAIQLIRERGAIDDIRAGRIERAVSRCRNIWASLPGAGYGQREHSLEKLVTVWRTAGGVVA',
  'MYSQQVQQINQPQKNSDIQLINMWLQQIHPIQQNSHLYIAQMFLKFIKKPLKKVTSADVIAFANVYGVRSHNSHSNQQKRIETINSLLKFGQEAGILPRNQKKTFSPNTTNFKTSVYSQNKIKNYRTTGKQQKKPLNWSQLFNLQLASSVLIVFILLMAILQLFRQVSGSTNANQNKSVTSVVMPKIDPTKNWAYPVNVPRIRAFLDTIAVTEGTTGPKGYYRQYTGSHFLSFEDHPRELKCANSNGKKLCSDAAGRYQFLSTSWDRFAPVVKAQNFSPTYQDRVAIELIRDKNALKDIEEGRVKEAFQKLYMVWPSFGETETDVEQLMPKLVGTYEQKLALYQIKN',
  'MDDEFERAFKKILDYEGGYSDEQKDHGGKTKYGITEKLARDYGHEGEMKDLELEKAKEIYYREFWANHLYSWIEDERIATEVFEQAVNMGAKTANKHLQKAYNLLADKEIAVDGIIGQRTLEAVNNFEHNSDLFKLLNILQAKKYINIVKNDASQQKFIRGWLRRVELDIDSRKS',
  'MKRNFQTVMPYIFSEEGGYADNPADPGGATNMGITINTLSAWEGRQVSPQDVKELTQATATQIYQVEFWNKIDGNDLPSGVDYALFDFAVNSGPGRAAKTLQKILAMPEDGIIGAQTVAAAAARSPEGIINALCDARAAWLRGLSTAATFGNGWLARVERVRARALALAATPPAITQPADPAGNPSPKARQADIAFTSALKHPEALGTMGSVASGLAAIATGNGPVQYALAIVMVACAGVGLWYFVRRVRSEP',
  'MNFDQAFDRLLGHEGGYSNNSADPGGETMWGVTARVARADGYLGEMRDLPRDRAKSIYRRLYWTPVRADELPEVVRFDVFDGAVNSGPAQSIKWLQRAAGAVDDGILGPRTMAAAVAAGPVLAARYNGHRLLFLADRPTWGSFGKGWARRVGKNLLGA',
  'MDQPPWLQAAWAEFGVREIPGKEDAPEILRYFRDAGDTNVETEATPWCAAFLGAMLKRAGYAGTGSLLARSYLDWGDRLDDARFGAVAVLSRGDDPNAGHVGFLLSDTNGKLYLLGGNQGDAVTVASFDKARLLGLRWPKENVEAASKGDDAIFSRVLAHVLEMEGGFSNDPYDPGGPTNRGITLEVYAKFRKETLDDGTRARLIAELKRIPDAIVTAIYRQRYFDPASCPVFTAPLALMHFDAAVNHGVGAAIRMLQGVAGVTVDGEIGPETLAAIGAKSLADLLDDYAETRRARYRALPHFWRFGRGWLKRVDATLALARTWAAAEATNRGLIEPQQIAKGEGKMGEKSKTEISSSDDSKWWLNSKTMWGTLITAAATVIPVLGPAVGIVLPADLITSFGDQVVTAAQALAGLFGTALAIYGRLKADTPLVLRKN',
  'MSAPLTFQQVFDRVVGHEGGYVNDPHDPGGETNWGITKYTARENGYTGSMKAMTREQAYKIYEKAFWQRYHCEKLPEAVAFQFFDAAVNHGVGNASRMLQRAVNVADDGIIGKVTLSAVEKMPISDLLLRFNAERIRFYTKLKNFPRYGKGWMNRIAGNLAYAAIDNEV',
  'MNPIIDGIIALEGGYVFNPKDKGGATHWGITEATARAHGYAGDMRDLTHAEAYAILEEDYWIKPGFDVISTLSWPVSFELCDAAVNIGAYHPSAWLQRWLNVFNHEGKRYPDIHVDGNIGPRTLAALEHYLAWRGQEGEAVLVKALNCSQGTYYLNVAEKNHNNEQFIYGWIKNRVT',
  'MDSFEDAFKALIGNEGGYSFNPADPGGETMWGVTARVARSEGYNGAMKDLPLETAHQIAKRRYWDPLHLDELDPRVAFQIFDANYNGGLVVLWMQKASGAKEDGKFGPDTLDAVKNADPMKFVMRFAAYRLRYLRNLHSWPSFSRGWTERMAANLLLGAA',
  'MSQTATLSDFNKAFDRVIQHEGGYVNDPRDAGGETKFGITIHTARANGYTGSMFTMTRDDAKQIYLKAFWQRYRCNEFPPELAFQFFDACVNHGSGNASRMLQRAVGVVDDGIIGEITLAAIRKRSTVEVVTLFNAERLEFYTKLSGFQHFGKGWIRRMAGNLRHIADDVGDK'],
 'letters': 'MRKFNKPLLALLIGSTLCSAAQAAAPGKPTIAWGNTKFAIVEVDQAATAYNNLVKVKNAADVSVSWNLWNGDAGTTAKILLNGKEAWSGPSTGSSGTANFKVNKGGRYQMQVALCNADGCTASDATEIVVADTDGSHLAPLKEPLLEKNKPYKQNSGKVVGSYFVEWGVYGRNFTVDKIPAQNLTHLLYGFIPICGGNGINDSLKEIEGSFQALQRSCQGREDFKVSIHDPFAALQKAQKGVTAWDDPYKGNFGQLMALKQAHPDLKILPSIGGWTLSDPFFFMGDKVKRDRFVGSVKEFLQTWKFFDGVDIDWEFPGGKGANPNLGSPQDGETYVLLMKELRAMLDQLSAETGRKYELTSAISAGKDKIDKVAYNVAQNSMDHIFLMSYDFYGPFDLKNLGHQTALNAPAWKPDTAYTTVNGVNALLAQGVKPGKVVVGTAMYGRGWTGVNGYQNNIPFTGTATGPVKGTWKNGIVDYRQIAGQFMSGEWQYTYDATAEAPYVFKPSTGDLITFDDARSVQAKGKYVLDKQLGGLFSWEIDADNGDILNSMNASLGNSAGVQMSTRKAVIGYYFIPTNQINNYTETDTSVVPFPVSNITPAKAKQLTHINFSFLDINSNLECAWDPATNDAKARDVVNRLTALKAHNPSLRIMFSIGGWYYSNDLGVSHANYVNAVKTPAARTKFAQSCVRIMKDYGFDGVDIDWEYPQAAEVDGFIAALQEIRTLLNQQTIADGRQALPYQLTIAGAGGAFFLSRYYSKLAQIVAPLDYINLMTYDLAGPWEKITNHQAALFGDAAGPTFYNALREANLGWSWEELTRAFPSPFSLTVDAAVQQHLMMEGVPSAKIVMGVPFYGRAFKGVSGGNGGQYSSHSTPGEDPYPNADYWLVGCDECVRDKDPRIASYRQLEQMLQGNYGYQRLWNDKTKTPYLYHAQNGLFVTYDDAESFKYKAKYIKQQQLGGVMFWHLGQDNRNGDLLAALDRYFNAADYDDSQLDMGTGLRYTGVGPGNLPIMTAPAYVPGTTYAQGALVSYQGYVWQTKWGYITSAPGSDSAWLKVGRLAMLSFVKKSIALVAALQAVTALATPISSEAGVEKRGSGFANAVYFTNWGIYGRNFQPADLPASEITHVLYSFMNVRADGTIFSGDTYADYEKHYAGDSWNDVGTNAYGCVKQLYLLKKQNRNMKVMLSIGGWTWSTNFPAAASSAATRKTFAQSAVGFMKDWGFDGIDIDWEYPADATQAQNMVLLLQAVRSELDSYAAQYAKGHHFLLSIAAPAGPDNYNKLKFAELGKVLDYINLMAYDYAGSWSNYTGHDANIYANPQNPNATPYNTDDAVQAYINGGVPANKIVLGMPIYGRSFQQTEGIGKPYNGIGSGSWENGIWDYKALPKAGATVKCDDTAKGCYSYDPSTKELISFDTPAMISTKVSWLKGKGLGGTMFWEASASKKGSDSLISTSHQGLGSQDSTQNYLDYPNSKYDNIKKGMNMILNLIILLAISIVASASNIAAYWGQNAGGDQQTLGDYCSSSPASIIILSFLDGFPNLSLNFANQCSGTFSSGLAHCSQIGSDIKSCQQQGKTILLSLGGATGNYGFSSDSEAVQFAGTLWNKFGGGKDSERPFDDAIVDGFDFDIENKDQTGYAALATQLRKYFSTGTKSYYLSAAPQCPYPDESVGDLMSQVDLDFAFIQFYNNYCSLNQQFNWNSWSNYARGKSIKLYLGLPGSSSSAGSGFVGLSTVQRVVASIKGDSSFGGISIWDISSAENGGYLNQLYQALSGSGSPAAPSNSYQPNTPLTRTYGGSTATASAYISVGFTAGATHGSTTTNDLLAWIDSLFGSSQSSVQQYATPVQSVTATPQPVAATTTSAPKPTASAFNWFGWFDGTTTSTTLQTVYSTVPADQTVYVTLTTTVGSQMLQSLFDKRDVIAEAKSTNLQICWLLFIPLLALICSMAKRTQAILLLLLAISLIMSSSHVDGGGIAIYWGQNGNEGTLTQTCSTRKYSYVNIAFLNKFGNGQTPQINLAGHCNPAAGGCTIVSNGIRSCQIQGIKVMLSLGGGIGSYTLASQADAKNVADYLWNNFLGGKSSSRPLGDAVLDGIDFDIEHGSTLYWDDLARYLSAYSKQGKKVYLTAAPQCPFPDRYLGTALNTGLFDYVWVQFYNNPPCQYSSGNINNIINSWNRWTTSINAGKIFLGLPAAPEAAGSGYVPPDVLISRILPEIKKSPKYGGVMLWSKFYDDKNGYSSSILDSVLFLHSEECMTVLMTKLILLTGLVLILNLQLGSAYQLTCYFTNWAQYRPGLGRFMPDNIDPCLCTHLIYAFAGRQNNEITTIEWNDVTLYQAFNGLKNKNSQLKTLLAIGGWNFGTAPFTAMVSTPENRQTFITSVIKFLRQYEFDGLDFDWEYPGSRGSPPQDKHLFTVLVQEMREAFEQEAKQINKPRLMVTAAVAAGISNIQSGYEIPQLSQYLDYIHVMTYDLHGSWEGYTGENSPLYKYPTDTGSNAYLNVDYVMNYWKDNGAPAEKLIVGFPTYGHNFILSNPSNTGIGAPTSGAGPAGPYAKESGIWAYYEICTFLKNGATQGWDAPQEVPYAYQGNVWVGYDNIKSFDIKAQWLKHNKFGGAMVWAIDLDDFTGTFCNQGKFPLISTLKKALGLQSASCTAPAQPIEPITAAPSGSGNGSGSSSSGGSSGGSGFCAVRANGLYPVANNRNAFWHCVNGVTYQQNCQAGLVFDTSCDCCNWAMKKFINQFSASLKNNILVFLAFPFVWTSCARDNPLSSENSNISPNAAARAAVTGTTKANIKLFSFTEVNDTNPLNNLNFTLKNSGKPLVDMVVLFSANINYDAANDKVFVSNNPNVQHLLTNRAKYLKPLQDKGIKVILSILGNHDRSGIANLSTARAKAFAQELKNTCDLYNLDGVFFDDEYSAYQTPPPSGFVTPSNNAAARLAYETKQAMPNKLVTVYVYSRTSSFPTAVDGVNAGSYVDYAIHDYGGSYDLATNYPGLAKSGMVMSSQEFNQGRYATAQALRNIVTKGYGGHMIFAMDPNRSNFTSGQLPALKLIAKELYGDELVYSNTPYSKDWMKLNIFTKSMIGMGLVCSALPALAMEAWNNQQGGNKYQVIFDGKIYENAWWVSSTNCPGKAKANDATNPWRLKRTATAAEISQFGNTLSCEKSGSSSSSNSNTPASNTPANGGSATPAQGTVPSNSSVVAWNKQQGGQTWYVVFNGAVYKNAWWVASSNCPGDAKSNDASNPWRYVRAATATEISETSNPQSCTSAPQPSPDVKPAPDVKPAPDVQPAPADKSNDNYAVVAWKGQEGSSTWYVIYNGGIYKNAWWVGAANCPGDAKENDASNPWRYVRAATATEISQYGNPGSCSVKPDNNGGAVTPVDPTPETPVTPTPDNSEPSTPADSVNDYSLQAWSGQEGSEIYHVIFNGNVYKNAWWVGSKDCPRGTSAENSNNPWRLERTATAAELSQYGNPTTCEIDNGGVIVADGFQASKAYSADSIVDYNDAHYKTSVDQDAWGFVPGGDNPWKKYEPAKAWSASTVYVKGDRVVVDGQAYEALFWTQSDNPALVANQNATGSNSRPWKPLGKAQSYSNEELNNAPQFNPETLYASDTLIRFNGVNYISQSKVQKVSPSDSNPWRVFVDWTGTKERVGTPKKAWPKHVYAPYVDFTLNTIPDLAALAKNHNVNHFTLAFVVSKDANTCLPTWGTAYGMQNYAQYSKIKALREAGGDVMLSIGGANNAPLAASCKNVDDLMQHYYDIVDNLNLKVLDFDIEGTWVADQASIERRNLAVKKVQDKWKSEGKDIAIWYTLPILPTGLTPEGMNVLSDAKAKGVELAGVNVMTMDYGNAICQSANTEGQNIHGKCATSAIANLHSQLKGLHPNKSDAEIDAMMGTTPMVGVNDVQGEVFYLSDARLVMQDAQKRNLGMVGIWSIARDLPGGTNLSPEFHGLTKEQAPKYAFSEIFAPFTKQMSTPRAAASLAKKAALVALAVLAAALATAARAEQCGAQAGGARCPNCLCCSRWGWCGTTSDFCGDGCQSQCSGCGPTPTPTPPSPSDGVGSIVPRDLFERLLLHRNDGACPARGFYTYEAFLAAAAAFPAFGGTGNTETRKREVAAFLGQTSHETTGGWPTAPDGPFSWGYCFKQEQNPPSDYCQPSPEWPCAPGRKYYGRGPIQLSFNFNYGPAGRAIGVDLLSNPDLVATDATVSFKTALWFWMTPQGNKPSSHDVITGRWAPSPADAAAGRAPGYGVITNIVNGGLECGHGPDDRVANRIGFYQRYCGAFGIGTGGNLDCYNQRPFNSGSSVGLAEQMPPQKENHRTLNKMKTNLFLFLIFSLLLSLSSAEQCGRQAGGALCPNGLCCSEFGWCGNTEPYCKQPGCQSQCTPGGTPPGPTGDLSGIISSSQFDDMLKHRNDAACPARGFYTYNAFITAAKSFPGFGTTGDTATRKKEVAAFFGQTSHETTGGWATAPDGPYSWGYCFKQEQNPASDYCEPSATWPCASGKRYYGRGPMQLSWNYNYGLCGRAIGVDLLNNPDLVANDAVIAFKAAIWFWMTAQPPKPSCHAVIAGQWQPSDADRAAGRLPGYGVITNIINGGLECGRGQDGRVADRIGFYQRYCNIFGVNPGGNLDCYNQRSFVNGLLEAAIMRLCKFTALSSLLFSLLLLSASAEQCGSQAGGARCPSGLCCSKFGWCGNTNDYCGPGNCQSQCPGGPTPTPPTPPGGGDLGSIISSSMFDQMLKHRNDNACQGKGFYSYNAFINAARSFPGFGTSGDTTARKREIAAFFAQTSHETTGGWATAPDGPYAWGYCWLREQGSPGDYCTPSGQWPCAPGRKYFGRGPIQISHNYNYGPCGRAIGVDLLNNPDLVATDPVISFKSALWFWMTPQSPKPSCHDVIIGRWQPSAGDRAANRLPGFGVITNIINGGLECGRGTDSRVQDRIGFYRRYCSILGVSPGDNLDCGNQRSFGNGLLVDTMMRSLAVVVAVVATVAMAIGTARGSVSSIVSRAQFDRMLLHRNDGACQAKGFYTYDAFVAAAAAFPGFGTTGSADAQKREVAAFLAQTSHETTGGWATAPDGAFAWGYCFKQERGASSDYCTPSAQWPCAPGKRYYGRGPIQLSHNYNYGPAGRAIGVDLLANPDLVATDATVGFKTAIWFWMTAQPPKPSSHAVIAGQWSPSGADRAAGRVPGFGVITNIINGGIECGHGQDSRVADRIGFYKRYCDILGVGYGNNLDCYSQRPFAMGAFALFAVLAMAVTMAVAEQCGSQAGGATCPNCLCCSRFGWCGSTSDYCGDGCQSQCAGCGGGGTPVTPTPTPSGGGGVSSIVSRALFDRMLLHRNDGACQAKGFYTYDAFVAAAGAFPGFGTTGSTDTRKREVAAFLAQTSHETTGGWATAPDGAFAWGYCFKQERGATSNYCTPSAQWPCAPGKSYYGRGPIQLSHNYNYGPAGRAIGVDLLRNPDLVATDPTVSFKTAMWFWMTAQAPKPSSHAVITGQWSPSGTDRAAGRVPGFGVITNIVNGGIECGHGQDSRVADRIGFYKRYCDILRVGYGNNLDCYNQRPFAMRLSEFTTLFLLFSVLLLSASAEQCGSQAGGALCASGLCCSKFGWCGNTNEYCGPGNCQSQCPGGPGPSGDLGGVISNSMFDQMLNHRNDNACQGKNNFYSYNAFVTAAGSFPGFGTTGDITARKREIAAFLAQTSHETTGGWPTAPDGPYAWGYCFLREQGSPGDYCTPSSQWPCAPGRKYFGRGPIQISHNYNYGPCGRAIGVDLLNNPDLVATDPVISFKSAIWFWMTPQSPKPSCHDVITGRWQPSGADQAANRVPGFGVITNIINGGLECGHGSDSRVQDRIGFYRRYCGILGVSPGENLDCGNQRSFGNGLLVDIMQNCQCDTTIYCCSQHGYCGNSYDYCGPGCQAGPCWDPCEGDGTLTVSDIVTQEFWDGIASQAAANCPGKSFYTRSNFLEAVSAYPGFGTKCTDEDRKREIAAYFAHVTHETGHLCYIEERDGHANNYCQESQQYPCNPNKEYFGRGPMQLSWNYNYIDAGKELHFDGLNDPDIVGRDPIISFKTSLWFWIRKGVQYVILDPNQGFGATIRIINGGQECDGHNTAQMMARVGYYQEYCAQLGVSPGNNLPCMKKNRMMMMIWSVGVVWMLLLVGGSYGEQCGRQAGGALCPGGNCCSQFGWCGSTTDYCGPGCQSQCGGPSPAPTDLSALISRSTFDQMLKHRNDGACPAKGFYTYDAFIAAAKAYPSFGNTGDTATRKREIAAFLGQTSHETTGGWATAPDGPYAWGYCFVRERNPSTYCSATPQFPCAPGQQYYGRGPIQISWNYNYGQCGRAIGVDLLNKPDLVATDSVISFKSALWFWMTAQSPKPSSHDVITSRWTPSSADVAARRLPGYGTVTNIINGGLECGRGQDSRVQDRIGFFKRYCDLLGVGYGNNLDCYSQTPFGNSLLLSDLVTSQMRSLLILVLCFLPLAALGKVFGRCELAAAMKRHGLDNYRGYSLGNWVCAAKFESNFNTQATNRNTDGSTDYGILQINSRWWCNDGRTPGSRNLCNIPCSALLSSDITASVNCAKKIVSDGNGMNAWVAWRNRCKGTDVQAWIRGCRLMKALIVLGLVLLSVTVQGKVFERCELARTLKRLGMDGYRGISLANWMCLAKWESGYNTRATNYNAGDRSTDYGIFQINSRYWCNDGKTPGAVNACHLSCSALLQDNIADAVACAKRVVRDPQGIRAWVAWRNRCQNRDVRQYVQGCGVMKAFIVLVALACAAPAFGRTMDRCSLAREMSNLGVPRDQLNKWACIAEHESSYRTGVVGPENYNGSNDYGIFQINDYYWCAPPSGRFSYNECGLSCNALLTDDITHSVRCAQKVLSQQGWSAWSTWHYCSGWLPSIDDCFKIFSKCELARKLKSMGMDGFHGYSLANWVCMAEYESNFNTQAFNGRNSNGSSDYGIFQLNSKWWCKSNSHSSANACNIMCSKFLDDNIDDDIACAKRVVKDPNGMSAWVAWVKHCKGKDLSKYLASCNLMTKYVILLAVLAFALHCDAKRFTRCGLVQELRRLGFDETLMSNWVCLVENESGRFTDKIGKVNKNGSRDYGLFQINDKYWCSKGTTPGKDCNVTCNQLLTDDISVAATCAKKIYKRHKFDAWYGWKNHCQHGLPDISDCKVYDRCEFARILKKSGMDGYRGVSLANWVCLAKWESDFNTKAINRNVGSTDYGIFQINSRYWCNDGKTPKAVNACHISCKVLLDDDLSQDIECAKRVVRDPQGIKAWVAWRTHCQNKDVSQYIRGCKLMKAVIILGLVLLSVTVQGKIFERCELARTLKRLGLDGYRGISLANWVCLAKWESDYNTQATNYNPGDQSTDYGIFQINSHYWCNNGKTPGAVNACRISCNALLQDNIADAVTCAKRVVRDPQGIRAWVAWRNHCQNRDVSQYVQGCGVKIYEQCEAAREMKRLGLDGYDGYSLGDWVCTAKHESNFNTGATNYNRGDQSTDYGIFQINSRWWCNDGKTPNAKNACGIECSELLKADITAAVICAKRVVRDPNGMGAWVAWTKYCKGKDVSQWIKGCKLMSALWLLLGLLALMDLSESSNWGCYGNIQSLDTPGASCGIGRRHGLNYCGVRASERLAEIDMPYLLKYQPMMQTIGQKYCMDPAVIAGVLSRKSPGDKILVNMGDRTSMVQDPGSQAPTSWISESQVSQTTEVLTTRIKEIQRRFPTWTPDQYLRGGLCAYSGGAGYVRSSQDLSCDFCNDVLARAKYLKRHGFRTDCYGNVNRIDTTGASCKTAKPEGLSYCGVSASKKIAERDLQAMDRYKTIIKKVGEKLCVEPAVIAGIISRESHAGKVLKNGWGDRGNGFGLMQVDKRSHKPQGTWNGEVHITQGTTILINFIKTIQKKFPSWTKDQQLKGGISAYNAGAGNVRSYARMDIGTTHDDYANDVVARAQYYKQHGYMVPSVVFWGLIALVGTAKGSYTHSVHSMNPHVHPRLYHGCYGDIMTMETFGAPCDINNLMNCGIHGSEMFAEMDLKAIKPYRILIKEVGQRHCIDPALIAAIISRESHGGAVLQNGWDHKGQRFGLMQLDKNMYHPIGSWDSKEHLLQSVGILTERIKAMKRKFPTWNTAQQLKGGLTAFKSGMETIVTPADIDGDLVDDVLARAKFYKRHGFMGYGNIMNVETTGASWQTAQQDKLGYSGVRASHTMANTDSGRMERYRSKINSVGAKYGIDPALIAAIISEESRAGNVLHDGWGDYDSNRGAYNAWGLMQVDVNPNGGGHTARGAWDSEEHLSQGAEILVYFIGRIRNKFPGWNTEQQLKGGIAAYNMGDGNVHSYDNVDGRTTGGDYSNDVVARAQWYKTQKGFMPYGKIEDIKTSGASDVTAAQDGLKEGGWKSSHRMAEIDSNRMENYRTIINEAGRQCDVDPAVIAGIISRESRAGNQLINGWGDHGKAFGLMQIDVTPPPNGGGHTPVGTWDSLEHLIQATEILVEFIERIKTKFPRWNADQHLKGALAAYNKGEKNVESYASVDAKTTGKDYSNDVVARAQWYKSNMGFMKCLVALFLSLSLVACQYDDYDTERKNNNMLSSMNILDLLDSFGLNIKARIAHVRRVAGRIRLTLDIGLGNGDVERESEEAEGEGTDGRGGGEGEREGWGGEREGGEGEREGGEGEREGREGEREGKSSESNESPEDFIGPPVDMCAGESRRGSPSIGCIAAECCQHSFYINSLCPGSSVCCFSMDVCDRLPVPVIPPFPTDPGTLPPPPPIPDSQTTVSPNQPSSYMCHGDFMKLMPKGADQRTARQDNLAYAGVRASNKLVDNDLAELNKRKDCYVQAGKNHCIHPAVIAAIASRETRGGKLLYSTNGYGDGGRAYGIMQCDGGASGLGDICKKYPWDSCEHINQLTDIILLNYVNQMKTKHPSWPAHYQLKGGVSAYNAGVGNVQTIAGMDAGTTNDDYSNDVIARAQRLVNAHGWMLGKNDPMCLVLVLLGLTALLGICQGGTGCYGSVSRIDTTGASCRTAKPEGLSYCGVRASRTIAERDLGSMNKYKVLIKRVGEALCIEPAVIAGIISRESHAGKILKNGWGDRGNGFGLMQVDKRYHKIEGTWNGEAHIRQGTRILIDMVKKIQRKFPRWTRDQQLKGGISAYNAGVGNVRSYERMDIGTLHDDYSNDVVARAQYFKQHGYMHLMLVLLGLAALLGTSQSRTGCYGDVNRVDTTGASCKSAKPEKLNYCGVAASRKIAERDLQSMDRYKALIKKVGQKLCVDPAVIAGIISRESHAGKALRNGWGDNGNGFGLMQVDRRSHKPVGEWNGERHLMQGTEILISMIKAIQKKFPRWTKEQQLKGGISAYNAGPGNVRSYERMDIGTTHDDYANDVVARAQYYKQHGYMNIFEMLRIDEGLRLKIYKDTEGYYTIGIGHLLTKSPSLNAAKSELDKAIGRNCNGVITKDEAEKLFNQDVDAAVRGILRNAKLKPVYDSLDAVRRCALINMVFQMGETGVAGFTNSLRMLQQKRWDEAAVNLAKSRWYNQTPNRAKRVITTFRTGTWDAYKNLMEMISNNLNWFVGVVEDRMDPLKLGRVRVRVVGLHPPQRAQGDVMGIPTEKLPWMSVIQPITSAAMSGIGGSVTGPVEGTRVYGHFLDKWKTNGIVLGTYGGIVREKPNRLEGFSDPTGQYPRRLGNDTNVLNQGGEVGYDSSSNVIQDSNLDTAINPDDRPLSEIPTDDNPNMSMAEMLRRDEGLRLKVYWDTEGYPTIGIGHLIMKQPVRDMAQINKVLSKQVGREITGNPGSITMEEATTLFERDLADMQRDIKSHSKVGPVWQAVNRSRQMALENMAFQMGVGGVAKFNTMLTAMLAGDWEKAYKAGRDSLWYQQTKGRASRVTMIILTGNLESYGVEVKTPARSLSAMAATVAKSSDPADPPIPNDSRILFKEPVSSYKGEYPYVHTMETESGHIQEFDDTPGQERYRLVHPTGTYEEVSPSGRRTRKTVDNLYDITNADGNFLVAGDKKTNVGGSEIYYNMDNRLHQIDGSNTIFVRGDETKTVEGNGTILVKGNVTIIVEGNADITVKGDATTLVEGNQTNTVNGNLSWKVAGTVDWDVGGDWTEKMASMSSISSGQYTIDGSRIDIGMPPSLRKAVAAAIGGGAIAIASVLITGPSGNDGLEGVSYIPYKDIVGVWTVCHGHTGKDIMLGKTYTKAECKALLNKDLATVARQINPYIKVDIPETTRGALYSFVYNVGAGNFRTSTLLRKINQGDIKGACDQLRRWTYAGGKQWKGLMTRREIEREVCLWGQQMVEINNQRKAFLDMLAWSEGTDNGRQKTRNHGYDVIVGGELFTDYSDHPRKLVTLNPKLKSTGAGRYQLLSRWWDAYRKQLGLKDFSPKSQDAVALQQIKERGALPMIDRGDIRQAIDRCSNIWASLPGAGYGQFEHKADSLIAKFKEAGGTVREIDVMKGKTAAGGGAICAIAVMITIVMGNGNVRTNQAGLELIGNAEGCRRDPYMCPAGVWTDGIGNTHGVTPGVRKTDQQIAADWEKNILIAERCINQHFRGKDMPDNAFSAMTSAAFNMGCNSLRTYYSKARGMRVETSIHKWAQKGEWVNMCNHLPDFVNSNGVPLRGLKIRREKERQLCLTGLVNEMMQISSNGITRLKREEGERLKAYSDSRGIPTIGVGHTGKVDGNSVASGMTITAEKSSELLKEDLQWVEDAISSLVRVPLNQNQYDALCSLIFNIGKSAFAGSTVLRQLNLKNYQAAADAFLLWKKAGKDPDILLPRRRRERALFLSMQISQAGINLIKSFEGLQLKAYKAVPTEKHYTIGYGHYGSDVSPRQVITAKQAEDMLRDDVQAFVDGVNKALKVSVTQNQFDALVSFAYNVGLGAFRSSSLLEYLNEGRTALAAAEFPKWNKSGGKVYQGLINRRAQEQALFNSGTPKNVSRGTSSTKTTPKYKVKSGDNLTKIAKKHNTTVATLLKLNPSIKDPNMIRVGQTINVTGSGGKTHKVKSGDTLSKIAVDNKTTVSRLMSLNPEITNPNHIKVGQTIRLSMKVSQNGLNLIKEFEGCRLTAYKPVPWEQMYTIGWGHYGVTAGTTWTQAQADSQLEIDINNKYAPMVDAYVKGKANQNEFDALVSLAYNCGNVFVADGWAPFSHAYCASMIPKYRNAGGQVLQGLVRRRQAELNLFNKPVSSNSNQNNQTGGMIKMYLIIGLDNSGKAKHWYVSDGVSVRHVRTIRMLENYQNKWAKLNLPVDTMFIAEIEAEFGRKIDMASGEVKMVKKNDLFVDVSSHNGYDITGILEQMGTTNTIIKISESTTYLNPCLSAQVEQSNPIGFYHFARFGGDVAEAEREAQFFLDNVPMQVKYLVLDYEDDPSGDAQANTNACLRFMQMIADAGYKPIYYSYKPFTHDNVDYQQILAQFPNSLWIAGYGLNDGTANFEYFPSMDGIRWWQYSSNPFDKNIVLLDDEEDDKPKTAGTWKQDSKGWWFRRNNGSFPYNKWEKIGGVWYYFDSKGYCLTSEWLKDNEKWYYLKDNGAMATGWVLVGSEWYYMDDSGAMVTGWVKYKNNWYYMTNERGNMVSNEFIKSGKGWYFMNTNGELADNPSFTKEPDGLITVATVQGFDISSYQPSVNFAGAYSAGARFVIIKATEGTSYTNPSFSSQYNGATTATGNYFIRGGYHFAHPGETTGAAQADYFIAHGGGWSGDGITLPGMLDLESEGSNPACWGLSAASMVAWIKAFSDRYHAVTGRYPMLYTNPSWWSSCTGNSNAFVNTNPLVLANRYASAPGTIPGGWPYQTIWQNSDAYAYGGSNNFINGSIDNLKKLATGMKGIDIYSGQGSVDFNAVKESGVEVVYIKATEGLTYTDSTYKDFYDGAKNAGLKIGFYHYLRANDPTSEAEHFFNTISGLSLDCKCAIDVEVTLGQSIDQISSNVRKFADYLINKGLDVCVYTYTNFYKDNLNSTVKDLPLWIAEYGVSKPNIDASYVGFQYSDSGSVNGISGSADLDEFSEGILVGGTVVIDPGQGGDDNIKAIQQDLNILLKRGLEVDGIEGPETEAAIKDFQSIMGLTVDGIWGTNTSGAAQQIFSRPLDGVAYPHYEYATRYIQYRVGASVDGTFGSGTKAKVAAWQSNQGLMADGVVGSATWSKLLDENKLGIDVSQPTSTSSFTCLRNKGFTTMVIVRAWKSTGSFDTNAPQTLKNANAAGFSIENSDVYYYPCISCGNMAGQVRTFWQKVGQYSLKVKRVWFDIEGTWTSSVSTNQNYLMQMMNEARAIGIVHGIYGSKYYWGNLFGSSYKYRYRSSTPLWYPHYDNSPSFSDFSSFGGWTSPSMKQYRGDVSVCSAGVDYNYKPMPAYSSLARRGRRPAVVLLGGLVSASLALTLAPTAAAAPLAPPPGKDVGPGEAYMGVGTRIEQGLGAGPDERTIGPADTSGVQGIDVSHWQGSINWSSVKSAGMSFAYIKATEGTNYKDDRFSANYTNAYNAGIIRGAYHFARPNASSGTAQADYFASNGGGWSRDNRTLPGVLDIEHNPSGAMCYGLSTTQMRTWINDFHARYKARTTRDVVIYTTASWWNTCTGSWNGMAAKSPFWVAHWGVSAPTVPSGFPTWTFWQYSATGRVGGVSGDVDRNKFNGSAARLLALANNTAMTKTYGVDVAVYQPIDLAAYHKAGASFAIVKLTEGVDYVNRRGPSRWTAPGLTTSTLMPTISRSFGSSVSRAKKEAAYFLKEAKKQDISKKRMLWLDWEAGSGNVVTGSKSSNTAAILDFMDAIKAAGWRPGLYSGASLMRTAIDTKQVVKKYGTCLWVASYPTMAAVSTADFGYFRQWTGSPSGSLPVTAWPGRRRERCSGMQLRITSRKKLTSLLCALGLISIVAIYPRQTVNFFYSTAVQITDYIHFYGYRPVKSFAIRIPASYTIHGIDVSRWQERIDWQRVAKMRDNGIRLQFAFIKATEGEKLVDPYFSRNWQLSRENGLLRGAYHYFSPSVSASVQARLFLQTVDFSQGDFPAVLDVEERGKLSAKELRKRVSQWLKMVEKSTGKKPIIYSGAVFYHTNLAGYFNEYPWWVAHYYQRRPDNDGMAWRFWQHSDRGQVDGINGPVDFNVFNGTVEELQAFVDGIKETPMRFIALLISFFALLKVISAISGVDISSASTIESFTCLKSAGYDFAIIRAYESLGQVDPNGPHSVYNARDAGIEYVDVYMFPCPTCGNGAGQAETMVNYLKGYNANYGMVWLDIEGPQYWMSQSENVAFFESLVAGLKAEGAHIGVYTSASQWEPIMGGYTGGSEFPLWYAHYDGNPSFSDFSPFNGWSTPSVKQYDDTGDSCGLGFDLNWYPMHCAPSWKSSDERRTMLDQINTLDPNSLTALKRMSKDNSPAAIKGAAQQFEALFLQNMLKSMRDATVTSDAMGSETTRFYQGLYDQQLAAMMAQRGGIGLADVMEKQMGAQAASAQNAAAAGASSAGNVPLSLDAARAAAAHTASGDKVPTTPQAFVDATWPQAAKAAQSLGVPAHFLVAQAALETGWGKSQIRNKDGTPSYNLFNIKAGSNWTGKVVEARTVEYENGQRKVRVERFRAYDSYEQAFQDYADLVGNSPRYAKVAGKTDGHAFARALQEGGYATDPSYADKLARVINGNALRQRLMASAASARGMINKKWMKIVMIPMLVVPMYGLTSVSGQIQDSLTGENSFVKDAEAATTASQQAFIDKIAPAAQASQEQYHLLSSITLAQAILESGWGKSGLATKGYNLFGIKGKYNGQSVIMSTSEYVNGQWIKIDAEFRKYPSWNESVTDHTLLLVNGTSWNKNLYKKVVDATDYKVAAMELQKAGYASPTYGASLIQVIENYDLAKYDVLYDKILTQKSTSGKATVTSPTGNGVWTLPYKVKGVQSVSPASTYANKDIDLVSVATTKRGTYYQFKYNGKVVGWVDAKALTIYDSVNYDKVNVGRAKITSPVSNGIWSKPYNVYGREFVTNATTYAQQEIKLLREAQTAKGTYYQFSINNKTIGWIDKRALTIYPYDSIVSSKNVSLDGQITNPTGNGIWTKAYKLEGTTSVAQATKYANKDVKISQQVETQHGTYYNISIDGKAIGWLDKNAITLYDQAEYNKTVAFDAAIRNVQGNAVWTEPYRTVGTKLIGPAETYLNKEVEVVREAKTPKGTYYQFKSGGKVIGWLDKKAFEVYDNINYNKAVNLDAVVENVTGNAVWTAPYKSKGVKLVTSAATYKGKATKITREAQTSRGTYYEFSVNGKVIGWLDKKAFDVYDSIEYNKAINMTGLLSNAPGNGIWTEPYRVLDTKNIGQATAYANKTVQLVREAKTSHSTYYQMSLNGKVIGWIDKRAFTNVKMVNTQVKRVKKQKFIAGTALLLGMATFGMVGKADDLSSSNTNGGVDNSKVDNDNQESVKTSTEGVSSTTENANTVPESKVTSTVDSESAPSKTISAGTQSNISGTSDGSDSLPKTETSDSSSKPSTSNSSSKPSTSNSSSKPSTSNSSSNNNSATKPSTTTQAPPVAPSTTAPSATPSTTAPSNYYQNSSYNQTSTAAQIPNSSSDSAASVYSGPVLKKIEAAKPIEKIDSSSTEAFIKSIADRVRILAGKNNLYASIILAQAILESGSGQSNMTQQYFNIFNITGAYLGKSISFKTEEFSGNNPYYIEQSFRVYSNYDQALDDYINLMIKGTTWNSEIYAGAWKSHAKTYQEAAQALQGIFATDPEYAQKLIEIIEEYNLNFYDNVDSTTQVLDSNIPESPLVASKLDSSTYPDYNGVEYPGADSYAFGNCTQYVYNRIIQLGGQIGTHMGNGGEWGINAQAQGYFTTTVPTEGYAVSFPPGVAGSSPEYGHVAFVEKVYPDNSILVSEMNVKGNNIVSERHISAGVAALATYIQPKMNRNRLSCLIVGAVIGAGAIVCTTNTKVHAKPVNEVKNINTSKGNSFGEIISSEDIGLRKGADSSHEIITSIPSGARVNIIDKMSKDWYKVSYKDFTGYLQAKDIRVLGDELNQDNVGLISANQLNVRTSPNENGQVIGTLHKNDKVNVLDKSIDGWYKIDFNGRRAYVSSKYVNLISYKNNEVKTEVKKEPIEGTGKVNINTALNVRQASTTNSRIIGSLKGGEKVNIISESNGFYKIEFNNSYGYVYSKYISKDGDSEKVQVVKQEEVKKEKVDESKKEAKATPKAEPVVLAVRSLNKTGIVNVSSSLNVREGAGTSSKVIGSLSGNTKVTIVGEEGAFYKIEYKGSHGYVAKEYVKDVTESSNSNQGTQTPEKPSTPESTEKTGIVNVSSSLNVREGASTSSKVIGSLSGNTKVIIVGEEGAFYKIEYKGSHGYVAKEYIKDVTESNNSNQGTQTPEKPSTPESTEKTGIVNVSSSLNVREGASTSSKVIGSLSGNTKVTIVGEEGAFYKIEYKGSHGYVAKEYIKDIKDEVVTEPEKPSAPENTEKTGVVNVSSSLNVREGASTSSKVIGSLSGNTKVIIVGEEGAFYKIEYKGSHGYVAKEYIKDVTESNNSNQGTQTPEKPSTPESTEKTGIVNVSSSLNVREGASTSSKVIGSLSGNTKVTIVGEEGAFYKIEYKGSHGYVAKEYVKDVTESNNSNQGTQTPEKPSTPESAEKTGVVNVSSSLNVREGASTSSKVIGSLSGNTKITIVGEEGAFYKIEYKGSHGYVAKEYIKDIKDEVVTEPEKPSTHENSKKTGVVTASKGLNVRKEANTSSQIIGILNSGESVEIIGEENGFYKITYKGQEAYASKNYINIFDGNSNVNPGLDIGNASKTNYGVSLNEYIKLQQRNNPSNYSYSEFEKYINPAKATNKLQFLRIDKFRSVNVSGLSSRLSNKGVLTGQGQAFVNAAKAFNIDPIYLVAQCLHETGNGTSKLAKGVTITEIADESKPIYNGNGQLVGYHMIKLSKPVTVYNLFGIGAKDNSSVFPNRALILGTTYAYNRGWTSIENAIKGAAEFVSLNYVHSSRYSQNTLYKMRYNQNVSNIWHQYATTPWYASSIADIMRSYQDLYLENNFTFDVPVFAGMKKESMSRIERRKAQQRKKTPVQWKKSTTLFSSALIVSSVGTPVALLPVTAEATEEQPTNAEVAQAPTTETGLVETPTTETTPGTTEQPTTDSSTTTESTTESSKETPTTPSTEQPTADSTTPVESGTTDSSVAEITPVAPSATESEAAPAVTPDDEVKVPEARVASAQTFSALSPTQSPSEFIAELARCAQPIAQANDLYASVMMAQAIVESGWGASTLSKAPNYNLFGIKGSYNGQSVYMDTWEYLNGKWLVKKEPFRKYPSYMESFQDNAHVLKTTSFQAGVYYYAGAWKSNTSSYRDATAWLTGRYATDPSYNAKLNNVITAYNLTQYDTPSSGGNTGGGTVNPGTGGSNNQSGTNTYYTVKSGDTLNKIAAQYGVSVANLRSWNGISGDLIFVGQKLIVKKGASGNTGGSGSGGSNNNQSGTNTYYTVKSGDTLNKIAAQYGVSVANLRSWNGISGDLIFVGQKLIVKKGASGNTGGSNNGGSNNNQSGTNTYYTIKSGDTLNKIAAQYGVSVANLRSWNGISGDLIFAGQKIIVKKGTSGNTGGSSNGGSNNNQSGTNTYYTIKSGDTLNKISAQFGVSVANLQAWNNISGSLIFAGQKIIVKKGANSGSTNTNKPTNNGGGATTSYTIKSGDTLNKISAQFGVSVANLRSWNGIKGDLIFAGQTIIVKKGASAGGNASSTNSASGKRHTVKSGDSLWGLSMQYGISIQKIKQLNGLSGDTIYIGQTLKVGMKKRLIAPMLLSAASLAFFAMSGSAQAAAYTDYSLYKVEPSNTFSTESQASQAVAKLEKDTGWDASYQASGTTTTYQISASGIHSESEAKAILSGLAKQTSITGTSSPVGSKQPYVTISSGAISGEKQANTILAKLKQETGVAGAVKAYGAAQPYMNVMTSDIADETKVKALIQSLAKQTGIKSSYQPITHTVSVTTIQSGTIVGDSRAAQIKNAFQKESGLQASLKETVKGQAYYTFTTAAISGEANAKTLLQQLKQSTGITGSYKSINQKTTVESYNVQSAYFKGLSTVKDAISQIKKNTGVSGSYQQVGKSTSYTVNMKGITKQQLQKIDTFFKKKKWHYTSSSVKKTTTSAAYQITTAKILGEQQANKAAAFFAQKKVKAAKTAAGSTAENQYQLISEETSDQAKVTKGLNILKKNQLSASAKSVKKQIADTFKITTESLLDQTKVNQALTFFKSNHISVASQKTGQTAASSYQITTEAIISQEEIDRVLTFFKQNHIAVTTSKTGQTAYTQYKIVTTQLSSKTALNNGLTYLKSKSVTPSYTTKSNTLYKISVNEQFTGNDTAAAASTKLKQLYGWTSSIVKIKNGPQIMKTNYNLSLRDMVQKQMTVSPQTDGAAYVSLTYINTATSTVTADVLNIRSTPEVSPTNVIGQFKKGDKVKVIGQINGWAKINLGWRNASSDEVVQYVDPNNFSRDSKYYFQFLKLSQTAGLSVTEVNQKVLAGKGILTGRAKAFIDAANQYSINELYLISHALLETGNGTSALANGLTYNGKTVYNMYGIGAYDSNPNYYGAKYAYEQGWFTPEAAIIGGAKFIGSSYIHNTAYNQDTLYKMRWSATATHQYATDIGWAYKQVNRMYSLYSLLDGYTLYFDVPEYRMARKKLKKRKLLISLFFLVSIPLALFVLATTLSKPIEISKETEEIDEQQVFIDSLSGHAQILYEKYHVLPSITIAQAILESDWGNSELAAKANNLFGVKGNYKGHHVTMETDEVEKGKRKTIRAKFRKYSTFFESMDDHAQLFVRGTSWNKKKYKPVLEAGNYKEAATALQTSGYATDPDYADKISAIVEKYDLDEYDEVNPSLKSVDLNASIKDSAVQDVWSKPSTDDRSIRLTSAQSYVGKDIKVVSKKQKGQSVWYQFQINDKLIGWIDDSAVEIKEATMARKLIKNLGKSKSVKRVKLLFKKIFITVFIVASIVAIFNITKYFEELYKVRDLKSTKIEYYMDVADEAGDGKVQLSWKALLAIDMVIHDEDLSNIKKKDTLDIGEKFIVEDKNDKGEKVYKVKKFNKVLSELKFDSSQKSRARKYMKDLEYTYLGNKQLDSSDEKIKFIKKLEDSAIREYIDYGILPSITIGQAILESGWGNSKLTKQSNNLFGIKADKAWKGKSVEISTSEHYNEKIVASFRSYNSLQDSVKDHSLFLINNKRYRKHGLFEAKDYISQAQALENAGYSTAEDKKGNRIYAELLIDVIRSYNLQLIDNKVETKMFFLTLPLLLGCTAATTPLTAATPPVDPLPLKVVSTDQLPKGLAKDQQLWNKVNGQKGDYKALLTAIDHSLEYLGTDKAQKDYQDYKVPGITRDRVSRSLRRFRQLVVQAKSPQALETAVKKEFQFYQSIGNDQKGNVDFTGYYEATYPASRQPTTEFRYPLYQAPADLKAWPKPHPTRAELEGADGLQASQGPLKGLELVWLRDRIQAFLVQVQGSARLGLTDGTEMTVGYAGKTAHPYTSIGKALIADGKFTLEELSLPVVLQYFEENPQDLDLYIPKNKSFVFFQETFGSPPMGNLNVPVTDERSIATDKSLMPPGALALIQTNLPYYNASQTLEFKDVSRFVLDHDTGSAIKGPGRVDIFMGTGAKAKERAGVMTGSGQLYYLLLKDNMNTPFSIDEVSFRDLPGWGQDDPRKLFPAMATILSHLRNAKPYRTGALGITAAELVSLLELAERGQVNSPEQARQFFETNSVPFRISPAQGKSGFVTAFYEPELEVSATPDDVWRYPIYRRPPELVDIDNDNRPDGFDPSYAFGKADEEGISYFPDRRAIDEGCLRGRGLEIAWARSKVDLFFVHVQGAARLVFPDGAIKRITYAAKAGHVFSPIGRLLLDRGELDPKTISMQTIRQWLADHPDEVDGVLWHNRSYIFFREADVAGLDMGPIAAAKVPLVAGRALAVDRLIHTFGLPFFIHAPTLTHLDDGKPFARLMLALDTGSAIVGPARGDIFTGSGFEAGELAGTVRNEADFYILLPRIAAERYRRMRKIQVAVFLFVGLLAACSTVPPSSAPTTCAQCQPCPACPAVTPAITPAPAPAFSRSLLPASWGDLPGWAEDDVTAAWPAFMQSCRGIASRGNAAGWRRVCELARAADGKPENDVRRFFERHLKPYAIVNGDGLVSGLVTGYYEPMLRGSRTKAKGYEQPVRGVPDDLLTIDLSAVFPELKDKRVRGRLEGNKVVPYWSRAEIAARGDKLPGKTLLYVDDAVELFFLQVQGSGRVKLADGGMVRLNYADQNGYQYQSIGKALVERGELKLEEASMQGIQAWARANPARLESLLNTNPSYVFFREVANSADGPVGALGVPLTAERSIAIDPRSVPLGSPVFLATTRPNSAVPLNRLVMAQDTGGAIKGGVRADFFWGFGKEAGDQAGRMKQSGRMWILLPTELAPKMKGRWVKYLLMGTVVAMLAACSSKPTDRGQQYKDGKFTQPFSLVNQPDAVGAPINAGDFAEQINHIRNSSPRLYGNQSNVYNAVQEWLRAGGDTRNMRQFGIDAWQMEGADNYGNVQFTGYYTPVIQARHTRQGEFQYPIYRMPPKRGRLPSRAEIYAGALSDKYILAYSNSLMDNFIMDVQGSGYIDFGDGSPLNFFSYAGKNGHAYRSIGKVLIDRGEVKKEDMSMQAIRHWGETHSEAEVRELLEQNPSFVFFKPQSFAPVKGASAVPLVGRASVASDRSIIPPGTTLLAEVPLLDNNGKFNGQYELRLMVALDVGGAIKGQHFDIYQGIGPEAGHRAGWYNHYGRVWVLKTAPGAGNVFSGMKKYLFRAALCGIAAAILAACQSKSIQTFPQPDTSVINGPDRPVGIPDPAGTTVGGGGAVYTVVPHLSLPHWAAQDFAKSLQSFRLGCANLKNRQGWQDVCAQAFQTPVHSVQAKQFFERYFTPWQVAGNGSLAGTVTGYYEPVLKGDDRRTAQARFPIYGIPDDFISVPLPAGLRSGKALVRIRQTGKNSGTIDNTGGTHTADLSQFPITARTTAIKGRFEGSRFLPYHTRNQINGGALDGKAPILGYAEDPVELFFMHIQGSGRLKTPSGKYIRIGYADKNEHPYVSIGRYMADKGYLKLGQTSMQGIKAYMQQNPQRLAEVLGQNPSYIFFRELTGSSNDGPVGALGTPLMGEYAGAVDRHYITLGAPLFVATAHPVTRKALNRLIMAQDTGSAIKGAVRVDYFWGYGDEAGELAGKQKTTGYVWQLLPNGMKPEYRPMKFPFHPWRRLLLCALPFAALLTACDDGKKEPPPTPAEVTTYNSVPWDALPATSDADLLAGFNAWRSACARLAKDPVWGEPCASATTVAADPTAVRAFLQERMQVYSLRSSSNGDQGLITGYYEPVYHGSLSQGEKTPVPVYGVPDDLVVVALESVYPELKGKRLRGRLEGRVLKPYDDAATIRDNGSSAPVLAWLGDPMDLQFLQIQGSGRIQLEDGRQLRIGYGDQNGHPYKPVGRWLVEQGLVPKEEISMKRIRDWAEANPQRVSELLASNPSFVFFSLRPDSDEGPRGSLNVPLTDGYSVAIDRKVIPLGSLMWLSTTRPDDGSAVVRPVAAQDTGGAIVGEVRADLFWGTGDAAGELAGHMKQPGRLWLLWPKGAPLPASMGAMNGTSGRRLSTATRVAAMAGVLLLAACGGPSSRPGLVSRPAGVAGPVSYQRVAIEGLPGWSTDRVADALPVFRRSCERLRAVSPNSMVGPSVWGSRASDWQAACAVAARLPAFDDDAARRFFAERFQAWQVTGAGDPTGLFTGYYEAALDGSLSPSAVYSTPIYGVPLDLRMEGGKGMRVSGGRSLPYPDRAAIEEGAISGVAPVIMWARDPVDVFMLHIQGSGQVRLPDGRIQRIGYAANNGHPFVGIGAIMRDRGLGDGSSMIAIRAWLRANPAEGRALMRENPRFIFFRPIEGEGPIGAQGLPLTGGRSLAVDPSSVPLGAPVWLATSDAHGETVNRLMVAQDTGSAIKGAVRGDFFWGSGEEALYHAGGMKSAGRYWVLVPRGGRNAVAQNMKGRWAKYVATGVMLAMLAACSSKPTDRGQQYKDGKFTQPFSLVNQPDAVGAPINAGDFAEQVNQIRSASPRLYTNQSNVYNAVQNWLRSGGDTRTMRQFGIDAWQMEGTDNYGNVQFTGYYTPVVQARHTRQGAFQYPIYSMPPKRGRLPSRAQIYAGALSDKYILAWSNSLMDNFIMDVQGSGYIDFGDGSPLNFFSYAGKNGWPYRSIGKVLIDRGEVKKEDMSMQAIREWGEKHSEAEVRELLEQNPSFVFFKPQSFAPVKGASAVPLIGRASVASDRSIIPPGTTLLAEVPLLDNNGKFSGQYELRLMVALDVGGAIKGQHFDIYQGIGPDAGHRAGWYNHYGRVWVLKSAPGAGNVFSGMFKRRYVTLLPLFVLLAACSSKPKPTETDTTTGTPSGGFLLEPQHNVMQMGGDFANNPNAQQFIDKMVNKHGFDRQQLQEILSQAKRLDSVLRLMDNQAPTTSVKPPSGPNGAWLRYRKKFITPDNVQNGVVFWNQYEDALNRAWQVYGVPPEIIVGIIGVETRWGRVMGKTRILDALATLSFNYPRRAEYFSGELETFLLMARDEQDDPLNLKGSFAGAMGYGQFMPSSYKQYAVDFSGDGHINLWDPVDAIGSVANYFKAHGWVKGDQVAVMANGQAPGLPNGFKTKYSISQLAAAGLTPQQPLGNHQQASLLRLDVGTGYQYWYGLPNFYTITRYNHSTHYAMAVWQLGQAVALARVQMFALTAYRLRCAAWLLATGIFLLLAGCSEAKAPTALERVQKEGVLRVITRNSPATYFQDRNGETGFEYELAKRFAERLGVELKIETADNLDDLYAQLSREGGPALAAAGLTPGREDDASVRYSHTYLDVTPQIIYRNGQQRPTRPEDLVGKRIMVLKGSSHAEQLAELKKQYPELKYEESDAVEVVDLLRMVDVGDIDLTLVDSNELAMNQVYFPNVRVAFDFGEARGLAWALPGGDDDSLMNEVNAFLDQAKKEGLLQRLKDRYYGHVDVLGYVGAYTFAQHLQQRLPRYESHFKQSGKQLDTDWRLLAAIGYQESLWQPGATSKTGVRGLMMLTNRTAQAMGVSNRLDPKQSIQGGSKYFVQIRSELPESIKEPDRSWFALAAYNIGGAHLEDARKMAEKEGLNPNKWLDVKKMLPRLAQKQWYAKTRYGYARGGETVHFVQNVRRYYDILTWVTQPQMEGSQIAESGLHLPGVNKTRPEEDSGDEKLMIGADTAKECDAMTFKLLPLAVLCAALVGCQSAQSRDARAESPATAESAAPTAEAPVSEAQEADFETWLANFRRQARGEGIDEATLARALDGLRYRPRVIELDGSQPEFVRPIWEYLDSAVSASRVKKGRERLAEYRDTVRQMTERYGVPGEVLVAIWGIESSYGDYLGDFSTLEALATLAYDGRRRDFARGELLAALRIIEAGDISPERMKGSWAGAMGHTQFIPSSFLAHAVDGDGDGRRDIWNSIADVLASTANYLDEAGWREGEPWGTEVSLPQGFDYTLTEPDIRRSSAEWAAAGVRSRDGHALPDFASASVIAPAGAQGPVFLVGHNFRVILRYNNATSYALAVATLSDAIAGRAGIQGEWPREQPALKRSEVREMQQLLDARGFDVGTPDGILGPNTRRGLRAFQREIGVTPDGFATKALLERLRRMPGLPRARMAQWHPLYSVRLAKDTMTDTQRSLRRPLLGAALSAAALGLCGLSPSLLAAGKRRVSLREEEIEPGRYRDNPQARAFIDEMVARHGFDRGMLQDWFGQAVYSATVVRLIMPPATTGRKSWRTYRSRFIEPIRINAGVRFWQDNRDTLRRAEAEFGVPASVIVGIIGVETIYGRDMGSFRVLDSLSTLAFDYPATPNREARSTLFRNQLADYLLWCRDTRTDVYSVLGSYAGAIGIPQFMPTSLREYALDYDNNGHIDLRNSPTDAIGSVARFLQLHGWEPGRPVVWRIAPDDGSLGVATAAADGEPWPTRTLNQLTRAGLRVDEPINLAREGETGVLVVDLPTPDQPTEYLLGLRNFYVLTRYNRSFFYALAVYQLGEAVKAAMGMFGILNRREMLRGTAATLLLPGILTSAHAGQVAEDPLLRYPWLAQWAGADGLDAPWLRGVFQNLKKYPRVIRAMNHQAEAKPFYLYREHVTSPWLYKKGREAWQQHRAMLEAAGARYGVDAPFVLALWGMESRFGRNQGEHPVLRTLFTLAVDYPRRQTFFRQELRHFLILCRQQGWDPMLLKGSYAGAMGHVQMIPSSLRYYAVDGDGDGRLDVFNNPMDATASIAHYLGKHGWELGGPYLIPVYGITDLSAIKSAKVKEMQPWSSWYALGVRTRGEPPPAERAMALIALEEQDGLRYYGVFNNFRVILDWNRSTRFAKVVGELAEGFVLMPTPATRASLIGLALASGLLAGPARADFQSCLAGIQAQAAGAGVSAQTFRAATANIAYDDKVIELSQAQPEFKTPIWDYMSALVDEERVEDGRAAMRQHAQALANAEARYGVDRHTIAAVWGVESNFGKNLGKMPLVQSLATLACSSNRRRDFFRSELIATLKIIERGDIEASRLTGSWAGAFGQTQFMPTTYQRLAVDGDGDGRRDVVDSVADAVASTANFLRVAKWSNGQPWGYEVRLPRGFNVAAAGRKNKHAVGHWASLGVTRVDGKALTGDGPAGIIAPAGINGPAFLVTKNFDAIYSYNAAESYGLAIAVLSDRLRGRPGVQADWPTDDPPLSRAERRDLQTRLTARGYDVGEPDGKVGSKTREAIKEIERQLGMPATGRPGGKVLEALRRGMFKYSFIAVIVSTVLLSACADSHQKSAEKKPVTSEIANIATSAPARWKQIDVVSLEQAFPKQSRTPAQFPAYVDALKQKAAELGYKPETINFAFSEIHFIDRVVKSDRNQPEKKITLDVYLPRVVTKGRIAEGAKLYQANQQTLAQISNQYGVPANYIVALWGLESGFGRVQGKEDVISALATLAFEGRREALFSRQLMAALEIIENGHLPVGQRLKGSWAGAMGQTQFMPSSFLTYAADGNGDGNIDIWNSREDAFASAANYLATEGWQRDLPWGEQVSLPANFNQQLEGIKTEQQKTVAQWKALGVQLPANSQLSDDMKVWLIIPDDDLHRSYLVTQNFRTIMHWNSSYFFALSIVTMADGVANKINTLPTQHMKKESRPAFDAAAVFDAAAVPVSDSGFAANANVRRFVDDEVGKGDFSRAEWQDFFDKAAYKADIVKIMHRPSTSRPWYVFRTGNSGKAKFRGARRFYAENRALIDDVAQKYGVPAELIVAVIGIETNYGKNTGSFRVADALATLGFDYPRRAGFFQKELVELLKLAKEEGGDVFAFKGSYAGAMGMPQFMPSSYRKWAVDYDGDGHRDIWGNIGDVAASVANYMKQHGWRTGGKILVSATLAPGADVQAIIGEKTALTRTVADLKAYGIIPGEELADDEKAVLFKLETAPGVFEYYLGLNNFYTVWQYNHSRMYVTAVRDIANSLGGSGLMASSSSSKQAKPIHRMAWRLGVSLTLLLGLGALFVLPKFDPKSLTWPTTEPGRIAPLAMSGGNPYLRALMRTISASESNDASPYTVLYGGSHIENLQEHPDRCIPIRWGPNQGLCTTAAGRYQFITTTWLETAEKYHPAPTGEWMWRRYSFAPEYQDRVVYAWLDDVNYWGTDIPQLLEDGQLQTVLKRLSGTWTSLGYGIESNKVTPHLMHIYERMLAEEIALANGLPTNYLPTVANQSVETTRMIIQHSQPKRKGTKYRLKKPYKLVFNLIIVVGLIGLVYSFKKNTQPLVNPSLVTHLPELEMSGGDPYIRALMLTISASESNHKNSYYLLYGGSHVHNLQQHPDQCIPINIGPNRGNCSTAAGRYQFLNSTWQEKARKYHPNPQKNYRQYIYSFEPKYQDIVVYRWLKDHHQWNVDLLTLLKQDQVEEVLRKLSNVWTSLGGGIEDNSMTPHLPSIYRYFLAQELNRENADQNSLMVEINNQRKAFLDMLAWSEGTDNGRQKTRNHGYDVIVGGELFTDYSDHPRKLVTLNPKLKSTAAGRYQLLSRWWDAYRKQLGLKDFSPKSQDAVALQQIKERGALPMIDRGDIRQAIDRCSNIWASLPGAGYGQFEHKADSLIVKFKEAGGTVREIEVMGYTWKGLAKQYGFTDFSPATQDKAAVALILAKKGAMEAILNGDYEQAVMKLGGIWASFPTAPNEYRQHKRSWGFVHNFFRQRGFMARISAADAGGVNVIAFLDMLAWSEGTSTIKASDYGYDVLVGGKLFSEYSKHPRVKVWLPKYSIYSSAAGRYQFLAGTWDAIVKNYGFKGRFIPEAQDLAAIKLLTECGALPLIKAGRIVEAIAKAAPIWASLPGAGYGQREHKLAALLGIYEAERAAEAKPQDQLLAMFSACGGEMAAMTRYEFALLALAAVGYVVWRDWQRSEEPGAQSPDFIDQAENLFYDATEGNFFGGTEDTDMGQAQLNRAAFLLTIRTGEGTAGNDGYRMLFGGGKFDSFADHPRQVVTALSNGKPISSSAAGAYQFLRRTWDTLAARLGLTDFSPASQDAAALELIREAGALGDVDAGRFALAVRKVRKIWASMPGAGYGQPEVALERLQAAYQAAGGVVNGMPVINTHQNIAAFLDMLAYSEGTANHPLTKNRGYDVIVTSLDGRPEIFTDYSDHPFAHGRPAKVFNRRGEKSTASGRYQQLYMFWPHYKKQLALPDFSPLSQDKLAIQLIRERGAIDDIRAGRIERAVSRCRNIWASLPGAGYGQREHSLEKLVTVWRTAGGVVAMYSQQVQQINQPQKNSDIQLINMWLQQIHPIQQNSHLYIAQMFLKFIKKPLKKVTSADVIAFANVYGVRSHNSHSNQQKRIETINSLLKFGQEAGILPRNQKKTFSPNTTNFKTSVYSQNKIKNYRTTGKQQKKPLNWSQLFNLQLASSVLIVFILLMAILQLFRQVSGSTNANQNKSVTSVVMPKIDPTKNWAYPVNVPRIRAFLDTIAVTEGTTGPKGYYRQYTGSHFLSFEDHPRELKCANSNGKKLCSDAAGRYQFLSTSWDRFAPVVKAQNFSPTYQDRVAIELIRDKNALKDIEEGRVKEAFQKLYMVWPSFGETETDVEQLMPKLVGTYEQKLALYQIKNMDDEFERAFKKILDYEGGYSDEQKDHGGKTKYGITEKLARDYGHEGEMKDLELEKAKEIYYREFWANHLYSWIEDERIATEVFEQAVNMGAKTANKHLQKAYNLLADKEIAVDGIIGQRTLEAVNNFEHNSDLFKLLNILQAKKYINIVKNDASQQKFIRGWLRRVELDIDSRKSMKRNFQTVMPYIFSEEGGYADNPADPGGATNMGITINTLSAWEGRQVSPQDVKELTQATATQIYQVEFWNKIDGNDLPSGVDYALFDFAVNSGPGRAAKTLQKILAMPEDGIIGAQTVAAAAARSPEGIINALCDARAAWLRGLSTAATFGNGWLARVERVRARALALAATPPAITQPADPAGNPSPKARQADIAFTSALKHPEALGTMGSVASGLAAIATGNGPVQYALAIVMVACAGVGLWYFVRRVRSEPMNFDQAFDRLLGHEGGYSNNSADPGGETMWGVTARVARADGYLGEMRDLPRDRAKSIYRRLYWTPVRADELPEVVRFDVFDGAVNSGPAQSIKWLQRAAGAVDDGILGPRTMAAAVAAGPVLAARYNGHRLLFLADRPTWGSFGKGWARRVGKNLLGAMDQPPWLQAAWAEFGVREIPGKEDAPEILRYFRDAGDTNVETEATPWCAAFLGAMLKRAGYAGTGSLLARSYLDWGDRLDDARFGAVAVLSRGDDPNAGHVGFLLSDTNGKLYLLGGNQGDAVTVASFDKARLLGLRWPKENVEAASKGDDAIFSRVLAHVLEMEGGFSNDPYDPGGPTNRGITLEVYAKFRKETLDDGTRARLIAELKRIPDAIVTAIYRQRYFDPASCPVFTAPLALMHFDAAVNHGVGAAIRMLQGVAGVTVDGEIGPETLAAIGAKSLADLLDDYAETRRARYRALPHFWRFGRGWLKRVDATLALARTWAAAEATNRGLIEPQQIAKGEGKMGEKSKTEISSSDDSKWWLNSKTMWGTLITAAATVIPVLGPAVGIVLPADLITSFGDQVVTAAQALAGLFGTALAIYGRLKADTPLVLRKNMSAPLTFQQVFDRVVGHEGGYVNDPHDPGGETNWGITKYTARENGYTGSMKAMTREQAYKIYEKAFWQRYHCEKLPEAVAFQFFDAAVNHGVGNASRMLQRAVNVADDGIIGKVTLSAVEKMPISDLLLRFNAERIRFYTKLKNFPRYGKGWMNRIAGNLAYAAIDNEVMNPIIDGIIALEGGYVFNPKDKGGATHWGITEATARAHGYAGDMRDLTHAEAYAILEEDYWIKPGFDVISTLSWPVSFELCDAAVNIGAYHPSAWLQRWLNVFNHEGKRYPDIHVDGNIGPRTLAALEHYLAWRGQEGEAVLVKALNCSQGTYYLNVAEKNHNNEQFIYGWIKNRVTMDSFEDAFKALIGNEGGYSFNPADPGGETMWGVTARVARSEGYNGAMKDLPLETAHQIAKRRYWDPLHLDELDPRVAFQIFDANYNGGLVVLWMQKASGAKEDGKFGPDTLDAVKNADPMKFVMRFAAYRLRYLRNLHSWPSFSRGWTERMAANLLLGAAMSQTATLSDFNKAFDRVIQHEGGYVNDPRDAGGETKFGITIHTARANGYTGSMFTMTRDDAKQIYLKAFWQRYRCNEFPPELAFQFFDACVNHGSGNASRMLQRAVGVVDDGIIGEITLAAIRKRSTVEVVTLFNAERLEFYTKLSGFQHFGKGWIRRMAGNLRHIADDVGDK',
 'target_names': [18, 19, 22, 23, 24, 25, 73, 102, 103, 104, 108],
 'targets': array([ 0,  0,  0,  0,  0,  0,  0,  0,  1,  1,  1,  1,  1,  1,  1,  1,  2,
         2,  2,  2,  2,  2,  2,  2,  3,  3,  3,  3,  3,  3,  3,  3,  4,  4,
         4,  4,  4,  4,  4,  4,  5,  5,  5,  5,  5,  5,  5,  5,  6,  6,  6,
         6,  6,  6,  6,  6,  7,  7,  7,  7,  7,  7,  7,  7,  8,  8,  8,  8,
         8,  8,  8,  8,  9,  9,  9,  9,  9,  9,  9,  9, 10, 10, 10, 10, 10,
        10, 10, 10])}

In [ ]:
data=bio.sequences_to_vectors(sequence_data,chunksize=5)

In [ ]:
summary(data)

here'a a little sanity check...


In [ ]:
print("original sequence:")
print("\t",sequence_data.data[0])

print("the first few chunks:")
for vector in data.vectors[:10]:
    print("\t",bio.vector_to_sequence(vector,data.letters))

you only need to save to csv if you feel like looking at the vectors in Excel - usually you don't need to do this


In [ ]:
save_csv('small sequence dataset.csv',data)

Separate files for train and test, rather than split one file


In [ ]:
sequence_data_train=bio.load_sequences('data/small sequence dataset.xlsx')
sequence_data_test=bio.load_sequences('data/another small sequence dataset.xlsx')

In [ ]:
data_train,data_test=bio.sequences_to_vectors(sequence_data_train,sequence_data_test,chunksize=5)

All of the typical classifying stuff below here....