diff --git a/motif1.txt b/motif1.txt new file mode 100644 index 0000000..fc9936a --- /dev/null +++ b/motif1.txt @@ -0,0 +1,11 @@ +MSLKPFTYPFPETRFLHSGSSVYKFKIRYGDSIRGEDIENKEVIVQELEDSIRVVLGNLDSLQPFATEHFVVFPYKSKWERVSHLKFKHGEIVLIPYPFVLTLYVAKKPRVZEDELKWFNENLSTGKPIDDSPLGLVPAERKAARAMKKKRKRMELSVSPSRPGLDRAKMRTSSQGPSKKKFLMETSRNMERNTQQKCQETPAFDGTDVQEQGSRWEDNLAGEITPPVQQSNPPPPAGPTDLGTSGFFGF +MSLKPFTYPFPETRFLHAGPNVYKFKIRYGNNIRGEEIEDKEVIVQELEDSIRVVLGNLDSLQPFATEHFIIFPYKSKWESISHLKFKHGEIVLVPYPFVFTLYVAKKPRVZEDEMKWFHESLSAGKPIKDSPLGLVLTERKAAGAMMRKRKQVEVLSSPSRPGLDRAKIGISSQSPSKKKPLMETRRNREGKTHQEWQETPAFNITDVQEQDSKSEDSPAGQIIPPLQQNNPLPPKGPTELATGGFFGF +MSLKPFTYPFPETRFLHAGPNVYKFKIRYGNSIRGEEIQDKEVIVQELEDSIRVVLGNLDNLQPFATEHFVVFPYKSRWERVAHLKFKHGEIVLVPYPFVFTLYVAKKPRVZEDEMKWIHEDLSPGKPVNDCPLGLVLPERTAAGAMLRKRKRGQVPSSPGRPGLDRTGKEKPSRNGRRLQRLISPMSRTRVGSGNREGCQGRLSHQCRRTIHLHLKDPQSWEPVASLGF +MSLKPFTYPFPETRFLHAGPSVYKFKIRYGHSVRAEEITDKEVIIQELEDSIRAVLGNLDNLQPFITEHFIVFPYKSKWERVSHLKFKHEEVVLIPYPFVFTLYVAKKPRVZEDEMKWFHENLPPGKPINDSPLGSAVAEKKAAGDAGKKRKLVEEHGSPRGTALPRSVAEGKAESQSTEATLKKDQNRKKTQQETWKTVTSDTTDVQTQDSKRGHNLPGAMVPALQQSSSPPPQEPGTRSFFGF +MSLKPFTYPFPETRFLHAGPNVYKFKIRYGNNIRGEEIEDKEVIVQELEDSIRVVLGNLDSLQPFATEHFIIFPYKSKWESISHLKFKHGEIVLVPYPFVFTLYVAKKPRVZEDEMKWFHESLSAGKPIKDSPLGLVLTERKAAGAMMRKRKQVEVLSSPSRPGLDRTGKEKPIRNGKRPQHLISLMSRNRILSQRTAQQGRSFPHCSKTIHFHLKDPQSWQLVASLGF +MSLKPFTYPFPETRFLHAGPNVYKFKIRYGNSIRGEEIENKEVIIQELEDSIRVVLGNLDNLQPFATEHFIVFPYKSKWERVSHLKFKHGEIILIPYPFVFTLYVAKKPRVZEDEMKWFHENLSPGKPISDSPLGLVPAEKKAVGAVMRKRKHMDEPSSPSRPGLDRTGKEKPNKDCRRLWPLISLVSRNKILSGGTACQGQLSHPCSTTHLHLRSEQPAASLGF +MSLKPFTYPFPETRFLHAGPSVYKFKIRYGHSIRTVATLLKSFQIYLFQDSIRAVLENLDNLQPFVTEHFIVFPYKSKWERVSHLKFKHEDVVLIPYPFVFTLYVAKKPRVZEDEMKWFHENLSPGRPINDSPLGLVVVEKKAAGASKKQKRKLVEQHSSPGGARQPRDKMRSSSQRPSTKKPPMGTRRNRERKPQQERQKTVASDTTDVQEQHSKWGHNLPGAIVPPLQQNNSPPPKELGIRSFFGF +MSLKPFTYPFPETRFLHAGPNVYKFKIRYGNSIRGEEIEDKEVIVQELEDSIRAVLANMDSLQPFVTEHFIVFPYKSKWERVSHLKFKHGESILTPYPFVFTLYIAKKPRVZEDEMKWFAEDLPSGKPADDIPLELVLAETEAEEATMRKWKRKLMEEPSSPSRQGPHRAKMETSSEASSNKKPLKESKRSTDEEAQQEYQDTPASNAIAVKEQDAALGHGLQGLVVPPLQHSSPPPPKEPGARGFLGF +MSLKAFTYPLPETRFLHAGSSVYKFKIRYGSSVRGEEIEDKKIVSQELEDSIRAVLGNLDNLQPFTTDHFVIFPYKSKWERVSHLRFKHGAALLEPYPFVCTLYVAKKPRVZEDEMKWAPAGGNGGPTNSAPLHLHKTQKEQDRPGTETSRKKEPPAPPSRGGERRTSLEQSWKELADSPELLLQLTRNWTGESASEKGEAEDSDISFLKDHGSGSSLRHQQKSPPKPSSPPSEGPPKQKHAGFLGF +MSLKPFTYPFPETRFLHAGPNVYKFKIRYGNSIRGEEVENKEVIVRELEDSIRVVLGNLDNLQPFTTEHFIIFPYKSKWERVSHLKFKHGEVVLVPYPFVFTLYVAKKPRVZEDEMKWFHENLSPGKLINDSPLGLVSAEKKSAEAMMRKRRHTEVPSSPRKSGRFFPHLRAKVETSSEAPSKKKPPMETRRTWNDNEQQETPAFDATDVQEQGPKWGDSLAGQMAPSLQWNNPPPPKGPKELGTTGFFGF +MSLKPFTYPFPETRFLHAGPNVYKFKIRYGNSIRGEEVENKEVIVQELEDSIRAVLGNLDNLQPFATEHFIVFPYKSKWERVSHLKFKHGEAVLVPYPFVFTLYVAKKPRVZEDEMKCFHENLSPGKSMNSSPLGLVLAERKTAEAVLKKRKRGEVPSSPARPGLDRAEMGTSSQGLSKKKPPMETRRNRERKTQQECQKTPAFDVTDVQDQDSKWEDSLVGKTIPPSQQNNPPPAEGPTELGTSGFFGF diff --git a/motif2.txt b/motif2.txt new file mode 100644 index 0000000..7a60f45 --- /dev/null +++ b/motif2.txt @@ -0,0 +1,13 @@ +DEFIALMHGSDPVRVELTRLENELRDKERELGEAQTEIRALRLSERAREKAVEELTDELEKMFEKLKLTESLLDSKNLEVKKINDEKKAAMAAQFAAEATLRRVHAAQKDDDMPPIEAILAPLEAELKLARQEIAKLQDDNRALDRLTKQKEAALLDAERTVEIAMAKAAMVDDLQNKNQELMKQIEICHEENKILDKLQRQKVAEVKKLSLTVKELEEAVLRGGATANVVRDYQRQVQEVNDQKKTLECELAAQWWRNYGGARAKVTANRVAVVVANEWKDSNDKVMPVKQWLEERRFLQGEMQQLRDKLAVAERTARSEAQLKEKYQLRLKVLEDGLRGPPSGSSRLPTEGKSFSNGPSRRLSLGGADNMSKLSPNGLLARRSPSFHSRSSLSSSSSLVLKHAKGTSKSFDGGTRSLDRSKINGNGAHLLNRSTDAVRDCETNDSWKGNADEGTIENTNSNTDESNKETANNKSAEMVSGFLYDMLQKEVISLRKACHEKDQSLKDKDDAIEMLAKKVDTLTKAMEVEAKKMRREVAAMEKEVAAMRVDKEQEVKARRLGSSKGTGSSQV +LAHSDPIVLEFNRLQNQLKEKDRELGVASSEIKALRATIVLKDKALEQFRNEVNKLDERLGVIENLLKQKDLEIKKLTSEKKDALAAQFAAEAALRRVHANQKDDDTVPIEDVIAPLEADIKMYKIEIGRLQEDNKALERHIKSKESALLEAERILRSALERALIVEEVQNQNFELKRQIEICQEENKILDKTNRQKVLEVEKLSQTIQELEEAILAGGVAANAIRDYRRQISELNEEKRTLERELAAQWWRNYGGARVKVSANRVATVVANEWKDENDKVMPIKQWLEERRLLQAETQRLRDKLAISERTAKAEAQLKDKLKLRLKTLEEGLKQVSSFSENPYLSCRSPKPEKSNHILGFLSGNGGLKRRSTSQPRGSCIGKTSPLMPPNVENGAADAAGELKGVNSLKKKYASGENMLRKSLWASRSKVADIGGKENTEMKSNTDMHIDKFNNDTAVSADAKIKGGAKEETQNVGSAGFDSEDMVSAFLYDRLQREVINLRKSCEVKNNTLTAKDDEIKMLMRKVDALSKAIEVESKKIKREAAAREKEAISTKADENKKIRNTDSSKRRVA +SSDPIVLELNRLENHLKDNDRELGIAHAEIKALKVTERLKEKAVEELNDDLKKLDEKLRFTENLLEDKNLEIKKLVSERRDALAAQFAAEATLRRVHANQKDEDYIPLDAVLAPMESEIRMCRNEISVLQEDKKALERLTKSKELALLETERMLKIAIERALLVEDLQNQNLELKRQIDICQEENRILDKANRQKVAEVEKLSQTIHELEESILAGGAAANAVRDYQRQILEMNEERRTLERELAAQWWRNYGGARVKILANRVATVVANEWKDDNDKVMPVKQWLEERKVLQGEIQRLRDKLNVSERTAKAESQLKDKFKLRLKTLEEGLKQVTTSSPNTEGSHLKQTVKPEPVLGYLSSNMGPRKRSQSQPRASFNAEQSTVQQRPNVTSENSNSNRTLEHVNSLKYKYISGKNLVKKNLWAPRNKLVDDVGKENSERKEDVGLEEFASVGPEVSKDFSAEAHSMQSTPEKDDLNVDCEDIVSGFLYDKLQKEVLNLRKSSQEKDGLLTAKDEEIKMLVKKIDTLTKAMETELKKMRRESASKERELTPRRVQKDPLHKSSTMIISKRAVKSV +EDIIHLLHGSDPIKVELNRLENEVRDKDRELCEAHAEIKALRQTERLKEKAVEELFDEREKLQEKLKAMEIALENKNLDLKRTNDERKSALAAQAAAEATLRRLHASQKDEDLLPLEAILAPVEAELKSTRNDFLKLQDDNKALDRLTKSKEAALLEAERAVQIAEAKASLVDDLQNRNQELLKQIEICQEENKILDKMHRQKVAEVEKLSTTVAELEEALLAGGAAANAARDFERQVHHLMEEKRTLERELAAQWWRNYGGARAKVTANRVAVVVANEWKDANDKVMPVKQWLEERRFMQGEMQQLRDKLATTERTARSEAQLKEKLQVRLKVLEEGLRTSTNGSTRKHDDFLRSGTNGASVRRQSTGGSDIGNGVARRRPSMSSASQMRGSVSGSTILKNGKFGSKAFDGSKSLDAGRFKAYANGCEEPRKVSSAASGAGGGGGGGGGGGDVKPEAGKVEGATVAAADDNVSVLFYDMLQKEVVTLRKLGHEKDQSLKDKDDAIEMLSKKVDTLTKAMEVEAKKMRREVAAMEKEVAAMRVDKEQENRARRLSIAKGSVNSSHA +EDLLNLLHGSDPVKVELNRLENEVRDKDRKLAEATAECKVLKQRERLREKAVEELAEELDKVDEKLKAAEDLLESKNLELKKLNDEKKAALAAQFAAEATLRRVHAAQKDEQLPSIEEILSPLEAELKIARQEIAKLQDTNRALDRLTKSKEAALLEIERAIDAAEAKASQVDDLLNRNQELMKQIEICQEENKIMDKMHRQKTAEIEKLSSTVAELEEAVLAGGAAVNAARDYQRQAHELLEGKKTLERELAAQWWRNYGGARAKITANRVAVVVANEWKDANDKVMPVKQWLDERRFMQGEMQQLRDKLASAERTAKNESQLKDKFQMRLKVLEESLKPVTNGAPRRTEEVRSSSTTRRSTSGSEEASKLLANGSRRQRSAVTQVRASMASQTLMRATNGRMTSKSFDGGRSLDAGTTRLRAFSNGFEEVPVKPDSVEAKSEVEAVKSENGTTNQVSGSSSSVEDPVSGVLYDLLQKEVVNLRKASYEKDQSLKDKDDAIEMLSKKVDTLSKALEVEGKKMRREVQAMEKEVATLRAEKDQTRNPRRLSSGTGTVNSSSK +NEFITLLHGSDPVKVELNRLENEVRDKDRELGEAQAEIKALRLSERLREKAVEELTDELSKVEEKLKLTESLLESKNLEIKKINDEKKASMAAQFAAEATLRRVHAAQKDDDMPPIEAILAPLEAELKLARQEIAKLQDDNKALDRLTKSKEAALLEAERTVQVALAKASMVDDLQNKNQELMKQIEICQEENKILDKMHRQKVAEVEKLTQTVRELEEAVLAGGAAANAVRDYQRKVQEMNEERKTLDRELAAQWWRNYGGARAKVTANRVATVVANEWKDANDKVMPVKQWLEERRFLQGEMQQLRDKLAITERAAKSEAQLKEKYHLRLKVLEESLRGSSSNTRSMPEGRSTSNGPSRRQSLGGADNFSKFTSNGFLSKRTPTSQLRSSLSSNSVLKHAKGTSKSFDGGTRSLDRGSRALLNGSSPNCSFNQPCDETKDTEAANMWKGNSDEKPVEFPVTETEDTVPGVLYDLLQKEVVALRKAGHEKDQSLKDKDDAIEMLAKKVETLTKAMEVEAKKMRREVAAMEKEVAAMRVEKEHENRAKRFGSSKGPVGAAQL +DLMNHFNGSDPVRLELTRLENEVRDKSRVLAEAQAEIKSLRLSDRQKQKAVDELSDKLEKVDEKLKGTLILLDNKNLEMKKLNDERKAALAAQTAAEATLRRVHASQKDNDMPSLEVILAPLEAELKIARDSAVVVVTLQISKLQETNRALDRLTKSKEAALIESERVIKAAEAKASMVDDLQNRNQELLKQIEICQEENKILDKMHRSKVNEVEKLSATVRDLEEAVLAGGAAVNAARDYQRQVHELMEIKRTLERELAAQWWRNYGGARAKISANRVATVVANDWKDESEKVMPVKQWLEERRFLQGEMQQLREKLASAERTCKSEAQLKEKVQLRLKVLEEGLKSGNGTVRRGAGAGGTVEAKRSSSVTSNGSVRKGSGSEEGAKVLANGSRARRSAVSQLRAMGGPLVKNGRLTSKSFDGGGGGRSSSGGSYDAGGMAALKPFTNGFEELRAGIKTESRSCSGEAAGDAGEGAGDTVSGVLYDMLQKEVISLRRASQEKDQSLKDKDNAIEMLSKKVDTLGKAMEVEAKKMRREVTVMEKEVASMRVDKDQERRMRRLSMMKEPVNSSQR +EDVINLLHGSDPVRVELNRLENEVRDKDRELGDAHAEIKALKYSERLKEKAVEELTDELQKVDGKLKATEALLESKNLEIKKINDERKAALAAQFAAEATLRRVHAAQKDDEMPPIEAIIAPLEAELKLARLEAAKLQDDNRALDRLTKSKETALLEAERTVEIALAKASLVDDLQNKNQELMKQIEICQEENKILDKMHRQKVAEVKKLTQTVCELEEAVLAGGAAANAVRDYRRKVQEMNDERKILDRELAAQWWRNYGGSRAKVTANRVAVVVANEWKDANDKVMPVKQWLEERKFFQGEMQLLRDKLAVAERTAKAEAQLKEKYQLRFKVLEERLRASPSGNLRTTSEGRSISNGPSRRQSLGGAENLSRSASNGFALRRTANSQSGSIRSNSASVLLRNAKISSRSFDGGSRSLDRDKVIPNAARKHEVLTDTNDQIQNAKTIGTHEASTNGNRSEKTKSELDDSVSGVLYDMLQKEVITLRRACHEKDQSLKDKDDAIEMLAKKVDTLNKAMGVEAKKMRREVAAMEKEVAAMRVSKEHDPRARRPSAPRGSQ +DDFISLFHGSDPVRVELTRLQNELREKDRELGDALAEIKSLRNSERLKEKGVEELTDELIKVDEKLKAAEALLESKNLEIKKINEEKRAALAAQFAAEATLRRVHAAQKDDEMPPIEAIIAPLEAELKLARMEVAKLQDDNRALGRLTKSKEAALLEAERTVQIALAKASLVDDLQNKNQELMKQIEICQEENKILDKMLRQKVAEVEKLTQTVRELEEAVLAGGAAANAVRDYQRKVQEMNDERKILEREVAAQWWRNYGGARAKVTANRVATVVANEWKDANDKVMPVKQWLEERKFFQGEMQQLRDKLAIAERTAKAEAQMKEKYQLRFKVLEERVKTSNGNSKFTVSDGRNIATGPSRRQSFGGAESLSASSSNGYQSRKTSISRPGSLRSNSANVLLKHAKLSSRSFDGGSRNLERERPTSDANGLDNMPRNSNIQTITSETITTHEESANGTPVKKSKSENEDYVSGMLYDMLQKEVISLRKACHEKDLTLKDKDDAIEMLAKKVDTLSKAMEVEARKMRREVASMEKEVAAMRISKEHDHRARRASAPRGAVNSQSI +EEFINMLHGSDPVRVELCRLENEVRDRDRELSEAQAEIKALRLSERAREKAVEELTEEVNKMDEKLKLTESLLENRNLEIKKINDEKKAALAAQFAAEATLRRVHAAQKDDDMPPIEAILAPLEAELKLARQEIAKLQDDNRALDRLTKSKEAALLEAERTVQIALAKASMVDDLQNKNQELMKQIEICQEENKILDKMHRQKVAEVEKLSQTVRELEEAVLAGGAAANAVRDYQRKVQEMNDEMKTLDRELAAQWWRNYGGSRAKVSANRVAVVVANEWKDSNDKVMPVKQWLEERRFMQGEMQQLRDKLVIAERTARSEAQLKEKFQLRLKVLEDGSRMSASGTYRTTIEGKSVSNGPSRRQSLGGADNVPKSVNGFLSKRPSFQMRSSVSSSTVLKHAKGASKSFDGGTRSLDRSKVLLTGAGLSLNRSSDATGDGVTHESWKKIPDEKTNDFPNVDSDDCVSGLLYDMLQKEVITLRKACHEKDQSLKDKDDAIEMLAKKVDMLTKAMEVEAKKMRREVAAMEKEVAAMRVEKEQDNKSKRLGGSKGLANSSQL +DDFINLLHGSDPVKVELNRLENEVKDKDRELGEAQAEIKALKLSERLREKAVEELTDELQKVDEKLKAAGALIESKNLEIKKINDEKKASLAAQYAAEATLRRVHAAQKDDEMPPIEAIIAPLEAELRLARLEGAGSPYQVKGAALLEAERTVQVALAKAALVDDLQNKNQELMKQIEICQEENKILDKLHRQKVAEVEKLSQTVRELEEAVLAGGAAANAVRDYQRKFMEMNEEKKILDRELAAQWWRNYGGARTKVTANRVAVVVANEWKDANDKVMPVRQWLEERRFLQGEMQQLRDKLAIAERTAKSEAQLKERYHLRLKVLEDGLKASPSGHIRPSEVRSVSNGRSRRQSLGGAENFSRLSSNGLSRRTPASSPSNNISTVLKHAKGSSRSFDGGNRLSEKNKVCLNNGVVPNSSLNTAVEEHRRTENSNTCKENQDVKQSDTSKADADDYVSGLLYDMLQKEVIALRKASHEKDQSLKDKDDAIEMLAKKVDTLTKAMEVEAKKMRREVATMEKEVAAMRVGKGHDLRTKRLSNSKVTSQL +NEFITLLHGSDPVKVELNRLENDVRDKDRELSESQAEIKALRLSERQREKAVEELTEELGKMSEKLKLTENLLDSKNLEIKKINEEKRASMAAQFAAEATLRRVHAAQKDDDMPPIEAILAPLEAELKLARHEIVKLQDDNRALDRLTKSKEAALLDAERTVQSALAKASMVDDLQNKNQELMKQIEICQEENRILDKLHRQKVAEVEKFTQTVRELEEAVLAGGTAANAVRDYQRKFQEMNEERRILDRELAAQWWRNYGGARAKVSASRVATVVANEWKDGSDKVMPVKQWLEERRFLQGEMQQLRDKLAIADRAAKSEAQLKEKFQLRLRVLEESLRGPSSSGNRSTPEGRSMSNGPSRRQSLGGADIIPKLTSNGFFSKRSPSSQFRSLNASTSTILKHAKGTSRSFDGGSRSLDRSKVLTNEPRSKFPLNQSSEGTSGGGSPNSTKQGDSEKAAGTNNDSVPGVLHDLLQKEVITLRKAANDKDQSLRDKDEAIEMLAKKVETLTKAMEVEAKKMRREVAAMEKEVSAMRVDNKGSDSRTRRHSTNSKGASTTAQL +DDFVNFLHGSDPVKIELNRLQNEVIDKNRELVDAQAEIKALKLTDRIKEKALEELTEELRKMVEKFQASEAALENKNLEIKRVVDEKKAALAAQFAAEATLRRVHAAQKDEELPPLEAILSPLEAEIKQLRQEVSKLQDDNRALERLTKSKEAALLEAERDVQSAYFKASLVDELQNRNQELMKQIEISLEENKILDKINRQKIAEVEKLGQTVRDLEEALLSGAAAANAVRDYQRQVSELKGEKRTLERTLAAQWWRNYGGSRAKVVENRVAVVVANEWKDSDGKVMPVKQWLEERRFLMGEMQQLRDKLSIAERTAKTEAQLKEKFQLRLKVVEDGLRSSFNGGVRSSELQNCSNGVSRRLSLGGFENSTKLSSNSFGTKKVPSLTRSSTMSSTSSSALLKHAKGASKSFDGSKSSSEGQSIDGNKSFSNGLDDPCFGNNTDESSMNTINNSGREICCNKQSEFAEPTSTDLVSGILYDMLQKEVIVLRKASHEKDQSLKDKDDAIEMLAKKVDTLTKAMEVEAKKMRREVAAMEKEVASMRADNEHGQRGRRLSGSSKGLLNNAHM diff --git a/noMotif.txt b/noMotif.txt new file mode 100644 index 0000000..3b73db7 --- /dev/null +++ b/noMotif.txt @@ -0,0 +1,66 @@ +GAFNAMFDYHGCWHKDAAATGSLCFDGRFIELYAVEAPRAHLALLDRVKRDVPPFWDPAALAEFIDKYGTHVIAGVKMGGKDVVCIKQLKGSNLTQSDVQSRLKKLSDDKLAQDSPESLTARDDKFLLGLNGSLLLGPGSAAWRSFRPSVVSHKDDILSIHIRRGGVDNGQGHSNWLSTISGSPDVISMAFVPITSLLTGVRGCGFLNHAVNLY +GLFNSCFDFGSDSWASDAGDTRCLAFDGYFISLLDLRLDCRPLALAGHVVADVPAAWDPSAIASFIEKYGTHIIVGLSMGGQDVVYVKQDKSSPLSPSVIKEHLDKLGDQLFTGTCTLPPSHCKSRDHKFKVPEAFNVFDAQMTRQRIEGMTAPMSCKEGVTVIYSKRGGDTAASNHSEWLPTVPLMPDAINFKLVPITSLLKGVAGVGFLSHAINLY +KAITNDIYIPAEFAACEFSLKSGKSSLYSSHINPGQLIFGQGSDTLHHTSNTHQLPLPPNALGEANIGKLYVSIVEYLRGCQDGAGQPNEPLVVFTSTELVPVVRGCFRYLESDSDELQENIEVYDIQYLFYVLKKEVMDIADLPNEHINKSITDNLFVNDFFEYHSGISCQFHEDNDRGKYCTQSKVARWCYMFSDYMCGDLAIKPLPGKHMPPKQEP +KLAEYSMEKTKNDKFSFASQSTSCVFYRSYRLSSSPTLSQEFRKAVRGLPKTYSPENKLKFYRLIDTFGTHYITKVKLGGEVQSVTSIRQCQASLQGLSTEEVQMCLEAEASATIKATVKTELKHCKKDTEKMESKSSFSSLFNDRFTEIKGGQTTEPDLLFSSDKDPSAYKEWLNTLPLIPDIISYSLNSLHELLPTSCPVRKDLRSAIRHY +NPFSASIPYKGYFTDLEIKKRKYIVAENTCLHSYATYSLRESIKNINSDFLLDTENLPILSKSITEKTCSKLIYMYNSKNDQCIKFIKPWIDFFRKYGTHVIVSAHFGGKTINTLEVPIHKFEELKIYNYKYPIENNRYLNVFKDRLLLQKILKIEKGEYAYRGGSQDNYMEDEQAEKNNDNLEKKANDVLNKYENSTSNKINLDIKGGTKLNEDWKQLTYEKWRNSIYTNIAPIYLDLFSLSSFMHIEKKESYNNALLYY +YSFSASAGYKNALKKLKIQNSIIFMMKIYCLRYYTGISTTTNTWEFTNNFRNALNKLPNTFDGLKEDNECTYEYYITKSHSPQCEKNVNKWMTFFKLHGTHVAHEMYLGGKIIIKVNIEKEEYNKMKETNLDMKTVFDFYFHKMGLSARKNRRIQKFINKMHGSKTVSILGGHPGLNIDDPSFFEKWINSIDKNSMPIRTKLLPFSFFMDDPNMIKAYNDALMFY +QFSEKIFPIEIGISSYSLKENKEIASYHKLLYPGKFKNVFARTQMIHGIDARDPRLEQNYSLVCIELIKYIEQFPGLAFFVSKEESLAGDKKCIDEIFLRGNVPIPKQIRFITHIQLFDYWCSIQHIELHEKSSFILNHIFKQLECAERCEYHKKINQKYHCALSDARHTSLMELICMKSYGATIIGSDTLPSVKFV +AKYSKSVKKLRRVSGKSYSFVRAKAQLELAQYMLKSNDLMLHPEFLHRLRALPLSYVYGEYRQIFQDYGTHYITEAALGGEFEYTIILNKERLEQSDYTLEDYKKCAQAGLKVGANIYGVYVSAGVHGGSCNGLLNEMGENTARGSMVEDFVSVVRGGTSESITALLSKKLPTPELMRLWGEGVQFNPDFIRRTTQPLYELVTSRDFSQASTLKRNLKRALSEY +VLGGSRSDLAKFARSQHSVDKATFAIHEISCTYYSYRLADHPQLSAEFTKYLRRLPQRVQTKQDRGPYRRLIDTYGTHYIHQVQLGGKVRRITAFRTCLATLKGFAETDVKTCLNAELRMSLGFLPANVTLSNKCDNLLKGNMSMGFYQGFMTHKIEVIGGERYFPDILYQQDPSEAYDSWMNSLHDNPDVISYAIFPLHQLVPDSQIAANLRDAITEY +YSKNKSVQRLRQYSETKDKTYMRVSGTVQLASFQMRTRGAMLSPTFIEDIKSLPRDYDKAEYFSILEMYGTHYTVSGTVGGKYDLVYVLDSIVMKSLDITTEDVTDCLKLNAGANIGGTENGAKVDVNPNVKTDICNKGGGETETEPRRTQKPVIESIISFVDGGSVEYVTALEEKLNKKEPVADVDDYIQWASSLKDSPTVINSKSNPIISLIPTDIKDAYIKTRNLERAIEEY +GSQESEFFHNVTHYKSTDLGFVRLWSKVETAHFKMRSDKLMLHEDFYISLMDLPEQYDFGMYSRFFNTYGTHYVTQGTMGGTLEYALVLNKTKMAESKLQGEQAGRCFSASIGLSYPIGQGASVDLKLGVNPCSKDGTFNQGSDASSVMVEDIITLVKGGILDSTSGVMVVRNPETYRTWGASLKYNPTLIEHEIMPIYELVRFSTAADHVGARLANLRRAWDEY +TDICTVPVEICIKPTLLNGTINIECFQTIINQPIPIQHFLNSKHYTDFEHGISQENNPVPQTDFDFLWKKINTFIKSNMSKYSDSSMLPIIICTPFISSVQCVEFLASQAKVSDVRRSIFNTMFSVDDFVECVNRFKEIIPNTNAIYNFYKPLVCWTCNNDFKCDFHKSNGTRTFCCSKTNSEYLASTLCDLYKTIKSKIFVASMPSQV +DRRKFHKTVTESRAHRLIILKNKVELAQFQNTAPEYLTLAEGFWRALSSLPTTYDYAAYRQLFQTYGTHYFSEGSLGGEYQALLELTQHALATTSTTSREYERCWRKVKRRFLRKKVKTVCEKLTSSTAASYVTPWSPGTSMRNVPIKVDVVGGNPGLKRFLSILDLENPEENGRKYDDWASSVKDFPQIIEQKVRPLYELVKEVECAGLKKLHMKQALEEY +VNYEHKLENKSLNKLLTKNNLSIKKINCSIHTSGMIISYQWKLKKSISILLNDIQNKLVKDSGHTSNSNPQKNQKNIEKDWYNIFNTYGTHVLTKITLGGKIIEINAVEGGQNITENTSIFGSKLDINFFKMSLNSNSKDKLHDLDKNKSEKIIILGGNAMTTDRKTTNNNGEINYDKKLDKQKWVETIKYNPVPIKFELTPLSYFIYQNFSDENLVNSFHYF +HGDMPSLCEQRYVPCEIACVRYSLREGILGSFHDFIDPGELPRGFRYHCQSGSASTHQIPISGFELANSDYHNMFRKLCSFVCPTPCPVVPVYTKANDIYRVDWCLQWLANKAGMENHFRVQEVETLIIKFYQDKLQEEPSRPTVSRLLDVVQWDYSSNTRCKWHEDNDMWCCALASCKKIAYCISKALASVYGVTLTPAHLPNPERS +VSLSGEYVPAELAIIKYSLNDGVMDSLNVLINPTDLPLGMALDAKTHSSSTHQLPVPPDALGEANYEKILRQILKFFKNTSGSKVVPPIFTWNKDIPMVDSILRGILEATDLDYVKFSILPLIDFFYNLKLATEDYGLDIKTFPSIHLAKALLEKDVYAYTAGIACDVHEQLNNQVACALSRVVRWAYVISDSCCLDVGIEMEKGRHLPHNMTT +FSFSASTGYKNFVKSTATNKVRTYITKTYCLRYVGGIVDYHSLDTTDEFKKAVEALPDKFDSHSCTIETFKSNEDDSICAETVLPWMQFIKMFGTHFTTIVHLGGKITHQVQIDKSDVLHMQQNGINVDAAVKASISPVMVDSLQGGFASTSEKASLSQSNNLKYDKQVLVIGGDGLVDSKNANSLNNWAKELYKRPMPIKIKLESIKSLLGKKRELFDEALKFY +SHSRSSQFASSHSRKDKFSFTTHNLKCSYYTFRIHSRPPLSKEFEESLKNLPSTYDHKNTSAFTQFLSVYGTHFIRRVRLGGHVNSITAIRTCQASMSQMSVQTVSNCLSVEAQANIKGVTVSAATQFCKTKSSKLKTGATFRQAFSDRSIEVLGGDGDVGDVLFNSNGVAGFKKWLASIKRVPGLVWYQISPLHLLVPDNPVLQETLSKAISHY +KAIGNDIYMPAEFAACKFSLRSGRGPVYSSHINPGQLIFGQASDAQHHTSTTHQLPLPPKAMGESNMGSLYVNIVKYLRDCQGAGNPLVVFTTAELMPVVSGCFRYLQSDSDEVGEQIHVYDILYLFYVLKKEVMDIADLPHANINKCITDNFFFNDFFEYYSNIACQFHEDNDRGKYCTHSMVSRWCYTFCDYMCGDLAIKPLAGKHMPPVQEQ +ASFSASADFKQMKDTLSQKDTQCIQSHATCTAFDLSFYNDINSLPLLSLQLVDKIQQLYSYSNYTNEKEYYYDFFDSWGTHVATSVRLGSLFGYQFKMSSSSVQQQSSLGFDASVGASLYGVKGKVSTSYAQQQLNSFQQSLKSWSSYSLGATPNANLDAAQWATQTLDTPMPIKTELTPIYTFISQYQNNADIPLNSTTMAYVVNAMQNY +FSASATNEFSDSSLRKSENEFSRCQQSFDLWSISIPADIARLQNYVSDDFIKLINAINPESKDSIATVFNVYGSHVLMSGVMGGKAHVSASANKLTLTQKFEMSTIVQAKYEQLTSQLSVEDKLKYSEAFDSFSESGSYTYDILGGSPSLGALVFKNNSQGSSDDNLKNWIQSISSMPVLTKFIDQTSLMPVWLLCEDKTKADALKKY +GSFSASTGYKKFINEVSKRTSKTYFIKSNCIKYTIGLPPYVPWEQTTAYMNAVGILPKEFTGLNEDSCAPDVYEQKKMTKQCKNVHQWIQFFKTYGTHIIVEAQLGGKITKIINVSNTAVNQMKKDGVSVKAQIQAQFGFASVGGSTSVSSDNSSKNDNSSYDMSEKLVVIGGNPIKDVTKEENLYEWSKTVSSNPMPIHIKLLPIYKSFDSEELKESYEQAVLYY +KYNINRLLCYPAEIAITTFNMKEGIIYSDSKFVEFDERWAFGQDERDHRTMSERVNENEDLDELMHQLSSTIGIDHLSTDHNPESPFGVFEWLRSRIDIYPYAKILVDMNQFRFVYNGLKNIAKYHGFTGQTYFNENIKFNMVSIQDFTDVLLDYCSLLVARRWSDQDINNQYLRPNLVPNRDKNTICEYHETVPCPTRYNCMKAHNSRLVHHFFTIMKAHRLQNFRYSPPVHEPCIEDM +NGKFSTENQRMKIHQVKDSSVTTRVQIRNFIYKVKVFPDFSLDVRFAQQAKEIADAIENNQSRYADYLSERMVMDFGTHVITSVDAGASLVEEDYLNSKYVSDNVSQSSSISAQAGLNFFDKLKFDISSHNSQQSSTLQGYQSNIRYSLIQSHGGGIPFYPGMTLQKWQESTRNNLVAIDRSGLPLQYFISPNMLPDLPQPTVRKVSHLVRSAIERY +ISLGINHELDQFHQEITQNNKAVSVSQSYWAQYSLTTAPAFLMPLNPMFKQSLDALNRMAKEPTTDTQQTIYNQVINSFGTHYVTSAIMGGAAKIYTTLDQNYLKTVDIEQTKTQIGINFSYNVFQFKFGFNSTDLAQKLDENFKKNSNDIIIFSPEVDHISDPKAWSTWESTVPEKPQPVNTTVSYISDLAYEFPEVQAHLRKTIEFY +KAVNTDIYIPAEFSACEFSLKTGVNSLYSTMIDPSQLIFGQTCDAMLYAAATHQLPLPPAALGESKMTKLYHSIQDYLRSRLERTDKNLKSLVVFTKTDDIDMVKSCFRFIKSGYHDEQSKRYDDDNDEENDQFKFFEAAASKFLPIVVYDIQYLFLALKLAAMDIGGLTLPKPNLYITDAFFSRDFYEFQDGIACWFHEDMDRSKYCTQSKVKRWAYTFCDYMCADLAIKMQPGKHMPPSYKA +KALTGDIYVPAEFSACRYSLKGGISSNYSTMINPGHIIYGQSRDAQDHSKTTHKLPLPPQAFGETNMGKLYIDIFNWLSVRNEEKLDQDPVIVYTTPELMPVVKSCFRYLASEAEIDEDERKIMVFDIHHLFYTLKKSVLDVAGVTNDRINFHVTNNFFVKDFFEYTEGISCDYHEKIDRSKYCTNSMVKRWGFTFSDYMCADLAIPLQPGKHIPLKVKP +NSFTGSLEYKNALMNFKSKRQKIYNKTEQCVRYQVGIPLNLKWGYTEYFNRTLSRLPILSSKVIKNCNIDNKLNLSDEECKSIKPWIKFFEVFGTHFNNQLTLGGKINQTMVFDSSTLEELKKKGIDIEAEVRTELGSGNVKLNLDMGGKKSRLDEIGQKKMSVLGGKMPNFPMDDNEFAHWAETVAENPMPIGVVSTSLKTLMHPAMHQSYDQALHQY +VNGKFSTEFQRMKTLQVKDQAVTTRVQVRNRIYTVKTTPTSELSLGFTKALMDICDQLEKNQTKMATYLAELLILNYGTHVITSVDAGAALVQEDHVRSSFLLDNQNSQNTVTASAGIAFLNIVNFKVETDYISQTSLTKDYLSNRTNSRVQSFGGVPFYPGITLETWQKGITNHLVAIDRAGLPLHFFIKPDKLPGLPGPLVKKLSKTVETAVRHY +SSHNSAFKQAIQASHKKDSSFIRIHKVIKVLNFTMKTKDLQLSDVFLKALNHLPLEYNAALYSRIFDDFGTHYFTSGSLGGVYDLLYQFSNEELKNSGLTQEEAKNCIRIETKKRYFIVTKTKVEHRCTTNRMSEKYEGSFLQGSEKSISLVKGGRSEYAAALAWEKGSSGPGEKTYSEWLESVKENPAVIDFELAPITDLVRNIPCAVTRRNNLRRAFREY +YSGYNNDEYTHDDMLHNLNKHNKLLIKSYKCIVYKANLTSLNFLKNKNNDEIGLNFNGMLILNVLKKLNKNCNSEFDNQKCPISMFRNDPFDANCIRCIMPWMEFFKDYGTFMTKEITMGGVINKFYNIKKYEGSMRKEYKKKTIKQSSTFFHLSKSRSESLNEKKSGETNKEELEELYTLTIGPEPPGNVSNSKVISDWLEKVVHNPTPIDLELVPIKQIIPEKYLKIYENALKYY +SGSRESAFLNKLSKYNEKKYSFIRIFTKVQTASFKMRRDNIMLDEVMLQSLMELPEQYNYGMYAKFIDDYGTHYITSGSMGGVYEYILVLNKENMTKSGVTSDDVTSCFGGSFGIDYDYTDNLQITGSLSGKHCKKLGGGHREDEESNMAVEDIISRVRGGSSGWGGGLTQNGSIITYRAWGRSLKYNPAVIDFEMKPIYEILRHTNLGPLEAKCQNLRRALDQY +KALTTDVYVPAEFSASEYSFNEGIMSVYSTLIDPGQIIFGQGSDAQHHSSTTHNLPLPPNALGEKNMGKLYRNILEYLSKIQEGKDATKPFVVFTKTDMVPVVKSCFRYLACENQDGSYENGDQIQVLDIQYLLFILKKEVLDIAGVSDEKINLYVTDAYFLKDFFEFTPEISCQYHEENDRSKYCTQSLVMRWAYTFSDYMCSDLAISVQPGKHIPPKTKP +SVAGSHSKVANFAAEKTYQDQYNFNSDTVECRMYSFRLVQKPPLHLDFKKALRALPRNFNSSTEHAYHRLISSYGTHFITAVDLGGRISVLTALRTCQLTLNGLTADEVGDCLNVEAQVSIGAQASVSSEYKACEEKKKQHKMATSFHQTYRERHVEVLGGPLDSTHDLLFGNQATPEQFSTWTASLPSNPGLVDYSLEPLHTLLEEQNPKREALRQAISHY +KALTTDVYVPAEFAACEYSLKEGIRSIYSTMIDPGQIIFGQGSDALLHSSTTHDLPLPPNALGEKNMTKLYRNIVDYLSKCQGKGKTLVVFTPAENITMVKSCFRYLECDDDFRDGGEKIQVFDIQYLLFILKKEVMNVADLNDEKINKFATDAFFKKDFFEFTAGIACQYHEDNDRTKYCTQSMVTRWAYTFTDFMCGDLAITVQPGKHIPAQTK +AKFSLSTNYSEISDLLKNNDNKLYVDKSYCFLLEAALPIHNSLKMTRSFATAMSKLTRDFKKHTKDCNAIKYSINKNNKDCKEIKNWMELFDQFGTHFSYNIKLGGRITFITQEEGSKDERGNEKSVDVGVGGKFEKDNKGVGIEGNVKFVFGNKRGESKNLSFKYTNILGGLPVSDISKESEYVKWIKSVYKYPMPIRTQFAPISKIFKSKALKDSYDEAFRFY +GSFSASVGYASASNTISKKKFRMFILKSYCFKYVASLSQYSQWKLSDQFLRAINLLPSYFNSLEHDGKYCNAEELRDNKTGMDSCGKSVESWLYFFKNFGTHVSTVIHLGGKITQQVKISKNEYKSLSESGLSTSVSASVGFGLFKANASSSTDSKESSNEESSNSSIEKETVIIGGTTIYDPNDPSNFEKWADSIKNNPMPIKGQYEPLSRILPERLTKIYDEALSFY +NIDGECMLAEMAMNEFSLFSGIVEKFHAIVGPWMPESESHRRRASRHALETHRIPLQNNFATITKKRLVEEILGRVEPSIACHQGVKVGLYSDACNEKTKIDLNIKNNFKDPGMLCDKNDRRFILVLQSELDLMVDSMKHLANNVGFHYDGFPVTPNCFVIVEAFVEAISDIMNEKIDVETMRWFSLLGQKVDAEDSVSPWETGTDFHCARHSEPKSNFCASVTVGRTCCIVYHVIGSFFRRYHLKKIPTAHQPSSSNS +KALNGDVYQPAELSACRFSLKGGISSNYSTMINPGHIIFGQTSDAQDHSRTTHKLPLPPNAMGEKNLGNLYSDTLKWLSASNDEEDEQYDHPVIVYTTPELMPVVKSCFRYLACEGDTDKHAKKIIVYDICYLFLTLKKTVLDLVGVPSDHMNIHVTNSFFRRDFFEFSSGIACDYHEEVDRTKYCTKSMVLRWGYMISHYICGDLAIPLQPRKHVPIEVKH +RTNTGVHLPAELAVVRYSLEGGVKDKLHMFINPGRLPIGMAYDAQRHAEEDHQLPLPPNAMGVSDYGDVAMRLFSFLLQNDDMPLLFTDETDVPRVESMLEHILSDHLSEIELRICPLAELFFRLKQNVELYMMDQTTFPSVYIAQQIITKDVYDYTKGISCDYHEEKDNVLYCPLSRCIRWAYIISDNCCQDMGIEPIPGKHVPLNANT +FSGSLTCEFVKKSTQHAKNTVTCSTAAHSLYTLKEDDSSNPSEKRLDSCFRNWIENKLSANSPDSWSAFIQKFGTHYIASATFGGIGFQVLKLSFEQVEDLHSKKISLETAAANSLLKGSVSSSTESGYSSYSSTSSSHTVFLGGTVLPSVHDERLDFKDWSESVHLEPVPIQVSLQPITNLLVPLHFPNIGAAELSNKRESLQQAIRVY +WAFTASSEFNHMQQKIEQTSATFVISMATCQIAQITQVPELAEFHQSFIDQLSALPVEYSAPQYLEFLSNFGTHYATDIILGSKVGYVYTLPPAIVDDFDQKKFKEIDLKQAATITSALLKGVIGQQILPKEQEAKAYSDVSKLSTQSFTIEIGPQSTENTPKDWLRETELEPTPIRYTLKSISELVSEGKGQLSSVKEYQKIGQNLKKALTDY +VTSGGTYIPAEMGLVRYSLKDGVMDKLHMFIDPGKLPLGMAYDAKQHSESDHQLPIPPDAKGEKDNDEIILKLFSFLSQQEKMPPLFTETNDIRMVENILKGILNQGSMDENTLLVCPLSELFYQLKRATESFGLDIKTFPSVHIAQAIIQKDVYEYTKDISCEFHEDQGNGKYCPLSRCVRWAYIISDSCCLDLSIEMKPGRHLPMNADT +KSMTNDIYIPAEFSACQFSLKSGICSMYSSHIDPGQLIFGQGSETMHHTKHTHQLPLPPNAMGESDIGRLYANIVEYLRACNPDAKPNDPLVVFATPEFMPIVKGCFRYLESDSEEPLATIHIYDIQYLLYVLKLEVLDSVDIRNVTVNRTATDSLFINDYFCYHLGISCQYHEDIDRCQYCTQSIISRWCYVFSDFMCGDLAITPLPGKHMPPKQEP +SSSRSYTSHTNEIHKGKSYQLLVVENTVEVAQFINNNPEFLQLAEPFWKELSHLPSLYDYSAYRRLIDQYGTHYLQSGSLGGEYRVLFYVDSEKLKQNDFNSVEEKKCKSSGWHFVVKFSSHGCKELENALKAASGTQNNVLRGEPFIRGGGAGFISGLSYLELDNPAGNKRRYSAWAESVTNLPQVIKQKLTPLYELVKEVPCASVKKLYLKWALEEY +KDACTPAELAVVQFTLKHGMRNIYHTLINPDGSQYATQEHVRATHQYPNALGNDDLEGILADLLEFVRLECGPEAELSPMFTLESQISVVNNALEFLNGGVASQLKVHPIEYLFYVLKKATCAAGILPPPASFHITNAQFNLDPHEFLSDIGCEFHKQRDLTAHCAKSYVTRWAFAFADYMCSDLAIKMLPNRHMPNRLDT +IDLANEPLYREAVKASQQKDSVFYRVHQVIATSTFKVKSSDLYLSDPFLQFLNSLPLEYNYALYRHIFQLFGTHYFSSGTLGGKYDLLFQFDREELKTFGLKESDSEYCLSDDDTLVTFFYNRHKQRNTCGNISMKTKYEGSMVKASERCITSVQGGRTEFAAALAWEKKGVSPQSTVYTDWIKSTIENPVVINYELLPLVNLVRGISCAVTKRRHFHRALEEY +HPFNDSNYYKMLVKRINRGDSIIIEKKLCSKYFSFINDINKNDLDTFFLTTLNELGDNYQNIKDDTYKCSLQYYKMNNMNKYSENCLKTITPWISFFNMYGTHVISGVYYGGKIIHNLYFENNNLKKKEYKIRMYKSRLNPFSTINSNLYFGSSLSKEKIIYIRERNLIMDGGVHINPYNINEVNMENKKKNIYVNNVEKNLYDQKKKYRNYYNFYELKDDVRKRNYYNSWKDTIEWEQAKPVKLNLVPLSEFINSEEGKSAYYMALEFY +CEQRFLPCEIGCVKYSLQEGIMADFHSFINPGEIPRGFRFHCQAASDSSHKIPISNFERGHNQATVLQNLYRFIHPNPGNWPPIYCKSDDRTRVNWCLKHMAKASEIRQDLQLLTVEDLVVGIYQQKFLKEPSKTWIRSLLDVAMWDYSSNTRCKWHEENDILFCALAVCKKIAYCISNSLATLFGIQLTEAHVPLQ +GKFSEENTRMKIHQVRGNSVTTRVQVRNHLYTVNAYPDFTLDSRFSQQISELADAIENNQTRQAMYLSEKVILEYGTHVITSIDAGATLVQEDYIKRSYVSDTNSERSSVSASAGINFFNMVNFNFGSKETEQTSETLTYQQNITYSLVQSHGGALFYQGITMQKWQESTQNHLVAIDRSGLPIHYFLNPAVFPDLPVPTLHKLAFSVQKAAERY +GMFNNMFAFSKCWPKDASSVKTLAYDGWFISLYSVEIVRKQLTLRDEVKREVPSSWDSAALAGFIEKYGTHVVVGVTMGGKDVIHVKQMRKSNHEPEEIQKMLKHWGDERFCVDPVESKSPASVYSGKPKEENLLQWGLQPFGTSVSSAVVMHTKNEEIMRVCIRRGGVDLGQSHERWLSTVSQAPNVISMCFVPITSLLSGLPGTGFLSHAVNLY +GNFNATFGFQSGSWATDAANVKSLGLDASVVTLFNLHIHNPNRLRLTDRVRNAVPSSWDPQLLARFIERYGTHVITGVSVGGQDVVVVRQDKSSDLDNDLLRHHLYDLGDQLFTGSCLLSTRRLNKAYHHSHSQPKFPEAFNVFDDKQTVAFNNFSINSQNGITVICAKRGGDGRAKSHSEWLITVPDKPDAINFNFIPITSLLKDVPGSGLLSHAMSLY +KPFSASMPYKSYFADLEIKKKKYALAQNMCVLNYATYDLKESGNNINKDFVLDIEKLPILTKNQMKLCTKVLYMNNNLHCSEGIKSWMKFFEKYGTHVVLSAHFGGMSFNTMEITKRKIEEIKIYKYKYSLWNNPYLNIFKSGSLFQDLSINVDGHKENKKNNSNNNINIDEKKKNDAYIKNDVLIEQYRDNINLEIRGGNNFDEKWRNLTYLVWKNSIYSNIVPIHLDLYSLNTFMPIEKKESYDMALLFY +EFSAEFMFLNNISKYTNKEMGFVQLMSKIQTSQFKMRSKDLVLDEDMLWALSDLPDHYHFGAYSQFFNEYGTHYVTEGTMGGLMDYVAVVNINEMEENQMTGQMIGSCIGGSFGLVFMEKIKATVKGKSCGKFTSNEKTSDESHSAIKDVFGFVKGGNTASSAGSLGIKDAKSYKDWGKSLKYNPALIEFEILPIYELLRLSTAAEQLSSKLPHVKMAWEEY +ELPDDMGYMPCEIGVVEYSLQEGITREFHRFIQPGKPPLGYRYLCQSTSDNTHQIPIEGFELAEGDYHRLWTDLCKFTSPNGRDFPPLYVQVTHTSMCEWCLDWLSEMAGEYNRFHVYELDSLVKDLYEHGEGHAPSLSMIASILNTSVFDYEDGSSCEYHASKEVKYCALGAVKRFCFSISDSMAQVYDLQLTARHLPERPEN +FKFSASAKFKKLQDVSKSGKSKMFINKSYCFKYVAGISTSLKWDFTLGFQSSLGRLSDFKGLEKDSICKPFIYREDPKNENCQELGISDWMELFNTFGTHVATKIYLGGKIFTTLEIKKSQEKKLSDQGLDVRAILSAKIKDTDIDSNVEVSTIKSKNAGDFLLDTKKSTFVLGGDIYGHGKTIEFAEWARSVADHAMPIKAEFTPISHFIDKNLRDAYNKAYLYY +HPFNSSNYYRMLVERIEKGYSIIIDKKICSRYFVALKNVDSSKLDPFFINMLNDLEKNYKNININKYKCSVHSYKKNKYDQNCLRTITPWITFFNLYGTHLVSEVYYGGKIINILYSEYYNNIYNSEQVQIYKKRLNPFTSGSKLGSFYFGSIISKKQNSTNQKDNDNMLTYIKEKNTIYDGGEDIKEYKDGEGKVLMINGMEDEWEKTINGKYAKPIKLILKPFSDFIKTNDGKVAYYKALEYY +GRFRASVDYQNMQNDMASGTYQYIVSNSRCSVFQLDLIDSPTYHPQFSNDILLNLQQLALNQNNANNTEANAYYDFFDNWGTHVVTSVDLGSLFGYKFKMLKTDVQSMQNQGIDVSASATLFNVRGRTNTQLEQNSLNSFSQSIQSWTSYSIGATPDLNNDPANWATQTLTKPMPIKSSITPYHEALKIFTQGGNNILSSTQILQLYSKLRMY +FLGEIENRFDMSDDKSSKRTNEYISYDINNTLYRITLKGNVPLSEQFQEDLNSLDATTLFEKYGTHYLKSTWIGGRISFSTTIDTYGMTDDMRKKFAFVTKRKVGNWTGTSDVELTREEKDISEKMKSNSIVRVWGGDPKLGRDIERAIQGHTVSDIYQQWGQTVEERPYISDFDHGQGLVPIYELATGTRKEQLKEQWEAY +GKFSASSDYQEVQDGLNSANIQYIESQARCSIFQLDVYNSPSQNAQLTPQLQQALFTLAFNQTSQNDYYDFIDTWGTHVVTSVNLGSRFGYKYQMDKYQSNQLTQQGVNLSVSASYFSSSGSASGAYNQTQIQNFTQAMTSWSSYSIGATPDANQDPLSWAQQTLDTPMPINISILSFDDFLNKFSFSVNGLTSSQLNTVISNLSQY +SQSRMTHEVIESAQKIDSKYFKVVNTVELAQFKMRRNGLNPSDIFLRRMKDLPVYYNYLDYSFLIEDFGTHYFSSGSLGGQYEYVYRYSRADLSHSGLTEEEQKSCLSAEAKASFFSFSGSSSGSRCKENALSQRNSGSFTLSASESFSHVKGGSSESAGQLAFANGPNPQKYEAWIQDVKRNPAIISYEITPISELLVGIPYADIKRRNMEKALVEY +YYPTEDKYFICEIAIAAVSLKNGVEDVFHRIVKPGKLPLGYYGGALTHSKETHQMLELVQDEPYENNTREVFNEMTSFLKLWRGKGSDSIVYADEKTHEMITKVIDNFCQEFNYPDEIKVYNFQYLFFALRNSVAARTVWPTETYSSTELEKDLYSYTPDISCEFHEMSDISVYCSKSIVTRYCYTLCDHCCTDLNIQLVAGFHVPKNSRI +ISAEVKSKFSKESLDVKVGKEVYLTSSVSVPRLEFCINPLKVKLSDEFYSKLNNVETHGELIKVFKEYGEFYPKRYILGGMITNHETQKFTTIENLESKLLSLSAGVNAAIGPVKVGGSVGGESATDEKKSKQNEENSSKKDVIGGDPSKTGSEWVSSLSDINNWGIIGIDVYPIMDLIKKNDNTLYKKLEKIKNS +KTSTEAFVPAEIALIKYNLELGVLDKLHELINPVRLPLGLAHEALTYSEQTHELPTPPNAMGETDFYTVLQKILSFTDYNSKPHKKLAIMTDAKEVPVIESLLSQLNDDVKLEYQFLVIPLGEFFFHLKRATEKYGLDICTFPTKTVADILLKKDAYEYTSGIACDFHEKLGNQRFCALSKVVRWSYIISDNCCLDLSIDLIAGRHLPSNADT +GFFNAMFEFTGCWQKDASITKSLAFDGWCITLYTVALSKAHIILKDHVKQAVPSTWEPAALARFIKKFGTHIVVGVKMGGKDVIYLKQQHSSSLQAVDVQKRLKEMSDQRFLDANGHSDISLADSYAKDNKVEAREQRLRFVESNPLNSYSSNEELVMMPKRRGGRDKDIISHSEWLNTVQAEPDVISMSFIPITSLLNGVPGCGFLNHAINLY +SFSASTGYRDFAKEVSKKDTRTYMLKNYCMRYEAGVAQSNHLKWNVTLAFAAGVSQLPDVFDAHNPECACSAEQWRQDQNAEACTKTNVPIWISFIEQFGTHFLVRLFAGGKMTYQVTAKRSEVEKMRNMGIDVKTQLKMQLGGVSGGAGQGTSSKKNQSSSEYQMNVQKETLVIGGRPPGNVSDPAALAAWADTVEELPMPVKFEVQPLYHLLPVEKQEAFKQAVTFY diff --git a/problem1.sh b/problem1.sh new file mode 100644 index 0000000..78d55a0 --- /dev/null +++ b/problem1.sh @@ -0,0 +1,23 @@ +#!/usr/bin/env bash +################################################# + +for reffile in Exercise11_files/Problem1/*.ref + +do + + #../muscle3.8.31_i86darwin64 -in $reffile -out $reffile.aln + + #../hmmer-3.1b2-macosx-intel/binaries/hmmbuild $reffile.hmm $reffile.aln + + for fastafile in Exercise11_files/Problem1/*.fasta + + do + + ../hmmer-3.1b2-macosx-intel/binaries/hmmsearch --tblout $reffile.hits $reffile.hmm $fastafile + + + done + +done + +cat *.hits | grep -v "#" | awk '{print $1, $2}' >> results.txt diff --git a/problem2.py b/problem2.py new file mode 100644 index 0000000..ec6fb8d --- /dev/null +++ b/problem2.py @@ -0,0 +1,31 @@ +import re +import os + +current = os.getcwd() +os.chdir("./Exercise11_files/Problem2/") +inputFile = open("motifsort.fasta","r") +os.chdir(current) +motif1Output = open("motif1.txt","w") +motif2Output = open("motif2.txt","w") +noMotifOutput = open("noMotif.txt","w") + +motif1 = re.compile(r"AKKPRVZE") +motif2 = re.compile(r"AAQWWRNYGG") + +for ln in inputFile: + if ln.startswith(">"): + continue + ln.strip() + if re.search(motif1, ln) is not None: + motif1Output.write(ln) + continue + if re.search(motif2, ln) is not None: + motif2Output.write(ln) + continue + noMotifOutput.write(ln) + + +inputFile.close() +motif1Output.close() +motif2Output.close() +noMotifOutput.close() \ No newline at end of file diff --git a/resultsProblem1.txt b/resultsProblem1.txt new file mode 100644 index 0000000..fea2373 --- /dev/null +++ b/resultsProblem1.txt @@ -0,0 +1,24 @@ +4.9e-23 +1.4e-24 +1.1e-23 +9e-18 +5.8e-22 +6.4e-22 +5.4e-22 +2.8e-22 + +5.9e-35 + + + + + + + +1.8e-06 + +3.5e-09 +2e-09 + +------ +