Skip to content
Open
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
55 changes: 55 additions & 0 deletions bioinformaticsProject/computingproject.sh
Original file line number Diff line number Diff line change
@@ -0,0 +1,55 @@
# Determine which isloated colonies of methanogens are the best candidates for growth experiments based on the presence of the McrA gene and multiple copies of the HSP70 gene.
# Usage: bash computingproject.sh
# Enter remote crc terminal
# Be sure to have hmmsearch, hmmbuild, and muscle in the same working directory

# Combine all hsp.fasta and mcrA.fasta into two separate files
cat hsp*.fasta >> hspref.fasta
cat mcrA*.fasta >> mcrAref.fasta

# Use muscle to align reference sequences into two files, one for hsp70 and one for mcrA. This will generate .afasta files.
./muscle -in hspref.fasta -out hspref.afasta
./muscle -in mcrAref.fasta -out mcrAref.afasta

# Input .afasta files into hmmbuild to generate two profile hmm's, one for hsp70 and one for mcrA.
./hmmbuild hsphmm.txt hspref.afasta
./hmmbuild mcrAhmm.txt mcrAref.afasta

# Use hmmsearch to search for patterns in aligned sequences. Repeat for both hsp70 and mcrA. Match.txt files will contain result output tables.
for file in proteome*.fasta
do
./hmmsearch --tblout hspmatch$file.txt hsphmm.txt $file
done

for file in proteome*.fasta
do
./hmmsearch --tblout mcrAmatch$file.txt mcrAhmm.txt $file
done

# Interpret results:

# Generate a text file with the names of candidate pH-resistant methanogens based on tabular hmmsearch results.
# hsp:
for file in hspmatchproteome*.txt
do
echo $file | tr '\n' ' ' >> hspresults.txt
grep "WP_" $file | wc -l >> hspresults.txt
done

grep -E "[23456789]$" hspresults.txt > results.txt

# mrcA:
for file in mcrAmatchproteome*.txt
do
echo $file | tr '\n' ' ' >> mcrAresults.txt
grep "WP_" $file | wc -l >> mcrAresults.txt
done

grep -E "[123456789]$" mcrAresults.txt >> results.txt

#Generate final answer
cut -d _ -f 2 results.txt | cut -d . -f 1 | sort | uniq -c | sort | grep -E "2 " | tr -s ' ' | cut -d " " -f 3 > finalresults.txt

# Rationale: The final results file lists the best 8 isolated candidate colonies because of the presence of the McrA gene to produce methane and the presence of two or greater HSP70 genes to confer pH resistance.

# Generate a summary table of best candidate results with proteome_number, number_of_mcrA_genes, number_of_HSP70_genes
54 changes: 54 additions & 0 deletions bioinformaticsProject/computingproject1.sh
Original file line number Diff line number Diff line change
@@ -0,0 +1,54 @@

# Determine which isloated colonies of methanogens are the best candidates for growth experiments based on the presence of the McrA gene and multipl$
# Usage: bash computingproject.sh
# Enter remote crc terminal
# Be sure to have hmmsearch, hmmbuild, and muscle in the same working directory

# Combine all hsp.fasta and mcrA.fasta into two separate files
cat hsp*.fasta >> hspref.fasta
cat mcrA*.fasta >> mcrAref.fasta

# Use muscle to align reference sequences into two files, one for hsp70 and one for mcrA. This will generate .afasta files.
./muscle -in hspref.fasta -out hspref.afasta
./muscle -in mcrAref.fasta -out mcrAref.afasta

# Input .afasta files into hmmbuild to generate two profile hmm's, one for hsp70 and one for mcrA.
./hmmbuild hsphmm.txt hspref.afasta
./hmmbuild mcrAhmm.txt mcrAref.afasta

# Use hmmsearch to search for patterns in aligned sequences for both hsp70 and mcrA. Match.txt file will contain result output tables.
for file in proteome*.fasta
do
./hmmsearch --tblout hspmatch$file.txt hsphmm.txt $file
./hmmsearch --tblout mcrAmatch$file.txt mcrAhmm.txt $file
done


# Interpret results:

# Generate a text file with the names of candidate pH-resistant methanogens based on tabular hmmsearch results.
# hsp:
for file in hspmatchproteome*.txt
do
echo $file | tr '\n' ' ' >> hspresults.txt
grep "WP_" $file | wc -l >> hspresults.txt
done

grep -E "[23456789]$" hspresults.txt > results.txt

# mrcA:
for file in mcrAmatchproteome*.txt
do
echo $file | tr '\n' ' ' >> mcrAresults.txt
grep "WP_" $file | wc -l >> mcrAresults.txt
done

grep -E "[123456789]$" mcrAresults.txt >> results.txt

#Generate final answer
cut -d _ -f 2 results.txt | cut -d . -f 1 | sort | uniq -c | sort | grep -E "2 " | tr -s ' ' | cut -d " " -f 3 > finalresults.txt

# Rationale: The final results file lists the best 8 isolated candidate colonies because of the presence of the McrA gene to produce methane and the$

# Generate a summary table of best candidate results with proteome_number, number_of_mcrA_genes, number_of_HSP70_genes

Binary file added bioinformaticsProject/hmmbuild
Binary file not shown.
Binary file added bioinformaticsProject/hmmsearch
Binary file not shown.
2 changes: 2 additions & 0 deletions bioinformaticsProject/hsp70gene_01.fasta
Original file line number Diff line number Diff line change
@@ -0,0 +1,2 @@
>sp|Q9UXR0.1|DNAK_METTE RecName: Full=Chaperone protein DnaK; AltName: Full=HSP
MGKILGIDLGTTNSCMAVMEGGEAVVIPNAEGARTTPSVVGFSKKGEKLVGQVAKRQAISNPENTVYSIKRHMGEPNYKVTLQGKHNTPQEISAMILQKLKADAEAYLGEEIKQAVITVPAYFNDAQRQATKDAGTIAGLEVLRIINEPTAASLAYGLDKGEVEQTILVYDLGGGTFDVSILEIGGGVFEVKATSGDTHLGGDDFDQRIVNYLLAEFKKTEGIDLSKDRAVLQRLTDAAEKAKIELSGVASTNINLPFLTVGPDGEPKHLDIDLTRAQFQKMTEDLLEKTLVSMRQALSDAKLTPNDIDKVILIGGATRMPAVVELVENFTGKKPYKNINPDEAVAIGAAIQAGVLGGEVKDILLLDVTPLTLGIETLGGIATPLIPRNTTIPTRKSQIFSTAADNQPSVEIHVLQGERGIASENKTLGRFTLDGIPPAPRGVPQIEVTFDIDANGILHVSAKDLGTGREQSISIQKPGGLTDAEIERMIKDAELHAEEDRKRKEEVETRNNAETLINAAEKTLKEAGDVATEDQKSKVNAAIDDLKKALEGKDAEEIKAKTEALQEAIYPISTAMYQKAAQQAQQAAGGAAGRTDAKGPEETVVDAIMR
2 changes: 2 additions & 0 deletions bioinformaticsProject/hsp70gene_02.fasta
Original file line number Diff line number Diff line change
@@ -0,0 +1,2 @@
>sp|Q8TQR2.1|DNAK_METAC RecName: Full=Chaperone protein DnaK; AltName: Full=HSP
MAKILGIDLGTTNSCMAVMEGGDAVVLPNAEGSRTTPSVVGFSKKGEKLVGQVAKRQAISNPENTVYSIKRHMGEANYKVTLNGKTYTPQEISAMILQKLKTEAEAYLGETIKQAVITVPAYFNDAQRQATKDAGSIAGLEVLRIINEPTAASLAYGLDKGDVDQKILVYDLGGGTFDVSILELGGGVFEVKSTSGDTHLGGDDFDQRVIDHLLAEFKKTEGIDLSKDKAILQRLKDAAEKAKIELSGVTVTNINLPFLTVGPDGEPKHMDIDLTRAQFQKMTEDLLEKTLVSMRRALSDSKLTPNDLDKVILVGGATRMPAVVELVENFTGKKPYKNINPDEAVAIGAAIQAGVLGGEVKDVLLLDVTPLTLGIETLGGIATPLIQRNTTIPTKKSQIFSTAADNQPSVEIHVLQGERGIASENKTLGRFTLDGIPPAPRGIPQIEVAFDIDANGILHVNAKDLGTGKEQSISIQKPGGLSDAEIERMVKDAELHAEEDKKRKEEVETRNNAEALINAAEKTIKEAGDVATEDQKSKVNAAIEDLKKALEGKDTEEVKAKTEALQEAVYPISTAMYQKAQQEAQQASGEAGSADARGPDETVVDADYEVVDDEKRK
2 changes: 2 additions & 0 deletions bioinformaticsProject/hsp70gene_03.fasta
Original file line number Diff line number Diff line change
@@ -0,0 +1,2 @@
>sp|Q01100.2|DNAK_HALMA RecName: Full=Chaperone protein DnaK; AltName: Full=HSP
MASNKILGIDLGTTNSAFAVMEGGDPEIIVNGEGERTTPSVVAFDDGERLVGKPAKNQAVKNPDETIQSIKRHMGEDDYSVELDGEEYTPEQVSAMILQKIKHDAEEYLGDEIEKAVITVPAYFNDRQRQATKDAGEIAGFEVERIVNEPTAAAMAYGLDDESDQTVLVYDLGGGTFDVSILDLGGGVYEVVATNGDNDLGGDDWDHAIIDYLADEFEAEHGIDLRDDRQALQRLTEAAEEAKIELSSRKETRINLPFIATTDDGPLDLEQKITRAKFESLTEDLIERTVGPTEQALADADYTKSDIDEVILVGGSTRMPQVQDQVEEMTGQEPKKNVNPDEAVALGAAIQAGVLSGDVDDIVLLDVTPLSLGVEVKGGLFERLIDKNTTIPTEESKIFTTAQDNQTQVQIRVFQGEREIAEENELLGAFALSGIPPAPAGTPQIEVSFNIDENGIVNVEAEDKGSGNKEDITIEGGAGLSDDQIEEMQQEAEQHAEEDEQRRERIEARNEAEASVRRAETLLDENEEEIDEDLQSDIEAKIEDVEEVLEDEDATKEDYEAVTETLSEELQEIGKQMYQDQAQQAAGGAAGAGPGGAAGPGGAAGPGGAAGGAAEQGEEYVDADFEDVEESDEDE
2 changes: 2 additions & 0 deletions bioinformaticsProject/hsp70gene_04.fasta
Original file line number Diff line number Diff line change
@@ -0,0 +1,2 @@
>sp|P50023.2|DNAK_THEAC RecName: Full=Chaperone protein DnaK; AltName: Full=HSP
MSKIIGIDLGTSNSAAAVVISGKPTVIPSSEGVSIGGKAFPSYVAFTKDGQMLVGEPARRQALLNPEGTIFAAKRKMGTDYKFKVFDKEFTPQQISAFILQKIKKDAEAFLGEPVNEAVITVPAYFNDNQRQATKDAGTIAGFDVKRIINEPTAAALAYGVDKSGKSEKILVFDLGGGTLDVTIMDFGDGVFQVLSTSGDTRLGGTDMDEAIVNYIADDFQKKEGIDLRKDRSAYIRLRDAAEKAKIELSTTLSTDIDLPYITVTNSGPKHIKMTLTRAKLEELISPIVERVKGPIDKALEGAKLKKTEITKLLFVGGPTRIPYVRKYVEDYLGIKAEGGVDPMEAVAIGAAIQGAVLKGEIKDIVLLDVTPLTLSVETLGGIATPIIPANTTIPVRKSQIFTTAEDMQTTVTIHVVQGERPLAKDNVSLGMFNLTGIAPAPRGVPQIEVTFDIDSNGILNVTAVDKATGKKQGITITASTKLSKEEIERMKKEAEQYAEQDRKAKEQIELLNNAESLAYSVEKTLNDAGDKVDKETKERLTNEVKDLRKAIEEKNTENVKTLMDKLSKDIQEVGAKMYQQASANTQQSAQSNSQNSGSSDGKTVDAEYKEKS
2 changes: 2 additions & 0 deletions bioinformaticsProject/hsp70gene_05.fasta
Original file line number Diff line number Diff line change
@@ -0,0 +1,2 @@
>sp|Q97BG8.1|DNAK_THEVO RecName: Full=Chaperone protein DnaK; AltName: Full=HSP
MSKIIGIDLGTSNSAAAVVISGKPTVIPSSEGVSIGGKAFPSYVAFTKDGQMLVGEPARRQALLNPEGTIFAAKRKMGTDYKFKVFDKEFTPQQISAFILQKIKKDAEAFLGEPVNEAVITVPAYFNDNQRQATKDAGTIAGFDVKRIINEPTAAALAYGVDKSGKSEKILVFDLGGGTLDVTIIEISKRPNVQVLSTSGDTQLGGTDMDEAIVNYIADDFQKKEGIDLRKDRGAYIRLRDAAEKAKIELSTTLSSDIDLPYITVTSSGPKHIKMTLTRAKLEELISPIVERVKAPIDKALEGAKLKKTDITKLLFVGGPTRIPYVRKYVEDYLGIKAEGGVDPMEAVAIGAAIQGAVLKGEIKDIVLLDVTPLTLSVETLGGIATPIIPANTTIPVRKSQVFTTAEDMQTTVTIHVVQGERPLAKDNVSLGMFNLTGIAPAPRGIPQIEVTFDIDSNGILNVTAVDKATGKKQGITITASTKLSKDEIERMKKEAEQYAEQDRKMKEQIETLNNAESLAYSVEKTLNEAGDKVDKETKDRILSEVKDLRKAIEEKNMDNVKTLMEKISKDIQEVGTKMYQSASSTTQTGSGNQNSSKQENDKTVDAEYKEKS
2 changes: 2 additions & 0 deletions bioinformaticsProject/hsp70gene_06.fasta
Original file line number Diff line number Diff line change
@@ -0,0 +1,2 @@
>sp|O27351.1|DNAK_METTH RecName: Full=Chaperone protein DnaK; AltName: Full=HSP
MAKKEKILGIDLGTSNSAAAVLIGGKPTIIPSAEGASQYGKSFPSCVAFTEDGQMLVGEPARRQAVTNPENTITAIKRSMGTDRKVKVHGKEYTPQEISAFILQKIKKDAEAFLGEEIKKAVITVPAYFDDNQRTATKDAGTIAGLDVVRLVNEPTAASLAYGLDKEDEDMVIMVFDLGGGTLDVTIMEFGGGVFEVRSTSGDTQLGGTDMDNAIMNYLAEEFKMETGIDLMEDDQAVQRLREAAEKAKIELSTTLTTEVNLPYITVAQDGPKHLIKTITRAKLEELVDPIVQKCAGPMEQALRDAGMTREDVDKIILVGGPTRMPIVQKFVEDFIGKPVERGIDPMECVAMGAAIQGGVLAGEIKDLVLLDVTPLSLGIETLGGVFTKLIERNTTIPTRKSQIFSTAADNQTSVDIHVLQGERPMAADNTSLGRFQLVGIPPAPRGVPQIEVTFDIDANGILNVSAKDLGTGKEQAITITAPNKLSEEEIKQKIEEAKKHAEEDRRKQEEIEIRNNADSMIYTAEKTLDELGDKVPAEKKEEVEKQVRELRELIAGDDIQAIKSKTEELTKTVQEIGVSYIPAGSTATSSTAAGR
2 changes: 2 additions & 0 deletions bioinformaticsProject/hsp70gene_07.fasta
Original file line number Diff line number Diff line change
@@ -0,0 +1,2 @@
>sp|A9A135.1|DNAK_NITMS RecName: Full=Chaperone protein DnaK; AltName: Full=HSP
MGKVIGIDLGTSNSAAAVMMGGKPTIIPAAEGQTAAGKAFPSVVAFSKEGELLVGEPARRQAVTNPDNTIIAAKRKMGSDYTFKIQDKEYKPQQISSFILQKIKKDAEAFVGETVEKAVITVPAYFDDNQRQATKDAGTIAGLDVVRIINEPTAASLAFGLDKAKEDMKILVFDFGGGTLDVTIMEMGGGVFEVMSTSGDTQLGGTDMDKVLIDYIVDEFKKKEGVDLSQDTTAMTRIREAAEKAKIELSTVMETDVNLPFIAHDPSSGAKNLELRLTRSKLDELIGPIVDRCKPSIQKALEDAKLSNSDINKIVMIGGPTRIPLVKKFVSEVIGKEVESGVDPMEAVAMGAAIQAGIIAGDVTSDIVLLDVTPLTLGIETLGGVREPLIERNTTIPTSKGKVFTTAADNQTAVTIHVVQGERPMATDNVSLGSFNLTDLPPAPRGVPQIEVKFDIDANGIINVTAKDLGTQKEAKITIETKTKLSEEEIEKLKEDAEKFSEEDKKKKEKIDLKNEAESYIYTTEKLVNHDLKDKISQEQGIKITDAVKEVKEVLDKEPEELKPKLEALQSIVNEVTTELYKNAAPPPGADGQQGADGQQGADGQQGADGQQGADGQQGADGQTTESSSNDETKTN
2 changes: 2 additions & 0 deletions bioinformaticsProject/hsp70gene_08.fasta
Original file line number Diff line number Diff line change
@@ -0,0 +1,2 @@
>sp|Q6L0S7.1|DNAK_PICTO RecName: Full=Chaperone protein DnaK; AltName: Full=HSP
MSKIIGIDLGTSNSAAAVVISGKPTVIPAAEGVSLGGKAFPSYVAFTKDGQLLVGEPARRQALLNPEGTVYAAKRKMGTDYKYKIFGKEYTPQQISAFILQKIKRDAEAFLGEPVTDAVITVPAYFNDNQRQATKDAGAIAGLNVRRIINEPTAACLAYGIDKLNQTLKIVIYDLGGGTLDVTIMDFGQGVFQVLSTSGDTHLGGTDMDEAIVNFLADNFQRENGIDLRKDHSAYIRLRDAAEKAKIELSTVLETEINLPYITATQDGPKHLQYTLTRAKFEELIAPIVDRSKVPLDTALEGAKLKKGDIDKIILIGGPTRIPYVRKYVEDYFGRKAEGGVDPMEAVAMGAAIQGAVLAGEVKDIVLLDVTPLTLGIETLGGVMTPLIPANTTIPTKKSQIFTTAADMQTTVTIHVVQGERPLAKDDVSLGMFNLDGIPPAPRGVPQIEVTFDIDANGILNVSAKDLGTGKQQSISITATNKLSKDEIERMKKEAEQYAEQDKKAKEEIETINNAETLAYTAEKTINDAGDKIDESSKESVRSIVKDLRDAISSKDINKIKELSEKLTKEIQEIGTKMYQSQATQGTSQNSSQNNNSQNNNGDTVDADFKESK
2 changes: 2 additions & 0 deletions bioinformaticsProject/hsp70gene_09.fasta
Original file line number Diff line number Diff line change
@@ -0,0 +1,2 @@
>sp|A0RZ01.1|DNAK_CENSY RecName: Full=Chaperone protein DnaK; AltName: Full=HSP
MAKVIGIDLGTSNSAAAVVMGGKPTIIPAAEGATVGGKAFPSVVAFSKDGDLLVGEPARRQAVTNPENTIMAAKRKMGSEHIFKAGGKDYKPQQISSFILQKIKKDAEAFVGEPVGQAVITVPAYFDDNQRQATKDAGTIAGLDVVRIINEPTAASLAFGLDKSKQDMKILVFDFGGGTLDVTVMEMGGGVFEVMSTSGDTQLGGTDMDKAIIDYIVDDFRKREGVDLSQDSTALTRVREAAEKAKIELSTVMETDVNLPFISHDSSGPKNLELRLTRAKLEELVGPIIDRCRPSIEKALADAKVSPSDIAKIVMVGGPTRMPAVKKFVSSVTGKESESGVDPMEAVAMGAAIQAGIIAGDVTSDIVLLDVTPLTLGIDTLGGVREPLIERNTTIPTSKSKVFTTAVDNQTAVTIHVVQGERPMTSDNVSLGSFNLTDLPPAPRGIPQIEVKFDIDANGIINVTAKDLGTQKEAKITIESSSKLSKDEIEKLREDAEKFSDEDEKKKGKVELKNEAESFVYTAEKLINHDLKDKITQEQGIKISDGIREVKEALDQDPDILRPKLDSLKAMVNEITTEMYQQAAAQGAAGGAAGGAAGGAAGGAAGDAAGAAGDSTGDAAGAAGGPSEGPAGDAGAGESAGPEPGDDGQPKPGPAA
2 changes: 2 additions & 0 deletions bioinformaticsProject/hsp70gene_10.fasta
Original file line number Diff line number Diff line change
@@ -0,0 +1,2 @@
>sp|P0CW12.1|DNAK_METMZ RecName: Full=Chaperone protein DnaK; AltName: Full=HSP
MAKILGIDLGTTNSCVAVMEGGEAVVIPNAEGSRTTPSVVGFSKKGEKLVGQVAKRQAISNPDNTVYSIKRHMGEANYKVTLNGKDYTPQEISAMILQKLKADAEAYLGETIKQAVITVPAYFNDSQRQATKDAGAIAGLEVLRIINEPTAASLAYGLDKGDIDQKILVYDLGGGTFDVSILELGGGVFEVKSTSGDTHLGGDDFDQRVIDYLLAEFKKSEGIDLSKDKAVLQRLKDAAEKAKIELSGVANTNINLPFLTVGTDGEPKHMDIDLTRAQFQKMTEDLLEKTLVSMRRALSDAKLTPNDLDKVILVGGATRMPAVVELVENFTGKKPYKNINPDEAVAIGAAIQAGVLGGEVKDVLLLDVTPLTLGIETLGGIATPLIQRNTTIPTKKSQIFSTAADNQPSVEIHVLQGERGIASENKTLGRFILDGIPPAPRGIPQIEVTFDIDANGILHVSAKDLGTGKQQSISIQKPGGLSDDEIERMVKDAEMHAEEDRKRKEEVEIRNNAEALINAAEKTIKEAGDLATEDQKSKVNAAIEDLKKALEGKDAEDIKAKTEALQESVYPISTAMYQKAQQAQQAAGGEGGAAGTDARGPDETVVDADYEVVDDEKRK
2 changes: 2 additions & 0 deletions bioinformaticsProject/hsp70gene_11.fasta
Original file line number Diff line number Diff line change
@@ -0,0 +1,2 @@
>sp|P0CW13.1|DNAK_METMA RecName: Full=Chaperone protein DnaK; AltName: Full=HSP
MAKILGIDLGTTNSCVAVMEGGEAVVIPNAEGSRTTPSVVGFSKKGEKLVGQVAKRQAISNPDNTVYSIKRHMGEANYKVTLNGKDYTPQEISAMILQKLKADAEAYLGETIKQAVITVPAYFNDSQRQATKDAGAIAGLEVLRIINEPTAASLAYGLDKGDIDQKILVYDLGGGTFDVSILELGGGVFEVKSTSGDTHLGGDDFDQRVIDYLLAEFKKSEGIDLSKDKAVLQRLKDAAEKAKIELSGVANTNINLPFLTVGTDGEPKHMDIDLTRAQFQKMTEDLLEKTLVSMRRALSDAKLTPNDLDKVILVGGATRMPAVVELVENFTGKKPYKNINPDEAVAIGAAIQAGVLGGEVKDVLLLDVTPLTLGIETLGGIATPLIQRNTTIPTKKSQIFSTAADNQPSVEIHVLQGERGIASENKTLGRFILDGIPPAPRGIPQIEVTFDIDANGILHVSAKDLGTGKQQSISIQKPGGLSDDEIERMVKDAEMHAEEDRKRKEEVEIRNNAEALINAAEKTIKEAGDLATEDQKSKVNAAIEDLKKALEGKDAEDIKAKTEALQESVYPISTAMYQKAQQAQQAAGGEGGAAGTDARGPDETVVDADYEVVDDEKRK
2 changes: 2 additions & 0 deletions bioinformaticsProject/hsp70gene_12.fasta
Original file line number Diff line number Diff line change
@@ -0,0 +1,2 @@
>sp|A0B747.1|DNAK_METTP RecName: Full=Chaperone protein DnaK; AltName: Full=HSP
MSKIIGIDLGTSNSAAAVLIGGRPTIIPSAEGTSLGGKAFPSYVAFTKDGQVLVGEPARRQAITNPEGTITGIKRKMGTDYKVKVFGKEYTPEEISAHILRKIKQDAEAFLGEKVEKAVITVPAYFNDNQRQATKDAGTIAGLDVVRIINEPTAAALAYGLDKGGEQKIMVFDLGGGTLDVTIMEMGEGVFEVKSTSGDTQLGGRDMDERLLDYIVEKFRQETGINLRNDVMAMQRLREAAEVAKIELSSMLQTTINLPYITADASGPKHLNMTITRAKLEELIQDVLERCRGPMEQALSDAKLSKSDIDKIILVGGPTRMPAVQEFVKRVMGKDVERGVDPMECVAMGAAIQAGVLAGEVKDILLLDVTPLSLGVETLGGIMTRLIERNTTIPTRKSQIFTTAADNQTSVEIHVLQGERPLAKDNISLGRFTLVGIPPAPRGIPQIEVTFDIDANGILHVSAKDLATKKEQRITITAPHRLSKEEIEQKVKEAERYAQEDARRREEIETRNQADNLIYTTEKMLKEAGDVATSEQRERIEKAISELRDALSGKDVQEIKSKMEKLQNAVYELSAAMYQRAAQSQSGSATGSASGSTSGGKTVEADYEVVNDDKR
2 changes: 2 additions & 0 deletions bioinformaticsProject/hsp70gene_13.fasta
Original file line number Diff line number Diff line change
@@ -0,0 +1,2 @@
>sp|Q465Y6.1|DNAK_METBF RecName: Full=Chaperone protein DnaK; AltName: Full=HSP
MAKILGIDLGTTNSCMAVMEGGEAVVIPNAEGARTTPSVVGFSKKGEKLVGQVAKRQAISNPENTVYSIKRHMGDANYTVTLQGTQYKPQEISAMILQKLKTDAEAYLGETIKQAVITVPAYFNDAQRQATKDAGAIAGLDVLRIINEPTSASLAYGLDKGDIEQKILVYDLGGGTFDVSILELGGGVFEVKSTSGDTRLGGDDFDQRIVNYLLAEFRKIEGIDLSKDKAVLQRLTDAAEKAKIELSGVASTNINLPFLTVGADGEPKHLDIDLTRAQFQKMTEDLLEKTLVSMRQALSDAKLTPNDLDKVILVGGATRMPAVVELVENFTGKKPYKNINPDEAVAIGAAIQAGVLGGEVKDVLLLDVTPLTLGIETLGGIATPLIPRNTTIPTKKSQVFSTAADNQPSVEIHVLQGERGVASENKTLGRFTLDGIPPAPRGIPQIEVTFDIDANGILHVGAKDLGTGKEQSISIQKPGGLSDDEIDRMVKDAELHAEEDKKRKEDVETRNNAEALINAAEKTLKEAGDAATEDQKSKVTAAIDDLKKALEGKDSEDIKSKTEALQEAVYPISTAMYQKAQQQAQQAQQAEGEAGSHDAQGPDETVVDADYEVVDDEKRK
2 changes: 2 additions & 0 deletions bioinformaticsProject/hsp70gene_14.fasta
Original file line number Diff line number Diff line change
@@ -0,0 +1,2 @@
>sp|Q9HHB9.1|DNAK_HALMT RecName: Full=Chaperone protein DnaK; AltName: Full=HSP
MASNKILGIDLGTTNSAFAVMEGGDPEIIVNAEGDRTTPSVVAFTDDGERLVGKPAKNQAIQNPEHTIRSIKRHMGDDGYTVDIEGEEYTPEQISAMILQKIKRDAEDYLGDEVEKAVITVPAYFNDKQRQATKDAGEIAGLEVERIVNEPTAASMAYGLDDESNQTVLVYDLGGGTFDVSVLDLGGGVYEVVATNGDNELGGDDWDEAIIDWLATEFKNDHGIDLREDRQALQRLKDAAEEAKIELSSRKETTINLPFITATDSGPVHLEYDLTRAKFESLTKDLIDRTVEPTEQALEDAGYGKDDIDDVILVGGSTRMPQVLDKVEEILGSEPKKSVNPDEAVALGAAIQGGVLGGEVDDIVLLDVTPLSLGIEVKGGLFERLIEKNTTIPTEESKIFTTAADNQTTVQVRVFQGEREMAEDNELLGEFTLSGIPPAPAGTPQIEVGFNIDENGIVNVSAEDKGSGNAESITIEGGAGLSDDEIDRMQREAEQHAEEDKERRRAVEARNEAEGAVQRAETLLEENEENVDDELRADIEAAIEDVEAVLEDDDASTDELEDVTEDLSKELQEIGKRMYQQQAQAQAGGPGGAGGPGGADGPGADADPEDFVDADADFDDEDDDE
2 changes: 2 additions & 0 deletions bioinformaticsProject/hsp70gene_15.fasta
Original file line number Diff line number Diff line change
@@ -0,0 +1,2 @@
>sp|Q9HRY2.1|DNAK_HALSA RecName: Full=Chaperone protein DnaK; AltName: Full=HSP
MASEKILGVDLGTTNSAFAVMEGSDPEIITNEEGDRTTPSIVAHDDGELLVGKPAKNQAVQNPDQTIASIKRHMGEEDYTVALGDDEYTPEEISARILQKIKRDAEEYLGQDVEKAVITVPAYFNDRQRQATKDAGEIAGFDVERIVNEPTAASMAYGLDEDRDQTVLVYDLGGGTFDVSILDLGGGVYEVAATNGDNDLGGDDWDHAIIDHLADNFENEHGIDLREDRQALQRLTEAAEEAKIELSSRKETTVNLPFVTATDSGPVHLEQDITRATFESITEDLIERTVGPTEQALEDAGLSKSDIDDVILVGGSTRMPQVQAQVEDLVGQEPKKNVNPDEAVALGAAVQGGVLSGEVDDIVLVDVTPLSLGIEVKGGLFERLIEKNTAIPTTASKVFTTAADNQTSVQIRVFQGEREIASENELLGDFHLTGIPPAPAGTPQIEVTFEIDADGIVNVEAEDQGSGNAESITIEGGAGLSDEQIDEMQEDAEAHAEEDEQRRRRIEARNEAETAIQRAESLLEENEELVDEDLEADVNDAIDDVQAVLDEDEPEIDALETATEELSDTLQEIGKQAYQQQQDAQAGAAGGAGGMGGMGGMADGPGGAADADGDDEEYVDADFEDVDEE
2 changes: 2 additions & 0 deletions bioinformaticsProject/hsp70gene_16.fasta
Original file line number Diff line number Diff line change
@@ -0,0 +1,2 @@
>sp|Q18GZ4.1|DNAK_HALWD RecName: Full=Chaperone protein DnaK; AltName: Full=HSP
MASNKILGIDLGTTNSAFAVMEGDDPEIIVNAEGDRTTPSVVAMTDDEERLVGKPAKNQVIQNPDQTIRSIKRHMGEEDYTVELGGEDYTPEQVSAMILQKIKRDAEEYLGDEIEKAVITVPAYFNDRQRQATKDAGEIAGFEVDRIVNEPTAASMAYGLDDESNQTILVYDLGGGTFDVSVLDLGGGVYEVVATNGDNDLGGDDWDDAVIDWLAGEFEDNHGIDLRDDRQALQRLKDAAEEAKIELSSRKETTINLPFITATDSGPVHLEETLSRAKFESLTEDLIERTVGPTEQALEDAGYDDSDIDEVILVGGSTRMPQVREKVEDLLGTEPKKNVNPDEAVALGAAIQGGVLAGDVDDIVLLDVTPLSLGIEVKGGLFERLIDKNTTIPTEESKVFTTAAANQTSVNVRVFQGEREIAEENELLGEFQLAGIPPAPAGTPQIEVTFNIDENGIVNVEAEDQGSGNAESITIEGGAGLSDEEIEQMQEEAEAHAEEDERRRERIEARNSAESAVQRAETLLEENEEDIDDDLKESIEDEVESVEAVLEDEDATKEEIEDVTESLSSELQEIGKQMYDAQQAAAGAGAGAAGAGAGAGPGGMGDMGDMGDMGGAAGSGDADNEYVDADFEDVDDDTKDE
2 changes: 2 additions & 0 deletions bioinformaticsProject/hsp70gene_17.fasta
Original file line number Diff line number Diff line change
@@ -0,0 +1,2 @@
>sp|Q12WE6.1|DNAK_METBU RecName: Full=Chaperone protein DnaK; AltName: Full=HSP
MGKILGIDLGTTNSCMAVIEGGKPTVIPNAEGGRTTPSVVGFSKKGDKLVGQVAKRQMIANPGNSVSSIKRHIGEGDYKVNLSGKDYTPQEVSAMILRKLKDDAEAYLGETITQTVITVPAYFNDSQRQATKDAGQIAGLEVLRIINEPTAASLAYGLDKEEGDHKILVYDLGGGTFDVSILELGDGVFEVLSTSGNTHLGGDDFDQRITEFLVEEFKKAEGIDLSNDKAALQRLNDAAEKAKIELSGVASTNVNLPFITADSNGQPKHIDIDITRAQFEKMTEDLVAKTLESMKMALSDAKLTTKDIDRVLLIGGSTRTPAVYNLVKNFIGKDPYKNINPDEAVAVGAAIQAGVLSGEVHDVLLLDVTPLTMGIETLGGVATPLIERNTTIPVKKSQIFSTAADSQPSVEIHILQGERGIASANKTLGRFVLDGIPPAPRGLPQIEVTFDIDSNGILHVNAKDLGTGKEQSISIQKPGGLSDEEIERMVKDAELHAEEDKARKEEVETRNNADSLVNAAENTLKEAGDVATNEQKEQIEAAIADLKTALEGEDLEAIKSKTEALQESVYKVSAAMYEKAQKEASAGAEASEDASGPSSTGSASDDDVVDADYEVVDEDK
2 changes: 2 additions & 0 deletions bioinformaticsProject/hsp70gene_18.fasta
Original file line number Diff line number Diff line change
@@ -0,0 +1,2 @@
>sp|Q3IUI0.1|DNAK_NATPD RecName: Full=Chaperone protein DnaK; AltName: Full=HSP
MASNKILGIDLGTTNSAFAVMEGGDPEIIVNSEGERTTPSVVAFTDDGERLVGKPAKNQAVQNPEDTIQSIKRHMGEDDYTVEVGDDEYTPEQISAMILQKIKRDAEEYLGDDIEKAVITVPAYFNDRQRQATKDAGEIAGFEVERIVNEPTAAAMAYGLDDESDQTVLVYDLGGGTFDVSILDLGGGVYEVVATNGDNDLGGDDWDEAIIDYLADSFEEEHGIDLREDRQALQRLHEAAEEAKIELSSRKETNINLPFIAATDEGPLNLEESISRAKFESLTSDLVERTVGPTEQALDDAGYSKGDIDEVILVGGSTRMPMVQEKVEELTGQEPKKNVNPDEAVGLGAAIQGGVLSGDVDDIVLLDVTPLSLGIEVKGGLFERLIDKNTTIPTEASKVFTTAADNQTSVNIRVFQGEREIAEENELLGAFQLTGIPPAPAGTPQIEVTFNIDENGIVNVEAEDQGSGNKEDITIEGGVGLSDEEIEEMQEEAEKHAEEDEKRRERIEARNEAESTLQRAETLLDENEDAVDDDLRADIEASMDDLREVVEDEDADTDELTEATEALAEALQEIGKQMYQQQAGEGGAGAGAGAAGGMGGAGPGGMGGAGPGGMGGAGPGGMGGAGPGAGAGQQGDGEEFVDADFEDVDDEDDEDE
2 changes: 2 additions & 0 deletions bioinformaticsProject/hsp70gene_19.fasta
Original file line number Diff line number Diff line change
@@ -0,0 +1,2 @@
>sp|B9LUC7.1|DNAK_HALLT RecName: Full=Chaperone protein DnaK; AltName: Full=HSP
MASNKILGIDLGTTNSAFAVMEGDEPEIIANAEGDRTTPSVVAFADDGERLVGKPAKNQAVQNPDRTIQSIKRHMGEDGYTVEIGDEEYTPEQVSAMILQKIKRDAEEYLGDDVEKAVITVPAYFNDKQRQATKDAGEIAGFEVERIVNEPTAASMAYGLDDESDQTVLVYDLGGGTFDVSVLDLGGGVYEVVATNGDNDLGGDDWDEALIDHLAKEFKNNHGIDLREDRQALQRLKDAAEEAKIELSSKKETTVNLPFITATDSGPVHLEQSITRATFENLTSDLIERTVNPTEQALSDADYSKSDIDEVILVGGSTRMPQVQEQVEALVGQEPKKNVNPDEAVALGAAVQGGVLSGDVDDIVLLDVTPLSLGIEVKGGLFERLIEKNTTIPTEESKVFTTAADNQTSVNVRVFQGEREIAEENELLGAFQLSGIPPAPAGTPQIEVSFNIDENGIVNVEAEDQGSGNAESITIEGGVGLSDEEIDQMQEEAEKHKEEDEARRERIEARNEAETSIQRAETLLEENEEELDDDELVADIEAAIEDVEEVLEDEDADTDEIESATEALTEELQEIGKQMYEGQAAQAGPGGAGGAAGAGPGGMGGMGGAAGPGGAGGAGPGGADADDEEYVDADFEDVDDEDDA
2 changes: 2 additions & 0 deletions bioinformaticsProject/hsp70gene_20.fasta
Original file line number Diff line number Diff line change
@@ -0,0 +1,2 @@
>sp|B0R3H4.1|DNAK_HALS3 RecName: Full=Chaperone protein DnaK; AltName: Full=HSP
MASEKILGVDLGTTNSAFAVMEGSDPEIITNEEGDRTTPSIVAHDDGELLVGKPAKNQAVQNPDQTIASIKRHMGEEDYTVALGDDEYTPEEISARILQKIKRDAEEYLGQDVEKAVITVPAYFNDRQRQATKDAGEIAGFDVERIVNEPTAASMAYGLDEDRDQTVLVYDLGGGTFDVSILDLGGGVYEVAATNGDNDLGGDDWDHAIIDHLADNFENEHGIDLREDRQALQRLTEAAEEAKIELSSRKETTVNLPFVTATDSGPVHLEQDITRATFESITEDLIERTVGPTEQALEDAGLSKSDIDDVILVGGSTRMPQVQAQVEDLVGQEPKKNVNPDEAVALGAAVQGGVLSGEVDDIVLVDVTPLSLGIEVKGGLFERLIEKNTAIPTTASKVFTTAADNQTSVQIRVFQGEREIASENELLGDFHLTGIPPAPAGTPQIEVTFEIDADGIVNVEAEDQGSGNAESITIEGGAGLSDEQIDEMQEDAEAHAEEDEQRRRRIEARNEAETAIQRAESLLEENEELVDEDLEADVNDAIDDVQAVLDEDEPEIDALETATEELSDTLQEIGKQAYQQQQDAQAGAAGGAGGMGGMGGMADGPGGAADADGDDEEYVDADFEDVDEE
2 changes: 2 additions & 0 deletions bioinformaticsProject/hsp70gene_21.fasta
Original file line number Diff line number Diff line change
@@ -0,0 +1,2 @@
>sp|Q9UXR0.1|DNAK_METTE RecName: Full=Chaperone protein DnaK; AltName: Full=HSP
MGKILGIDLGTTNSCMAVMEGGEAVVIPNAEGARTTPSVVGFSKKGEKLVGQVAKRQAISNPENTVYSIKRHMGEPNYKVTLQGKHNTPQEISAMILQKLKADAEAYLGEEIKQAVITVPAYFNDAQRQATKDAGTIAGLEVLRIINEPTAASLAYGLDKGEVEQTILVYDLGGGTFDVSILEIGGGVFEVKATSGDTHLGGDDFDQRIVNYLLAEFKKTEGIDLSKDRAVLQRLTDAAEKAKIELSGVASTNINLPFLTVGPDGEPKHLDIDLTRAQFQKMTEDLLEKTLVSMRQALSDAKLTPNDIDKVILIGGATRMPAVVELVENFTGKKPYKNINPDEAVAIGAAIQAGVLGGEVKDILLLDVTPLTLGIETLGGIATPLIPRNTTIPTRKSQIFSTAADNQPSVEIHVLQGERGIASENKTLGRFTLDGIPPAPRGVPQIEVTFDIDANGILHVSAKDLGTGREQSISIQKPGGLTDAEIERMIKDAELHAEEDRKRKEEVETRNNAETLINAAEKTLKEAGDVATEDQKSKVNAAIDDLKKALEGKDAEEIKAKTEALQEAIYPISTAMYQKAAQQAQQAAGGAAGRTDAKGPEETVVDAIMR
2 changes: 2 additions & 0 deletions bioinformaticsProject/hsp70gene_22.fasta
Original file line number Diff line number Diff line change
@@ -0,0 +1,2 @@
>sp|Q0W874.1|DNAK_METAR RecName: Full=Chaperone protein DnaK; AltName: Full=HSP
MSKILGIDLGTSNSEAAIMEGGKPVIIPSAEGARMFPSVVAFTKTGERLVGEAARRQAVTNPERTIIAIKRKMGTDYKVEIDGKKYTPQEISAMILQKIKQDAEAYIGEKITKAVITVPAYFNDNQRQATKDAGTIAGLEVLRVINEPTAAALAFGLDKKGSQKILVFDLGGGTLDVTIMEMGDGVFEVLSTSGDTQLGGTDMDNKIIDYIASQFKKDTGIDLRNDKMAMQRLRDAAEKAKIELSSTLQTQVNLPFITADASGPKHLDMMLTRATLEELVREVVERCYAPMRQAISDAKLTANQIDRIILVGGPTRMPIIIETIKKFFGKEPERGIDPMECVAMGASIQGGVLAGEVKDLLLLDVTPLSLGIETLGNVATRLIERNTTIPTRKSQVFSTAADNQTSVEIHVIQGERPMAYDNTTLGRFHLIGIPPAPRGIPQIEVTFDIDANGILNVKAKDLGTGKEQAITITASTKLDKSDIERMVKDAEKFAAEDAAKKEKAEVMNQADTLLYSAEKTLADAGDKITADQKERVTKGSDALREAQKTGDIEKIKAATADLTKTMNEVATVLYQAAQQQYQQQQAAEQAAQQQSGGQQASGSNPGKDPNVVDADYEVVNDKK
Loading