diff --git a/Q1.sh b/Q1.sh new file mode 100644 index 0000000..51c9df7 --- /dev/null +++ b/Q1.sh @@ -0,0 +1,18 @@ +# This script is for Question 1 of EX11 +# Usage: bash Q1.sh + +cat gene_sequences/sporecoat01.fasta > gene_sequences/sp.fasta +for sp in gene_sequences/sporecoat0[234].fasta +do + echo \n >> gene_sequences/sp.fasta + cat $sp >> gene_sequences/sp.fasta +done +./bin/muscle -in gene_sequences/sp.fasta -out gene_sequences/sp.align + +cat gene_sequences/transporter01.fasta > gene_sequences/tr.fasta +for tr in gene_sequences/transporter0[234].fasta +do + echo \n >> gene_sequences/tr.fasta + cat $tr >> gene_sequences/tr.fasta +done +./bin/muscle -in gene_sequences/tr.fasta -out gene_sequences/tr.align diff --git a/Q2.sh b/Q2.sh new file mode 100644 index 0000000..c1bded1 --- /dev/null +++ b/Q2.sh @@ -0,0 +1,19 @@ +# This script is for Question 2 of EX11 +# Usage: bash Q2.sh + +# build a HMM profile for the transporter gene +./bin/hmmbuild proteomes/tr.hmm gene_sequences/tr.align + +# search the hits to HMM profile +for bp in proteomes/*.fasta +do + ./bin/hmmsearch --tblout ${bp%.*}.hits proteomes/tr.hmm $bp +done + +# count for number of hits +echo "Number of hits to the HMM profile in each proteome:" > proteomes/hit_counts.txt +for hits in proteomes/*.hits +do + echo ${hits##*/} >> proteomes/hit_counts.txt + cat $hits | grep -v "#" | wc -l >> proteomes/hit_counts.txt +done diff --git a/bin/alimask b/bin/alimask new file mode 100755 index 0000000..8fb0bb1 Binary files /dev/null and b/bin/alimask differ diff --git a/bin/hmmalign b/bin/hmmalign new file mode 100755 index 0000000..cf83ebc Binary files /dev/null and b/bin/hmmalign differ diff --git a/bin/hmmbuild b/bin/hmmbuild new file mode 100755 index 0000000..2327f67 Binary files /dev/null and b/bin/hmmbuild differ diff --git a/bin/hmmconvert b/bin/hmmconvert new file mode 100755 index 0000000..5ec9798 Binary files /dev/null and b/bin/hmmconvert differ diff --git a/bin/hmmemit b/bin/hmmemit new file mode 100755 index 0000000..9a832dc Binary files /dev/null and b/bin/hmmemit differ diff --git a/bin/hmmfetch b/bin/hmmfetch new file mode 100755 index 0000000..6991b89 Binary files /dev/null and b/bin/hmmfetch differ diff --git a/bin/hmmlogo b/bin/hmmlogo new file mode 100755 index 0000000..f6e2915 Binary files /dev/null and b/bin/hmmlogo differ diff --git a/bin/hmmpgmd b/bin/hmmpgmd new file mode 100755 index 0000000..1057ac1 Binary files /dev/null and b/bin/hmmpgmd differ diff --git a/bin/hmmpress b/bin/hmmpress new file mode 100755 index 0000000..fef4230 Binary files /dev/null and b/bin/hmmpress differ diff --git a/bin/hmmscan b/bin/hmmscan new file mode 100755 index 0000000..408eb8f Binary files /dev/null and b/bin/hmmscan differ diff --git a/bin/hmmsearch b/bin/hmmsearch new file mode 100755 index 0000000..3763311 Binary files /dev/null and b/bin/hmmsearch differ diff --git a/bin/hmmsim b/bin/hmmsim new file mode 100755 index 0000000..5446ca8 Binary files /dev/null and b/bin/hmmsim differ diff --git a/bin/hmmstat b/bin/hmmstat new file mode 100755 index 0000000..94ba67f Binary files /dev/null and b/bin/hmmstat differ diff --git a/bin/jackhmmer b/bin/jackhmmer new file mode 100755 index 0000000..81b9b96 Binary files /dev/null and b/bin/jackhmmer differ diff --git a/bin/makehmmerdb b/bin/makehmmerdb new file mode 100755 index 0000000..17f00fd Binary files /dev/null and b/bin/makehmmerdb differ diff --git a/bin/muscle b/bin/muscle new file mode 100755 index 0000000..569be49 Binary files /dev/null and b/bin/muscle differ diff --git a/bin/nhmmer b/bin/nhmmer new file mode 100755 index 0000000..77aa05c Binary files /dev/null and b/bin/nhmmer differ diff --git a/bin/nhmmscan b/bin/nhmmscan new file mode 100755 index 0000000..847d9b4 Binary files /dev/null and b/bin/nhmmscan differ diff --git a/bin/phmmer b/bin/phmmer new file mode 100755 index 0000000..a8c6031 Binary files /dev/null and b/bin/phmmer differ