Gitlab is now using https://gitlab.lcsb.uni.lu as it's primary address. Please update your bookmarks. FAQ.

annotateHMMs.sh 2.43 KB
Newer Older
Laura Denies's avatar
Laura Denies committed
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68
#! /bin/bash -l

cpus=12 # run on with -l nodes=1
hmmscan_tool="/work/projects/ecosystem_biology/local_tools/hmmer-3.1b1-linux-intel-x86_64/binaries/hmmsearch --cpu $cpus --noali --notextw "
fasta=swissprot.faa # change this to your filename

#KEGG
db=kegg
hmm_file=/work/projects/ecosystem_biology/data/hmm/KEGG/KO.hmm
keggout_file=$fasta.$db.hmmscan
time $hmmscan_tool --tblout $keggout_file $hmm_file $fasta >/dev/null
#out_file=$fasta
#perl /home/users/aheintzbuschart/myScripts/consolidate_hmmscan_results_justKEGG.pl $out_file $keggout_file

#META-cyc
db=metacyc
hmm_file=/work/projects/ecosystem_biology/data/hmm/$db/$db.hmm
metacycout_file=$fasta.$db.hmmscan
time $hmmscan_tool --tblout $metacycout_file $hmm_file $fasta >/dev/null

#Pfam
db=Pfam-A
hmm_file=/work/projects/ecosystem_biology/data/hmm/$db/$db.hmm
pfamout_file=$fasta.$db.hmmscan
time $hmmscan_tool --tblout $pfamout_file $hmm_file $fasta >/dev/null

#TIGR
db=tigrpfam
hmm_file=/work/projects/ecosystem_biology/data/hmm/TIGRPFAM/$db.hmm
tigrpfamout_file=$fasta.$db.hmmscan
time $hmmscan_tool --tblout $tigrpfamout_file $hmm_file $fasta >/dev/null

#swissprot
db=swissprot
hmm_file=/work/projects/ecosystem_biology/data/hmm/SwissProt/$db.hmm
swissprotout_file=$fasta.$db.hmmscan
time $hmmscan_tool --tblout $swissprotout_file $hmm_file $fasta >/dev/null

date

#consolidate
perl /work/projects/ecosystem_biology/local_tools/perlscripts/hmms/consolidate_hmmscan_results.pl $fasta $keggout_file $metacycout_file $pfamout_file $swissprotout_file $tigrpfamout_file

date

input=${fasta}pfam.tsv
idn=pfamID
python /home/users/aheintzbuschart/myScripts/150705_MUST_hmmParsePfam.py $input $idn -g $(grep ">" $fasta | wc -l)

input=${fasta}kegg.tsv
idn=KO
python /home/users/aheintzbuschart/myScripts/150705_MUST_hmmParse.py $input $idn -g $(grep ">" $fasta | wc -l)

input=${fasta}metacyc.tsv
idn=metaCycID
python /home/users/aheintzbuschart/myScripts/150705_MUST_hmmParse.py $input $idn -g $(grep ">" $fasta | wc -l)

input=${fasta}swissprot.tsv
idn=swissprotEC
python /home/users/aheintzbuschart/myScripts/150705_MUST_hmmParse.py $input $idn -g $(grep ">" $fasta | wc -l)

input=${fasta}tigrpfam.tsv
idn=tigrID
python /home/users/aheintzbuschart/myScripts/150705_MUST_hmmParse.py $input $idn -g $(grep ">" $fasta | wc -l)

python /home/users/aheintzbuschart/myScripts/150310_MUST_hmmBestAll.py ${fasta}kegg.tsv ${fasta}metacyc.tsv ${fasta}swissprot.tsv ${fasta}pfam.tsv ${fasta}tigrpfam.tsv -g $(grep ">" $fasta | wc -l)

date