Files
annotate/detectors/rrna/bin/go_rrna.sh
alain viari efb9949075 CDS detector added
Former-commit-id: a72f30f90d22cc3c7ff6059e0254e47911bb5af1
Former-commit-id: db0264bdbe5136b6e6dc44e4788175a257439643
2015-11-08 14:28:57 +01:00

58 lines
1.6 KiB
Bash
Executable File

#!/bin/bash
#
# Annotate rRNA
#
#========================================================================================
#
# Annotate rRNA genes based on HMMER3 profils.
#
# go_rrna.sh <FASTAFILE>
#
# - <FASTAFILE> : The fasta file containing the genome to annotate
#
# Results are printed to the standart output
#
#========================================================================================
# -- CAUTION -- Works as long than the script
# is not called through a symlink
THIS_DIR="$(dirname ${BASH_SOURCE[0]})"
source "${THIS_DIR}/../../../scripts/bash_init.sh"
pushTmpDir ORG.rrna
RRNADB="${RRNA_DATA_DIR}/plast_RRNA.hmm"
export CAUTRNADB
if [[ ! "$1" =~ ^/ ]]; then
QUERY="${CALL_DIR}/$1"
else
QUERY="$1"
fi
RRNA=$(basename ${QUERY})
hmmsearch --max ${RRNADB} ${QUERY} | \
awk '/Query: / { \
profil=$2; \
match($3,"[0-9][0-9]*");\
lprof=substr($3,RSTART,RLENGTH)} \
/ [0-9][0-9]* ! / { \
print profil,lprof,$7,$8,$10,$11}' | \
awk '($3 <=5) && (($2-$4) <=5) { \
full=1;$5=$5-$3+1;$6=$6+($2-$4)}
{loc=$5".."$6} \
($1 ~ /_RC$/) { \
loc="complement("loc")"} \
(full==1) {match($1,"_..*S");\
rrna=substr($1,RSTART+1,RLENGTH-1);\
print "FT rRNA " loc; \
print "FT /gene=\"rrn"rrna"\""
print "FT /product=\""rrna" ribosomal RNA\"";\
full=0
}'
popTmpDir
exit 0