-
Notifications
You must be signed in to change notification settings - Fork 2
/
Copy pathdoRSAT
executable file
·25 lines (21 loc) · 1.09 KB
/
doRSAT
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
#!/bin/bash
# Given a motif file (meme.txt) and a directory full of genomes in fasta format
# launches rsat on each genome
if [ "$#" -lt 5 ]; then
echo 'doRSAT MOTIF_FILE FASTA_DIR GENBANK_DIR RESULTS_DIR REGULATOR_NAME'
exit 65
fi
MOTIF_FILE=$1
FASTA_DIR=$2
GENBANK_DIR=$3
RESULTS_DIR=$4
REGULATOR_NAME=$5
for i in $(ls $FASTA_DIR)
do
org=$(echo $i | awk 'BEGIN { FS = "." } ; {print $1}')
mkdir $RESULTS_DIR/$org'_'$REGULATOR_NAME > /dev/null
matrix-scan -m $MOTIF_FILE -matrix_format meme -i $FASTA_DIR/$i -bginput -markov 3 -return sites -o $RESULTS_DIR/$org'_'$REGULATOR_NAME/rawhits.txt -quick -n skip -uth pval 0.001 -pseudo 0.01
./getRsatEvalue $RESULTS_DIR/$org'_'$REGULATOR_NAME/rawhits.txt $FASTA_DIR/$i > $RESULTS_DIR/$org'_'$REGULATOR_NAME/hits.txt
./parseRSAT -l -t 1e-4 -o $RESULTS_DIR/$org'_'$REGULATOR_NAME/hits.txt $GENBANK_DIR/$org.gbk $REGULATOR_NAME > $RESULTS_DIR/$org'_'$REGULATOR_NAME'_orientation.tab'
./parseRSAT -l -t 1e-4 $RESULTS_DIR/$org'_'$REGULATOR_NAME/hits.txt $GENBANK_DIR/$org.gbk $REGULATOR_NAME > $RESULTS_DIR/$org'_'$REGULATOR_NAME'_noorientation.tab'
done