comparison wrapper.sh @ 19:c518cf0d4adb draft

Uploaded
author davidvanzessen
date Wed, 01 Apr 2015 05:09:59 -0400
parents 2bb24ebbbc38
children 850857bc8605
comparison
equal deleted inserted replaced
18:9dd557f17153 19:c518cf0d4adb
1 #!/bin/bash 1 #!/bin/bash
2 set -e 2 set -e
3 dir="$(cd "$(dirname "$0")" && pwd)" 3 dir="$(cd "$(dirname "$0")" && pwd)"
4 input=$1 4 input=$1
5 output=$2 5 method=$2
6 outdir=$3 6 output=$3
7 title=$4 7 outdir=$4
8 title=$5
8 mkdir $outdir 9 mkdir $outdir
9 10
10 unzip $input -d $PWD/files/ > $PWD/unziplog.log 11 unzip $input -d $PWD/files/ > $PWD/unziplog.log
11 cat $PWD/files/*/1_* > $PWD/summary.txt 12 cat $PWD/files/*/1_* > $PWD/summary.txt
12 cat $PWD/files/*/7_* > $PWD/mutationanalysis.txt 13 cat $PWD/files/*/7_* > $PWD/mutationanalysis.txt
13 cat $PWD/files/*/8_* > $PWD/mutationstats.txt 14 cat $PWD/files/*/8_* > $PWD/mutationstats.txt
14 cat $PWD/files/*/10_* > $PWD/hotspots.txt 15 cat $PWD/files/*/10_* > $PWD/hotspots.txt
15 16
16 echo "${BLASTN}" 17 BLASTN_DIR="/home/galaxy/tmp/blast/ncbi-blast-2.2.30+/bin"
18
19 echo "${BLASTN_DIR}"
17 20
18 21
19 echo "identification" 22
20 python $dir/gene_identification.py --input $PWD/summary.txt --output $outdir/annotatedsummary.txt 23
24 echo "identification ($method)"
25
26 if [[ "${method}" == "custom" ]] ; then
27 python $dir/gene_identification.py --input $PWD/summary.txt --output $outdir/identified_genes.txt
28 else
29 ID_index=$(cat $PWD/summary.txt | grep -o -P ".+Sequence ID" | grep -o -P "\t" | wc -l)
30 ID_index=$((ID_index+1))
31 sequence_index=$(cat $PWD/summary.txt | grep -o -P ".+\tSequence" | grep -o -P "\t" | wc -l)
32 sequence_index=$((sequence_index+1))
33
34 echo "$ID_index ${sequence_index}"
35
36 cat $PWD/summary.txt | tail -n+2 | cut -f ${ID_index},${sequence_index} | awk '{print ">" $1 "\n" $2}' > $PWD/sequences.fasta
37
38 echo -e "qseqid\tsseqid\tpident\tlength\tmismatch\tgapopen\tqstart\tqend\tsstart\tsend\tevalue\tbitscore" > $outdir/identified_genes.txt
39 ${BLASTN_DIR}/blastn -task blastn -db $dir/subclass_definition.db -query $PWD/sequences.fasta -outfmt 6 >> $outdir/identified_genes.txt
40 fi
41
42
43
21 echo "merging" 44 echo "merging"
22 Rscript $dir/merge_and_filter.r $outdir/annotatedsummary.txt $PWD/mutationanalysis.txt $PWD/mutationstats.txt $PWD/hotspots.txt $outdir/merged.txt $outdir/unmatched.txt 45 Rscript $dir/merge_and_filter.r $PWD/summary.txt $PWD/mutationanalysis.txt $PWD/mutationstats.txt $PWD/hotspots.txt $outdir/identified_genes.txt $outdir/merged.txt $outdir/unmatched.txt $method
23 46
24 genes="ca,ca1,ca2,cg,cg1,cg2,cg3,cg4,cm" 47 genes="ca,ca1,ca2,cg,cg1,cg2,cg3,cg4,cm"
25 echo "R mutation analysis" 48 echo "R mutation analysis"
26 Rscript $dir/mutation_analysis.r $outdir/merged.txt $genes $outdir 2>&1 49 Rscript $dir/mutation_analysis.r $outdir/merged.txt $genes $outdir 2>&1
27 echo "python mutation analysis" 50 echo "python mutation analysis"