mutation_analysis: wrapper.sh comparison

comparison wrapper.sh @ 89:480fdd383fdb draft

Uploaded

author	davidvanzessen
date	Tue, 31 May 2016 08:30:50 -0400
parents	07f7da724a77
children	f0e8dac22c6e

comparison

equal deleted inserted replaced

-:d57c624a9aa9
+:480fdd383fdb
 echo "---------------- read parameters ----------------"
 echo "---------------- read parameters ----------------<br />" > $output
 echo "unpacking IMGT file"
 type="`file $input`"
 if [[ "$type" == *"Zip archive"* ]] ; then
 	echo "Zip archive"
 	echo "unzip $input -d $PWD/files/"
 	unzip $input -d $PWD/files/
 cat `find $PWD/files/ -name "6_*"` > $PWD/junction.txt
 cat `find $PWD/files/ -name "7_*"` > $PWD/mutationanalysis.txt
 cat `find $PWD/files/ -name "8_*"` > $PWD/mutationstats.txt
 cat `find $PWD/files/ -name "10_*"` > $PWD/hotspots.txt
 #cat $PWD/files/*/1_* > $PWD/summary.txt
 #cat $PWD/files/*/3_* > $PWD/sequences.txt
 #cat $PWD/files/*/5_* > $PWD/aa.txt
 #cat $PWD/files/*/6_* > $PWD/junction.txt
 #cat $PWD/files/*/7_* > $PWD/mutationanalysis.txt
 #BLASTN_DIR="/home/galaxy/tmp/blast/ncbi-blast-2.2.30+/bin"
 echo "${BLASTN_DIR}"
 echo "identification ($method)"
-echo "identification ($method)<br />" >> $output
+echo "---------------- identification ($method) ----------------"
+echo "---------------- identification ($method) ----------------<br />" >> $output
-echo "blast or custom"
 if [[ "${method}" == "custom" ]] ; then
-	echo "custom"
 	python $dir/gene_identification.py --input $PWD/summary.txt --output $outdir/identified_genes.txt
 else
-	echo "blast"
 	ID_index=$(cat $PWD/summary.txt | grep -o -P ".+Sequence ID" | grep -o -P "\t" | wc -l)
 	ID_index=$((ID_index+1))
 	sequence_index=$(cat $PWD/summary.txt | grep -o -P ".+\tSequence" | grep -o -P "\t" | wc -l)
 	sequence_index=$((sequence_index+1))
-	echo "$ID_index ${sequence_index}"
 	cat $PWD/summary.txt | tail -n+2 | cut -f ${ID_index},${sequence_index} | awk '{print ">" $1 "\n" $2}' > $PWD/sequences.fasta
 	echo -e "qseqid\tsseqid\tpident\tlength\tmismatch\tgapopen\tqstart\tqend\tsstart\tsend\tevalue\tbitscore" > $outdir/identified_genes.txt
 	${BLASTN_DIR}/blastn -task blastn -db $dir/subclass_definition.db -query $PWD/sequences.fasta -outfmt 6 >> $outdir/identified_genes.txt
 fi
 echo "---------------- sequence_overview.r ----------------"
 mkdir $outdir/sequence_overview
 Rscript $dir/sequence_overview.r $outdir/identified_genes.txt $PWD/sequences.txt $outdir/merged.txt $outdir/sequence_overview $classes $outdir/hotspot_analysis_sum.txt 2>&1
+#Rscript $dir/sequence_overview.r $outdir/before_unique_filter.txt $outdir/sequence_overview $classes $outdir/hotspot_analysis_sum.txt 2>&1
 echo "<table border='1'>" > $outdir/base_overview.html
 while read ID class seq A C G T
 do
 	done
 	tmp=`cat $outdir/unmatched_${func}_n.txt`
 	echo "<th><a href='unmatched.txt'>unmatched (N = ${unmatched_count})</a></th>" >> $output
 	tmp=`cat $outdir/all_${func}_n.txt`
-	echo "<th><a href='matched_${func}_all.txt'>all (N = $tmp)</a></th>" >> $output
+	echo "<th><a href='matched_all_${func}.txt'>all (N = $tmp)</a></th>" >> $output
 	while IFS=, read name cax cay caz ca1x ca1y ca1z ca2x ca2y ca2z cgx cgy cgz cg1x cg1y cg1z cg2x cg2y cg2z cg3x cg3y cg3z cg4x cg4y cg4z cmx cmy cmz unx uny unz allx ally allz
 	do
 		if [ "$name" == "FR S/R (ratio)" ] || [ "$name" == "CDR S/R (ratio)" ] ; then #meh
 			echo "<tr><td>$name</td><td>${cax}/${cay} (${caz})</td><td>${ca1x}/${ca1y} (${ca1z})</td><td>${ca2x}/${ca2y} (${ca2z})</td><td>${cgx}/${cgy} (${cgz})</td><td>${cg1x}/${cg1y} (${cg1z})</td><td>${cg2x}/${cg2y} (${cg2z})</td><td>${cg3x}/${cg3y} (${cg3z})</td><td>${cg4x}/${cg4y} (${cg4z})</td><td>${cmx}/${cmy} (${cmz})</td><td>${allx}/${ally} (${allz})</td></tr>" >> $output

Mercurial > repos > davidvanzessen > mutation_analysis

comparison wrapper.sh @ 89:480fdd383fdb draft