Mercurial > repos > davidvanzessen > mutation_analysis
diff wrapper.sh @ 120:613278c1bde0 draft
Uploaded
author | davidvanzessen |
---|---|
date | Tue, 16 Aug 2016 09:10:50 -0400 |
parents | 626a956f3811 |
children | 31cca6d3722a |
line wrap: on
line diff
--- a/wrapper.sh Thu Aug 11 10:35:52 2016 -0400 +++ b/wrapper.sh Tue Aug 16 09:10:50 2016 -0400 @@ -45,14 +45,6 @@ cat `find $PWD/files/ -name "8_*"` > $PWD/mutationstats.txt cat `find $PWD/files/ -name "10_*"` > $PWD/hotspots.txt -#cat $PWD/files/*/1_* > $PWD/summary.txt -#cat $PWD/files/*/3_* > $PWD/sequences.txt -#cat $PWD/files/*/5_* > $PWD/aa.txt -#cat $PWD/files/*/6_* > $PWD/junction.txt -#cat $PWD/files/*/7_* > $PWD/mutationanalysis.txt -#cat $PWD/files/*/8_* > $PWD/mutationstats.txt -#cat $PWD/files/*/10_* > $PWD/hotspots.txt - if [[ ${#BLASTN_DIR} -ge 5 ]] ; then echo "On server, using BLASTN_DIR env: ${BLASTN_DIR}" else @@ -66,25 +58,11 @@ if [[ "${method}" == "custom" ]] ; then python $dir/gene_identification.py --input $PWD/summary.txt --output $outdir/identified_genes.txt else - #ID_index=$(cat $PWD/summary.txt | grep -o -P ".+Sequence ID" | grep -o -P "\t" | wc -l) - #ID_index=$((ID_index+1)) - #sequence_index=$(cat $PWD/summary.txt | grep -o -P ".+\tSequence" | grep -o -P "\t" | wc -l) - #sequence_index=$((sequence_index+1)) - - #echo "${ID_index}, ${sequence_index}" - - #cat $PWD/summary.txt | tail -n+2 | cut -f ${ID_index},${sequence_index} | awk '{print ">" $1 "\n" $2}' > $PWD/sequences.tmp - #cat $PWD/summary.txt | tail -n+2 | awk -v id="${ID_index}" -v seq="${sequence_index}" 'BEGIN{FS="\t"} if(NF>10 && length($seq) > 0) {print ">" $id "\n" $seq} {}' > $PWD/sequences.fasta - - #cat $PWD/sequences.tmp | grep -B1 -vE ">.*|^$" | grep -v "^\-\-$" > sequences.fasta #filter out empty sequences - echo "---------------- summary_to_fasta.py ----------------" echo "---------------- summary_to_fasta.py ----------------<br />" >> $log python $dir/summary_to_fasta.py --input $PWD/summary.txt --fasta $PWD/sequences.fasta - #rm $PWD/sequences.tmp - echo -e "qseqid\tsseqid\tpident\tlength\tmismatch\tgapopen\tqstart\tqend\tsstart\tsend\tevalue\tbitscore" > $outdir/identified_genes.txt ${BLASTN_DIR}/blastn -task blastn -db $dir/subclass_definition.db -query $PWD/sequences.fasta -outfmt 6 >> $outdir/identified_genes.txt fi @@ -397,10 +375,6 @@ echo "<tr><td>Baseline cg data</td><td><a href='baseline_cg.txt'>Download</a></td></tr>" >> $output echo "<tr><td>Baseline cm PDF</td><td><a href='baseline_cm.pdf'>Download</a></td></tr>" >> $output echo "<tr><td>Baseline cm data</td><td><a href='baseline_cm.txt'>Download</a></td></tr>" >> $output -#echo "<tr><td></td><td><a href='IgAT.zip'>IgAT zip</a></td></tr>" >> $output -#echo "<tr><td></td><td><a href='IgAT_ca.zip'>IgAT ca zip</a></td></tr>" >> $output -#echo "<tr><td></td><td><a href='IgAT_cg.zip'>IgAT cg zip</a></td></tr>" >> $output -#echo "<tr><td></td><td><a href='IgAT_cm.zip'>IgAT cm zip</a></td></tr>" >> $output echo "<tr><td>An IMGT archive with just the matched and filtered sequences</td><td><a href='new_IMGT.txz'>Download</a></td></tr>" >> $output echo "<tr><td>An IMGT archive with just the matched and filtered ca sequences</td><td><a href='new_IMGT_ca.txz'>Download</a></td></tr>" >> $output echo "<tr><td>An IMGT archive with just the matched and filtered ca1 sequences</td><td><a href='new_IMGT_ca1.txz'>Download</a></td></tr>" >> $output @@ -411,6 +385,8 @@ echo "<tr><td>An IMGT archive with just the matched and filtered cg3 sequences</td><td><a href='new_IMGT_cg3.txz'>Download</a></td></tr>" >> $output echo "<tr><td>An IMGT archive with just the matched and filtered cg4 sequences</td><td><a href='new_IMGT_cg4.txz'>Download</a></td></tr>" >> $output echo "<tr><td>An IMGT archive with just the matched and filtered cm sequences</td><td><a href='new_IMGT_cm.txz'>Download</a></td></tr>" >> $output +echo "<tr><td>The Change-O DB file with defined clones</td><td><a href='change_o/change-o-db-defined_clones.txt'>Download</a></td></tr>" >> $output +echo "<tr><td>The Change-O DB defined clones summary file</td><td><a href='change_o/change-o-defined_clones-summary.txt'>Download</a></td></tr>" >> $output echo "</table>" >> $output echo "</div>" >> $output #downloads tab end @@ -465,15 +441,6 @@ if [[ "$naive_output" != "None" ]] then - #echo "---------------- imgt_loader.r ----------------" - #echo "---------------- imgt_loader.r ----------------<br />" >> $log - #python $dir/imgt_loader.py --summ $PWD/summary.txt --aa $PWD/aa.txt --junction $PWD/junction.txt --output $naive_output - #Rscript --verbose $dir/imgt_loader.r $PWD/summary.txt $PWD/aa.txt $PWD/junction.txt $outdir/loader_output.txt 2>&1 - - #echo "---------------- naive_output.r ----------------" - #echo "---------------- naive_output.r ----------------<br />" >> $log - #Rscript $dir/naive_output.r $outdir/loader_output.txt $outdir/merged.txt ${naive_output_ca} ${naive_output_cg} ${naive_output_cm} $outdir/ntoverview.txt $outdir/ntsum.txt 2>&1 - cp $outdir/new_IMGT_ca.txz ${naive_output_ca} cp $outdir/new_IMGT_cg.txz ${naive_output_cg} cp $outdir/new_IMGT_cm.txz ${naive_output_cm} @@ -481,6 +448,24 @@ echo "</table>" >> $outdir/base_overview.html +echo "---------------- change-o MakeDB ----------------" +echo "---------------- change-o MakeDB ----------------<br />" >> $log + +mkdir $outdir/change_o + +tmp="$PWD" + +cd $outdir/change_o + +bash $dir/change_o/makedb.sh $input false false false $outdir/change_o/change-o-db.txt + +echo "---------------- change-o DefineClones ----------------" +echo "---------------- change-o DefineClones ----------------<br />" >> $log + +bash $dir/change_o/define_clones.sh bygroup $outdir/change_o/change-o-db.txt gene first ham none min complete 3.0 $outdir/change_o/change-o-db-defined_clones.txt $outdir/change_o/change-o-defined_clones-summary.txt + +PWD="$tmp" + mv $log $outdir/log.html echo "<html><center><h1><a href='index.html'>Click here for the results</a></h1>Tip: Open it in a new tab (middle mouse button or right mouse button -> 'open in new tab' on the link above)<br />" > $log