# HG changeset patch # User davidvanzessen # Date 1472455729 14400 # Node ID e87dcca14bd618e564d41b50ce2f789dc2a8936c # Parent 4a93146f87aa84a0326b4c0166eca76da04a6ef3 Uploaded diff -r 4a93146f87aa -r e87dcca14bd6 change_o/define_clones.sh --- a/change_o/define_clones.sh Mon Aug 22 09:11:17 2016 -0400 +++ b/change_o/define_clones.sh Mon Aug 29 03:28:49 2016 -0400 @@ -21,7 +21,8 @@ output=${10} output2=${11} - /data/users/david/anaconda3/bin/python $dir/DefineClones.py bygroup -d $PWD/input.tab --nproc 4 --outdir $PWD/outdir --outname output --mode $mode --act $act --model $model --dist $dist --norm $norm --sym $sym --link $link + python3 $dir/DefineClones.py bygroup -d $PWD/input.tab --nproc 4 --outdir $PWD/outdir --outname output --mode $mode --act $act --model $model --dist $dist --norm $norm --sym $sym --link $link + #/data/users/david/anaconda3/bin/python $dir/DefineClones.py bygroup -d $PWD/input.tab --nproc 4 --outdir $PWD/outdir --outname output --mode $mode --act $act --model $model --dist $dist --norm $norm --sym $sym --link $link #/home/galaxy/anaconda3/bin/python $dir/DefineClones.py bygroup -d $PWD/input.tab --nproc 4 --outdir $PWD/outdir --outname output --mode $mode --act $act --model $model --dist $dist --norm $norm --sym $sym --link $link Rscript $dir/define_clones.r $PWD/outdir/output_clone-pass.tab $output2 2>&1 @@ -30,10 +31,13 @@ output=$4 output2=$5 - /data/users/david/anaconda3/bin/python $dir/DefineClones.py hclust -d $PWD/input.tab --nproc 4 --outdir $PWD/outdir --outname output --method $method + python3 $dir/DefineClones.py hclust -d $PWD/input.tab --nproc 4 --outdir $PWD/outdir --outname output --method $method + #/data/users/david/anaconda3/bin/python $dir/DefineClones.py hclust -d $PWD/input.tab --nproc 4 --outdir $PWD/outdir --outname output --method $method #/home/galaxy/anaconda3/bin/python $dir/DefineClones.py hclust -d $PWD/input.tab --nproc 4 --outdir $PWD/outdir --outname output --method $method Rscript $dir/define_clones.r $PWD/outdir/output_clone-pass.tab $output2 2>&1 fi cp $PWD/outdir/output_clone-pass.tab $output + +rm -rf $PWD/outdir/ diff -r 4a93146f87aa -r e87dcca14bd6 change_o/makedb.sh --- a/change_o/makedb.sh Mon Aug 22 09:11:17 2016 -0400 +++ b/change_o/makedb.sh Mon Aug 29 03:28:49 2016 -0400 @@ -29,7 +29,10 @@ echo "makedb: $PWD/outdir" -/data/users/david/anaconda3/bin/python $dir/MakeDb.py imgt -i $input --outdir $PWD/outdir --outname output $noparse $scores $regions +python3 $dir/MakeDb.py imgt -i $input --outdir $PWD/outdir --outname output $noparse $scores $regions +#/data/users/david/anaconda3/bin/python $dir/MakeDb.py imgt -i $input --outdir $PWD/outdir --outname output $noparse $scores $regions #/home/galaxy/anaconda3/bin/python $dir/MakeDb.py imgt -i $input --outdir $PWD/outdir --outname output $noparse $scores $regions mv $PWD/outdir/output_db-pass.tab $output + +rm -rf $PWD/outdir/ diff -r 4a93146f87aa -r e87dcca14bd6 merge.r --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/merge.r Mon Aug 29 03:28:49 2016 -0400 @@ -0,0 +1,27 @@ +args <- commandArgs(trailingOnly = TRUE) + +input.1 = args[1] +input.2 = args[2] + +fields.1 = args[3] +fields.2 = args[4] + +field.1 = args[5] +field.2 = args[6] + +output = args[7] + +dat1 = read.table(input.1, header=T, sep="\t", quote="", stringsAsFactors=F, fill=T, row.names=NULL) +if(fields.1 != "all"){ + fields.1 = unlist(strsplit(fields.1, ",")) + dat1 = dat1[,fields.1] +} +dat2 = read.table(input.2, header=T, sep="\t", quote="", stringsAsFactors=F, fill=T, row.names=NULL) +if(fields.2 != "all"){ + fields.2 = unlist(strsplit(fields.2, ",")) + dat2 = dat2[,fields.2] +} + +dat3 = merge(dat1, dat2, by.x=field.1, by.y=field.2) + +write.table(dat3, output, sep="\t",quote=F,row.names=F,col.names=T) diff -r 4a93146f87aa -r e87dcca14bd6 wrapper.sh --- a/wrapper.sh Mon Aug 22 09:11:17 2016 -0400 +++ b/wrapper.sh Mon Aug 29 03:28:49 2016 -0400 @@ -374,12 +374,15 @@ echo "The data used to generate the sexond SHM Overview plotDownload" >> $output echo "The data used to generate the third SHM Overview plotDownload" >> $output echo "The alignment info on the unmatched sequencesDownload" >> $output + echo "Motif data per sequence IDDownload" >> $output echo "Mutation data per sequence IDDownload" >> $output echo "AA mutation data per sequence IDDownload" >> $output echo "Absent AA location data per sequence IDDownload" >> $output echo "CDR1+FR2+CDR2+FR3+CDR3 sequences that show up more than onceDownload" >> $output + echo "Base count for every sequenceDownload" >> $output + echo "Baseline PDF (http://selection.med.yale.edu/baseline/)Download" >> $output echo "Baseline dataDownload" >> $output echo "Baseline ca PDFDownload" >> $output @@ -388,6 +391,7 @@ echo "Baseline cg dataDownload" >> $output echo "Baseline cm PDFDownload" >> $output echo "Baseline cm dataDownload" >> $output + echo "An IMGT archive with just the matched and filtered sequencesDownload" >> $output echo "An IMGT archive with just the matched and filtered ca sequencesDownload" >> $output echo "An IMGT archive with just the matched and filtered ca1 sequencesDownload" >> $output @@ -398,8 +402,16 @@ echo "An IMGT archive with just the matched and filtered cg3 sequencesDownload" >> $output echo "An IMGT archive with just the matched and filtered cg4 sequencesDownload" >> $output echo "An IMGT archive with just the matched and filtered cm sequencesDownload" >> $output -echo "The Change-O DB file with defined clonesDownload" >> $output + +echo "The Change-O DB file with defined clones and subclass annotationDownload" >> $output echo "The Change-O DB defined clones summary fileDownload" >> $output +echo "The Change-O DB file with defined clones of caDownload" >> $output +echo "The Change-O DB defined clones summary file of caDownload" >> $output +echo "The Change-O DB file with defined clones of cgDownload" >> $output +echo "The Change-O DB defined clones summary file of cgDownload" >> $output +echo "The Change-O DB file with defined clones of cmDownload" >> $output +echo "The Change-O DB defined clones summary file of cmDownload" >> $output + echo "" >> $output echo "" >> $output #downloads tab end @@ -462,7 +474,6 @@ echo "" >> $outdir/base_overview.html echo "---------------- change-o MakeDB ----------------" -echo "---------------- change-o MakeDB ----------------
" >> $log mkdir $outdir/change_o @@ -471,11 +482,35 @@ cd $outdir/change_o bash $dir/change_o/makedb.sh $input false false false $outdir/change_o/change-o-db.txt +bash $dir/change_o/define_clones.sh bygroup $outdir/change_o/change-o-db.txt gene first ham none min complete 3.0 $outdir/change_o/change-o-db-defined_clones.txt $outdir/change_o/change-o-defined_clones-summary.txt -echo "---------------- change-o DefineClones ----------------" -echo "---------------- change-o DefineClones ----------------
" >> $log +Rscript $dir/merge.r $outdir/change_o/change-o-db-defined_clones.txt $outdir/merged.txt "all" "Sequence.ID,best_match" "SEQUENCE_ID" "Sequence.ID" $outdir/change_o/change-o-db-defined_clones.txt 2>&1 + +echo "Rscript $dir/merge.r $outdir/change_o/change-o-db-defined_clones.txt $outdir/$outdir/merged.txt 'all' 'Sequence.ID,best_match' 'Sequence.ID' 'Sequence.ID' '\t' $outdir/change_o/change-o-db-defined_clones.txt 2>&1" + +if [[ $(wc -l < $outdir/new_IMGT_ca/1_Summary.txt) -gt "1" ]]; then + bash $dir/change_o/makedb.sh $outdir/new_IMGT_ca.txz false false false $outdir/change_o/change-o-db-ca.txt + bash $dir/change_o/define_clones.sh bygroup $outdir/change_o/change-o-db-ca.txt gene first ham none min complete 3.0 $outdir/change_o/change-o-db-defined_clones-ca.txt $outdir/change_o/change-o-defined_clones-summary-ca.txt +else + echo "No ca sequences" > "$outdir/change_o/change-o-db-defined_clones-ca.txt" + echo "No ca sequences" > "$outdir/change_o/change-o-defined_clones-summary-ca.txt" +fi -bash $dir/change_o/define_clones.sh bygroup $outdir/change_o/change-o-db.txt gene first ham none min complete 3.0 $outdir/change_o/change-o-db-defined_clones.txt $outdir/change_o/change-o-defined_clones-summary.txt +if [[ $(wc -l < $outdir/new_IMGT_cg/1_Summary.txt) -gt "1" ]]; then + bash $dir/change_o/makedb.sh $outdir/new_IMGT_cg.txz false false false $outdir/change_o/change-o-db-cg.txt + bash $dir/change_o/define_clones.sh bygroup $outdir/change_o/change-o-db-cg.txt gene first ham none min complete 3.0 $outdir/change_o/change-o-db-defined_clones-cg.txt $outdir/change_o/change-o-defined_clones-summary-cg.txt +else + echo "No cg sequences" > "$outdir/change_o/change-o-db-defined_clones-cg.txt" + echo "No cg sequences" > "$outdir/change_o/change-o-defined_clones-summary-cg.txt" +fi + +if [[ $(wc -l < $outdir/new_IMGT_cm/1_Summary.txt) -gt "1" ]]; then + bash $dir/change_o/makedb.sh $outdir/new_IMGT_cm.txz false false false $outdir/change_o/change-o-db-cm.txt + bash $dir/change_o/define_clones.sh bygroup $outdir/change_o/change-o-db-cm.txt gene first ham none min complete 3.0 $outdir/change_o/change-o-db-defined_clones-cm.txt $outdir/change_o/change-o-defined_clones-summary-cm.txt +else + echo "No cm sequences" > "$outdir/change_o/change-o-db-defined_clones-cm.txt" + echo "No cm sequences" > "$outdir/change_o/change-o-defined_clones-summary-cm.txt" +fi PWD="$tmp"