annotate baseline/wrapper.sh @ 127:afb0937ec0dc draft default tip

Uploaded
author davidvanzessen
date Tue, 13 Sep 2016 08:55:05 -0400
parents e7b550d52eb7
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
114
e7b550d52eb7 Uploaded
davidvanzessen
parents:
diff changeset
1 #!/bin/bash
e7b550d52eb7 Uploaded
davidvanzessen
parents:
diff changeset
2 dir="$(cd "$(dirname "$0")" && pwd)"
e7b550d52eb7 Uploaded
davidvanzessen
parents:
diff changeset
3
e7b550d52eb7 Uploaded
davidvanzessen
parents:
diff changeset
4 testID=$1
e7b550d52eb7 Uploaded
davidvanzessen
parents:
diff changeset
5 species=$2
e7b550d52eb7 Uploaded
davidvanzessen
parents:
diff changeset
6 substitutionModel=$3
e7b550d52eb7 Uploaded
davidvanzessen
parents:
diff changeset
7 mutabilityModel=$4
e7b550d52eb7 Uploaded
davidvanzessen
parents:
diff changeset
8 clonal=$5
e7b550d52eb7 Uploaded
davidvanzessen
parents:
diff changeset
9 fixIndels=$6
e7b550d52eb7 Uploaded
davidvanzessen
parents:
diff changeset
10 region=$7
e7b550d52eb7 Uploaded
davidvanzessen
parents:
diff changeset
11 inputs=$8
e7b550d52eb7 Uploaded
davidvanzessen
parents:
diff changeset
12 inputs=($inputs)
e7b550d52eb7 Uploaded
davidvanzessen
parents:
diff changeset
13 IDs=$9
e7b550d52eb7 Uploaded
davidvanzessen
parents:
diff changeset
14 IDs=($IDs)
e7b550d52eb7 Uploaded
davidvanzessen
parents:
diff changeset
15 ref=${10}
e7b550d52eb7 Uploaded
davidvanzessen
parents:
diff changeset
16 output=${11}
e7b550d52eb7 Uploaded
davidvanzessen
parents:
diff changeset
17 selection=${12}
e7b550d52eb7 Uploaded
davidvanzessen
parents:
diff changeset
18 output_table=${13}
e7b550d52eb7 Uploaded
davidvanzessen
parents:
diff changeset
19 outID="result"
e7b550d52eb7 Uploaded
davidvanzessen
parents:
diff changeset
20
e7b550d52eb7 Uploaded
davidvanzessen
parents:
diff changeset
21 echo "$PWD"
e7b550d52eb7 Uploaded
davidvanzessen
parents:
diff changeset
22
e7b550d52eb7 Uploaded
davidvanzessen
parents:
diff changeset
23 echo "testID = $testID"
e7b550d52eb7 Uploaded
davidvanzessen
parents:
diff changeset
24 echo "species = $species"
e7b550d52eb7 Uploaded
davidvanzessen
parents:
diff changeset
25 echo "substitutionModel = $substitutionModel"
e7b550d52eb7 Uploaded
davidvanzessen
parents:
diff changeset
26 echo "mutabilityModel = $mutabilityModel"
e7b550d52eb7 Uploaded
davidvanzessen
parents:
diff changeset
27 echo "clonal = $clonal"
e7b550d52eb7 Uploaded
davidvanzessen
parents:
diff changeset
28 echo "fixIndels = $fixIndels"
e7b550d52eb7 Uploaded
davidvanzessen
parents:
diff changeset
29 echo "region = $region"
e7b550d52eb7 Uploaded
davidvanzessen
parents:
diff changeset
30 echo "inputs = ${inputs[@]}"
e7b550d52eb7 Uploaded
davidvanzessen
parents:
diff changeset
31 echo "IDs = ${IDs[@]}"
e7b550d52eb7 Uploaded
davidvanzessen
parents:
diff changeset
32 echo "ref = $ref"
e7b550d52eb7 Uploaded
davidvanzessen
parents:
diff changeset
33 echo "output = $output"
e7b550d52eb7 Uploaded
davidvanzessen
parents:
diff changeset
34 echo "outID = $outID"
e7b550d52eb7 Uploaded
davidvanzessen
parents:
diff changeset
35
e7b550d52eb7 Uploaded
davidvanzessen
parents:
diff changeset
36 fasta="$PWD/baseline.fasta"
e7b550d52eb7 Uploaded
davidvanzessen
parents:
diff changeset
37
e7b550d52eb7 Uploaded
davidvanzessen
parents:
diff changeset
38
e7b550d52eb7 Uploaded
davidvanzessen
parents:
diff changeset
39 count=0
e7b550d52eb7 Uploaded
davidvanzessen
parents:
diff changeset
40 for current in ${inputs[@]}
e7b550d52eb7 Uploaded
davidvanzessen
parents:
diff changeset
41 do
e7b550d52eb7 Uploaded
davidvanzessen
parents:
diff changeset
42 f=$(file $current)
e7b550d52eb7 Uploaded
davidvanzessen
parents:
diff changeset
43 zipType="Zip archive"
e7b550d52eb7 Uploaded
davidvanzessen
parents:
diff changeset
44 if [[ "$f" == *"$zipType"* ]] || [[ "$f" == *"XZ compressed data"* ]]
e7b550d52eb7 Uploaded
davidvanzessen
parents:
diff changeset
45 then
e7b550d52eb7 Uploaded
davidvanzessen
parents:
diff changeset
46 id=${IDs[$count]}
e7b550d52eb7 Uploaded
davidvanzessen
parents:
diff changeset
47 echo "id=$id"
e7b550d52eb7 Uploaded
davidvanzessen
parents:
diff changeset
48 if [[ "$f" == *"Zip archive"* ]] ; then
e7b550d52eb7 Uploaded
davidvanzessen
parents:
diff changeset
49 echo "Zip archive"
e7b550d52eb7 Uploaded
davidvanzessen
parents:
diff changeset
50 echo "unzip $input -d $PWD/files/"
e7b550d52eb7 Uploaded
davidvanzessen
parents:
diff changeset
51 unzip $current -d "$PWD/$id/"
e7b550d52eb7 Uploaded
davidvanzessen
parents:
diff changeset
52 elif [[ "$f" == *"XZ compressed data"* ]] ; then
e7b550d52eb7 Uploaded
davidvanzessen
parents:
diff changeset
53 echo "ZX archive"
e7b550d52eb7 Uploaded
davidvanzessen
parents:
diff changeset
54 echo "tar -xJf $input -C $PWD/files/"
e7b550d52eb7 Uploaded
davidvanzessen
parents:
diff changeset
55 mkdir -p "$PWD/$id/files"
e7b550d52eb7 Uploaded
davidvanzessen
parents:
diff changeset
56 tar -xJf $current -C "$PWD/$id/files/"
e7b550d52eb7 Uploaded
davidvanzessen
parents:
diff changeset
57 fi
e7b550d52eb7 Uploaded
davidvanzessen
parents:
diff changeset
58 summaryfile="$PWD/summary_${id}.txt"
e7b550d52eb7 Uploaded
davidvanzessen
parents:
diff changeset
59 gappedfile="$PWD/gappednt_${id}.txt"
e7b550d52eb7 Uploaded
davidvanzessen
parents:
diff changeset
60 filtered="$PWD/filtered_${id}.txt"
e7b550d52eb7 Uploaded
davidvanzessen
parents:
diff changeset
61 filecount=`ls -l $PWD/$id/ | wc -l`
e7b550d52eb7 Uploaded
davidvanzessen
parents:
diff changeset
62 if [[ "$filecount" -eq "2" ]]
e7b550d52eb7 Uploaded
davidvanzessen
parents:
diff changeset
63 then
e7b550d52eb7 Uploaded
davidvanzessen
parents:
diff changeset
64 cat $PWD/$id/*/1_* > $summaryfile
e7b550d52eb7 Uploaded
davidvanzessen
parents:
diff changeset
65 cat $PWD/$id/*/2_* > $gappedfile
e7b550d52eb7 Uploaded
davidvanzessen
parents:
diff changeset
66 else
e7b550d52eb7 Uploaded
davidvanzessen
parents:
diff changeset
67 cat $PWD/$id/1_* > $summaryfile
e7b550d52eb7 Uploaded
davidvanzessen
parents:
diff changeset
68 cat $PWD/$id/2_* > $gappedfile
e7b550d52eb7 Uploaded
davidvanzessen
parents:
diff changeset
69 fi
e7b550d52eb7 Uploaded
davidvanzessen
parents:
diff changeset
70 Rscript $dir/filter.r $summaryfile $gappedfile "$selection" $filtered 2>&1
e7b550d52eb7 Uploaded
davidvanzessen
parents:
diff changeset
71
e7b550d52eb7 Uploaded
davidvanzessen
parents:
diff changeset
72 final="$PWD/final_${id}.txt"
e7b550d52eb7 Uploaded
davidvanzessen
parents:
diff changeset
73 cat $filtered | cut -f2,4,7 > $final
e7b550d52eb7 Uploaded
davidvanzessen
parents:
diff changeset
74 python $dir/script_imgt.py --input $final --ref $ref --output $fasta --id $id
e7b550d52eb7 Uploaded
davidvanzessen
parents:
diff changeset
75 else
e7b550d52eb7 Uploaded
davidvanzessen
parents:
diff changeset
76 python $dir/script_xlsx.py --input $current --ref $ref --output $fasta
e7b550d52eb7 Uploaded
davidvanzessen
parents:
diff changeset
77 fi
e7b550d52eb7 Uploaded
davidvanzessen
parents:
diff changeset
78 count=$((count+1))
e7b550d52eb7 Uploaded
davidvanzessen
parents:
diff changeset
79 done
e7b550d52eb7 Uploaded
davidvanzessen
parents:
diff changeset
80
e7b550d52eb7 Uploaded
davidvanzessen
parents:
diff changeset
81 if [[ $(wc -l < $fasta) -eq "1" ]]; then
e7b550d52eb7 Uploaded
davidvanzessen
parents:
diff changeset
82 echo "No sequences in the fasta file, exiting"
e7b550d52eb7 Uploaded
davidvanzessen
parents:
diff changeset
83 exit 0
e7b550d52eb7 Uploaded
davidvanzessen
parents:
diff changeset
84 fi
e7b550d52eb7 Uploaded
davidvanzessen
parents:
diff changeset
85
e7b550d52eb7 Uploaded
davidvanzessen
parents:
diff changeset
86 workdir="$PWD"
e7b550d52eb7 Uploaded
davidvanzessen
parents:
diff changeset
87 cd $dir
e7b550d52eb7 Uploaded
davidvanzessen
parents:
diff changeset
88 echo "file: ${inputs[0]}"
e7b550d52eb7 Uploaded
davidvanzessen
parents:
diff changeset
89 #Rscript --verbose $dir/Baseline_Main.r $testID $species $substitutionModel $mutabilityModel $clonal $fixIndels $region ${inputs[0]} $workdir/ $outID 2>&1
e7b550d52eb7 Uploaded
davidvanzessen
parents:
diff changeset
90 Rscript --verbose $dir/Baseline_Main.r $testID $species $substitutionModel $mutabilityModel $clonal $fixIndels $region $fasta $workdir/ $outID 2>&1
e7b550d52eb7 Uploaded
davidvanzessen
parents:
diff changeset
91
e7b550d52eb7 Uploaded
davidvanzessen
parents:
diff changeset
92 echo "$workdir/${outID}.txt"
e7b550d52eb7 Uploaded
davidvanzessen
parents:
diff changeset
93
e7b550d52eb7 Uploaded
davidvanzessen
parents:
diff changeset
94 rows=`tail -n +2 $workdir/${outID}.txt | grep -v "All sequences combined" | grep -n 'Group' | grep -Eoh '^[0-9]+' | tr '\n' ' '`
e7b550d52eb7 Uploaded
davidvanzessen
parents:
diff changeset
95 rows=($rows)
e7b550d52eb7 Uploaded
davidvanzessen
parents:
diff changeset
96 #unset rows[${#rows[@]}-1]
e7b550d52eb7 Uploaded
davidvanzessen
parents:
diff changeset
97
e7b550d52eb7 Uploaded
davidvanzessen
parents:
diff changeset
98 cd $dir
e7b550d52eb7 Uploaded
davidvanzessen
parents:
diff changeset
99 Rscript --verbose $dir/comparePDFs.r $workdir/${outID}.RData $output ${rows[@]} 2>&1
e7b550d52eb7 Uploaded
davidvanzessen
parents:
diff changeset
100 cp $workdir/result.txt ${output_table}
e7b550d52eb7 Uploaded
davidvanzessen
parents:
diff changeset
101
e7b550d52eb7 Uploaded
davidvanzessen
parents:
diff changeset
102
e7b550d52eb7 Uploaded
davidvanzessen
parents:
diff changeset
103
e7b550d52eb7 Uploaded
davidvanzessen
parents:
diff changeset
104