annotate pal_finder_wrapper.sh @ 14:3f8bf1a0403b draft

Uploaded version with bad primer ranger detection (WIP).
author pjbriggs
date Thu, 22 Mar 2018 07:21:26 -0400
parents d26fb5260c67
children a3af1ff4cad1
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
1 #!/bin/sh
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
2 #
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
3 # pal_finder_wrapper.sh: run pal_finder perl script as a Galaxy tool
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
4 #
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
5 # Usage: run_palfinder.sh FASTQ_R1 FASTQ_R2 MICROSAT_SUMMARY PAL_SUMMARY FILTERED_MICROSATS [OPTIONS]
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
6 # run_palfinder.sh --454 FASTA MICROSAT_SUMMARY PAL_SUMMARY [OPTIONS]
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
7 #
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
8 # Options:
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
9 #
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
10 # --primer-prefix PREFIX: prefix added to the beginning of all primer names (prPrefixName)
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
11 # --2merMinReps N: miniumum number of 2-mer repeat units to detect (0=ignore units of this size)
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
12 # --3merMinReps N
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
13 # --4merMinReps N
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
14 # --5merMinReps N
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
15 # --6merMinReps N
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
16 # --primer-mispriming-library FASTA: specify a Fasta file with sequences to avoid amplifying
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
17 # --primer-opt-size VALUE: optimum primer length
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
18 # --primer-min-size VALUE: minimum acceptable primer length
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
19 # --primer-max-size VALUE: maximum acceptable primer length
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
20 # --primer-min-gc VALUE: minimum allowable percentage of Gs and Cs in any primer
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
21 # --primer-max-gc VALUE: maximum allowable percentage of Gs and Cs
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
22 # --primer-gc-clamp VALUE: number of consecutive Gs and Cs at 3' end of both left and right primer
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
23 # --primer-max-end-gc VALUE: max number of Gs or Cs in last five 3' bases of left or right primer
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
24 # --primer-min-tm VALUE: minimum acceptable melting temperature (Celsius) for a primer oligo
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
25 # --primer-max-tm VALUE: maximum acceptable melting temperature (Celsius)
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
26 # --primer-opt-tm VALUE: optimum melting temperature (Celsius)
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
27 # --primer-pair-max-diff-tm VALUE: max difference between melting temps of left & right primers
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
28 # --output_config_file FNAME: write a copy of the config.txt file to FNAME
14
3f8bf1a0403b Uploaded version with bad primer ranger detection (WIP).
pjbriggs
parents: 12
diff changeset
29 # --bad_primer_ranges FNAME: write a list of the read IDs generating bad primer ranges to FNAME
3f8bf1a0403b Uploaded version with bad primer ranger detection (WIP).
pjbriggs
parents: 12
diff changeset
30 # --filter_microsats FNAME: write output of filter options to FNAME
3
1cea7b4b838f Uploaded version 0.02.04.3.
pjbriggs
parents: 1
diff changeset
31 # -assembly FNAME: run the 'assembly' filter option and write to FNAME
1cea7b4b838f Uploaded version 0.02.04.3.
pjbriggs
parents: 1
diff changeset
32 # -primers: run the 'primers' filter option
1cea7b4b838f Uploaded version 0.02.04.3.
pjbriggs
parents: 1
diff changeset
33 # -occurrences: run the 'occurrences' filter option
1cea7b4b838f Uploaded version 0.02.04.3.
pjbriggs
parents: 1
diff changeset
34 # -rankmotifs: run the 'rankmotifs' filter option
0
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
35 #
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
36 # pal_finder is available from http://sourceforge.net/projects/palfinder/
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
37 #
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
38 # primer3 is available from http://primer3.sourceforge.net/releases.php
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
39 # (nb needs version 2.0.0-alpha)
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
40 #
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
41 # Explicitly set the locations of the pal_finder script, data files and the primer3
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
42 # executable by setting the following variables in the environment:
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
43 #
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
44 # * PALFINDER_SCRIPT_DIR: location of the pal_finder Perl script (defaults to
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
45 # /usr/bin)
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
46 # * PALFINDER_DATA_DIR: location of the pal_finder data files (specifically
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
47 # config.txt and simple.ref; defaults to /usr/share/pal_finder_v0.02.04)
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
48 # * PRIMER3_CORE_EXE: name of the primer3_core program, which should include the
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
49 # full path if it's not on the Galaxy user's PATH (defaults to primer3_core)
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
50 #
1
288a74cd7a8d Explicitly build and use perl 5.16.3 as a tool dependency.
pjbriggs
parents: 0
diff changeset
51 echo "### $(basename $0) ###"
0
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
52 echo $*
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
53 #
8
67ab365c29a7 Version v0.02.04.5: handle large output files
pjbriggs
parents: 5
diff changeset
54 # Maximum size reporting log file contents
67ab365c29a7 Version v0.02.04.5: handle large output files
pjbriggs
parents: 5
diff changeset
55 MAX_LINES=500
67ab365c29a7 Version v0.02.04.5: handle large output files
pjbriggs
parents: 5
diff changeset
56 #
14
3f8bf1a0403b Uploaded version with bad primer ranger detection (WIP).
pjbriggs
parents: 12
diff changeset
57 # Get helper functions
3f8bf1a0403b Uploaded version with bad primer ranger detection (WIP).
pjbriggs
parents: 12
diff changeset
58 . $(dirname $0)/pal_finder_wrapper_utils.sh
3f8bf1a0403b Uploaded version with bad primer ranger detection (WIP).
pjbriggs
parents: 12
diff changeset
59 #
0
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
60 # Initialise locations of scripts, data and executables
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
61 #
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
62 # Set these in the environment to overide at execution time
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
63 : ${PALFINDER_SCRIPT_DIR:=/usr/bin}
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
64 : ${PALFINDER_DATA_DIR:=/usr/share/pal_finder_v0.02.04}
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
65 : ${PRIMER3_CORE_EXE:=primer3_core}
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
66 #
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
67 # Filter script is in the same directory as this script
5
ef95b26a2407 Uploaded 0.02.04.4.
pjbriggs
parents: 3
diff changeset
68 PALFINDER_FILTER=$(dirname $0)/pal_filter.py
3
1cea7b4b838f Uploaded version 0.02.04.3.
pjbriggs
parents: 1
diff changeset
69 if [ ! -f $PALFINDER_FILTER ] ; then
14
3f8bf1a0403b Uploaded version with bad primer ranger detection (WIP).
pjbriggs
parents: 12
diff changeset
70 fatal No $PALFINDER_FILTER script
0
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
71 fi
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
72 #
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
73 # Check that we have all the components
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
74 if [ "$(have_program $PRIMER3_CORE_EXE)" == "no" ] ; then
14
3f8bf1a0403b Uploaded version with bad primer ranger detection (WIP).
pjbriggs
parents: 12
diff changeset
75 fatal "primer3_core missing: ${PRIMER3_CORE_EXE} not found"
0
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
76 fi
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
77 if [ ! -f "${PALFINDER_DATA_DIR}/config.txt" ] ; then
14
3f8bf1a0403b Uploaded version with bad primer ranger detection (WIP).
pjbriggs
parents: 12
diff changeset
78 fatal "pal_finder config.txt not found in ${PALFINDER_DATA_DIR}"
0
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
79 fi
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
80 if [ ! -f "${PALFINDER_SCRIPT_DIR}/pal_finder_v0.02.04.pl" ] ; then
14
3f8bf1a0403b Uploaded version with bad primer ranger detection (WIP).
pjbriggs
parents: 12
diff changeset
81 fatal "pal_finder_v0.02.04.pl not found in ${PALFINDER_SCRIPT_DIR}"
0
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
82 fi
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
83 #
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
84 # Initialise parameters used in the config.txt file
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
85 PRIMER_PREFIX="test"
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
86 MIN_2_MER_REPS=6
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
87 MIN_3_MER_REPS=0
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
88 MIN_4_MER_REPS=0
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
89 MIN_5_MER_REPS=0
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
90 MIN_6_MER_REPS=0
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
91 PRIMER_MISPRIMING_LIBRARY=$PALFINDER_DATA_DIR/simple.ref
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
92 PRIMER_OPT_SIZE=
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
93 PRIMER_MAX_SIZE=
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
94 PRIMER_MIN_SIZE=
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
95 PRIMER_MAX_GC=
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
96 PRIMER_MIN_GC=
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
97 PRIMER_GC_CLAMP=
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
98 PRIMER_MAX_END_GC=
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
99 PRIMER_OPT_TM=
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
100 PRIMER_MAX_TM=
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
101 PRIMER_MIN_TM=
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
102 PRIMER_PAIR_MAX_DIFF_TM=
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
103 OUTPUT_CONFIG_FILE=
3
1cea7b4b838f Uploaded version 0.02.04.3.
pjbriggs
parents: 1
diff changeset
104 OUTPUT_ASSEMBLY=
0
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
105 FILTERED_MICROSATS=
3
1cea7b4b838f Uploaded version 0.02.04.3.
pjbriggs
parents: 1
diff changeset
106 FILTER_OPTIONS=
14
3f8bf1a0403b Uploaded version with bad primer ranger detection (WIP).
pjbriggs
parents: 12
diff changeset
107 BAD_PRIMER_RANGES=
0
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
108 #
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
109 # Collect command line arguments
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
110 if [ $# -lt 2 ] ; then
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
111 echo "Usage: $0 FASTQ_R1 FASTQ_R2 MICROSAT_SUMMARY PAL_SUMMARY [OPTIONS]"
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
112 echo " $0 --454 FASTA MICROSAT_SUMMARY PAL_SUMMARY [OPTIONS]"
14
3f8bf1a0403b Uploaded version with bad primer ranger detection (WIP).
pjbriggs
parents: 12
diff changeset
113 fatal "Bad command line"
0
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
114 fi
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
115 if [ "$1" == "--454" ] ; then
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
116 PLATFORM="454"
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
117 FNA=$2
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
118 else
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
119 PLATFORM="Illumina"
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
120 FASTQ_R1=$1
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
121 FASTQ_R2=$2
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
122 fi
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
123 MICROSAT_SUMMARY=$3
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
124 PAL_SUMMARY=$4
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
125 shift; shift; shift; shift
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
126 #
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
127 # Collect command line options
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
128 while [ ! -z "$1" ] ; do
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
129 case "$1" in
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
130 --primer-prefix)
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
131 shift
3
1cea7b4b838f Uploaded version 0.02.04.3.
pjbriggs
parents: 1
diff changeset
132 # Convert all non-alphanumeric characters to underscores in prefix
1cea7b4b838f Uploaded version 0.02.04.3.
pjbriggs
parents: 1
diff changeset
133 PRIMER_PREFIX=$(echo -n $1 | tr -s -c "[:alnum:]" "_")
0
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
134 ;;
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
135 --2merMinReps)
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
136 shift
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
137 MIN_2_MER_REPS=$1
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
138 ;;
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
139 --3merMinReps)
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
140 shift
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
141 MIN_3_MER_REPS=$1
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
142 ;;
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
143 --4merMinReps)
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
144 shift
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
145 MIN_4_MER_REPS=$1
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
146 ;;
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
147 --5merMinReps)
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
148 shift
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
149 MIN_5_MER_REPS=$1
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
150 ;;
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
151 --6merMinReps)
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
152 shift
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
153 MIN_6_MER_REPS=$1
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
154 ;;
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
155 --primer-mispriming-library)
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
156 shift
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
157 PRIMER_MISPRIMING_LIBRARY=$1
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
158 ;;
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
159 --primer-opt-size)
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
160 shift
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
161 PRIMER_OPT_SIZE=$1
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
162 ;;
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
163 --primer-max-size)
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
164 shift
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
165 PRIMER_MAX_SIZE=$1
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
166 ;;
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
167 --primer-min-size)
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
168 shift
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
169 PRIMER_MIN_SIZE=$1
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
170 ;;
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
171 --primer-max-gc)
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
172 shift
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
173 PRIMER_MAX_GC=$1
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
174 ;;
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
175 --primer-min-gc)
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
176 shift
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
177 PRIMER_MIN_GC=$1
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
178 ;;
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
179 --primer-gc-clamp)
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
180 shift
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
181 PRIMER_GC_CLAMP=$1
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
182 ;;
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
183 --primer-max-end-gc)
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
184 shift
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
185 PRIMER_MAX_END_GC=$1
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
186 ;;
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
187 --primer-opt-tm)
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
188 shift
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
189 PRIMER_OPT_TM=$1
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
190 ;;
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
191 --primer-max-tm)
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
192 shift
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
193 PRIMER_MAX_TM=$1
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
194 ;;
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
195 --primer-min-tm)
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
196 shift
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
197 PRIMER_MIN_TM=$1
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
198 ;;
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
199 --primer-pair-max-diff-tm)
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
200 shift
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
201 PRIMER_PAIR_MAX_DIFF_TM=$1
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
202 ;;
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
203 --output_config_file)
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
204 shift
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
205 OUTPUT_CONFIG_FILE=$1
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
206 ;;
14
3f8bf1a0403b Uploaded version with bad primer ranger detection (WIP).
pjbriggs
parents: 12
diff changeset
207 --bad_primer_ranges)
3f8bf1a0403b Uploaded version with bad primer ranger detection (WIP).
pjbriggs
parents: 12
diff changeset
208 shift
3f8bf1a0403b Uploaded version with bad primer ranger detection (WIP).
pjbriggs
parents: 12
diff changeset
209 BAD_PRIMER_RANGES=$1
3f8bf1a0403b Uploaded version with bad primer ranger detection (WIP).
pjbriggs
parents: 12
diff changeset
210 ;;
0
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
211 --filter_microsats)
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
212 shift
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
213 FILTERED_MICROSATS=$1
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
214 ;;
3
1cea7b4b838f Uploaded version 0.02.04.3.
pjbriggs
parents: 1
diff changeset
215 -primers|-occurrences|-rankmotifs)
1cea7b4b838f Uploaded version 0.02.04.3.
pjbriggs
parents: 1
diff changeset
216 FILTER_OPTIONS="$FILTER_OPTIONS $1"
1cea7b4b838f Uploaded version 0.02.04.3.
pjbriggs
parents: 1
diff changeset
217 ;;
1cea7b4b838f Uploaded version 0.02.04.3.
pjbriggs
parents: 1
diff changeset
218 -assembly)
1cea7b4b838f Uploaded version 0.02.04.3.
pjbriggs
parents: 1
diff changeset
219 FILTER_OPTIONS="$FILTER_OPTIONS $1"
1cea7b4b838f Uploaded version 0.02.04.3.
pjbriggs
parents: 1
diff changeset
220 shift
1cea7b4b838f Uploaded version 0.02.04.3.
pjbriggs
parents: 1
diff changeset
221 OUTPUT_ASSEMBLY=$1
1cea7b4b838f Uploaded version 0.02.04.3.
pjbriggs
parents: 1
diff changeset
222 ;;
0
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
223 *)
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
224 echo Unknown option: $1 >&2
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
225 exit 1
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
226 ;;
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
227 esac
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
228 shift
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
229 done
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
230 #
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
231 # Check that primer3_core is available
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
232 got_primer3=`which $PRIMER3_CORE_EXE 2>&1 | grep -v "no primer3_core in"`
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
233 if [ -z "$got_primer3" ] ; then
14
3f8bf1a0403b Uploaded version with bad primer ranger detection (WIP).
pjbriggs
parents: 12
diff changeset
234 fatal "primer3_core not found"
0
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
235 fi
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
236 #
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
237 # Set up the working dir
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
238 if [ "$PLATFORM" == "Illumina" ] ; then
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
239 # Paired end Illumina data as input
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
240 if [ $FASTQ_R1 == $FASTQ_R2 ] ; then
14
3f8bf1a0403b Uploaded version with bad primer ranger detection (WIP).
pjbriggs
parents: 12
diff changeset
241 fatal ERROR R1 and R2 fastqs are the same file
0
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
242 fi
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
243 ln -s $FASTQ_R1
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
244 ln -s $FASTQ_R2
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
245 fastq_r1=$(basename $FASTQ_R1)
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
246 fastq_r2=$(basename $FASTQ_R2)
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
247 else
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
248 # 454 data as input
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
249 ln -s $FNA
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
250 fna=$(basename $FNA)
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
251 fi
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
252 ln -s $PRIMER_MISPRIMING_LIBRARY
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
253 PRIMER_MISPRIMING_LIBRARY=$(basename $PRIMER_MISPRIMING_LIBRARY)
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
254 mkdir Output
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
255 #
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
256 # Copy in the default config.txt file
1
288a74cd7a8d Explicitly build and use perl 5.16.3 as a tool dependency.
pjbriggs
parents: 0
diff changeset
257 echo "### Creating config.txt file for pal_finder run ###"
0
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
258 /bin/cp $PALFINDER_DATA_DIR/config.txt .
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
259 #
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
260 # Update the config.txt file with new values
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
261 # Input files
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
262 set_config_value platform $PLATFORM config.txt
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
263 if [ "$PLATFORM" == "Illumina" ] ; then
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
264 set_config_value inputFormat fastq config.txt
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
265 set_config_value pairedEnd 1 config.txt
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
266 set_config_value inputReadFile $fastq_r1 config.txt
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
267 set_config_value pairedReadFile $fastq_r2 config.txt
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
268 else
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
269 set_config_value inputFormat fasta config.txt
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
270 set_config_value pairedEnd 0 config.txt
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
271 set_config_value input454reads $fna config.txt
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
272 fi
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
273 # Output files
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
274 set_config_value MicrosatSumOut Output/microsat_summary.txt config.txt
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
275 set_config_value PALsummaryOut Output/PAL_summary.txt config.txt
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
276 # Microsat info
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
277 set_config_value 2merMinReps $MIN_2_MER_REPS config.txt
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
278 set_config_value 3merMinReps $MIN_3_MER_REPS config.txt
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
279 set_config_value 4merMinReps $MIN_4_MER_REPS config.txt
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
280 set_config_value 5merMinReps $MIN_5_MER_REPS config.txt
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
281 set_config_value 6merMinReps $MIN_6_MER_REPS config.txt
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
282 # Primer3 settings
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
283 set_config_value primer3input Output/pr3in.txt config.txt
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
284 set_config_value primer3output Output/pr3out.txt config.txt
14
3f8bf1a0403b Uploaded version with bad primer ranger detection (WIP).
pjbriggs
parents: 12
diff changeset
285 set_config_value keepPrimer3files 1 config.txt
0
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
286 set_config_value primer3executable $PRIMER3_CORE_EXE config.txt
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
287 set_config_value prNamePrefix ${PRIMER_PREFIX}_ config.txt
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
288 set_config_value PRIMER_MISPRIMING_LIBRARY "$PRIMER_MISPRIMING_LIBRARY" config.txt
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
289 set_config_value PRIMER_OPT_SIZE "$PRIMER_OPT_SIZE" config.txt
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
290 set_config_value PRIMER_MIN_SIZE "$PRIMER_MIN_SIZE" config.txt
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
291 set_config_value PRIMER_MAX_SIZE "$PRIMER_MAX_SIZE" config.txt
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
292 set_config_value PRIMER_MIN_GC "$PRIMER_MIN_GC" config.txt
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
293 set_config_value PRIMER_MAX_GC "$PRIMER_MAX_GC" config.txt
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
294 set_config_value PRIMER_GC_CLAMP "$PRIMER_GC_CLAMP" config.txt
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
295 set_config_value PRIMER_MAX_END_GC "$PRIMER_MAX_END_GC" config.txt
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
296 set_config_value PRIMER_MIN_TM "$PRIMER_MIN_TM" config.txt
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
297 set_config_value PRIMER_MAX_TM "$PRIMER_MAX_TM" config.txt
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
298 set_config_value PRIMER_OPT_TM "$PRIMER_OPT_TM" config.txt
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
299 set_config_value PRIMER_PAIR_MAX_DIFF_TM "$PRIMER_PAIR_MAX_DIFF_TM" config.txt
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
300 #
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
301 # Run pal_finder
1
288a74cd7a8d Explicitly build and use perl 5.16.3 as a tool dependency.
pjbriggs
parents: 0
diff changeset
302 echo "### Running pal_finder ###"
8
67ab365c29a7 Version v0.02.04.5: handle large output files
pjbriggs
parents: 5
diff changeset
303 perl $PALFINDER_SCRIPT_DIR/pal_finder_v0.02.04.pl config.txt 1>pal_finder.log 2>&1
67ab365c29a7 Version v0.02.04.5: handle large output files
pjbriggs
parents: 5
diff changeset
304 echo "### pal_finder finished ###"
67ab365c29a7 Version v0.02.04.5: handle large output files
pjbriggs
parents: 5
diff changeset
305 #
67ab365c29a7 Version v0.02.04.5: handle large output files
pjbriggs
parents: 5
diff changeset
306 # Handlers the pal_finder log file
67ab365c29a7 Version v0.02.04.5: handle large output files
pjbriggs
parents: 5
diff changeset
307 echo "### Output from pal_finder ###"
67ab365c29a7 Version v0.02.04.5: handle large output files
pjbriggs
parents: 5
diff changeset
308 if [ $(wc -l pal_finder.log | cut -d" " -f1) -gt $MAX_LINES ] ; then
67ab365c29a7 Version v0.02.04.5: handle large output files
pjbriggs
parents: 5
diff changeset
309 echo WARNING output too long, truncated to last $MAX_LINES lines:
67ab365c29a7 Version v0.02.04.5: handle large output files
pjbriggs
parents: 5
diff changeset
310 echo ...
67ab365c29a7 Version v0.02.04.5: handle large output files
pjbriggs
parents: 5
diff changeset
311 fi
67ab365c29a7 Version v0.02.04.5: handle large output files
pjbriggs
parents: 5
diff changeset
312 tail -$MAX_LINES pal_finder.log
0
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
313 #
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
314 # Check that log ends with "Done!!" message
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
315 if [ -z "$(tail -n 1 pal_finder.log | grep Done!!)" ] ; then
14
3f8bf1a0403b Uploaded version with bad primer ranger detection (WIP).
pjbriggs
parents: 12
diff changeset
316 fatal ERROR pal_finder failed to complete successfully
3f8bf1a0403b Uploaded version with bad primer ranger detection (WIP).
pjbriggs
parents: 12
diff changeset
317 fi
3f8bf1a0403b Uploaded version with bad primer ranger detection (WIP).
pjbriggs
parents: 12
diff changeset
318 echo "### pal_finder finished ###"
3f8bf1a0403b Uploaded version with bad primer ranger detection (WIP).
pjbriggs
parents: 12
diff changeset
319 #
3f8bf1a0403b Uploaded version with bad primer ranger detection (WIP).
pjbriggs
parents: 12
diff changeset
320 # Check for errors in pal_finder output
3f8bf1a0403b Uploaded version with bad primer ranger detection (WIP).
pjbriggs
parents: 12
diff changeset
321 echo "### Checking for errors ###"
3f8bf1a0403b Uploaded version with bad primer ranger detection (WIP).
pjbriggs
parents: 12
diff changeset
322 if [ ! -z "$(grep 'primer3_core: Illegal element in PRIMER_PRODUCT_SIZE_RANGE' pal_finder.log)" ] ; then
3f8bf1a0403b Uploaded version with bad primer ranger detection (WIP).
pjbriggs
parents: 12
diff changeset
323 echo WARNING primer3 terminated prematurely due to bad product size ranges
3f8bf1a0403b Uploaded version with bad primer ranger detection (WIP).
pjbriggs
parents: 12
diff changeset
324 if [ -z "$BAD_PRIMER_RANGES" ] ; then
3f8bf1a0403b Uploaded version with bad primer ranger detection (WIP).
pjbriggs
parents: 12
diff changeset
325 # No output file so report to stderr
3f8bf1a0403b Uploaded version with bad primer ranger detection (WIP).
pjbriggs
parents: 12
diff changeset
326 cat >&2 <<EOF
3f8bf1a0403b Uploaded version with bad primer ranger detection (WIP).
pjbriggs
parents: 12
diff changeset
327 ERROR primer3 terminated prematurely due to bad product size ranges
3f8bf1a0403b Uploaded version with bad primer ranger detection (WIP).
pjbriggs
parents: 12
diff changeset
328
3f8bf1a0403b Uploaded version with bad primer ranger detection (WIP).
pjbriggs
parents: 12
diff changeset
329 Pal_finder generated bad ranges for the following read IDs:
3f8bf1a0403b Uploaded version with bad primer ranger detection (WIP).
pjbriggs
parents: 12
diff changeset
330 EOF
3f8bf1a0403b Uploaded version with bad primer ranger detection (WIP).
pjbriggs
parents: 12
diff changeset
331 echo $(find_bad_primer_ranges Output/pr3in.txt) >&2
3f8bf1a0403b Uploaded version with bad primer ranger detection (WIP).
pjbriggs
parents: 12
diff changeset
332 cat >&2 <<EOF
3f8bf1a0403b Uploaded version with bad primer ranger detection (WIP).
pjbriggs
parents: 12
diff changeset
333
3f8bf1a0403b Uploaded version with bad primer ranger detection (WIP).
pjbriggs
parents: 12
diff changeset
334 This error can occur when input data contains short R1 reads and has
3f8bf1a0403b Uploaded version with bad primer ranger detection (WIP).
pjbriggs
parents: 12
diff changeset
335 has not been properly trimmed and filtered.
3f8bf1a0403b Uploaded version with bad primer ranger detection (WIP).
pjbriggs
parents: 12
diff changeset
336
3f8bf1a0403b Uploaded version with bad primer ranger detection (WIP).
pjbriggs
parents: 12
diff changeset
337 EOF
3f8bf1a0403b Uploaded version with bad primer ranger detection (WIP).
pjbriggs
parents: 12
diff changeset
338 else
3f8bf1a0403b Uploaded version with bad primer ranger detection (WIP).
pjbriggs
parents: 12
diff changeset
339 # Dump bad ranges to file
3f8bf1a0403b Uploaded version with bad primer ranger detection (WIP).
pjbriggs
parents: 12
diff changeset
340 echo "### Writing read IDs with bad primer ranges ###"
3f8bf1a0403b Uploaded version with bad primer ranger detection (WIP).
pjbriggs
parents: 12
diff changeset
341 echo $(find_bad_primer_ranges Output/pr3in.txt) >"$BAD_PRIMER_RANGES"
3f8bf1a0403b Uploaded version with bad primer ranger detection (WIP).
pjbriggs
parents: 12
diff changeset
342 fi
0
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
343 fi
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
344 #
12
d26fb5260c67 0.02.04.6: update to use conda to resolve dependencies.
pjbriggs
parents: 11
diff changeset
345 # Sort microsat_summary output
d26fb5260c67 0.02.04.6: update to use conda to resolve dependencies.
pjbriggs
parents: 11
diff changeset
346 echo "### Sorting microsat summary output ###"
d26fb5260c67 0.02.04.6: update to use conda to resolve dependencies.
pjbriggs
parents: 11
diff changeset
347 head -n 7 Output/microsat_summary.txt | sort >microsat_summary.sorted
d26fb5260c67 0.02.04.6: update to use conda to resolve dependencies.
pjbriggs
parents: 11
diff changeset
348 grep "^$" Output/microsat_summary.txt>>microsat_summary.sorted
d26fb5260c67 0.02.04.6: update to use conda to resolve dependencies.
pjbriggs
parents: 11
diff changeset
349 grep "^Microsat Type" Output/microsat_summary.txt >>microsat_summary.sorted
d26fb5260c67 0.02.04.6: update to use conda to resolve dependencies.
pjbriggs
parents: 11
diff changeset
350 tail -n +11 Output/microsat_summary.txt >>microsat_summary.sorted
d26fb5260c67 0.02.04.6: update to use conda to resolve dependencies.
pjbriggs
parents: 11
diff changeset
351 mv microsat_summary.sorted Output/microsat_summary.txt
d26fb5260c67 0.02.04.6: update to use conda to resolve dependencies.
pjbriggs
parents: 11
diff changeset
352 #
d26fb5260c67 0.02.04.6: update to use conda to resolve dependencies.
pjbriggs
parents: 11
diff changeset
353 # Sort PAL_summary output
d26fb5260c67 0.02.04.6: update to use conda to resolve dependencies.
pjbriggs
parents: 11
diff changeset
354 echo "### Sorting PAL summary output ###"
3
1cea7b4b838f Uploaded version 0.02.04.3.
pjbriggs
parents: 1
diff changeset
355 head -1 Output/PAL_summary.txt > Output/PAL_summary.sorted.txt
1cea7b4b838f Uploaded version 0.02.04.3.
pjbriggs
parents: 1
diff changeset
356 if [ "$PLATFORM" == "Illumina" ] ; then
1cea7b4b838f Uploaded version 0.02.04.3.
pjbriggs
parents: 1
diff changeset
357 grep -v "^readPairID" Output/PAL_summary.txt | sort -k 1 >> Output/PAL_summary.sorted.txt
1cea7b4b838f Uploaded version 0.02.04.3.
pjbriggs
parents: 1
diff changeset
358 else
1cea7b4b838f Uploaded version 0.02.04.3.
pjbriggs
parents: 1
diff changeset
359 grep -v "^SequenceID" Output/PAL_summary.txt | sort -k 1 >> Output/PAL_summary.sorted.txt
1cea7b4b838f Uploaded version 0.02.04.3.
pjbriggs
parents: 1
diff changeset
360 fi
1cea7b4b838f Uploaded version 0.02.04.3.
pjbriggs
parents: 1
diff changeset
361 mv Output/PAL_summary.sorted.txt Output/PAL_summary.txt
1cea7b4b838f Uploaded version 0.02.04.3.
pjbriggs
parents: 1
diff changeset
362 #
1cea7b4b838f Uploaded version 0.02.04.3.
pjbriggs
parents: 1
diff changeset
363 # Run the filtering & assembly script
1cea7b4b838f Uploaded version 0.02.04.3.
pjbriggs
parents: 1
diff changeset
364 if [ ! -z "$FILTERED_MICROSATS" ] || [ ! -z "$OUTPUT_ASSEMBLY" ] ; then
1cea7b4b838f Uploaded version 0.02.04.3.
pjbriggs
parents: 1
diff changeset
365 echo "### Running filtering & assembly script ###"
8
67ab365c29a7 Version v0.02.04.5: handle large output files
pjbriggs
parents: 5
diff changeset
366 python $PALFINDER_FILTER -i $fastq_r1 -j $fastq_r2 -p Output/PAL_summary.txt $FILTER_OPTIONS 1>pal_filter.log 2>&1
67ab365c29a7 Version v0.02.04.5: handle large output files
pjbriggs
parents: 5
diff changeset
367 echo "### Output from pal_filter ###"
67ab365c29a7 Version v0.02.04.5: handle large output files
pjbriggs
parents: 5
diff changeset
368 if [ $(wc -l pal_filter.log | cut -d" " -f1) -gt $MAX_LINES ] ; then
67ab365c29a7 Version v0.02.04.5: handle large output files
pjbriggs
parents: 5
diff changeset
369 echo WARNING output too long, truncated to last $MAX_LINES lines:
67ab365c29a7 Version v0.02.04.5: handle large output files
pjbriggs
parents: 5
diff changeset
370 echo ...
67ab365c29a7 Version v0.02.04.5: handle large output files
pjbriggs
parents: 5
diff changeset
371 fi
67ab365c29a7 Version v0.02.04.5: handle large output files
pjbriggs
parents: 5
diff changeset
372 tail -$MAX_LINES pal_filter.log
0
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
373 if [ $? -ne 0 ] ; then
14
3f8bf1a0403b Uploaded version with bad primer ranger detection (WIP).
pjbriggs
parents: 12
diff changeset
374 fatal $PALFINDER_FILTER exited with non-zero status
3
1cea7b4b838f Uploaded version 0.02.04.3.
pjbriggs
parents: 1
diff changeset
375 elif [ ! -f PAL_summary.filtered ] ; then
14
3f8bf1a0403b Uploaded version with bad primer ranger detection (WIP).
pjbriggs
parents: 12
diff changeset
376 fatal no output from $PALFINDER_FILTER
0
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
377 fi
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
378 fi
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
379 #
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
380 # Clean up
1
288a74cd7a8d Explicitly build and use perl 5.16.3 as a tool dependency.
pjbriggs
parents: 0
diff changeset
381 echo "### Handling output files ###"
0
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
382 if [ -f Output/microsat_summary.txt ] ; then
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
383 /bin/mv Output/microsat_summary.txt $MICROSAT_SUMMARY
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
384 fi
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
385 if [ -f Output/PAL_summary.txt ] ; then
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
386 /bin/mv Output/PAL_summary.txt $PAL_SUMMARY
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
387 fi
3
1cea7b4b838f Uploaded version 0.02.04.3.
pjbriggs
parents: 1
diff changeset
388 if [ ! -z "$FILTERED_MICROSATS" ] && [ -f PAL_summary.filtered ] ; then
1cea7b4b838f Uploaded version 0.02.04.3.
pjbriggs
parents: 1
diff changeset
389 /bin/mv PAL_summary.filtered $FILTERED_MICROSATS
1cea7b4b838f Uploaded version 0.02.04.3.
pjbriggs
parents: 1
diff changeset
390 fi
1cea7b4b838f Uploaded version 0.02.04.3.
pjbriggs
parents: 1
diff changeset
391 if [ ! -z "$OUTPUT_ASSEMBLY" ] ; then
5
ef95b26a2407 Uploaded 0.02.04.4.
pjbriggs
parents: 3
diff changeset
392 assembly=${fastq_r1%.*}_pal_filter_assembly_output.txt
3
1cea7b4b838f Uploaded version 0.02.04.3.
pjbriggs
parents: 1
diff changeset
393 if [ -f "$assembly" ] ; then
1cea7b4b838f Uploaded version 0.02.04.3.
pjbriggs
parents: 1
diff changeset
394 /bin/mv $assembly "$OUTPUT_ASSEMBLY"
5
ef95b26a2407 Uploaded 0.02.04.4.
pjbriggs
parents: 3
diff changeset
395 else
14
3f8bf1a0403b Uploaded version with bad primer ranger detection (WIP).
pjbriggs
parents: 12
diff changeset
396 fatal no assembly output found
3
1cea7b4b838f Uploaded version 0.02.04.3.
pjbriggs
parents: 1
diff changeset
397 fi
0
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
398 fi
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
399 if [ ! -z "$OUTPUT_CONFIG_FILE" ] && [ -f config.txt ] ; then
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
400 /bin/mv config.txt $OUTPUT_CONFIG_FILE
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
401 fi
8
67ab365c29a7 Version v0.02.04.5: handle large output files
pjbriggs
parents: 5
diff changeset
402 #
67ab365c29a7 Version v0.02.04.5: handle large output files
pjbriggs
parents: 5
diff changeset
403 echo "### Pal_finder tool completed ###"
0
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
404 ##
1dac42bb7aab First version pushed to test toolshed.
pjbriggs
parents:
diff changeset
405 #