annotate defuse.xml @ 45:aedaa66483f1 draft

Uploaded
author jjohnson
date Wed, 18 Oct 2017 16:55:57 -0400
parents 225750bf3770
children e500b50b72fd
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
44
225750bf3770 Uploaded
jjohnson
parents: 35
diff changeset
1 <tool id="defuse" name="DeFuse" version="@DEFUSE_VERSION@.1">
225750bf3770 Uploaded
jjohnson
parents: 35
diff changeset
2 <description>identify fusion transcripts</description>
225750bf3770 Uploaded
jjohnson
parents: 35
diff changeset
3 <macros>
225750bf3770 Uploaded
jjohnson
parents: 35
diff changeset
4 <import>macros.xml</import>
225750bf3770 Uploaded
jjohnson
parents: 35
diff changeset
5 </macros>
225750bf3770 Uploaded
jjohnson
parents: 35
diff changeset
6 <requirements>
225750bf3770 Uploaded
jjohnson
parents: 35
diff changeset
7 <expand macro="defuse_requirement" />
225750bf3770 Uploaded
jjohnson
parents: 35
diff changeset
8 </requirements>
45
aedaa66483f1 Uploaded
jjohnson
parents: 44
diff changeset
9 <command><![CDATA[
aedaa66483f1 Uploaded
jjohnson
parents: 44
diff changeset
10 #if $defuse_out.__str__ != 'None':
aedaa66483f1 Uploaded
jjohnson
parents: 44
diff changeset
11 ## ln to output_dir in from_work_dir
aedaa66483f1 Uploaded
jjohnson
parents: 44
diff changeset
12 mkdir -p $defuse_out.dataset.extra_files_path &&
aedaa66483f1 Uploaded
jjohnson
parents: 44
diff changeset
13 ln -s $defuse_out.dataset.extra_files_path output_dir &&
aedaa66483f1 Uploaded
jjohnson
parents: 44
diff changeset
14 #else
aedaa66483f1 Uploaded
jjohnson
parents: 44
diff changeset
15 mkdir -p output_dir &&
aedaa66483f1 Uploaded
jjohnson
parents: 44
diff changeset
16 #end if
aedaa66483f1 Uploaded
jjohnson
parents: 44
diff changeset
17 ## Put executable paths in config file
aedaa66483f1 Uploaded
jjohnson
parents: 44
diff changeset
18 $__tool_directory__/config_sub.sh $defuse_config output_dir/defuse.cfg &&
aedaa66483f1 Uploaded
jjohnson
parents: 44
diff changeset
19 ## copy config to output
aedaa66483f1 Uploaded
jjohnson
parents: 44
diff changeset
20 cp defuse.cfg $config_txt &&
aedaa66483f1 Uploaded
jjohnson
parents: 44
diff changeset
21 ## make a data_dir and ln -s the input fastq
aedaa66483f1 Uploaded
jjohnson
parents: 44
diff changeset
22 mkdir -p data_dir &&
aedaa66483f1 Uploaded
jjohnson
parents: 44
diff changeset
23 ln -s "$left_pairendreads" data_dir/reads_1.fastq &&
aedaa66483f1 Uploaded
jjohnson
parents: 44
diff changeset
24 ln -s "$right_pairendreads" data_dir/reads_2.fastq &&
aedaa66483f1 Uploaded
jjohnson
parents: 44
diff changeset
25 ## run
aedaa66483f1 Uploaded
jjohnson
parents: 44
diff changeset
26 perl defuse_run.pl --name "$library_name" --config defuse.cfg -1 data_dir/reads_1.fastq -2 data_dir/reads_2.fastq -o output_dir -p \$GALAXY_SLOTS &&
aedaa66483f1 Uploaded
jjohnson
parents: 44
diff changeset
27 grep -v cluster_id output_dir/results.filtered.tsv | awk '{print $1}' > cluster_id_list &&
aedaa66483f1 Uploaded
jjohnson
parents: 44
diff changeset
28 get_fusion_fastq.pl --list cluster_id_list --output output_dir --fastq1 results.fusions_1.fq --fastq2 results.fusions_2.fq &&
aedaa66483f1 Uploaded
jjohnson
parents: 44
diff changeset
29 cp output_dir/results.* . &&
aedaa66483f1 Uploaded
jjohnson
parents: 44
diff changeset
30 cp `find output_dir -name defuse.log` $defuse_log
aedaa66483f1 Uploaded
jjohnson
parents: 44
diff changeset
31 #if $defuse_out.__str__ != 'None':
aedaa66483f1 Uploaded
jjohnson
parents: 44
diff changeset
32 && $__tool_directory__/make_html.sh $defuse_out $defuse_out.dataset.extra_files_path
aedaa66483f1 Uploaded
jjohnson
parents: 44
diff changeset
33 #end if
aedaa66483f1 Uploaded
jjohnson
parents: 44
diff changeset
34 ]]></command>
0
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
35 <inputs>
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
36 <param name="left_pairendreads" type="data" format="fastq" label="left part of read pairs" help="The left and right reads pairs must be in the same order, and not have any unpaired reads. (FASTQ interlacer will pair reads and remove the unpaired. FASTQ de-interlacer will separate the result into left and right reads.)"/>
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
37 <param name="right_pairendreads" type="data" format="fastq" label="right part of read pairs" help="In the same order as the left reads"/>
27
d57fcac025e2 Add more info fields to defuse_results_to_vcf.py
Jim Johnson <jj@umn.edu>
parents: 25
diff changeset
38 <param name="library_name" type="text" value="unknown" label="library name" help="Value to put in the results library_name column">
d57fcac025e2 Add more info fields to defuse_results_to_vcf.py
Jim Johnson <jj@umn.edu>
parents: 25
diff changeset
39 <validator type="length" min="1"/>
d57fcac025e2 Add more info fields to defuse_results_to_vcf.py
Jim Johnson <jj@umn.edu>
parents: 25
diff changeset
40 </param>
0
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
41 <conditional name="refGenomeSource">
19
1af6f32ff592 Add datamanager, move to defuse_reference.loc
Jim Johnson <jj@umn.edu>
parents: 18
diff changeset
42 <param name="genomeSource" type="select" label="Will you select a built-in DeFuse Reference Dataset, or supply a configuration from your history" help="">
1af6f32ff592 Add datamanager, move to defuse_reference.loc
Jim Johnson <jj@umn.edu>
parents: 18
diff changeset
43 <option value="indexed">Use a built-in DeFuse Reference Dataset</option>
1af6f32ff592 Add datamanager, move to defuse_reference.loc
Jim Johnson <jj@umn.edu>
parents: 18
diff changeset
44 <option value="history">Use a configuration from your history that specifies the DeFuse Reference Dataset</option>
1af6f32ff592 Add datamanager, move to defuse_reference.loc
Jim Johnson <jj@umn.edu>
parents: 18
diff changeset
45 </param>
1af6f32ff592 Add datamanager, move to defuse_reference.loc
Jim Johnson <jj@umn.edu>
parents: 18
diff changeset
46 <when value="indexed">
1af6f32ff592 Add datamanager, move to defuse_reference.loc
Jim Johnson <jj@umn.edu>
parents: 18
diff changeset
47 <param name="index" type="select" label="Select a Reference Dataset" help="if your genome of interest is not listed - contact Galaxy team">
1af6f32ff592 Add datamanager, move to defuse_reference.loc
Jim Johnson <jj@umn.edu>
parents: 18
diff changeset
48 <options from_file="defuse_reference.loc">
1af6f32ff592 Add datamanager, move to defuse_reference.loc
Jim Johnson <jj@umn.edu>
parents: 18
diff changeset
49 <column name="name" index="1"/>
22
68494d6aabeb Update datamanager and defuse.xml config file generation
Jim Johnson <jj@umn.edu>
parents: 19
diff changeset
50 <column name="value" index="3"/>
19
1af6f32ff592 Add datamanager, move to defuse_reference.loc
Jim Johnson <jj@umn.edu>
parents: 18
diff changeset
51 <filter type="sort_by" column="0" />
1af6f32ff592 Add datamanager, move to defuse_reference.loc
Jim Johnson <jj@umn.edu>
parents: 18
diff changeset
52 <validator type="no_options" message="No indexes are available" />
1af6f32ff592 Add datamanager, move to defuse_reference.loc
Jim Johnson <jj@umn.edu>
parents: 18
diff changeset
53 </options>
0
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
54 </param>
19
1af6f32ff592 Add datamanager, move to defuse_reference.loc
Jim Johnson <jj@umn.edu>
parents: 18
diff changeset
55 </when>
1af6f32ff592 Add datamanager, move to defuse_reference.loc
Jim Johnson <jj@umn.edu>
parents: 18
diff changeset
56 <when value="history">
1af6f32ff592 Add datamanager, move to defuse_reference.loc
Jim Johnson <jj@umn.edu>
parents: 18
diff changeset
57 <param name="config" type="data" format="defuse.conf" label="Defuse Config file" help=""/>
1af6f32ff592 Add datamanager, move to defuse_reference.loc
Jim Johnson <jj@umn.edu>
parents: 18
diff changeset
58 </when> <!-- history -->
0
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
59 </conditional> <!-- refGenomeSource -->
19
1af6f32ff592 Add datamanager, move to defuse_reference.loc
Jim Johnson <jj@umn.edu>
parents: 18
diff changeset
60 <conditional name="defuse_param">
1af6f32ff592 Add datamanager, move to defuse_reference.loc
Jim Johnson <jj@umn.edu>
parents: 18
diff changeset
61 <param name="settings" type="select" label="Defuse parameter settings" help="">
1af6f32ff592 Add datamanager, move to defuse_reference.loc
Jim Johnson <jj@umn.edu>
parents: 18
diff changeset
62 <option value="preSet">Default settings</option>
1af6f32ff592 Add datamanager, move to defuse_reference.loc
Jim Johnson <jj@umn.edu>
parents: 18
diff changeset
63 <option value="full">Full parameter list</option>
1af6f32ff592 Add datamanager, move to defuse_reference.loc
Jim Johnson <jj@umn.edu>
parents: 18
diff changeset
64 </param>
1af6f32ff592 Add datamanager, move to defuse_reference.loc
Jim Johnson <jj@umn.edu>
parents: 18
diff changeset
65 <when value="preSet" />
1af6f32ff592 Add datamanager, move to defuse_reference.loc
Jim Johnson <jj@umn.edu>
parents: 18
diff changeset
66 <when value="full">
1af6f32ff592 Add datamanager, move to defuse_reference.loc
Jim Johnson <jj@umn.edu>
parents: 18
diff changeset
67 <param name="max_insert_size" type="integer" value="500" optional="true" label="Bowtie max_insert_size" />
1af6f32ff592 Add datamanager, move to defuse_reference.loc
Jim Johnson <jj@umn.edu>
parents: 18
diff changeset
68 <param name="dna_concordant_length" type="integer" value="2000" optional="true" label="Minimum gene fusion range dna_concordant_length" />
1af6f32ff592 Add datamanager, move to defuse_reference.loc
Jim Johnson <jj@umn.edu>
parents: 18
diff changeset
69 <param name="discord_read_trim" type="integer" value="50" optional="true" label="Trim length for discordant reads discord_read_trim" help="(split reads are not trimmed)" />
1af6f32ff592 Add datamanager, move to defuse_reference.loc
Jim Johnson <jj@umn.edu>
parents: 18
diff changeset
70 <param name="calculate_extra_annotations" type="select" label="Calculate extra annotations, fusion splice index and interrupted index" help="">
1af6f32ff592 Add datamanager, move to defuse_reference.loc
Jim Johnson <jj@umn.edu>
parents: 18
diff changeset
71 <option value="">Use Default</option>
1af6f32ff592 Add datamanager, move to defuse_reference.loc
Jim Johnson <jj@umn.edu>
parents: 18
diff changeset
72 <option value="no">no</option>
1af6f32ff592 Add datamanager, move to defuse_reference.loc
Jim Johnson <jj@umn.edu>
parents: 18
diff changeset
73 <option value="yes">yes</option>
1af6f32ff592 Add datamanager, move to defuse_reference.loc
Jim Johnson <jj@umn.edu>
parents: 18
diff changeset
74 </param>
1af6f32ff592 Add datamanager, move to defuse_reference.loc
Jim Johnson <jj@umn.edu>
parents: 18
diff changeset
75 <param name="clustering_precision" type="float" value=".95" optional="true" label="Filter clustering_precision">
1af6f32ff592 Add datamanager, move to defuse_reference.loc
Jim Johnson <jj@umn.edu>
parents: 18
diff changeset
76 <validator type="in_range" message="Choose a value between .1 and 1.0" min=".1" max="1"/>
1af6f32ff592 Add datamanager, move to defuse_reference.loc
Jim Johnson <jj@umn.edu>
parents: 18
diff changeset
77 </param>
1af6f32ff592 Add datamanager, move to defuse_reference.loc
Jim Johnson <jj@umn.edu>
parents: 18
diff changeset
78 <param name="span_count_threshold" type="integer" value="5" optional="true" label="Filter span_count_threshold" />
1af6f32ff592 Add datamanager, move to defuse_reference.loc
Jim Johnson <jj@umn.edu>
parents: 18
diff changeset
79 <param name="percent_identity_threshold" type="float" value=".90" optional="true" label="Filter percent_identity_threshold">
1af6f32ff592 Add datamanager, move to defuse_reference.loc
Jim Johnson <jj@umn.edu>
parents: 18
diff changeset
80 <validator type="in_range" message="Choose a value between .1 and 1.0" min=".1" max="1"/>
1af6f32ff592 Add datamanager, move to defuse_reference.loc
Jim Johnson <jj@umn.edu>
parents: 18
diff changeset
81 </param>
1af6f32ff592 Add datamanager, move to defuse_reference.loc
Jim Johnson <jj@umn.edu>
parents: 18
diff changeset
82 <param name="split_min_anchor" type="integer" value="4" optional="true" label="Filter split_min_anchor" />
1af6f32ff592 Add datamanager, move to defuse_reference.loc
Jim Johnson <jj@umn.edu>
parents: 18
diff changeset
83 <param name="splice_bias" type="integer" value="10" optional="true" label="Filter splice_bias" />
1af6f32ff592 Add datamanager, move to defuse_reference.loc
Jim Johnson <jj@umn.edu>
parents: 18
diff changeset
84 <param name="probability_threshold" type="float" value="0.50" optional="true" label="Filter probability_threshold">
1af6f32ff592 Add datamanager, move to defuse_reference.loc
Jim Johnson <jj@umn.edu>
parents: 18
diff changeset
85 <validator type="in_range" message="Choose a value between 0.0 and 1.0" min="0" max="1"/>
1af6f32ff592 Add datamanager, move to defuse_reference.loc
Jim Johnson <jj@umn.edu>
parents: 18
diff changeset
86 </param>
45
aedaa66483f1 Uploaded
jjohnson
parents: 44
diff changeset
87 <param name="multi_exon_transcripts_stats" type="select" label="Use multiple exon transcripts for stats calculations" help="should be enabled for very small libraries">
aedaa66483f1 Uploaded
jjohnson
parents: 44
diff changeset
88 <option value="no" select="true">no</option>
aedaa66483f1 Uploaded
jjohnson
parents: 44
diff changeset
89 <option value="yes">yes</option>
aedaa66483f1 Uploaded
jjohnson
parents: 44
diff changeset
90 </param>
19
1af6f32ff592 Add datamanager, move to defuse_reference.loc
Jim Johnson <jj@umn.edu>
parents: 18
diff changeset
91 <param name="covariance_sampling_density" type="float" value="0.01" optional="true" label="covariance_sampling_density">
1af6f32ff592 Add datamanager, move to defuse_reference.loc
Jim Johnson <jj@umn.edu>
parents: 18
diff changeset
92 <help>Position density when calculating covariance</help>
1af6f32ff592 Add datamanager, move to defuse_reference.loc
Jim Johnson <jj@umn.edu>
parents: 18
diff changeset
93 <validator type="in_range" message="Choose a value between 0.0 and 1.0" min="0" max="1"/>
1af6f32ff592 Add datamanager, move to defuse_reference.loc
Jim Johnson <jj@umn.edu>
parents: 18
diff changeset
94 </param>
45
aedaa66483f1 Uploaded
jjohnson
parents: 44
diff changeset
95 <param name="max_paired_alignments" type="integer" value="10" optional="true" label="max_paired_alignments">
aedaa66483f1 Uploaded
jjohnson
parents: 44
diff changeset
96 <help>Maximum number of alignments for a read pair, Pairs with more alignments are filtered, default is 10</help>
aedaa66483f1 Uploaded
jjohnson
parents: 44
diff changeset
97 <validator type="in_range" message="Choose a value between 0.0 and 1.0" min="1" max="100"/>
aedaa66483f1 Uploaded
jjohnson
parents: 44
diff changeset
98 </param>
19
1af6f32ff592 Add datamanager, move to defuse_reference.loc
Jim Johnson <jj@umn.edu>
parents: 18
diff changeset
99 <param name="denovo_assembly" type="select" label="denovo_assembly" help="">
1af6f32ff592 Add datamanager, move to defuse_reference.loc
Jim Johnson <jj@umn.edu>
parents: 18
diff changeset
100 <option value="">Use Default</option>
1af6f32ff592 Add datamanager, move to defuse_reference.loc
Jim Johnson <jj@umn.edu>
parents: 18
diff changeset
101 <option value="no">no</option>
1af6f32ff592 Add datamanager, move to defuse_reference.loc
Jim Johnson <jj@umn.edu>
parents: 18
diff changeset
102 <option value="yes">yes</option>
1af6f32ff592 Add datamanager, move to defuse_reference.loc
Jim Johnson <jj@umn.edu>
parents: 18
diff changeset
103 </param>
1af6f32ff592 Add datamanager, move to defuse_reference.loc
Jim Johnson <jj@umn.edu>
parents: 18
diff changeset
104 <!--
1af6f32ff592 Add datamanager, move to defuse_reference.loc
Jim Johnson <jj@umn.edu>
parents: 18
diff changeset
105 <param name="positive_controls" type="data" format="txt" optional=true label="Defuse positive_controls" help=""/>
1af6f32ff592 Add datamanager, move to defuse_reference.loc
Jim Johnson <jj@umn.edu>
parents: 18
diff changeset
106 -->
1af6f32ff592 Add datamanager, move to defuse_reference.loc
Jim Johnson <jj@umn.edu>
parents: 18
diff changeset
107 <param name="reads_per_job" type="integer" value="1000000" optional="true" label="Number of reads for each job in split" />
1af6f32ff592 Add datamanager, move to defuse_reference.loc
Jim Johnson <jj@umn.edu>
parents: 18
diff changeset
108 </when> <!-- full -->
1af6f32ff592 Add datamanager, move to defuse_reference.loc
Jim Johnson <jj@umn.edu>
parents: 18
diff changeset
109 </conditional> <!-- defuse_param -->
5
87033f379b99 Edit labels and help.
Jim Johnson <jj@umn.edu>
parents: 4
diff changeset
110 <param name="keep_output" type="boolean" checked="true" truevalue="yes" falsevalue="no" label="Save DeFuse working directory files"
87033f379b99 Edit labels and help.
Jim Johnson <jj@umn.edu>
parents: 4
diff changeset
111 help="The defuse output working directory can be helpful for determining errors that may have occurred during the run,
87033f379b99 Edit labels and help.
Jim Johnson <jj@umn.edu>
parents: 4
diff changeset
112 but they require considerable diskspace, and should be deleted and purged when no longer needed."/>
45
aedaa66483f1 Uploaded
jjohnson
parents: 44
diff changeset
113 <param name="breakpoints_bam" type="boolean" checked="false" truevalue="yes" falsevalue="no" label="Generate a Bam file for the fusions"/>
44
225750bf3770 Uploaded
jjohnson
parents: 35
diff changeset
114 <param name="do_get_reads" type="boolean" checked="false" truevalue="yes" falsevalue="no" label="Run get_reads on each cluster"/>
0
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
115 </inputs>
5
87033f379b99 Edit labels and help.
Jim Johnson <jj@umn.edu>
parents: 4
diff changeset
116 <outputs>
87033f379b99 Edit labels and help.
Jim Johnson <jj@umn.edu>
parents: 4
diff changeset
117 <data format="txt" name="config_txt" label="${tool.name} on ${on_string}: config.txt"/>
87033f379b99 Edit labels and help.
Jim Johnson <jj@umn.edu>
parents: 4
diff changeset
118 <data format="txt" name="defuse_log" label="${tool.name} on ${on_string}: defuse.log" />
87033f379b99 Edit labels and help.
Jim Johnson <jj@umn.edu>
parents: 4
diff changeset
119 <data format="html" name="defuse_out" label="${tool.name} on ${on_string}: defuse_output (purge when no longer needed)">
87033f379b99 Edit labels and help.
Jim Johnson <jj@umn.edu>
parents: 4
diff changeset
120 <filter>keep_output == True</filter>
87033f379b99 Edit labels and help.
Jim Johnson <jj@umn.edu>
parents: 4
diff changeset
121 </data>
45
aedaa66483f1 Uploaded
jjohnson
parents: 44
diff changeset
122 <data format="defuse.results.tsv" name="results_classify_tsv" label="${tool.name} on ${on_string}: results.classify.tsv" from_work_dir="results.classify.tsv"/>
aedaa66483f1 Uploaded
jjohnson
parents: 44
diff changeset
123 <data format="defuse.results.tsv" name="results_filtered_tsv" label="${tool.name} on ${on_string}: results.filtered.tsv" from_work_dir="results.filtered.tsv"/>
aedaa66483f1 Uploaded
jjohnson
parents: 44
diff changeset
124 <data format="fastqsanger" name="results_fusions1_fq" label="${tool.name} on ${on_string}: fusions_1.fq" from_work_dir="results.fusions_1.fq" />
aedaa66483f1 Uploaded
jjohnson
parents: 44
diff changeset
125 <data format="fastqsanger" name="results_fusions2_fq" label="${tool.name} on ${on_string}: fusions_2.fq" from_work_dir="results.fusions_2.fq" />
19
1af6f32ff592 Add datamanager, move to defuse_reference.loc
Jim Johnson <jj@umn.edu>
parents: 18
diff changeset
126 <!--
1af6f32ff592 Add datamanager, move to defuse_reference.loc
Jim Johnson <jj@umn.edu>
parents: 18
diff changeset
127 expression_plot
1af6f32ff592 Add datamanager, move to defuse_reference.loc
Jim Johnson <jj@umn.edu>
parents: 18
diff changeset
128 circos plot
1af6f32ff592 Add datamanager, move to defuse_reference.loc
Jim Johnson <jj@umn.edu>
parents: 18
diff changeset
129 -->
5
87033f379b99 Edit labels and help.
Jim Johnson <jj@umn.edu>
parents: 4
diff changeset
130 </outputs>
0
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
131 <configfiles>
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
132 <configfile name="defuse_config">
19
1af6f32ff592 Add datamanager, move to defuse_reference.loc
Jim Johnson <jj@umn.edu>
parents: 18
diff changeset
133 #import re
0
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
134 #if $refGenomeSource.genomeSource == "history":
19
1af6f32ff592 Add datamanager, move to defuse_reference.loc
Jim Johnson <jj@umn.edu>
parents: 18
diff changeset
135 #set config_file = $refGenomeSource.config.__str__
0
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
136 #else
19
1af6f32ff592 Add datamanager, move to defuse_reference.loc
Jim Johnson <jj@umn.edu>
parents: 18
diff changeset
137 #set config_file = $refGenomeSource.index.value
1af6f32ff592 Add datamanager, move to defuse_reference.loc
Jim Johnson <jj@umn.edu>
parents: 18
diff changeset
138 #end if
1af6f32ff592 Add datamanager, move to defuse_reference.loc
Jim Johnson <jj@umn.edu>
parents: 18
diff changeset
139 #set pat = '^\s*([^#=][^=]*?)\s*=\s*(.*?)\s*$'
22
68494d6aabeb Update datamanager and defuse.xml config file generation
Jim Johnson <jj@umn.edu>
parents: 19
diff changeset
140 #set fh = open($config_file)
19
1af6f32ff592 Add datamanager, move to defuse_reference.loc
Jim Johnson <jj@umn.edu>
parents: 18
diff changeset
141 #set keys = ['dataset_directory','ensembl_organism','ensembl_prefix','ensembl_version','ensembl_genome_version','ucsc_genome_version','ncbi_organism','ncbi_prefix','chromosomes','mt_chromosome','gene_sources','ig_gene_sources','rrna_gene_sources']
1af6f32ff592 Add datamanager, move to defuse_reference.loc
Jim Johnson <jj@umn.edu>
parents: 18
diff changeset
142 #set kv = []
1af6f32ff592 Add datamanager, move to defuse_reference.loc
Jim Johnson <jj@umn.edu>
parents: 18
diff changeset
143 #for $line in $fh:
1af6f32ff592 Add datamanager, move to defuse_reference.loc
Jim Johnson <jj@umn.edu>
parents: 18
diff changeset
144 #set m = $re.match($pat,$line)
1af6f32ff592 Add datamanager, move to defuse_reference.loc
Jim Johnson <jj@umn.edu>
parents: 18
diff changeset
145 #if $m and len($m.groups()) == 2:
1af6f32ff592 Add datamanager, move to defuse_reference.loc
Jim Johnson <jj@umn.edu>
parents: 18
diff changeset
146 ## #echo $line
1af6f32ff592 Add datamanager, move to defuse_reference.loc
Jim Johnson <jj@umn.edu>
parents: 18
diff changeset
147 #if $m.groups()[0] in keys:
1af6f32ff592 Add datamanager, move to defuse_reference.loc
Jim Johnson <jj@umn.edu>
parents: 18
diff changeset
148 #set k = $m.groups()[0]
1af6f32ff592 Add datamanager, move to defuse_reference.loc
Jim Johnson <jj@umn.edu>
parents: 18
diff changeset
149 #if k == 'dataset_directory' and $refGenomeSource.genomeSource == "indexed":
1af6f32ff592 Add datamanager, move to defuse_reference.loc
Jim Johnson <jj@umn.edu>
parents: 18
diff changeset
150 ## The DataManager is conifgured to place the config file in the same directory as the defuse_data: dataset_directory
1af6f32ff592 Add datamanager, move to defuse_reference.loc
Jim Johnson <jj@umn.edu>
parents: 18
diff changeset
151 #set v = $os.path.dirname($config_file)
1af6f32ff592 Add datamanager, move to defuse_reference.loc
Jim Johnson <jj@umn.edu>
parents: 18
diff changeset
152 #else:
1af6f32ff592 Add datamanager, move to defuse_reference.loc
Jim Johnson <jj@umn.edu>
parents: 18
diff changeset
153 #set v = $m.groups()[1]
1af6f32ff592 Add datamanager, move to defuse_reference.loc
Jim Johnson <jj@umn.edu>
parents: 18
diff changeset
154 #end if
1af6f32ff592 Add datamanager, move to defuse_reference.loc
Jim Johnson <jj@umn.edu>
parents: 18
diff changeset
155 #set kv = $kv + [[$k, $v]]
1af6f32ff592 Add datamanager, move to defuse_reference.loc
Jim Johnson <jj@umn.edu>
parents: 18
diff changeset
156 #end if
1af6f32ff592 Add datamanager, move to defuse_reference.loc
Jim Johnson <jj@umn.edu>
parents: 18
diff changeset
157 #end if
1af6f32ff592 Add datamanager, move to defuse_reference.loc
Jim Johnson <jj@umn.edu>
parents: 18
diff changeset
158 #end for
1af6f32ff592 Add datamanager, move to defuse_reference.loc
Jim Johnson <jj@umn.edu>
parents: 18
diff changeset
159 ## #echo $kv
1af6f32ff592 Add datamanager, move to defuse_reference.loc
Jim Johnson <jj@umn.edu>
parents: 18
diff changeset
160 #set ref_dict = dict($kv)
1af6f32ff592 Add datamanager, move to defuse_reference.loc
Jim Johnson <jj@umn.edu>
parents: 18
diff changeset
161 ## #echo $ref_dict
1af6f32ff592 Add datamanager, move to defuse_reference.loc
Jim Johnson <jj@umn.edu>
parents: 18
diff changeset
162 ## include raw $refGenomeSource.config.__str__
0
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
163 #
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
164 # Configuration file for defuse
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
165 #
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
166 # At a minimum, change all values enclused by []
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
167 #
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
168
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
169 # Directory where the defuse code was unpacked
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
170 ## Default location in the tool/defuse directory
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
171 # source_directory = ${__root_dir__}/tools/defuse
19
1af6f32ff592 Add datamanager, move to defuse_reference.loc
Jim Johnson <jj@umn.edu>
parents: 18
diff changeset
172 source_directory = __DEFUSE_PATH__
0
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
173
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
174 # Directory where you want your dataset
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
175 dataset_directory = #slurp
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
176 #try
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
177 $ref_dict['dataset_directory']
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
178 #except
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
179 /project/db/genomes/Hsapiens/hg19/defuse
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
180 #end try
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
181
22
68494d6aabeb Update datamanager and defuse.xml config file generation
Jim Johnson <jj@umn.edu>
parents: 19
diff changeset
182 # Organism IDs
68494d6aabeb Update datamanager and defuse.xml config file generation
Jim Johnson <jj@umn.edu>
parents: 19
diff changeset
183 ensembl_organism = #slurp
68494d6aabeb Update datamanager and defuse.xml config file generation
Jim Johnson <jj@umn.edu>
parents: 19
diff changeset
184 #try
68494d6aabeb Update datamanager and defuse.xml config file generation
Jim Johnson <jj@umn.edu>
parents: 19
diff changeset
185 $ref_dict['ensembl_organism']
68494d6aabeb Update datamanager and defuse.xml config file generation
Jim Johnson <jj@umn.edu>
parents: 19
diff changeset
186 #except
68494d6aabeb Update datamanager and defuse.xml config file generation
Jim Johnson <jj@umn.edu>
parents: 19
diff changeset
187 homo_sapiens
68494d6aabeb Update datamanager and defuse.xml config file generation
Jim Johnson <jj@umn.edu>
parents: 19
diff changeset
188 #end try
68494d6aabeb Update datamanager and defuse.xml config file generation
Jim Johnson <jj@umn.edu>
parents: 19
diff changeset
189
68494d6aabeb Update datamanager and defuse.xml config file generation
Jim Johnson <jj@umn.edu>
parents: 19
diff changeset
190 ensembl_prefix = #slurp
68494d6aabeb Update datamanager and defuse.xml config file generation
Jim Johnson <jj@umn.edu>
parents: 19
diff changeset
191 #try
68494d6aabeb Update datamanager and defuse.xml config file generation
Jim Johnson <jj@umn.edu>
parents: 19
diff changeset
192 $ref_dict['ensembl_prefix']
68494d6aabeb Update datamanager and defuse.xml config file generation
Jim Johnson <jj@umn.edu>
parents: 19
diff changeset
193 #except
68494d6aabeb Update datamanager and defuse.xml config file generation
Jim Johnson <jj@umn.edu>
parents: 19
diff changeset
194 Homo_sapiens
68494d6aabeb Update datamanager and defuse.xml config file generation
Jim Johnson <jj@umn.edu>
parents: 19
diff changeset
195 #end try
68494d6aabeb Update datamanager and defuse.xml config file generation
Jim Johnson <jj@umn.edu>
parents: 19
diff changeset
196
68494d6aabeb Update datamanager and defuse.xml config file generation
Jim Johnson <jj@umn.edu>
parents: 19
diff changeset
197 ensembl_version = #slurp
68494d6aabeb Update datamanager and defuse.xml config file generation
Jim Johnson <jj@umn.edu>
parents: 19
diff changeset
198 #try
68494d6aabeb Update datamanager and defuse.xml config file generation
Jim Johnson <jj@umn.edu>
parents: 19
diff changeset
199 $ref_dict['ensembl_version']
68494d6aabeb Update datamanager and defuse.xml config file generation
Jim Johnson <jj@umn.edu>
parents: 19
diff changeset
200 #except
68494d6aabeb Update datamanager and defuse.xml config file generation
Jim Johnson <jj@umn.edu>
parents: 19
diff changeset
201 71
68494d6aabeb Update datamanager and defuse.xml config file generation
Jim Johnson <jj@umn.edu>
parents: 19
diff changeset
202 #end try
68494d6aabeb Update datamanager and defuse.xml config file generation
Jim Johnson <jj@umn.edu>
parents: 19
diff changeset
203
68494d6aabeb Update datamanager and defuse.xml config file generation
Jim Johnson <jj@umn.edu>
parents: 19
diff changeset
204 ensembl_genome_version = #slurp
68494d6aabeb Update datamanager and defuse.xml config file generation
Jim Johnson <jj@umn.edu>
parents: 19
diff changeset
205 #try
68494d6aabeb Update datamanager and defuse.xml config file generation
Jim Johnson <jj@umn.edu>
parents: 19
diff changeset
206 $ref_dict['ensembl_genome_version']
68494d6aabeb Update datamanager and defuse.xml config file generation
Jim Johnson <jj@umn.edu>
parents: 19
diff changeset
207 #except
68494d6aabeb Update datamanager and defuse.xml config file generation
Jim Johnson <jj@umn.edu>
parents: 19
diff changeset
208 GRCh37
68494d6aabeb Update datamanager and defuse.xml config file generation
Jim Johnson <jj@umn.edu>
parents: 19
diff changeset
209 #end try
68494d6aabeb Update datamanager and defuse.xml config file generation
Jim Johnson <jj@umn.edu>
parents: 19
diff changeset
210
68494d6aabeb Update datamanager and defuse.xml config file generation
Jim Johnson <jj@umn.edu>
parents: 19
diff changeset
211 ucsc_genome_version = #slurp
68494d6aabeb Update datamanager and defuse.xml config file generation
Jim Johnson <jj@umn.edu>
parents: 19
diff changeset
212 #try
68494d6aabeb Update datamanager and defuse.xml config file generation
Jim Johnson <jj@umn.edu>
parents: 19
diff changeset
213 $ref_dict['ucsc_genome_version']
68494d6aabeb Update datamanager and defuse.xml config file generation
Jim Johnson <jj@umn.edu>
parents: 19
diff changeset
214 #except
68494d6aabeb Update datamanager and defuse.xml config file generation
Jim Johnson <jj@umn.edu>
parents: 19
diff changeset
215 hg19
68494d6aabeb Update datamanager and defuse.xml config file generation
Jim Johnson <jj@umn.edu>
parents: 19
diff changeset
216 #end try
68494d6aabeb Update datamanager and defuse.xml config file generation
Jim Johnson <jj@umn.edu>
parents: 19
diff changeset
217
68494d6aabeb Update datamanager and defuse.xml config file generation
Jim Johnson <jj@umn.edu>
parents: 19
diff changeset
218 ncbi_organism = #slurp
68494d6aabeb Update datamanager and defuse.xml config file generation
Jim Johnson <jj@umn.edu>
parents: 19
diff changeset
219 #try
68494d6aabeb Update datamanager and defuse.xml config file generation
Jim Johnson <jj@umn.edu>
parents: 19
diff changeset
220 $ref_dict['ncbi_organism']
68494d6aabeb Update datamanager and defuse.xml config file generation
Jim Johnson <jj@umn.edu>
parents: 19
diff changeset
221 #except
68494d6aabeb Update datamanager and defuse.xml config file generation
Jim Johnson <jj@umn.edu>
parents: 19
diff changeset
222 Homo_sapiens
68494d6aabeb Update datamanager and defuse.xml config file generation
Jim Johnson <jj@umn.edu>
parents: 19
diff changeset
223 #end try
68494d6aabeb Update datamanager and defuse.xml config file generation
Jim Johnson <jj@umn.edu>
parents: 19
diff changeset
224
68494d6aabeb Update datamanager and defuse.xml config file generation
Jim Johnson <jj@umn.edu>
parents: 19
diff changeset
225 ncbi_prefix = #slurp
68494d6aabeb Update datamanager and defuse.xml config file generation
Jim Johnson <jj@umn.edu>
parents: 19
diff changeset
226 #try
68494d6aabeb Update datamanager and defuse.xml config file generation
Jim Johnson <jj@umn.edu>
parents: 19
diff changeset
227 $ref_dict['ncbi_prefix']
68494d6aabeb Update datamanager and defuse.xml config file generation
Jim Johnson <jj@umn.edu>
parents: 19
diff changeset
228 #except
68494d6aabeb Update datamanager and defuse.xml config file generation
Jim Johnson <jj@umn.edu>
parents: 19
diff changeset
229 Hs
68494d6aabeb Update datamanager and defuse.xml config file generation
Jim Johnson <jj@umn.edu>
parents: 19
diff changeset
230 #end try
68494d6aabeb Update datamanager and defuse.xml config file generation
Jim Johnson <jj@umn.edu>
parents: 19
diff changeset
231
0
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
232 # Input genome and gene models
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
233 gene_models = #slurp
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
234 #try
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
235 $ref_dict['gene_models']
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
236 #except
22
68494d6aabeb Update datamanager and defuse.xml config file generation
Jim Johnson <jj@umn.edu>
parents: 19
diff changeset
237 \$(dataset_directory)/\$(ensembl_prefix).\$(ensembl_genome_version).\$(ensembl_version).gtf
0
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
238 #end try
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
239 genome_fasta = #slurp
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
240 #try
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
241 $ref_dict['genome_fasta']
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
242 #except
22
68494d6aabeb Update datamanager and defuse.xml config file generation
Jim Johnson <jj@umn.edu>
parents: 19
diff changeset
243 \$(dataset_directory)/\$(ensembl_prefix).\$(ensembl_genome_version).\$(ensembl_version).dna.chromosomes.fa
0
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
244 #end try
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
245
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
246 # Repeat table from ucsc genome browser
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
247 repeats_filename = #slurp
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
248 #try
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
249 $ref_dict['repeats_filename']
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
250 #except
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
251 \$(dataset_directory)/rmsk.txt
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
252 #end try
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
253
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
254 # EST info downloaded from ucsc genome browser
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
255 est_fasta = #slurp
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
256 #try
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
257 $ref_dict['est_fasta']
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
258 #except
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
259 \$(dataset_directory)/est.fa
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
260 #end try
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
261 est_alignments = #slurp
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
262 #try
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
263 $ref_dict['est_alignments']
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
264 #except
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
265 \$(dataset_directory)/intronEst.txt
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
266 #end try
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
267
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
268 # Unigene clusters downloaded from ncbi
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
269 unigene_fasta = #slurp
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
270 #try
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
271 $ref_dict['unigene_fasta']
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
272 #except
23
e8fc5de0578b defuse.xml fix unigene_fasta path to use ncbi_prefix
Jim Johnson <jj@umn.edu>
parents: 22
diff changeset
273 \$(dataset_directory)/\$(ncbi_prefix).seq.uniq
0
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
274 #end try
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
275
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
276 # Paths to external tools
19
1af6f32ff592 Add datamanager, move to defuse_reference.loc
Jim Johnson <jj@umn.edu>
parents: 18
diff changeset
277 bowtie_bin = __BOWTIE_BIN__
1af6f32ff592 Add datamanager, move to defuse_reference.loc
Jim Johnson <jj@umn.edu>
parents: 18
diff changeset
278 bowtie_build_bin = __BOWTIE_BUILD_BIN__
1af6f32ff592 Add datamanager, move to defuse_reference.loc
Jim Johnson <jj@umn.edu>
parents: 18
diff changeset
279 blat_bin = __BLAT_BIN__
1af6f32ff592 Add datamanager, move to defuse_reference.loc
Jim Johnson <jj@umn.edu>
parents: 18
diff changeset
280 fatotwobit_bin = __FATOTWOBIT_BIN__
1af6f32ff592 Add datamanager, move to defuse_reference.loc
Jim Johnson <jj@umn.edu>
parents: 18
diff changeset
281 gmap_bin = __GMAP_BIN__
1af6f32ff592 Add datamanager, move to defuse_reference.loc
Jim Johnson <jj@umn.edu>
parents: 18
diff changeset
282 gmap_bin = __GMAP_BIN__
1af6f32ff592 Add datamanager, move to defuse_reference.loc
Jim Johnson <jj@umn.edu>
parents: 18
diff changeset
283 gmap_setup_bin = __GMAP_SETUP_BIN__
1af6f32ff592 Add datamanager, move to defuse_reference.loc
Jim Johnson <jj@umn.edu>
parents: 18
diff changeset
284 r_bin = __R_BIN__
1af6f32ff592 Add datamanager, move to defuse_reference.loc
Jim Johnson <jj@umn.edu>
parents: 18
diff changeset
285 rscript_bin = __RSCRIPT_BIN__
0
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
286
7
f4eadbd2e7c1 Add gmap_setup_bin and gmap_index_directory to defuse.xml config file generation
Jim Johnson <jj@umn.edu>
parents: 6
diff changeset
287 # Directory where you want your dataset
f4eadbd2e7c1 Add gmap_setup_bin and gmap_index_directory to defuse.xml config file generation
Jim Johnson <jj@umn.edu>
parents: 6
diff changeset
288 gmap_index_directory = #slurp
f4eadbd2e7c1 Add gmap_setup_bin and gmap_index_directory to defuse.xml config file generation
Jim Johnson <jj@umn.edu>
parents: 6
diff changeset
289 #try
f4eadbd2e7c1 Add gmap_setup_bin and gmap_index_directory to defuse.xml config file generation
Jim Johnson <jj@umn.edu>
parents: 6
diff changeset
290 $ref_dict['gmap_index_directory']
f4eadbd2e7c1 Add gmap_setup_bin and gmap_index_directory to defuse.xml config file generation
Jim Johnson <jj@umn.edu>
parents: 6
diff changeset
291 #except
12
33e2235bf003 Add create_reference_dataset.xml
Jim Johnson <jj@umn.edu>
parents: 10
diff changeset
292 #raw
33e2235bf003 Add create_reference_dataset.xml
Jim Johnson <jj@umn.edu>
parents: 10
diff changeset
293 $(dataset_directory)/gmap
33e2235bf003 Add create_reference_dataset.xml
Jim Johnson <jj@umn.edu>
parents: 10
diff changeset
294 #end raw
7
f4eadbd2e7c1 Add gmap_setup_bin and gmap_index_directory to defuse.xml config file generation
Jim Johnson <jj@umn.edu>
parents: 6
diff changeset
295 #end try
f4eadbd2e7c1 Add gmap_setup_bin and gmap_index_directory to defuse.xml config file generation
Jim Johnson <jj@umn.edu>
parents: 6
diff changeset
296
0
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
297 #raw
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
298 # Dataset files
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
299 dataset_prefix = $(dataset_directory)/defuse
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
300 chromosome_prefix = $(dataset_prefix).dna.chromosomes
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
301 exons_fasta = $(dataset_prefix).exons.fa
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
302 cds_fasta = $(dataset_prefix).cds.fa
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
303 cdna_regions = $(dataset_prefix).cdna.regions
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
304 cdna_fasta = $(dataset_prefix).cdna.fa
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
305 reference_fasta = $(dataset_prefix).reference.fa
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
306 rrna_fasta = $(dataset_prefix).rrna.fa
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
307 ig_gene_list = $(dataset_prefix).ig.gene.list
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
308 repeats_regions = $(dataset_directory)/repeats.regions
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
309 est_split_fasta1 = $(dataset_directory)/est.1.fa
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
310 est_split_fasta2 = $(dataset_directory)/est.2.fa
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
311 est_split_fasta3 = $(dataset_directory)/est.3.fa
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
312 est_split_fasta4 = $(dataset_directory)/est.4.fa
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
313 est_split_fasta5 = $(dataset_directory)/est.5.fa
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
314 est_split_fasta6 = $(dataset_directory)/est.6.fa
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
315 est_split_fasta7 = $(dataset_directory)/est.7.fa
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
316 est_split_fasta8 = $(dataset_directory)/est.8.fa
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
317 est_split_fasta9 = $(dataset_directory)/est.9.fa
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
318
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
319 # Fasta files with bowtie indices for prefiltering reads for concordantly mapping pairs
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
320 prefilter1 = $(unigene_fasta)
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
321
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
322 # deFuse scripts and tools
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
323 scripts_directory = $(source_directory)/scripts
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
324 tools_directory = $(source_directory)/tools
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
325 data_directory = $(source_directory)/data
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
326 #end raw
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
327
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
328 # Path to samtools, 0.1.8 is compiled for you, use other versions at your own risk
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
329 samtools_bin = #slurp
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
330 #try
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
331 $ref_dict['samtools_bin']
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
332 #except
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
333 \$(source_directory)/external/samtools-0.1.8/samtools
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
334 #end try
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
335
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
336 # Bowtie parameters
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
337 bowtie_threads = #slurp
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
338 #try
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
339 $ref_dict['bowtie_threads']
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
340 #except
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
341 4
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
342 #end try
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
343 bowtie_quals = #slurp
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
344 #try
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
345 $ref_dict['bowtie_quals']
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
346 #except
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
347 --phred33-quals
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
348 #end try
45
aedaa66483f1 Uploaded
jjohnson
parents: 44
diff changeset
349 bowtie_params = #slurp
aedaa66483f1 Uploaded
jjohnson
parents: 44
diff changeset
350 #try
aedaa66483f1 Uploaded
jjohnson
parents: 44
diff changeset
351 $ref_dict['bowtie_params']
aedaa66483f1 Uploaded
jjohnson
parents: 44
diff changeset
352 #except
aedaa66483f1 Uploaded
jjohnson
parents: 44
diff changeset
353 --chunkmbs 200
aedaa66483f1 Uploaded
jjohnson
parents: 44
diff changeset
354 #end try
0
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
355 max_insert_size = #slurp
19
1af6f32ff592 Add datamanager, move to defuse_reference.loc
Jim Johnson <jj@umn.edu>
parents: 18
diff changeset
356 #if $defuse_param.settings == "full" and $defuse_param.max_insert_size.__str__ != "":
1af6f32ff592 Add datamanager, move to defuse_reference.loc
Jim Johnson <jj@umn.edu>
parents: 18
diff changeset
357 $defuse_param.max_insert_size
0
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
358 #else
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
359 #try
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
360 $ref_dict['max_insert_size']
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
361 #except
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
362 500
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
363 #end try
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
364 #end if
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
365
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
366 # Parameters for building the dataset
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
367 chromosomes = #slurp
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
368 #try
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
369 $ref_dict.chromosomes
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
370 #except
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
371 1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,X,Y,MT
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
372 #end try
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
373 mt_chromosome = #slurp
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
374 #try
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
375 $ref_dict['mt_chromosome']
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
376 #except
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
377 MT
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
378 #end try
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
379 gene_sources = #slurp
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
380 #try
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
381 $ref_dict['gene_sources']
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
382 #except
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
383 IG_C_gene,IG_D_gene,IG_J_gene,IG_V_gene,processed_transcript,protein_coding
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
384 #end try
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
385 ig_gene_sources = #slurp
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
386 #try
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
387 $ref_dict['ig_gene_sources']
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
388 #except
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
389 IG_C_gene,IG_D_gene,IG_J_gene,IG_V_gene,IG_pseudogene
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
390 #end try
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
391 rrna_gene_sources = #slurp
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
392 #try
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
393 $ref_dict['rrna_gene_sources']
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
394 #except
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
395 Mt_rRNA,rRNA,rRNA_pseudogene
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
396 #end try
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
397
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
398 # Blat sequences per job
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
399 num_blat_sequences = #slurp
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
400 #try
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
401 $ref_dict['num_blat_sequences']
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
402 #except
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
403 10000
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
404 #end try
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
405
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
406 # Minimum gene fusion range
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
407 dna_concordant_length = #slurp
19
1af6f32ff592 Add datamanager, move to defuse_reference.loc
Jim Johnson <jj@umn.edu>
parents: 18
diff changeset
408 #if $defuse_param.settings == "full" and $defuse_param.dna_concordant_length.__str__ != "":
1af6f32ff592 Add datamanager, move to defuse_reference.loc
Jim Johnson <jj@umn.edu>
parents: 18
diff changeset
409 $defuse_param.dna_concordant_length
0
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
410 #else
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
411 #try
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
412 $ref_dict['dna_concordant_length']
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
413 #except
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
414 2000
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
415 #end try
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
416 #end if
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
417
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
418 # Trim length for discordant reads (split reads are not trimmed)
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
419 discord_read_trim = #slurp
19
1af6f32ff592 Add datamanager, move to defuse_reference.loc
Jim Johnson <jj@umn.edu>
parents: 18
diff changeset
420 #if $defuse_param.settings == "full" and $defuse_param.discord_read_trim.__str__ != "":
1af6f32ff592 Add datamanager, move to defuse_reference.loc
Jim Johnson <jj@umn.edu>
parents: 18
diff changeset
421 $defuse_param.discord_read_trim
0
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
422 #else
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
423 #try
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
424 $ref_dict['discord_read_trim']
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
425 #except
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
426 50
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
427 #end try
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
428 #end if
19
1af6f32ff592 Add datamanager, move to defuse_reference.loc
Jim Johnson <jj@umn.edu>
parents: 18
diff changeset
429 # Calculate extra annotations, fusion splice index and interrupted index
1af6f32ff592 Add datamanager, move to defuse_reference.loc
Jim Johnson <jj@umn.edu>
parents: 18
diff changeset
430 calculate_extra_annotations = #slurp
1af6f32ff592 Add datamanager, move to defuse_reference.loc
Jim Johnson <jj@umn.edu>
parents: 18
diff changeset
431 #if $defuse_param.settings == "full" and $defuse_param.calculate_extra_annotations.__str__ != "":
1af6f32ff592 Add datamanager, move to defuse_reference.loc
Jim Johnson <jj@umn.edu>
parents: 18
diff changeset
432 $defuse_param.calculate_extra_annotations
1af6f32ff592 Add datamanager, move to defuse_reference.loc
Jim Johnson <jj@umn.edu>
parents: 18
diff changeset
433 #else
1af6f32ff592 Add datamanager, move to defuse_reference.loc
Jim Johnson <jj@umn.edu>
parents: 18
diff changeset
434 #try
1af6f32ff592 Add datamanager, move to defuse_reference.loc
Jim Johnson <jj@umn.edu>
parents: 18
diff changeset
435 $ref_dict['calculate_extra_annotations']
1af6f32ff592 Add datamanager, move to defuse_reference.loc
Jim Johnson <jj@umn.edu>
parents: 18
diff changeset
436 #except
1af6f32ff592 Add datamanager, move to defuse_reference.loc
Jim Johnson <jj@umn.edu>
parents: 18
diff changeset
437 no
1af6f32ff592 Add datamanager, move to defuse_reference.loc
Jim Johnson <jj@umn.edu>
parents: 18
diff changeset
438 #end try
1af6f32ff592 Add datamanager, move to defuse_reference.loc
Jim Johnson <jj@umn.edu>
parents: 18
diff changeset
439 #end if
0
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
440 # Filtering parameters
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
441 clustering_precision = #slurp
19
1af6f32ff592 Add datamanager, move to defuse_reference.loc
Jim Johnson <jj@umn.edu>
parents: 18
diff changeset
442 #if $defuse_param.settings == "full" and $defuse_param.clustering_precision.__str__ != ""
1af6f32ff592 Add datamanager, move to defuse_reference.loc
Jim Johnson <jj@umn.edu>
parents: 18
diff changeset
443 $defuse_param.clustering_precision
0
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
444 #else
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
445 #try
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
446 $ref_dict['clustering_precision']
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
447 #except
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
448 0.95
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
449 #end try
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
450 #end if
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
451 span_count_threshold = #slurp
19
1af6f32ff592 Add datamanager, move to defuse_reference.loc
Jim Johnson <jj@umn.edu>
parents: 18
diff changeset
452 #if $defuse_param.settings == "full" and $defuse_param.span_count_threshold.__str__ != ""
1af6f32ff592 Add datamanager, move to defuse_reference.loc
Jim Johnson <jj@umn.edu>
parents: 18
diff changeset
453 $defuse_param.span_count_threshold
0
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
454 #else
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
455 #try
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
456 $ref_dict['span_count_threshold']
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
457 #except
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
458 5
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
459 #end try
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
460 #end if
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
461 percent_identity_threshold = #slurp
19
1af6f32ff592 Add datamanager, move to defuse_reference.loc
Jim Johnson <jj@umn.edu>
parents: 18
diff changeset
462 #if $defuse_param.settings == "full" and $defuse_param.percent_identity_threshold.__str__ != ""
1af6f32ff592 Add datamanager, move to defuse_reference.loc
Jim Johnson <jj@umn.edu>
parents: 18
diff changeset
463 $defuse_param.percent_identity_threshold
0
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
464 #else
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
465 #try
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
466 $ref_dict['percent_identity_threshold']
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
467 #except
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
468 0.90
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
469 #end try
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
470 #end if
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
471 split_min_anchor = #slurp
19
1af6f32ff592 Add datamanager, move to defuse_reference.loc
Jim Johnson <jj@umn.edu>
parents: 18
diff changeset
472 #if $defuse_param.settings == "full" and $defuse_param.split_min_anchor.__str__ != ""
1af6f32ff592 Add datamanager, move to defuse_reference.loc
Jim Johnson <jj@umn.edu>
parents: 18
diff changeset
473 $defuse_param.split_min_anchor
0
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
474 #else
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
475 #try
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
476 $ref_dict['split_min_anchor']
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
477 #except
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
478 4
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
479 #end try
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
480 #end if
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
481 splice_bias = #slurp
19
1af6f32ff592 Add datamanager, move to defuse_reference.loc
Jim Johnson <jj@umn.edu>
parents: 18
diff changeset
482 #if $defuse_param.settings == "full" and $defuse_param.splice_bias.__str__ != ""
1af6f32ff592 Add datamanager, move to defuse_reference.loc
Jim Johnson <jj@umn.edu>
parents: 18
diff changeset
483 $defuse_param.splice_bias
0
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
484 #else
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
485 #try
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
486 $ref_dict['splice_bias']
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
487 #except
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
488 10
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
489 #end try
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
490 #end if
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
491 denovo_assembly = #slurp
19
1af6f32ff592 Add datamanager, move to defuse_reference.loc
Jim Johnson <jj@umn.edu>
parents: 18
diff changeset
492 #if $defuse_param.settings == "full" and $defuse_param.denovo_assembly.__str__ != ""
1af6f32ff592 Add datamanager, move to defuse_reference.loc
Jim Johnson <jj@umn.edu>
parents: 18
diff changeset
493 $defuse_param.denovo_assembly
0
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
494 #else
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
495 #try
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
496 $ref_dict['denovo_assembly']
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
497 #except
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
498 no
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
499 #end try
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
500 #end if
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
501 probability_threshold = #slurp
19
1af6f32ff592 Add datamanager, move to defuse_reference.loc
Jim Johnson <jj@umn.edu>
parents: 18
diff changeset
502 #if $defuse_param.settings == "full" and $defuse_param.probability_threshold.__str__ != ""
1af6f32ff592 Add datamanager, move to defuse_reference.loc
Jim Johnson <jj@umn.edu>
parents: 18
diff changeset
503 $defuse_param.probability_threshold
0
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
504 #else
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
505 #try
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
506 $ref_dict['probability_threshold']
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
507 #except
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
508 0.50
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
509 #end try
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
510 #end if
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
511 positive_controls = \$(data_directory)/controls.txt
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
512
45
aedaa66483f1 Uploaded
jjohnson
parents: 44
diff changeset
513 # Use multiple exon transcripts for stats calculations (yes/no)
aedaa66483f1 Uploaded
jjohnson
parents: 44
diff changeset
514 # should be enabled for very small libraries
aedaa66483f1 Uploaded
jjohnson
parents: 44
diff changeset
515 multi_exon_transcripts_stats = #slurp
aedaa66483f1 Uploaded
jjohnson
parents: 44
diff changeset
516 #if $defuse_param.settings == "full" and $defuse_param.multi_exon_transcripts_stats.__str__ != ""
aedaa66483f1 Uploaded
jjohnson
parents: 44
diff changeset
517 $defuse_param.multi_exon_transcripts_stats
aedaa66483f1 Uploaded
jjohnson
parents: 44
diff changeset
518 #else
aedaa66483f1 Uploaded
jjohnson
parents: 44
diff changeset
519 #try
aedaa66483f1 Uploaded
jjohnson
parents: 44
diff changeset
520 $ref_dict['multi_exon_transcripts_stats']
aedaa66483f1 Uploaded
jjohnson
parents: 44
diff changeset
521 #except
aedaa66483f1 Uploaded
jjohnson
parents: 44
diff changeset
522 no
aedaa66483f1 Uploaded
jjohnson
parents: 44
diff changeset
523 #end try
aedaa66483f1 Uploaded
jjohnson
parents: 44
diff changeset
524 #end if
aedaa66483f1 Uploaded
jjohnson
parents: 44
diff changeset
525
0
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
526 # Position density when calculating covariance
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
527 covariance_sampling_density = #slurp
19
1af6f32ff592 Add datamanager, move to defuse_reference.loc
Jim Johnson <jj@umn.edu>
parents: 18
diff changeset
528 #if $defuse_param.settings == "full" and $defuse_param.covariance_sampling_density.__str__ != ""
1af6f32ff592 Add datamanager, move to defuse_reference.loc
Jim Johnson <jj@umn.edu>
parents: 18
diff changeset
529 $defuse_param.covariance_sampling_density
0
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
530 #else
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
531 #try
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
532 $ref_dict['covariance_sampling_density']
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
533 #except
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
534 0.01
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
535 #end try
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
536 #end if
45
aedaa66483f1 Uploaded
jjohnson
parents: 44
diff changeset
537
aedaa66483f1 Uploaded
jjohnson
parents: 44
diff changeset
538 # Maximum number of alignments for a read pair
aedaa66483f1 Uploaded
jjohnson
parents: 44
diff changeset
539 # Pairs with more alignments are filtered
aedaa66483f1 Uploaded
jjohnson
parents: 44
diff changeset
540 max_paired_alignments = #slurp
aedaa66483f1 Uploaded
jjohnson
parents: 44
diff changeset
541 #if $defuse_param.settings == "full" and $defuse_param.max_paired_alignments.__str__ != ""
aedaa66483f1 Uploaded
jjohnson
parents: 44
diff changeset
542 $defuse_param.max_paired_alignments
aedaa66483f1 Uploaded
jjohnson
parents: 44
diff changeset
543 #else
aedaa66483f1 Uploaded
jjohnson
parents: 44
diff changeset
544 #try
aedaa66483f1 Uploaded
jjohnson
parents: 44
diff changeset
545 $ref_dict['max_paired_alignments']
aedaa66483f1 Uploaded
jjohnson
parents: 44
diff changeset
546 #except
aedaa66483f1 Uploaded
jjohnson
parents: 44
diff changeset
547 10
aedaa66483f1 Uploaded
jjohnson
parents: 44
diff changeset
548 #end try
aedaa66483f1 Uploaded
jjohnson
parents: 44
diff changeset
549 #end if
aedaa66483f1 Uploaded
jjohnson
parents: 44
diff changeset
550
0
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
551 # Number of reads for each job in split
19
1af6f32ff592 Add datamanager, move to defuse_reference.loc
Jim Johnson <jj@umn.edu>
parents: 18
diff changeset
552 reads_per_job = #slurp
1af6f32ff592 Add datamanager, move to defuse_reference.loc
Jim Johnson <jj@umn.edu>
parents: 18
diff changeset
553 #if $defuse_param.settings == "full" and $defuse_param.reads_per_job.__str__ != ""
1af6f32ff592 Add datamanager, move to defuse_reference.loc
Jim Johnson <jj@umn.edu>
parents: 18
diff changeset
554 $defuse_param.reads_per_job
1af6f32ff592 Add datamanager, move to defuse_reference.loc
Jim Johnson <jj@umn.edu>
parents: 18
diff changeset
555 #else
1af6f32ff592 Add datamanager, move to defuse_reference.loc
Jim Johnson <jj@umn.edu>
parents: 18
diff changeset
556 #try
1af6f32ff592 Add datamanager, move to defuse_reference.loc
Jim Johnson <jj@umn.edu>
parents: 18
diff changeset
557 $ref_dict['reads_per_job']
1af6f32ff592 Add datamanager, move to defuse_reference.loc
Jim Johnson <jj@umn.edu>
parents: 18
diff changeset
558 #except
1af6f32ff592 Add datamanager, move to defuse_reference.loc
Jim Johnson <jj@umn.edu>
parents: 18
diff changeset
559 1000000
1af6f32ff592 Add datamanager, move to defuse_reference.loc
Jim Johnson <jj@umn.edu>
parents: 18
diff changeset
560 #end try
1af6f32ff592 Add datamanager, move to defuse_reference.loc
Jim Johnson <jj@umn.edu>
parents: 18
diff changeset
561 #end if
0
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
562
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
563 #raw
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
564 # If you have command line 'mail' and wish to be notified
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
565 # mailto = andrew.mcpherson@gmail.com
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
566
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
567 # Remove temp files
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
568 remove_job_files = yes
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
569 remove_job_temp_files = yes
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
570
45
aedaa66483f1 Uploaded
jjohnson
parents: 44
diff changeset
571 qsub_params = ""
aedaa66483f1 Uploaded
jjohnson
parents: 44
diff changeset
572
0
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
573 #end raw
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
574
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
575 </configfile>
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
576 </configfiles>
5
87033f379b99 Edit labels and help.
Jim Johnson <jj@umn.edu>
parents: 4
diff changeset
577
0
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
578 <tests>
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
579 </tests>
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
580 <help>
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
581 **DeFuse**
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
582
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
583 DeFuse_ is a software package for gene fusion discovery using RNA-Seq data. The software uses clusters of discordant paired end alignments to inform a split read alignment analysis for finding fusion boundaries. The software also employs a number of heuristic filters in an attempt to reduce the number of false positives and produces a fully annotated output for each predicted fusion.
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
584
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
585 Journal reference: http://www.ploscompbiol.org/article/info%3Adoi%2F10.1371%2Fjournal.pcbi.1001138
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
586
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
587 .. _DeFuse: http://sourceforge.net/apps/mediawiki/defuse/index.php?title=Main_Page
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
588
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
589 ------
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
590
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
591 **Inputs**
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
592
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
593 DeFuse requires 2 fastq files for paried reads, one with the left mate of the paired reads, and a second fastq with the the right mate of the paired reads (**with reads in the same order as in the first fastq dataset**).
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
594
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
595 If your fastq files have reads in different orders or include unpaired reads, you can preprocess them with **FASTQ interlacer** to create a single interlaced fastq dataset with only the paired reads and input that to **FASTQ de-interlacer** to separate the reads into a left fastq and right fastq.
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
596
19
1af6f32ff592 Add datamanager, move to defuse_reference.loc
Jim Johnson <jj@umn.edu>
parents: 18
diff changeset
597 DeFuse uses a Reference Dataset to search for gene fusions. The Reference Dataset is generated from the following sources in DeFuse_Version_0.4_:
0
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
598 - genome_fasta from Ensembl
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
599 - gene_models from Ensembl
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
600 - repeats_filename from UCSC RepeatMasker rmsk.txt
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
601 - est_fasta from UCSC
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
602 - est_alignments from UCSC intronEst.txt
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
603 - unigene_fasta from NCBI
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
604
19
1af6f32ff592 Add datamanager, move to defuse_reference.loc
Jim Johnson <jj@umn.edu>
parents: 18
diff changeset
605 .. _DeFuse_Version_0.4: http://sourceforge.net/apps/mediawiki/defuse/index.php?title=DeFuse_Version_0.4.2
0
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
606
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
607 ------
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
608
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
609 **Outputs**
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
610
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
611 The galaxy history will contain 5 outputs: the config.txt file that provides DeFuse with its parameters, the defuse.log which details what DeFuse has done and can be useful in determining any errors, and the 3 results files that defuse generates.
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
612
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
613 DeFuse generates 3 results files: results.txt, results.filtered.txt, and results.classify.txt. All three files have the same format, though results.classify.txt has a probability column from the application of the classifier to results.txt, and results.filtered.txt has been filtered according to the threshold probability as set in config.txt.
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
614
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
615 The file format is tab delimited with one prediction per line, and the following fields per prediction (not necessarily in this order):
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
616
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
617 - **Identification**
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
618 - cluster_id : random identifier assigned to each prediction
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
619 - library_name : library name given on the command line of defuse
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
620 - gene1 : ensembl id of gene 1
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
621 - gene2 : ensembl id of gene 2
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
622 - gene_name1 : name of gene 1
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
623 - gene_name2 : name of gene 2
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
624 - **Evidence**
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
625 - break_predict : breakpoint prediction method, denovo or splitr, that is considered most reliable
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
626 - concordant_ratio : proportion of spanning reads considered concordant by blat
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
627 - denovo_min_count : minimum kmer count across denovo assembled sequence
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
628 - denovo_sequence : fusion sequence predicted by debruijn based denovo sequence assembly
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
629 - denovo_span_pvalue : p-value, lower values are evidence the prediction is a false positive
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
630 - gene_align_strand1 : alignment strand for spanning read alignments to gene 1
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
631 - gene_align_strand2 : alignment strand for spanning read alignments to gene 2
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
632 - min_map_count : minimum of the number of genomic mappings for each spanning read
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
633 - max_map_count : maximum of the number of genomic mappings for each spanning read
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
634 - mean_map_count : average of the number of genomic mappings for each spanning read
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
635 - num_multi_map : number of spanning reads that map to more than one genomic location
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
636 - span_count : number of spanning reads supporting the fusion
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
637 - span_coverage1 : coverage of spanning reads aligned to gene 1 as a proportion of expected coverage
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
638 - span_coverage2 : coverage of spanning reads aligned to gene 2 as a proportion of expected coverage
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
639 - span_coverage_min : minimum of span_coverage1 and span_coverage2
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
640 - span_coverage_max : maximum of span_coverage1 and span_coverage2
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
641 - splitr_count : number of split reads supporting the prediction
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
642 - splitr_min_pvalue : p-value, lower values are evidence the prediction is a false positive
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
643 - splitr_pos_pvalue : p-value, lower values are evidence the prediction is a false positive
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
644 - splitr_sequence : fusion sequence predicted by split reads
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
645 - splitr_span_pvalue : p-value, lower values are evidence the prediction is a false positive
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
646 - **Annotation**
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
647 - adjacent : fusion between adjacent genes
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
648 - altsplice : fusion likely the product of alternative splicing between adjacent genes
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
649 - break_adj_entropy1 : di-nucleotide entropy of the 40 nucleotides adjacent to the fusion splice in gene 1
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
650 - break_adj_entropy2 : di-nucleotide entropy of the 40 nucleotides adjacent to the fusion splice in gene 2
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
651 - break_adj_entropy_min : minimum of break_adj_entropy1 and break_adj_entropy2
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
652 - breakpoint_homology : number of nucleotides at the fusion splice that align equally well to gene 1 or gene 2
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
653 - breakseqs_estislands_percident : maximum percent identity of fusion sequence alignments to est islands
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
654 - cdna_breakseqs_percident : maximum percent identity of fusion sequence alignments to cdna
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
655 - deletion : fusion produced by a genomic deletion
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
656 - est_breakseqs_percident : maximum percent identity of fusion sequence alignments to est
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
657 - eversion : fusion produced by a genomic eversion
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
658 - exonboundaries : fusion splice at exon boundaries
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
659 - expression1 : expression of gene 1 as number of concordant pairs aligned to exons
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
660 - expression2 : expression of gene 2 as number of concordant pairs aligned to exons
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
661 - gene_chromosome1 : chromosome of gene 1
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
662 - gene_chromosome2 : chromosome of gene 2
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
663 - gene_end1 : end position for gene 1
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
664 - gene_end2 : end position for gene 2
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
665 - gene_location1 : location of breakpoint in gene 1
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
666 - gene_location2 : location of breakpoint in gene 2
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
667 - gene_start1 : start of gene 1
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
668 - gene_start2 : start of gene 2
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
669 - gene_strand1 : strand of gene 1
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
670 - gene_strand2 : strand of gene 2
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
671 - genome_breakseqs_percident : maximum percent identity of fusion sequence alignments to genome
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
672 - genomic_break_pos1 : genomic position in gene 1 of fusion splice / breakpoint
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
673 - genomic_break_pos2 : genomic position in gene 2 of fusion splice / breakpoint
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
674 - genomic_strand1 : genomic strand in gene 1 of fusion splice / breakpoint, retained sequence upstream on this strand, breakpoint is downstream
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
675 - genomic_strand2 : genomic strand in gene 2 of fusion splice / breakpoint, retained sequence upstream on this strand, breakpoint is downstream
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
676 - interchromosomal : fusion produced by an interchromosomal translocation
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
677 - interrupted_index1 : ratio of coverage before and after the fusion splice / breakpoint in gene 1
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
678 - interrupted_index2 : ratio of coverage before and after the fusion splice / breakpoint in gene 2
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
679 - inversion : fusion produced by genomic inversion
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
680 - orf : fusion combines genes in a way that preserves a reading frame
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
681 - probability : probability produced by classification using adaboost and example positives/negatives (only given in results.classified.txt)
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
682 - read_through : fusion involving adjacent potentially resulting from co-transcription rather than genome rearrangement
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
683 - repeat_proportion1 : proportion of the spanning reads in gene 1 that span a repeat region
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
684 - repeat_proportion2 : proportion of the spanning reads in gene 2 that span a repeat region
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
685 - max_repeat_proportion : max of repeat_proportion1 and repeat_proportion2
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
686 - splice_score : number of nucleotides similar to GTAG at fusion splice
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
687 - num_splice_variants : number of potential splice variants for this gene pair
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
688 - splicing_index1 : number of concordant pairs in gene 1 spanning the fusion splice / breakpoint, divided by number of spanning reads supporting the fusion with gene 2
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
689 - splicing_index2 : number of concordant pairs in gene 2 spanning the fusion splice / breakpoint, divided by number of spanning reads supporting the fusion with gene 1
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
690
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
691
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
692 **Example**
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
693
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
694 results.tsv::
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
695
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
696 cluster_id splitr_sequence splitr_count splitr_span_pvalue splitr_pos_pvalue splitr_min_pvalue adjacent altsplice break_adj_entropy1 break_adj_entropy2 break_adj_entropy_min break_predict breakpoint_homology breakseqs_estislands_percident cdna_breakseqs_percident concordant_ratio deletion est_breakseqs_percident eversion exonboundaries expression1 expression2 gene1 gene2 gene_align_strand1 gene_align_strand2 gene_chromosome1 gene_chromosome2 gene_end1 gene_end2 gene_location1 gene_location2 gene_name1 gene_name2 gene_start1 gene_start2 gene_strand1 gene_strand2 genome_breakseqs_percident genomic_break_pos1 genomic_break_pos2 genomic_strand1 genomic_strand2 interchromosomal interrupted_index1 interrupted_index2 inversion library_name max_map_count max_repeat_proportion mean_map_count min_map_count num_multi_map num_splice_variants orf read_through repeat_proportion1 repeat_proportion2 span_count span_coverage1 span_coverage2 span_coverage_max span_coverage_min splice_score splicing_index1 splicing_index2
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
697 1169 GCTTACTGTATGCCAGGCCCCAGAGGGGCAACCACCCTCTAAAGAGAGCGGCTCCTGCCTCCCAGAAAGCTCACAGACTGTGGGAGGGAAACAGGCAGCAGGTGAAGATGCCAAATGCCAGGATATCTGCCCTGTCCTTGCTTGATGCAGCTGCTGGCTCCCACGTTCTCCCCAGAATCCCCTCACACTCCTGCTGTTTTCTCTGCAGGTTGGCAGAGCCCCATGAGGGCAGGGCAGCCACTTTGTTCTTGGGCGGCAAACCTCCCTGGGCGGCACGGAAACCACGGTGAGAAGGGGGCAGGTCGGGCACGTGCAGGGACCACGCTGCAGG|TGTACCCAACAGCTCCGAAGAGACAGCGACCATCGAGAACGGGCCATGATGACGATGGCGGTTTTGTCGAAAAGAAAAGGGGGAAATGTGGGGAAAAGCAAGAGAGATCAGATTGTTACTGTGTCTGTGTAGAAAGAAGTAGACATGGGAGACTCCATTTTGTTCTGTACTAAGAAAAATTCTTCTGCCTTGAGATTCGGTGACCCCACCCCCAACCCCGTGCTCTCTGAAACATGTGCTGTGTCCACTCAGGGTTGAATGGATTAAGGGCGGTGCGAGACGTGCTTT 2 0.000436307890680442 0.110748295953850 0.0880671602973091 N Y 3.19872427442695 3.48337348351473 3.19872427442695 splitr 0 0 0 0 Y 0 N N 0 0 ENSG00000105549 ENSG00000213753 + - 19 19 376013 59111168 intron upstream THEG AC016629.2 361750 59084870 - + 0 375099 386594 + - N 8.34107429512245 - N output_dir 82 0.677852348993289 40.6666666666667 1 11 1 N N 0.361271676300578 0.677852348993289 12 0.758602776578432 0.569678713445872 0.758602776578432 0.569678713445872 2 0.416666666666667 -
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
698 3596 TGGGGGTTGAGGCTTCTGTTCCCAGGTTCCATGACCTCAGAGGTGGCTGGTGAGGTTATGACCTTTGCCCTCCAGCCCTGGCTTAAAACCTCAGCCCTAGGACCTGGTTAAAGGAAGGGGAGATGGAGCTTTGCCCCGACCCCCCCCCGTTCCCCTCACCTGTCAGCCCGAGCTGGGCCAGGGCCCCTAGGTGGGGAACTGGGCCGGGGGGCGGGCACAAGCGGAGGTGGTGCCCCCAAAAGGGCTCCCGGTGGGGTCTTGCTGAGAAGGTGAGGGGTTCCCGGGGCCGCAGCAGGTGGTGGTGGAGGAGCCAAGCGGCTGTAGAGCAAGGGGTGAGCAGGTTCCAGACCGTAGAGGCGGGCAGCGGCCACGGCCCCGGGTCCAGTTAGCTCCTCACCCGCCTCATAGAAGCGGGGTGGCCTTGCCAGGCGTGGGGGTGCTGCC|TTCCTTGGATGTGGTAGCCGTTTCTCAGGCTCCCTCTCCGGAATCGAACCCTGATTCCCCGTCACCCGTGGTCACCATGGTAGGCACGGCGACTACCATCGAAAGTTGATAGGGCAGACGTTCGAATGGGTCGTCGCCGCCACGGGGGGCGTGCGATCAGCCCGAGGTTATCTAGAGTCACCAAAGCCGCCGGCGCCCGCCCCCCGGCCGGGGCCGGAGAGGGGCTGACCGGGTTGGTTTTGATCTGATAAATGCACGCATCCCCCCCGCGAAGGGGGTCAGCGCCCGTCGGCATGTATTAGCTCTAGAATTACCACAGTTATCCAAGTAGGAGAGGAGCGAGCGACCAAAGGAACCATAACTGATTTAATGAGCCATTCGCAGTTTCACTGTACCGGCCGTGCGTACTTAGACATGCATGGCTTAATCTTTGAGACAAGCATATGCTACTGGCAGG 250 7.00711162298275e-72 0.00912124762512338 0.00684237452309549 N N 3.31745197152461 3.47233119514066 3.31745197152461 splitr 7 0.0157657657657656 0 0 N 0.0135135135135136 N N 0 0 ENSG00000156860 ENSG00000212932 - + 16 21 30682131 48111157 coding upstream FBRS RPL23AP4 30670289 48110676 + + 0.0157657657657656 30680678 9827473 - + Y - - N output_dir 2 1 1.11111111111111 1 1 1 N N 0 1 9 0.325530693397641 0.296465452915709 0.325530693397641 0.296465452915709 2 - -
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
699
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
700 </help>
44
225750bf3770 Uploaded
jjohnson
parents: 35
diff changeset
701 <expand macro="citations"/>
0
b75ea9927793 Uploaded
jjohnson
parents:
diff changeset
702 </tool>