diff transit_hmm.xml @ 7:1cb8d9b0b9b7 draft

"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/transit/ commit f63413d629e4de3c69984b3a96ad8ccfe0d47ada"
author iuc
date Tue, 08 Oct 2019 08:22:31 -0400
parents 029555804ec2
children 1a615b00dbd0
line wrap: on
line diff
--- a/transit_hmm.xml	Tue Jun 25 17:43:34 2019 -0400
+++ b/transit_hmm.xml	Tue Oct 08 08:22:31 2019 -0400
@@ -27,10 +27,10 @@
     <tests>
         <test>
             <param name="inputs" ftype="wig" value="transit-in1-rep1.wig,transit-in1-rep2.wig" />
-            <param name="annotation" ftype="gff3" value="transit-in1.gff3" />
+            <param name="annotation" ftype="tabular" value="transit-in1.prot" />
             <param name="replicates" value="Replicates" />
-            <output name="sites" file="hmm-sites1.txt" ftype="tabular" lines_diff="2" />
-            <output name="genes" file="hmm-genes1.txt" ftype="tabular" />
+            <output name="sites" file="hmm-sites1.txt" ftype="tabular" compare="sim_size" />
+            <output name="genes" file="hmm-genes1.txt" ftype="tabular" compare="sim_size" />
         </test>
     </tests>
     <help>
@@ -60,15 +60,25 @@
 
 -------------------
 
-| python transit.py hmm <comma-separated .wig files> <annotation .prot_table or GFF3> <output file>
-| Optional Arguments:
+
+Optional Arguments:
 |    -r <string>     :=  How to handle replicates. Sum, Mean. Default: -r Mean
 |    -l              :=  Perform LOESS Correction; Helps remove possible genomic position bias. Default: Off.
 |    -iN <float>     :=  Ignore TAs occuring at given fraction of the N terminus. Default: -iN 0.0
 |    -iC <float>     :=  Ignore TAs occuring at given fraction of the C terminus. Default: -iC 0.0
+|    -n <string>      := Determines which normalization method to use. Default -n TTR
 
 The HMM method automatically estimates the necessary statistical parameters from the datasets. You can change how the method handles replicate datasets:
 -   Replicates: Determines how the HMM deals with replicate datasets by either averaging the read-counts or summing read counts across datasets. For regular datasets (i.e. mean-read count > 100) the recommended setting is to average read-counts together. For sparse datasets, it summing read-counts may produce more accurate results.
+-   Normalization Method: Determines which normalization method to use when comparing datasets. Proper normalization is important as it ensures that other sources of variability are not mistakenly treated as real differences. See the Normalization section for a description of normalization method available in TRANSIT.
+-    - TTR (Default) : Trimmed Total Reads (TTR), normalized by the total read-counts (like totreads), but trims top and bottom 5% of read-counts. This is the recommended normalization method for most cases as it has the beneffit of normalizing for difference in saturation in the context of resampling.
+-    - nzmean : Normalizes datasets to have the same mean over the non-zero sites.
+-    - totreads : Normalizes datasets by total read-counts, and scales them to have the same mean over all counts.
+-    - zinfnb : Fits a zero-inflated negative binomial model, and then divides read-counts by the mean. The zero-inflated negative binomial model will treat some empty sites as belonging to the “true” negative binomial distribution responsible for read-counts while treating the others as “essential” (and thus not influencing its parameters).
+-    - quantile : Normalizes datasets using the quantile normalization method described by Bolstad et al. (2003). In this normalization procedure, datasets are sorted, an empirical distribution is estimated as the mean across the sorted datasets at each site, and then the original (unsorted) datasets are assigned values from the empirical distribution based on their quantiles.
+-    - betageom : Normalizes the datasets to fit an “ideal” Geometric distribution with a variable probability parameter p. Specially useful for datasets that contain a large skew. See Beta-Geometric Correction .
+-    - nonorm : No normalization is performed.
+
 
 -----------