annotate datamash-ops.xml @ 9:4b7dd5ff6497 draft

planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 384736acb5d2ae31d796c53031fad0e5da5424e3
author iuc
date Fri, 01 Jul 2022 16:15:57 +0000
parents f11dedb74b83
children 67d9cf45e802
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
8
f11dedb74b83 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 206ac70388ea11b168366f1e30bb44157e371c6e"
iuc
parents: 7
diff changeset
1 <tool id="datamash_ops" name="Datamash" version="@TOOL_VERSION@+galaxy@VERSION_SUFFIX@" profile="@PROFILE@">
0
2d03f8df7806 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 1fa5e1a5cfac88256d484ec20c35fc319e6ceb3b
iuc
parents:
diff changeset
2 <description>(operations on tabular data)</description>
2d03f8df7806 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 1fa5e1a5cfac88256d484ec20c35fc319e6ceb3b
iuc
parents:
diff changeset
3 <macros>
2d03f8df7806 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 1fa5e1a5cfac88256d484ec20c35fc319e6ceb3b
iuc
parents:
diff changeset
4 <import>macros.xml</import>
2d03f8df7806 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 1fa5e1a5cfac88256d484ec20c35fc319e6ceb3b
iuc
parents:
diff changeset
5 </macros>
2d03f8df7806 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 1fa5e1a5cfac88256d484ec20c35fc319e6ceb3b
iuc
parents:
diff changeset
6 <expand macro="requirements" />
2d03f8df7806 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 1fa5e1a5cfac88256d484ec20c35fc319e6ceb3b
iuc
parents:
diff changeset
7 <expand macro="stdio" />
2d03f8df7806 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 1fa5e1a5cfac88256d484ec20c35fc319e6ceb3b
iuc
parents:
diff changeset
8 <command>
2d03f8df7806 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 1fa5e1a5cfac88256d484ec20c35fc319e6ceb3b
iuc
parents:
diff changeset
9 <![CDATA[
2d03f8df7806 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 1fa5e1a5cfac88256d484ec20c35fc319e6ceb3b
iuc
parents:
diff changeset
10 datamash
2d03f8df7806 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 1fa5e1a5cfac88256d484ec20c35fc319e6ceb3b
iuc
parents:
diff changeset
11 $header_in
2d03f8df7806 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 1fa5e1a5cfac88256d484ec20c35fc319e6ceb3b
iuc
parents:
diff changeset
12 $header_out
2d03f8df7806 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 1fa5e1a5cfac88256d484ec20c35fc319e6ceb3b
iuc
parents:
diff changeset
13 $need_sort
2d03f8df7806 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 1fa5e1a5cfac88256d484ec20c35fc319e6ceb3b
iuc
parents:
diff changeset
14 $print_full_line
2d03f8df7806 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 1fa5e1a5cfac88256d484ec20c35fc319e6ceb3b
iuc
parents:
diff changeset
15 $ignore_case
9
4b7dd5ff6497 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 384736acb5d2ae31d796c53031fad0e5da5424e3
iuc
parents: 8
diff changeset
16 $narm
8
f11dedb74b83 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 206ac70388ea11b168366f1e30bb44157e371c6e"
iuc
parents: 7
diff changeset
17 @FIELD_SEPARATOR@
f11dedb74b83 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 206ac70388ea11b168366f1e30bb44157e371c6e"
iuc
parents: 7
diff changeset
18 #if str($grouping) != ''
f11dedb74b83 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 206ac70388ea11b168366f1e30bb44157e371c6e"
iuc
parents: 7
diff changeset
19 --group '$grouping'
0
2d03f8df7806 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 1fa5e1a5cfac88256d484ec20c35fc319e6ceb3b
iuc
parents:
diff changeset
20 #end if
2d03f8df7806 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 1fa5e1a5cfac88256d484ec20c35fc319e6ceb3b
iuc
parents:
diff changeset
21 #for $oper in $operations
2d03f8df7806 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 1fa5e1a5cfac88256d484ec20c35fc319e6ceb3b
iuc
parents:
diff changeset
22 ${oper.op_name}
2d03f8df7806 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 1fa5e1a5cfac88256d484ec20c35fc319e6ceb3b
iuc
parents:
diff changeset
23 ${oper.op_column}
2d03f8df7806 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 1fa5e1a5cfac88256d484ec20c35fc319e6ceb3b
iuc
parents:
diff changeset
24 #end for
6
9bd21de9455b planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit fd00f13c26d6d6e108a558ad8ef234eb86967b4b
iuc
parents: 5
diff changeset
25 < $in_file > '$out_file'
0
2d03f8df7806 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 1fa5e1a5cfac88256d484ec20c35fc319e6ceb3b
iuc
parents:
diff changeset
26 ]]>
2d03f8df7806 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 1fa5e1a5cfac88256d484ec20c35fc319e6ceb3b
iuc
parents:
diff changeset
27 </command>
2d03f8df7806 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 1fa5e1a5cfac88256d484ec20c35fc319e6ceb3b
iuc
parents:
diff changeset
28 <expand macro="inputs_outputs">
8
f11dedb74b83 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 206ac70388ea11b168366f1e30bb44157e371c6e"
iuc
parents: 7
diff changeset
29 <param argument="--group" name="grouping" type="text" label="Group by fields" help="Group consecutive rows with equal values in the chosen fields. If no columns are specified, each operation is performed in the entire input file. Comma separated list of column indices, e.g. 1,5">
f11dedb74b83 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 206ac70388ea11b168366f1e30bb44157e371c6e"
iuc
parents: 7
diff changeset
30 <sanitizer invalid_char="">
f11dedb74b83 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 206ac70388ea11b168366f1e30bb44157e371c6e"
iuc
parents: 7
diff changeset
31 <valid initial="string.digits">
f11dedb74b83 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 206ac70388ea11b168366f1e30bb44157e371c6e"
iuc
parents: 7
diff changeset
32 <add value="," />
f11dedb74b83 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 206ac70388ea11b168366f1e30bb44157e371c6e"
iuc
parents: 7
diff changeset
33 </valid>
f11dedb74b83 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 206ac70388ea11b168366f1e30bb44157e371c6e"
iuc
parents: 7
diff changeset
34 <mapping initial="none">
f11dedb74b83 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 206ac70388ea11b168366f1e30bb44157e371c6e"
iuc
parents: 7
diff changeset
35 <add source=" " target=""/>
f11dedb74b83 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 206ac70388ea11b168366f1e30bb44157e371c6e"
iuc
parents: 7
diff changeset
36 </mapping>
f11dedb74b83 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 206ac70388ea11b168366f1e30bb44157e371c6e"
iuc
parents: 7
diff changeset
37 </sanitizer>
f11dedb74b83 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 206ac70388ea11b168366f1e30bb44157e371c6e"
iuc
parents: 7
diff changeset
38 <validator message="Invalid value in field. Allowed is a comma separated list of integer values or the empty string" type="regex">(^$)|(^\s*\d+\s*(,\s*\d+\s*)*$)</validator>
0
2d03f8df7806 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 1fa5e1a5cfac88256d484ec20c35fc319e6ceb3b
iuc
parents:
diff changeset
39 </param>
8
f11dedb74b83 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 206ac70388ea11b168366f1e30bb44157e371c6e"
iuc
parents: 7
diff changeset
40 <param argument="--sort" name="need_sort" type="boolean" truevalue="--sort" falsevalue="" label="Sort input" help="Input file must be sorted by the grouping columns. Enable this option to automatically sort the input."/>
f11dedb74b83 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 206ac70388ea11b168366f1e30bb44157e371c6e"
iuc
parents: 7
diff changeset
41 <param argument="--header-in" type="boolean" truevalue="--header-in" falsevalue="" label="Input file has a header line" />
f11dedb74b83 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 206ac70388ea11b168366f1e30bb44157e371c6e"
iuc
parents: 7
diff changeset
42 <param argument="--header-out" type="boolean" truevalue="--header-out" falsevalue="" label="Print header line" />
f11dedb74b83 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 206ac70388ea11b168366f1e30bb44157e371c6e"
iuc
parents: 7
diff changeset
43 <param argument="--full" name="print_full_line" type="boolean" truevalue="--full" falsevalue="" label="Print all fields from input file" />
f11dedb74b83 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 206ac70388ea11b168366f1e30bb44157e371c6e"
iuc
parents: 7
diff changeset
44 <param argument="--ignore-case" type="boolean" truevalue="--ignore-case" falsevalue="" label="Ignore case when grouping" />
9
4b7dd5ff6497 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 384736acb5d2ae31d796c53031fad0e5da5424e3
iuc
parents: 8
diff changeset
45 <param argument="--narm" type="boolean" truevalue="--narm" falsevalue="" label="Skip NA or NaN values" />
8
f11dedb74b83 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 206ac70388ea11b168366f1e30bb44157e371c6e"
iuc
parents: 7
diff changeset
46 <repeat name="operations" default="1" min="1" title="Operation to perform on each group">
4
7ae1fa51bacf planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 5a6df0b54ca66fb588886b4610bbd837cd624fed
iuc
parents: 0
diff changeset
47 <param name="op_name" type="select" label="Type">
0
2d03f8df7806 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 1fa5e1a5cfac88256d484ec20c35fc319e6ceb3b
iuc
parents:
diff changeset
48 <option value="count">count</option>
2d03f8df7806 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 1fa5e1a5cfac88256d484ec20c35fc319e6ceb3b
iuc
parents:
diff changeset
49 <option value="sum">sum</option>
2d03f8df7806 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 1fa5e1a5cfac88256d484ec20c35fc319e6ceb3b
iuc
parents:
diff changeset
50 <option value="min">minimum</option>
2d03f8df7806 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 1fa5e1a5cfac88256d484ec20c35fc319e6ceb3b
iuc
parents:
diff changeset
51 <option value="max">maximum</option>
2d03f8df7806 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 1fa5e1a5cfac88256d484ec20c35fc319e6ceb3b
iuc
parents:
diff changeset
52 <option value="absmin">Absolute minimum</option>
2d03f8df7806 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 1fa5e1a5cfac88256d484ec20c35fc319e6ceb3b
iuc
parents:
diff changeset
53 <option value="absmax">Absolute maximum</option>
2d03f8df7806 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 1fa5e1a5cfac88256d484ec20c35fc319e6ceb3b
iuc
parents:
diff changeset
54 <option value="mean">Mean</option>
2d03f8df7806 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 1fa5e1a5cfac88256d484ec20c35fc319e6ceb3b
iuc
parents:
diff changeset
55 <option value="pstdev">Population Standard deviantion</option>
2d03f8df7806 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 1fa5e1a5cfac88256d484ec20c35fc319e6ceb3b
iuc
parents:
diff changeset
56 <option value="sstdev">Sample Standard deviantion</option>
2d03f8df7806 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 1fa5e1a5cfac88256d484ec20c35fc319e6ceb3b
iuc
parents:
diff changeset
57 <option value="median">Median</option>
2d03f8df7806 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 1fa5e1a5cfac88256d484ec20c35fc319e6ceb3b
iuc
parents:
diff changeset
58 <option value="q1">1st quartile</option>
2d03f8df7806 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 1fa5e1a5cfac88256d484ec20c35fc319e6ceb3b
iuc
parents:
diff changeset
59 <option value="q3">3rd quartile</option>
2d03f8df7806 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 1fa5e1a5cfac88256d484ec20c35fc319e6ceb3b
iuc
parents:
diff changeset
60 <option value="iqr">Inter-quartile range</option>
2d03f8df7806 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 1fa5e1a5cfac88256d484ec20c35fc319e6ceb3b
iuc
parents:
diff changeset
61 <option value="mad">Median Absolute Deviation</option>
2d03f8df7806 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 1fa5e1a5cfac88256d484ec20c35fc319e6ceb3b
iuc
parents:
diff changeset
62 <option value="pvar">Variance (population)</option>
2d03f8df7806 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 1fa5e1a5cfac88256d484ec20c35fc319e6ceb3b
iuc
parents:
diff changeset
63 <option value="svar">Variance (sample)</option>
2d03f8df7806 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 1fa5e1a5cfac88256d484ec20c35fc319e6ceb3b
iuc
parents:
diff changeset
64 <option value="sskew">Skewness (sample)</option>
2d03f8df7806 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 1fa5e1a5cfac88256d484ec20c35fc319e6ceb3b
iuc
parents:
diff changeset
65 <option value="pskew">Skewness (population)</option>
2d03f8df7806 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 1fa5e1a5cfac88256d484ec20c35fc319e6ceb3b
iuc
parents:
diff changeset
66 <option value="skurt">Kurtosis (sample)</option>
2d03f8df7806 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 1fa5e1a5cfac88256d484ec20c35fc319e6ceb3b
iuc
parents:
diff changeset
67 <option value="pkurt">Kurtosis (population)</option>
2d03f8df7806 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 1fa5e1a5cfac88256d484ec20c35fc319e6ceb3b
iuc
parents:
diff changeset
68 <option value="jarque">Jarque-Bera Normality test</option>
6
9bd21de9455b planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit fd00f13c26d6d6e108a558ad8ef234eb86967b4b
iuc
parents: 5
diff changeset
69 <option value="dpo">D Agostino-Pearson Omnibus Normality Test</option>
0
2d03f8df7806 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 1fa5e1a5cfac88256d484ec20c35fc319e6ceb3b
iuc
parents:
diff changeset
70 <option value="mode">Mode</option>
2d03f8df7806 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 1fa5e1a5cfac88256d484ec20c35fc319e6ceb3b
iuc
parents:
diff changeset
71 <option value="antimode">Anti-Mode</option>
6
9bd21de9455b planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit fd00f13c26d6d6e108a558ad8ef234eb86967b4b
iuc
parents: 5
diff changeset
72 <option value="rand">One random value from the group</option>
0
2d03f8df7806 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 1fa5e1a5cfac88256d484ec20c35fc319e6ceb3b
iuc
parents:
diff changeset
73 <option value="unique">Combine all unique values</option>
2d03f8df7806 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 1fa5e1a5cfac88256d484ec20c35fc319e6ceb3b
iuc
parents:
diff changeset
74 <option value="collapse">Combine all values</option>
2d03f8df7806 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 1fa5e1a5cfac88256d484ec20c35fc319e6ceb3b
iuc
parents:
diff changeset
75 <option value="countunique">Count Unique values</option>
2d03f8df7806 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 1fa5e1a5cfac88256d484ec20c35fc319e6ceb3b
iuc
parents:
diff changeset
76 </param>
4
7ae1fa51bacf planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 5a6df0b54ca66fb588886b4610bbd837cd624fed
iuc
parents: 0
diff changeset
77 <param name="op_column" data_ref="in_file" label="On column" type="data_column" />
0
2d03f8df7806 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 1fa5e1a5cfac88256d484ec20c35fc319e6ceb3b
iuc
parents:
diff changeset
78 </repeat>
2d03f8df7806 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 1fa5e1a5cfac88256d484ec20c35fc319e6ceb3b
iuc
parents:
diff changeset
79 </expand>
2d03f8df7806 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 1fa5e1a5cfac88256d484ec20c35fc319e6ceb3b
iuc
parents:
diff changeset
80 <tests>
2d03f8df7806 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 1fa5e1a5cfac88256d484ec20c35fc319e6ceb3b
iuc
parents:
diff changeset
81 <test>
4
7ae1fa51bacf planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 5a6df0b54ca66fb588886b4610bbd837cd624fed
iuc
parents: 0
diff changeset
82 <param name="in_file" value="group_compute_input.txt" ftype="tabular" />
0
2d03f8df7806 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 1fa5e1a5cfac88256d484ec20c35fc319e6ceb3b
iuc
parents:
diff changeset
83 <param name="grouping" value="2" />
2d03f8df7806 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 1fa5e1a5cfac88256d484ec20c35fc319e6ceb3b
iuc
parents:
diff changeset
84 <param name="header_in" value="true" />
2d03f8df7806 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 1fa5e1a5cfac88256d484ec20c35fc319e6ceb3b
iuc
parents:
diff changeset
85 <param name="header_out" value="true" />
2d03f8df7806 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 1fa5e1a5cfac88256d484ec20c35fc319e6ceb3b
iuc
parents:
diff changeset
86 <param name="need_sort" value="true" />
2d03f8df7806 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 1fa5e1a5cfac88256d484ec20c35fc319e6ceb3b
iuc
parents:
diff changeset
87 <param name="print_full_line" value="false" />
2d03f8df7806 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 1fa5e1a5cfac88256d484ec20c35fc319e6ceb3b
iuc
parents:
diff changeset
88 <param name="ignore_case" value="false" />
4
7ae1fa51bacf planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 5a6df0b54ca66fb588886b4610bbd837cd624fed
iuc
parents: 0
diff changeset
89 <repeat name="operations">
7ae1fa51bacf planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 5a6df0b54ca66fb588886b4610bbd837cd624fed
iuc
parents: 0
diff changeset
90 <param name="op_name" value="sum" />
7ae1fa51bacf planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 5a6df0b54ca66fb588886b4610bbd837cd624fed
iuc
parents: 0
diff changeset
91 <param name="op_column" value="3" />
7ae1fa51bacf planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 5a6df0b54ca66fb588886b4610bbd837cd624fed
iuc
parents: 0
diff changeset
92 </repeat>
5
90ff417a72fc planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 7409e73927c65e293ad19d54bb2572b4a289929d
iuc
parents: 4
diff changeset
93 <output file="group_compute_output.txt" name="out_file" ftype="tabular" />
0
2d03f8df7806 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 1fa5e1a5cfac88256d484ec20c35fc319e6ceb3b
iuc
parents:
diff changeset
94 </test>
8
f11dedb74b83 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 206ac70388ea11b168366f1e30bb44157e371c6e"
iuc
parents: 7
diff changeset
95 <test>
f11dedb74b83 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 206ac70388ea11b168366f1e30bb44157e371c6e"
iuc
parents: 7
diff changeset
96 <param name="in_file" value="group_compute_input.txt" ftype="tsv" />
f11dedb74b83 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 206ac70388ea11b168366f1e30bb44157e371c6e"
iuc
parents: 7
diff changeset
97 <param name="grouping" value="2" />
f11dedb74b83 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 206ac70388ea11b168366f1e30bb44157e371c6e"
iuc
parents: 7
diff changeset
98 <param name="header_in" value="true" />
f11dedb74b83 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 206ac70388ea11b168366f1e30bb44157e371c6e"
iuc
parents: 7
diff changeset
99 <param name="header_out" value="true" />
f11dedb74b83 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 206ac70388ea11b168366f1e30bb44157e371c6e"
iuc
parents: 7
diff changeset
100 <param name="need_sort" value="true" />
f11dedb74b83 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 206ac70388ea11b168366f1e30bb44157e371c6e"
iuc
parents: 7
diff changeset
101 <param name="print_full_line" value="false" />
f11dedb74b83 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 206ac70388ea11b168366f1e30bb44157e371c6e"
iuc
parents: 7
diff changeset
102 <param name="ignore_case" value="false" />
f11dedb74b83 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 206ac70388ea11b168366f1e30bb44157e371c6e"
iuc
parents: 7
diff changeset
103 <repeat name="operations">
f11dedb74b83 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 206ac70388ea11b168366f1e30bb44157e371c6e"
iuc
parents: 7
diff changeset
104 <param name="op_name" value="sum" />
f11dedb74b83 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 206ac70388ea11b168366f1e30bb44157e371c6e"
iuc
parents: 7
diff changeset
105 <param name="op_column" value="3" />
f11dedb74b83 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 206ac70388ea11b168366f1e30bb44157e371c6e"
iuc
parents: 7
diff changeset
106 </repeat>
f11dedb74b83 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 206ac70388ea11b168366f1e30bb44157e371c6e"
iuc
parents: 7
diff changeset
107 <output file="group_compute_output.txt" name="out_file" ftype="tsv" />
f11dedb74b83 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 206ac70388ea11b168366f1e30bb44157e371c6e"
iuc
parents: 7
diff changeset
108 </test>
f11dedb74b83 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 206ac70388ea11b168366f1e30bb44157e371c6e"
iuc
parents: 7
diff changeset
109 <test>
f11dedb74b83 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 206ac70388ea11b168366f1e30bb44157e371c6e"
iuc
parents: 7
diff changeset
110 <param name="in_file" value="group_compute_input.csv" ftype="csv" />
f11dedb74b83 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 206ac70388ea11b168366f1e30bb44157e371c6e"
iuc
parents: 7
diff changeset
111 <param name="grouping" value="2" />
f11dedb74b83 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 206ac70388ea11b168366f1e30bb44157e371c6e"
iuc
parents: 7
diff changeset
112 <param name="header_in" value="true" />
f11dedb74b83 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 206ac70388ea11b168366f1e30bb44157e371c6e"
iuc
parents: 7
diff changeset
113 <param name="header_out" value="true" />
f11dedb74b83 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 206ac70388ea11b168366f1e30bb44157e371c6e"
iuc
parents: 7
diff changeset
114 <param name="need_sort" value="true" />
f11dedb74b83 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 206ac70388ea11b168366f1e30bb44157e371c6e"
iuc
parents: 7
diff changeset
115 <param name="print_full_line" value="false" />
f11dedb74b83 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 206ac70388ea11b168366f1e30bb44157e371c6e"
iuc
parents: 7
diff changeset
116 <param name="ignore_case" value="false" />
f11dedb74b83 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 206ac70388ea11b168366f1e30bb44157e371c6e"
iuc
parents: 7
diff changeset
117 <repeat name="operations">
f11dedb74b83 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 206ac70388ea11b168366f1e30bb44157e371c6e"
iuc
parents: 7
diff changeset
118 <param name="op_name" value="sum" />
f11dedb74b83 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 206ac70388ea11b168366f1e30bb44157e371c6e"
iuc
parents: 7
diff changeset
119 <param name="op_column" value="3" />
f11dedb74b83 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 206ac70388ea11b168366f1e30bb44157e371c6e"
iuc
parents: 7
diff changeset
120 </repeat>
f11dedb74b83 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 206ac70388ea11b168366f1e30bb44157e371c6e"
iuc
parents: 7
diff changeset
121 <output name="out_file" ftype="csv">
f11dedb74b83 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 206ac70388ea11b168366f1e30bb44157e371c6e"
iuc
parents: 7
diff changeset
122 <assert_contents>
f11dedb74b83 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 206ac70388ea11b168366f1e30bb44157e371c6e"
iuc
parents: 7
diff changeset
123 <has_n_lines n="7"/>
f11dedb74b83 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 206ac70388ea11b168366f1e30bb44157e371c6e"
iuc
parents: 7
diff changeset
124 <has_line line="Arts,1310"/>
f11dedb74b83 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 206ac70388ea11b168366f1e30bb44157e371c6e"
iuc
parents: 7
diff changeset
125 </assert_contents>
f11dedb74b83 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 206ac70388ea11b168366f1e30bb44157e371c6e"
iuc
parents: 7
diff changeset
126 </output>
f11dedb74b83 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 206ac70388ea11b168366f1e30bb44157e371c6e"
iuc
parents: 7
diff changeset
127 </test>
9
4b7dd5ff6497 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 384736acb5d2ae31d796c53031fad0e5da5424e3
iuc
parents: 8
diff changeset
128 <test><!-- test with a file containing NA and NaN values and the -narm parameter " -->
4b7dd5ff6497 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 384736acb5d2ae31d796c53031fad0e5da5424e3
iuc
parents: 8
diff changeset
129 <param name="in_file" value="na_values_input.tsv" ftype="tabular" />
4b7dd5ff6497 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 384736acb5d2ae31d796c53031fad0e5da5424e3
iuc
parents: 8
diff changeset
130 <param name="grouping" value="2" />
4b7dd5ff6497 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 384736acb5d2ae31d796c53031fad0e5da5424e3
iuc
parents: 8
diff changeset
131 <param name="header_in" value="true" />
4b7dd5ff6497 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 384736acb5d2ae31d796c53031fad0e5da5424e3
iuc
parents: 8
diff changeset
132 <param name="print_full_line" value="false" />
4b7dd5ff6497 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 384736acb5d2ae31d796c53031fad0e5da5424e3
iuc
parents: 8
diff changeset
133 <param name="need_sort" value="true" />
4b7dd5ff6497 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 384736acb5d2ae31d796c53031fad0e5da5424e3
iuc
parents: 8
diff changeset
134 <param name="narm" value="true" />
4b7dd5ff6497 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 384736acb5d2ae31d796c53031fad0e5da5424e3
iuc
parents: 8
diff changeset
135 <repeat name="operations">
4b7dd5ff6497 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 384736acb5d2ae31d796c53031fad0e5da5424e3
iuc
parents: 8
diff changeset
136 <param name="op_name" value="mean" />
4b7dd5ff6497 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 384736acb5d2ae31d796c53031fad0e5da5424e3
iuc
parents: 8
diff changeset
137 <param name="op_column" value="3" />
4b7dd5ff6497 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 384736acb5d2ae31d796c53031fad0e5da5424e3
iuc
parents: 8
diff changeset
138 </repeat>
4b7dd5ff6497 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 384736acb5d2ae31d796c53031fad0e5da5424e3
iuc
parents: 8
diff changeset
139 <output name="out_file" ftype="tabular">
4b7dd5ff6497 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 384736acb5d2ae31d796c53031fad0e5da5424e3
iuc
parents: 8
diff changeset
140 <assert_contents>
4b7dd5ff6497 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 384736acb5d2ae31d796c53031fad0e5da5424e3
iuc
parents: 8
diff changeset
141 <has_n_lines n="2"/>
4b7dd5ff6497 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 384736acb5d2ae31d796c53031fad0e5da5424e3
iuc
parents: 8
diff changeset
142 <has_line_matching expression="DE\t173.5"/>
4b7dd5ff6497 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 384736acb5d2ae31d796c53031fad0e5da5424e3
iuc
parents: 8
diff changeset
143 <has_line_matching expression="NL\t177.5"/>
4b7dd5ff6497 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 384736acb5d2ae31d796c53031fad0e5da5424e3
iuc
parents: 8
diff changeset
144 </assert_contents>
4b7dd5ff6497 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 384736acb5d2ae31d796c53031fad0e5da5424e3
iuc
parents: 8
diff changeset
145 </output>
4b7dd5ff6497 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 384736acb5d2ae31d796c53031fad0e5da5424e3
iuc
parents: 8
diff changeset
146 </test>
0
2d03f8df7806 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 1fa5e1a5cfac88256d484ec20c35fc319e6ceb3b
iuc
parents:
diff changeset
147 </tests>
2d03f8df7806 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 1fa5e1a5cfac88256d484ec20c35fc319e6ceb3b
iuc
parents:
diff changeset
148 <help>
2d03f8df7806 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 1fa5e1a5cfac88256d484ec20c35fc319e6ceb3b
iuc
parents:
diff changeset
149 <![CDATA[
2d03f8df7806 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 1fa5e1a5cfac88256d484ec20c35fc319e6ceb3b
iuc
parents:
diff changeset
150 @HELP_HEADER@
2d03f8df7806 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 1fa5e1a5cfac88256d484ec20c35fc319e6ceb3b
iuc
parents:
diff changeset
151
2d03f8df7806 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 1fa5e1a5cfac88256d484ec20c35fc319e6ceb3b
iuc
parents:
diff changeset
152 **Syntax**
2d03f8df7806 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 1fa5e1a5cfac88256d484ec20c35fc319e6ceb3b
iuc
parents:
diff changeset
153
2d03f8df7806 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 1fa5e1a5cfac88256d484ec20c35fc319e6ceb3b
iuc
parents:
diff changeset
154 This tools performs common operations (such as summing, counting, mean, standard-deviation) on input file, based on tabular data. The tool can also optionaly group the input based on a given field.
2d03f8df7806 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 1fa5e1a5cfac88256d484ec20c35fc319e6ceb3b
iuc
parents:
diff changeset
155
2d03f8df7806 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 1fa5e1a5cfac88256d484ec20c35fc319e6ceb3b
iuc
parents:
diff changeset
156 -----
2d03f8df7806 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 1fa5e1a5cfac88256d484ec20c35fc319e6ceb3b
iuc
parents:
diff changeset
157
2d03f8df7806 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 1fa5e1a5cfac88256d484ec20c35fc319e6ceb3b
iuc
parents:
diff changeset
158 **Example 1**
2d03f8df7806 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 1fa5e1a5cfac88256d484ec20c35fc319e6ceb3b
iuc
parents:
diff changeset
159
2d03f8df7806 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 1fa5e1a5cfac88256d484ec20c35fc319e6ceb3b
iuc
parents:
diff changeset
160 - Find the average score in statistics course of college students, grouped by their college major. The input file has three fields (Name,Major,Score) and a header line::
2d03f8df7806 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 1fa5e1a5cfac88256d484ec20c35fc319e6ceb3b
iuc
parents:
diff changeset
161
2d03f8df7806 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 1fa5e1a5cfac88256d484ec20c35fc319e6ceb3b
iuc
parents:
diff changeset
162 Name Major Score
2d03f8df7806 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 1fa5e1a5cfac88256d484ec20c35fc319e6ceb3b
iuc
parents:
diff changeset
163 Bryan Arts 68
8
f11dedb74b83 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 206ac70388ea11b168366f1e30bb44157e371c6e"
iuc
parents: 7
diff changeset
164 Gabriel Health-Medicine 100
0
2d03f8df7806 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 1fa5e1a5cfac88256d484ec20c35fc319e6ceb3b
iuc
parents:
diff changeset
165 Isaiah Arts 80
2d03f8df7806 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 1fa5e1a5cfac88256d484ec20c35fc319e6ceb3b
iuc
parents:
diff changeset
166 Tysza Business 92
2d03f8df7806 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 1fa5e1a5cfac88256d484ec20c35fc319e6ceb3b
iuc
parents:
diff changeset
167 Zackery Engineering 54
2d03f8df7806 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 1fa5e1a5cfac88256d484ec20c35fc319e6ceb3b
iuc
parents:
diff changeset
168 ...
2d03f8df7806 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 1fa5e1a5cfac88256d484ec20c35fc319e6ceb3b
iuc
parents:
diff changeset
169 ...
2d03f8df7806 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 1fa5e1a5cfac88256d484ec20c35fc319e6ceb3b
iuc
parents:
diff changeset
170
8
f11dedb74b83 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 206ac70388ea11b168366f1e30bb44157e371c6e"
iuc
parents: 7
diff changeset
171 - Grouping the input by the second column (*Major*), sorting the input, and performing operations **mean** and **sample standard deviation** on the third column (*Score*), gives::
0
2d03f8df7806 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 1fa5e1a5cfac88256d484ec20c35fc319e6ceb3b
iuc
parents:
diff changeset
172
2d03f8df7806 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 1fa5e1a5cfac88256d484ec20c35fc319e6ceb3b
iuc
parents:
diff changeset
173 GroupBy(Major) mean(Score) sstdev(Score)
2d03f8df7806 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 1fa5e1a5cfac88256d484ec20c35fc319e6ceb3b
iuc
parents:
diff changeset
174 Arts 68.9474 10.4215
2d03f8df7806 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 1fa5e1a5cfac88256d484ec20c35fc319e6ceb3b
iuc
parents:
diff changeset
175 Business 87.3636 5.18214
2d03f8df7806 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 1fa5e1a5cfac88256d484ec20c35fc319e6ceb3b
iuc
parents:
diff changeset
176 Engineering 66.5385 19.8814
2d03f8df7806 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 1fa5e1a5cfac88256d484ec20c35fc319e6ceb3b
iuc
parents:
diff changeset
177 Health-Medicine 90.6154 9.22441
2d03f8df7806 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 1fa5e1a5cfac88256d484ec20c35fc319e6ceb3b
iuc
parents:
diff changeset
178 Life-Sciences 55.3333 20.606
2d03f8df7806 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 1fa5e1a5cfac88256d484ec20c35fc319e6ceb3b
iuc
parents:
diff changeset
179 Social-Sciences 60.2667 17.2273
2d03f8df7806 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 1fa5e1a5cfac88256d484ec20c35fc319e6ceb3b
iuc
parents:
diff changeset
180
8
f11dedb74b83 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 206ac70388ea11b168366f1e30bb44157e371c6e"
iuc
parents: 7
diff changeset
181 Note that input needs sorting here, since the column used for grouping (*Major*) is not sorted.
f11dedb74b83 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 206ac70388ea11b168366f1e30bb44157e371c6e"
iuc
parents: 7
diff changeset
182
0
2d03f8df7806 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 1fa5e1a5cfac88256d484ec20c35fc319e6ceb3b
iuc
parents:
diff changeset
183 This sample file is available at http://www.gnu.org/software/datamash .
2d03f8df7806 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 1fa5e1a5cfac88256d484ec20c35fc319e6ceb3b
iuc
parents:
diff changeset
184
2d03f8df7806 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 1fa5e1a5cfac88256d484ec20c35fc319e6ceb3b
iuc
parents:
diff changeset
185 **Example 2**
2d03f8df7806 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 1fa5e1a5cfac88256d484ec20c35fc319e6ceb3b
iuc
parents:
diff changeset
186
2d03f8df7806 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 1fa5e1a5cfac88256d484ec20c35fc319e6ceb3b
iuc
parents:
diff changeset
187 - Using the UCSC RefSeq Human Gene Track, available at: http://hgdownload.soe.ucsc.edu/goldenPath/hg38/database/refGene.txt.gz
2d03f8df7806 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 1fa5e1a5cfac88256d484ec20c35fc319e6ceb3b
iuc
parents:
diff changeset
188
2d03f8df7806 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 1fa5e1a5cfac88256d484ec20c35fc319e6ceb3b
iuc
parents:
diff changeset
189 - List the number and identifiers of isoforms per gene. The gene identifier is in column 13, the isoform/transcript identifier is in column 2. Grouping by column 13 and performing **count** and **Combine all values** on column 2, gives::
2d03f8df7806 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 1fa5e1a5cfac88256d484ec20c35fc319e6ceb3b
iuc
parents:
diff changeset
190
2d03f8df7806 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 1fa5e1a5cfac88256d484ec20c35fc319e6ceb3b
iuc
parents:
diff changeset
191 GroupBy(field-13) count(field-2) collapse(field-2)
2d03f8df7806 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 1fa5e1a5cfac88256d484ec20c35fc319e6ceb3b
iuc
parents:
diff changeset
192 A1BG 1 NM_130786
2d03f8df7806 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 1fa5e1a5cfac88256d484ec20c35fc319e6ceb3b
iuc
parents:
diff changeset
193 A1BG-AS1 1 NR_015380
2d03f8df7806 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 1fa5e1a5cfac88256d484ec20c35fc319e6ceb3b
iuc
parents:
diff changeset
194 A1CF 6 NM_001198818,NM_001198819,NM_001198820,NM_014576,NM_138932,NM_138933
2d03f8df7806 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 1fa5e1a5cfac88256d484ec20c35fc319e6ceb3b
iuc
parents:
diff changeset
195 A2M 1 NM_000014
2d03f8df7806 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 1fa5e1a5cfac88256d484ec20c35fc319e6ceb3b
iuc
parents:
diff changeset
196 A2M-AS1 1 NR_026971
2d03f8df7806 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 1fa5e1a5cfac88256d484ec20c35fc319e6ceb3b
iuc
parents:
diff changeset
197 A2ML1 2 NM_001282424,NM_144670
2d03f8df7806 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 1fa5e1a5cfac88256d484ec20c35fc319e6ceb3b
iuc
parents:
diff changeset
198 ...
2d03f8df7806 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 1fa5e1a5cfac88256d484ec20c35fc319e6ceb3b
iuc
parents:
diff changeset
199
2d03f8df7806 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 1fa5e1a5cfac88256d484ec20c35fc319e6ceb3b
iuc
parents:
diff changeset
200 - Count how many transcripts are listed for each chromosome and strand. Chromosome is on column 3, Strand is in column 4. Transcript identifiers are in column 2. Grouping by columns **3,4** and performing operation **count** on column 2, gives::
2d03f8df7806 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 1fa5e1a5cfac88256d484ec20c35fc319e6ceb3b
iuc
parents:
diff changeset
201
2d03f8df7806 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 1fa5e1a5cfac88256d484ec20c35fc319e6ceb3b
iuc
parents:
diff changeset
202 GroupBy(field-3) GroupBy(field-4) count(field-2)
2d03f8df7806 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 1fa5e1a5cfac88256d484ec20c35fc319e6ceb3b
iuc
parents:
diff changeset
203 chr1 + 2456
2d03f8df7806 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 1fa5e1a5cfac88256d484ec20c35fc319e6ceb3b
iuc
parents:
diff changeset
204 chr1 - 2431
2d03f8df7806 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 1fa5e1a5cfac88256d484ec20c35fc319e6ceb3b
iuc
parents:
diff changeset
205 chr2 + 1599
2d03f8df7806 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 1fa5e1a5cfac88256d484ec20c35fc319e6ceb3b
iuc
parents:
diff changeset
206 chr2 - 1419
2d03f8df7806 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 1fa5e1a5cfac88256d484ec20c35fc319e6ceb3b
iuc
parents:
diff changeset
207 chr3 + 1287
2d03f8df7806 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 1fa5e1a5cfac88256d484ec20c35fc319e6ceb3b
iuc
parents:
diff changeset
208 chr3 - 1249
2d03f8df7806 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 1fa5e1a5cfac88256d484ec20c35fc319e6ceb3b
iuc
parents:
diff changeset
209 ...
2d03f8df7806 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 1fa5e1a5cfac88256d484ec20c35fc319e6ceb3b
iuc
parents:
diff changeset
210
2d03f8df7806 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 1fa5e1a5cfac88256d484ec20c35fc319e6ceb3b
iuc
parents:
diff changeset
211 @HELP_FOOTER@
2d03f8df7806 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 1fa5e1a5cfac88256d484ec20c35fc319e6ceb3b
iuc
parents:
diff changeset
212 ]]>
2d03f8df7806 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 1fa5e1a5cfac88256d484ec20c35fc319e6ceb3b
iuc
parents:
diff changeset
213 </help>
2d03f8df7806 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/datamash commit 1fa5e1a5cfac88256d484ec20c35fc319e6ceb3b
iuc
parents:
diff changeset
214 </tool>