annotate perf.xml @ 1:7aa26fb0ac9e draft default tip

Uploaded
author bgruening
date Thu, 15 May 2014 16:58:26 -0400
parents e390b5b6b89c
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
e390b5b6b89c Uploaded
bgruening
parents:
diff changeset
1 <tool id="stats_perf_tool" name="Performance metrics" version="5.11.0">
e390b5b6b89c Uploaded
bgruening
parents:
diff changeset
2 <description>suitable for boolean classification problems (perf)</description>
e390b5b6b89c Uploaded
bgruening
parents:
diff changeset
3 <requirements>
e390b5b6b89c Uploaded
bgruening
parents:
diff changeset
4 <requirement type="package" version="5.11">perf</requirement>
e390b5b6b89c Uploaded
bgruening
parents:
diff changeset
5 </requirements>
e390b5b6b89c Uploaded
bgruening
parents:
diff changeset
6 <command>
e390b5b6b89c Uploaded
bgruening
parents:
diff changeset
7 perf
e390b5b6b89c Uploaded
bgruening
parents:
diff changeset
8 -t $threshold
e390b5b6b89c Uploaded
bgruening
parents:
diff changeset
9 #echo ' '.join(str($performance_measures).split(','))#
e390b5b6b89c Uploaded
bgruening
parents:
diff changeset
10 $plot
e390b5b6b89c Uploaded
bgruening
parents:
diff changeset
11 -file "${infile}"
e390b5b6b89c Uploaded
bgruening
parents:
diff changeset
12 2>/dev/null
e390b5b6b89c Uploaded
bgruening
parents:
diff changeset
13 > perf.out;
e390b5b6b89c Uploaded
bgruening
parents:
diff changeset
14
e390b5b6b89c Uploaded
bgruening
parents:
diff changeset
15 #if str($plot):
e390b5b6b89c Uploaded
bgruening
parents:
diff changeset
16 csplit --prefix 'perf' -s perf.out '/^$/';
e390b5b6b89c Uploaded
bgruening
parents:
diff changeset
17 cat perf00 | tr ' ' \\t > perf_plotting_data.out;
e390b5b6b89c Uploaded
bgruening
parents:
diff changeset
18 cat perf01 | awk '{printf("%s\t%s\n",$1,$2)}' > perf_results.out;
e390b5b6b89c Uploaded
bgruening
parents:
diff changeset
19 #else:
e390b5b6b89c Uploaded
bgruening
parents:
diff changeset
20 cat perf.out | awk '{printf("%s\t%s\n",$1,$2)}' > perf_results.out;
e390b5b6b89c Uploaded
bgruening
parents:
diff changeset
21 #end if
e390b5b6b89c Uploaded
bgruening
parents:
diff changeset
22
e390b5b6b89c Uploaded
bgruening
parents:
diff changeset
23 </command>
e390b5b6b89c Uploaded
bgruening
parents:
diff changeset
24 <inputs>
e390b5b6b89c Uploaded
bgruening
parents:
diff changeset
25 <param name="infile" format="tabular" type="data" label="File to select" help="1st col targets, 2nd col predictions (-infile)"/>
e390b5b6b89c Uploaded
bgruening
parents:
diff changeset
26
e390b5b6b89c Uploaded
bgruening
parents:
diff changeset
27 <param name="performance_measures" multiple="True" type="select" display="checkboxes" label="Select a pre-defined filtering set">
e390b5b6b89c Uploaded
bgruening
parents:
diff changeset
28 <option value="-ACC" selected="True">Accuracy</option>
e390b5b6b89c Uploaded
bgruening
parents:
diff changeset
29 <option value="-RMS">Root Mean Squared Error</option>
e390b5b6b89c Uploaded
bgruening
parents:
diff changeset
30 <option value="-CXE">Mean Cross-Entropy</option>
e390b5b6b89c Uploaded
bgruening
parents:
diff changeset
31 <option value="-ROC" selected="True">ROC area</option>
e390b5b6b89c Uploaded
bgruening
parents:
diff changeset
32 <option value="-R50">ROC area up to 50 negative examples</option>
e390b5b6b89c Uploaded
bgruening
parents:
diff changeset
33 <option value="-SEN">Sensitivity</option>
e390b5b6b89c Uploaded
bgruening
parents:
diff changeset
34 <option value="-SPC">Specificity</option>
e390b5b6b89c Uploaded
bgruening
parents:
diff changeset
35 <option value="-NPV">Negative Predictive Value</option>
e390b5b6b89c Uploaded
bgruening
parents:
diff changeset
36 <option value="-PPV">Positive Predictive Value</option>
e390b5b6b89c Uploaded
bgruening
parents:
diff changeset
37 <option value="-PRE">Precision</option>
e390b5b6b89c Uploaded
bgruening
parents:
diff changeset
38 <option value="-REC">Recall</option>
e390b5b6b89c Uploaded
bgruening
parents:
diff changeset
39 <option value="-PRF">F1 score</option>
e390b5b6b89c Uploaded
bgruening
parents:
diff changeset
40 <option value="-PRB">Precision/Recall Break Even Point</option>
e390b5b6b89c Uploaded
bgruening
parents:
diff changeset
41 <option value="-APR" selected="True">Mean Average Precision</option>
e390b5b6b89c Uploaded
bgruening
parents:
diff changeset
42 <!--option value="-LFT">Lift (at threshold)</option>
e390b5b6b89c Uploaded
bgruening
parents:
diff changeset
43 <option value="-TOP1">Top 1: is the top ranked case positive</option>
e390b5b6b89c Uploaded
bgruening
parents:
diff changeset
44 <option value="-TOP10">Top 10: is there a positive in the top 10 ranked cases</option>
e390b5b6b89c Uploaded
bgruening
parents:
diff changeset
45 <option value="-NTOP"> How many positives in the top N ranked cases</option>
e390b5b6b89c Uploaded
bgruening
parents:
diff changeset
46 <option value="-RKL">Rank of *last* (poorest ranked) positive case</option>
e390b5b6b89c Uploaded
bgruening
parents:
diff changeset
47 <option value="-NRM">Norm error using metric</option>
e390b5b6b89c Uploaded
bgruening
parents:
diff changeset
48 <option value="-CST">Total cost using these cost values, plus min-cost results</option-->
e390b5b6b89c Uploaded
bgruening
parents:
diff changeset
49 <!--option value="-SAR">typically wACC = wROC = wRMS = 1.0</option-->
e390b5b6b89c Uploaded
bgruening
parents:
diff changeset
50 <!--option value="-CAL">CA1/CA2 scores</option-->
e390b5b6b89c Uploaded
bgruening
parents:
diff changeset
51 <!--option value="-SLQ">Slac Q-score</option-->
e390b5b6b89c Uploaded
bgruening
parents:
diff changeset
52 </param>
e390b5b6b89c Uploaded
bgruening
parents:
diff changeset
53
e390b5b6b89c Uploaded
bgruening
parents:
diff changeset
54 <param name="plot" type="select" label="Plotting type">
e390b5b6b89c Uploaded
bgruening
parents:
diff changeset
55 <option value="" selected="True">No plot</option>
e390b5b6b89c Uploaded
bgruening
parents:
diff changeset
56 <option value="-plot roc">ROC plot</option>
e390b5b6b89c Uploaded
bgruening
parents:
diff changeset
57 <option value="-plor pr">Precision/Recall plot</option>
e390b5b6b89c Uploaded
bgruening
parents:
diff changeset
58 <option value="-plot lift">Lift versus threshold plot</option>
e390b5b6b89c Uploaded
bgruening
parents:
diff changeset
59 <option value="-plor cost">Cost versus threshold plot</option>
e390b5b6b89c Uploaded
bgruening
parents:
diff changeset
60 <option value="-plor acc">Accuracy versus threshold plot</option>
e390b5b6b89c Uploaded
bgruening
parents:
diff changeset
61 </param>
e390b5b6b89c Uploaded
bgruening
parents:
diff changeset
62
e390b5b6b89c Uploaded
bgruening
parents:
diff changeset
63 <param name="threshold" size="4" type="float" min="0" value="0.5" label="Threshold"/>
e390b5b6b89c Uploaded
bgruening
parents:
diff changeset
64
e390b5b6b89c Uploaded
bgruening
parents:
diff changeset
65 </inputs>
e390b5b6b89c Uploaded
bgruening
parents:
diff changeset
66
e390b5b6b89c Uploaded
bgruening
parents:
diff changeset
67 <outputs>
e390b5b6b89c Uploaded
bgruening
parents:
diff changeset
68 <data format="tabular" name="outfile" from_work_dir="perf_results.out" label="Performance measures from ${on_string}" />
e390b5b6b89c Uploaded
bgruening
parents:
diff changeset
69 <data format="tabular" name="outfile_plotting" from_work_dir="perf_plotting_data.out" label="Performance values from ${on_string}">
e390b5b6b89c Uploaded
bgruening
parents:
diff changeset
70 <filter>plot is not ''</filter>
e390b5b6b89c Uploaded
bgruening
parents:
diff changeset
71 </data>
e390b5b6b89c Uploaded
bgruening
parents:
diff changeset
72 </outputs>
e390b5b6b89c Uploaded
bgruening
parents:
diff changeset
73 <tests>
e390b5b6b89c Uploaded
bgruening
parents:
diff changeset
74 <test>
e390b5b6b89c Uploaded
bgruening
parents:
diff changeset
75 <param name="infile" ftype="tabular" value="testperf.dat"/>
e390b5b6b89c Uploaded
bgruening
parents:
diff changeset
76 <param name="performance_measures" value="-ACC,-ROC,-APR" />
e390b5b6b89c Uploaded
bgruening
parents:
diff changeset
77 <output name="outfile" ftype="tabular" file="testperf.results" />
e390b5b6b89c Uploaded
bgruening
parents:
diff changeset
78 <output name="outfile_plotting" ftype="tabular" file="testperf.results.plot" />
e390b5b6b89c Uploaded
bgruening
parents:
diff changeset
79 </test>
e390b5b6b89c Uploaded
bgruening
parents:
diff changeset
80 </tests>
e390b5b6b89c Uploaded
bgruening
parents:
diff changeset
81 <help>
e390b5b6b89c Uploaded
bgruening
parents:
diff changeset
82
e390b5b6b89c Uploaded
bgruening
parents:
diff changeset
83 **What it does**
e390b5b6b89c Uploaded
bgruening
parents:
diff changeset
84
e390b5b6b89c Uploaded
bgruening
parents:
diff changeset
85 Perf calculates a variety of performance metrics suitable for boolean classification problems. Metrics include: accuracy, root-mean-squared-error, cross-entropy, precision, recall, precision/recall break-even point and F-score, area under the ROC curve, lift, weighted cost, top 1, top 10, rank of lowest positive case, q-score, several measures of probability calibration, etc.
e390b5b6b89c Uploaded
bgruening
parents:
diff changeset
86
e390b5b6b89c Uploaded
bgruening
parents:
diff changeset
87 For more information please refer to:
e390b5b6b89c Uploaded
bgruening
parents:
diff changeset
88
e390b5b6b89c Uploaded
bgruening
parents:
diff changeset
89 http://osmot.cs.cornell.edu/kddcup/software.html
e390b5b6b89c Uploaded
bgruening
parents:
diff changeset
90
e390b5b6b89c Uploaded
bgruening
parents:
diff changeset
91 </help>
e390b5b6b89c Uploaded
bgruening
parents:
diff changeset
92 </tool>