annotate linear_regression.xml @ 1:2e7bc1bb2dbe draft default tip

Uploaded
author iuc
date Fri, 09 Jan 2015 12:56:07 -0500
parents ffcdde989859
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
1
2e7bc1bb2dbe Uploaded
iuc
parents: 0
diff changeset
1 <tool id="LinearRegression1" name="Perform Linear Regression" version="1.1.0">
2e7bc1bb2dbe Uploaded
iuc
parents: 0
diff changeset
2 <description> </description>
2e7bc1bb2dbe Uploaded
iuc
parents: 0
diff changeset
3 <expand macro="requirements" />
2e7bc1bb2dbe Uploaded
iuc
parents: 0
diff changeset
4 <macros>
2e7bc1bb2dbe Uploaded
iuc
parents: 0
diff changeset
5 <import>statistic_tools_macros.xml</import>
2e7bc1bb2dbe Uploaded
iuc
parents: 0
diff changeset
6 </macros>
2e7bc1bb2dbe Uploaded
iuc
parents: 0
diff changeset
7 <command interpreter="python">
2e7bc1bb2dbe Uploaded
iuc
parents: 0
diff changeset
8 <![CDATA[
2e7bc1bb2dbe Uploaded
iuc
parents: 0
diff changeset
9 linear_regression.py
2e7bc1bb2dbe Uploaded
iuc
parents: 0
diff changeset
10 $input1
2e7bc1bb2dbe Uploaded
iuc
parents: 0
diff changeset
11 $response_col
2e7bc1bb2dbe Uploaded
iuc
parents: 0
diff changeset
12 $predictor_cols
2e7bc1bb2dbe Uploaded
iuc
parents: 0
diff changeset
13 $out_file1
2e7bc1bb2dbe Uploaded
iuc
parents: 0
diff changeset
14 $out_file2
2e7bc1bb2dbe Uploaded
iuc
parents: 0
diff changeset
15 1>/dev/null
2e7bc1bb2dbe Uploaded
iuc
parents: 0
diff changeset
16 ]]>
2e7bc1bb2dbe Uploaded
iuc
parents: 0
diff changeset
17 </command>
2e7bc1bb2dbe Uploaded
iuc
parents: 0
diff changeset
18 <inputs>
2e7bc1bb2dbe Uploaded
iuc
parents: 0
diff changeset
19 <param format="tabular" name="input1" type="data" label="Select data" help="Dataset missing? See TIP below."/>
2e7bc1bb2dbe Uploaded
iuc
parents: 0
diff changeset
20 <param name="response_col" label="Response column (Y)" type="data_column" data_ref="input1" numerical="True"/>
2e7bc1bb2dbe Uploaded
iuc
parents: 0
diff changeset
21 <param name="predictor_cols" label="Predictor columns (X)" type="data_column" data_ref="input1" numerical="True" multiple="true" >
2e7bc1bb2dbe Uploaded
iuc
parents: 0
diff changeset
22 <validator type="no_options" message="Please select at least one column."/>
2e7bc1bb2dbe Uploaded
iuc
parents: 0
diff changeset
23 </param>
2e7bc1bb2dbe Uploaded
iuc
parents: 0
diff changeset
24 </inputs>
2e7bc1bb2dbe Uploaded
iuc
parents: 0
diff changeset
25 <outputs>
2e7bc1bb2dbe Uploaded
iuc
parents: 0
diff changeset
26 <data format="input" name="out_file1" metadata_source="input1" />
2e7bc1bb2dbe Uploaded
iuc
parents: 0
diff changeset
27 <data format="pdf" name="out_file2" />
2e7bc1bb2dbe Uploaded
iuc
parents: 0
diff changeset
28 </outputs>
2e7bc1bb2dbe Uploaded
iuc
parents: 0
diff changeset
29 <tests>
2e7bc1bb2dbe Uploaded
iuc
parents: 0
diff changeset
30 <test>
2e7bc1bb2dbe Uploaded
iuc
parents: 0
diff changeset
31 <param name="input1" value="regr_inp.tabular"/>
2e7bc1bb2dbe Uploaded
iuc
parents: 0
diff changeset
32 <param name="response_col" value="3"/>
2e7bc1bb2dbe Uploaded
iuc
parents: 0
diff changeset
33 <param name="predictor_cols" value="1,2"/>
2e7bc1bb2dbe Uploaded
iuc
parents: 0
diff changeset
34 <output name="out_file1" file="regr_out.tabular"/>
2e7bc1bb2dbe Uploaded
iuc
parents: 0
diff changeset
35 <output name="out_file2" file="regr_out.pdf"/>
2e7bc1bb2dbe Uploaded
iuc
parents: 0
diff changeset
36 </test>
2e7bc1bb2dbe Uploaded
iuc
parents: 0
diff changeset
37 </tests>
2e7bc1bb2dbe Uploaded
iuc
parents: 0
diff changeset
38 <help>
2e7bc1bb2dbe Uploaded
iuc
parents: 0
diff changeset
39 <![CDATA[
2e7bc1bb2dbe Uploaded
iuc
parents: 0
diff changeset
40
2e7bc1bb2dbe Uploaded
iuc
parents: 0
diff changeset
41
2e7bc1bb2dbe Uploaded
iuc
parents: 0
diff changeset
42 .. class:: infomark
2e7bc1bb2dbe Uploaded
iuc
parents: 0
diff changeset
43
2e7bc1bb2dbe Uploaded
iuc
parents: 0
diff changeset
44 **TIP:** If your data is not TAB delimited, use *Edit Datasets->Convert characters*
2e7bc1bb2dbe Uploaded
iuc
parents: 0
diff changeset
45
2e7bc1bb2dbe Uploaded
iuc
parents: 0
diff changeset
46 -----
2e7bc1bb2dbe Uploaded
iuc
parents: 0
diff changeset
47
2e7bc1bb2dbe Uploaded
iuc
parents: 0
diff changeset
48 .. class:: infomark
2e7bc1bb2dbe Uploaded
iuc
parents: 0
diff changeset
49
2e7bc1bb2dbe Uploaded
iuc
parents: 0
diff changeset
50 **What it does**
2e7bc1bb2dbe Uploaded
iuc
parents: 0
diff changeset
51
2e7bc1bb2dbe Uploaded
iuc
parents: 0
diff changeset
52 This tool uses the 'lm' function from R statistical package to perform linear regression on the input data. It outputs two files, one containing the summary statistics of the performed regression, and the other containing diagnostic plots to check whether model assumptions are satisfied.
2e7bc1bb2dbe Uploaded
iuc
parents: 0
diff changeset
53
2e7bc1bb2dbe Uploaded
iuc
parents: 0
diff changeset
54 *R Development Core Team (2009). R: A language and environment for statistical computing. R Foundation for Statistical Computing, Vienna, Austria. ISBN 3-900051-07-0, URL http://www.R-project.org.*
2e7bc1bb2dbe Uploaded
iuc
parents: 0
diff changeset
55
2e7bc1bb2dbe Uploaded
iuc
parents: 0
diff changeset
56 -----
2e7bc1bb2dbe Uploaded
iuc
parents: 0
diff changeset
57
2e7bc1bb2dbe Uploaded
iuc
parents: 0
diff changeset
58 .. class:: warningmark
2e7bc1bb2dbe Uploaded
iuc
parents: 0
diff changeset
59
2e7bc1bb2dbe Uploaded
iuc
parents: 0
diff changeset
60 **Note**
2e7bc1bb2dbe Uploaded
iuc
parents: 0
diff changeset
61
2e7bc1bb2dbe Uploaded
iuc
parents: 0
diff changeset
62 - This tool currently treats all predictor and response variables as continuous numeric variables. Running the tool on categorical variables might result in incorrect results.
2e7bc1bb2dbe Uploaded
iuc
parents: 0
diff changeset
63
2e7bc1bb2dbe Uploaded
iuc
parents: 0
diff changeset
64 - Rows containing non-numeric (or missing) data in any of the chosen columns will be skipped from the analysis.
2e7bc1bb2dbe Uploaded
iuc
parents: 0
diff changeset
65
2e7bc1bb2dbe Uploaded
iuc
parents: 0
diff changeset
66 - The summary statistics in the output are described below:
2e7bc1bb2dbe Uploaded
iuc
parents: 0
diff changeset
67
2e7bc1bb2dbe Uploaded
iuc
parents: 0
diff changeset
68 - sigma: the square root of the estimated variance of the random error (standard error of the residiuals)
2e7bc1bb2dbe Uploaded
iuc
parents: 0
diff changeset
69 - R-squared: the fraction of variance explained by the model
2e7bc1bb2dbe Uploaded
iuc
parents: 0
diff changeset
70 - Adjusted R-squared: the above R-squared statistic adjusted, penalizing for the number of the predictors (p)
2e7bc1bb2dbe Uploaded
iuc
parents: 0
diff changeset
71 - p-value: p-value for the t-test of the null hypothesis that the corresponding slope is equal to zero against the two-sided alternative.
2e7bc1bb2dbe Uploaded
iuc
parents: 0
diff changeset
72
2e7bc1bb2dbe Uploaded
iuc
parents: 0
diff changeset
73
2e7bc1bb2dbe Uploaded
iuc
parents: 0
diff changeset
74 ]]>
2e7bc1bb2dbe Uploaded
iuc
parents: 0
diff changeset
75 </help>
2e7bc1bb2dbe Uploaded
iuc
parents: 0
diff changeset
76 </tool>