annotate cluster.tools/hclust.xml @ 9:a3c03541fe6f draft default tip

Uploaded
author peter-waltman
date Mon, 11 Mar 2013 17:30:48 -0400
parents a58527c632b7
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
1 <tool id="hcluster" name="Hierarchical Clustering (HAC)" force_history_refresh="True">
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
2 <command interpreter="python">hclust.py
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
3 -d $dataset
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
4 ${dist_obj}
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
5 -n ${direction}
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
6 -m ${distance_metric}
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
7 -l ${linkage}
8
a58527c632b7 Uploaded
peter-waltman
parents: 0
diff changeset
8
a58527c632b7 Uploaded
peter-waltman
parents: 0
diff changeset
9 #if str($numk) != "-1":
0
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
10 -k ${numk}
8
a58527c632b7 Uploaded
peter-waltman
parents: 0
diff changeset
11 #end if
a58527c632b7 Uploaded
peter-waltman
parents: 0
diff changeset
12
a58527c632b7 Uploaded
peter-waltman
parents: 0
diff changeset
13 #if str($direction) == "rows":
a58527c632b7 Uploaded
peter-waltman
parents: 0
diff changeset
14 -o ${rdata_output_rows}
a58527c632b7 Uploaded
peter-waltman
parents: 0
diff changeset
15 #end if
a58527c632b7 Uploaded
peter-waltman
parents: 0
diff changeset
16
a58527c632b7 Uploaded
peter-waltman
parents: 0
diff changeset
17 #if str($direction) == "cols":
a58527c632b7 Uploaded
peter-waltman
parents: 0
diff changeset
18 -o ${rdata_output_cols}
a58527c632b7 Uploaded
peter-waltman
parents: 0
diff changeset
19 #end if
0
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
20
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
21 </command>
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
22 <inputs>
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
23 <param name="dataset" type="data" format='tabular' label="Data Set" help="Specify the data matrix (tab-delimited) to be clustered"/>
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
24 <param name="dist_obj" type="boolean" label="Distance Object (R dist object)?" truevalue="-D" falsevalue="" checked="False" help="Check if the matrix contains the pairwise distances between a set of objects"/>
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
25 <param name="direction" type="select" label="Cluster Samples or Genes?" help="Specify the matrix dimension to cluster (see help below)">
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
26 <option value="cols">Columns (Samples)</option>
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
27 <option value="rows" selected='true'>Rows (Genes)</option>
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
28 </param>
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
29
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
30 <param name="distance_metric" type="select" label="Distance Metric" help="Specify the distance metric to use (see help below)">
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
31 <option value="cosine" selected='true'>Cosine</option>
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
32 <option value="abscosine">Absolute Cosine</option>
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
33 <option value="pearson">Pearson</option>
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
34 <option value="abspearson">Absolute Pearson</option>
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
35 <option value="spearman">Spearman</option>
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
36 <option value="kendall">Kendall</option>
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
37 <option value="euclidean">Euclidean</option>
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
38 <option value="maximum">Maximum</option>
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
39 <option value="manhattan">Manhattan (AKA city block)</option>
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
40 <option value="canberra">Canberra</option>
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
41 <option value="binary">Binary</option>
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
42 </param>
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
43
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
44 <param name="linkage" type="select" label="Linkage" help="Specify the linkage to use when clustering (see help below)">
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
45 <option value="average">Average</option>
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
46 <option value="centroid">Centroid</option>
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
47 <option value="complete" selected='true'>Complete</option>
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
48 <option value="mcquitty">McQuitty</option>
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
49 <option value="median">Median</option>
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
50 <option value="single">Single</option>
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
51 <option value="ward">Ward</option>
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
52 </param>
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
53
8
a58527c632b7 Uploaded
peter-waltman
parents: 0
diff changeset
54 <param name="numk" type="integer" label="Number of Clusters" value="-1" help="Specify the number of clusters to use (-1 to use default. See help below)."/>
0
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
55
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
56 </inputs>
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
57 <outputs>
8
a58527c632b7 Uploaded
peter-waltman
parents: 0
diff changeset
58 <data format="rdata" name="rdata_output_rows" label="Hierarchical Clustering Results; Gene Clusters (RData)">
a58527c632b7 Uploaded
peter-waltman
parents: 0
diff changeset
59 <filter>(direction)=="rows"</filter>
a58527c632b7 Uploaded
peter-waltman
parents: 0
diff changeset
60 </data>
a58527c632b7 Uploaded
peter-waltman
parents: 0
diff changeset
61 <data format="rdata" name="rdata_output_cols" label="Hierarchical Clustering Results; Sample Clusters (RData)">
a58527c632b7 Uploaded
peter-waltman
parents: 0
diff changeset
62 <filter>(direction)=="cols"</filter>
a58527c632b7 Uploaded
peter-waltman
parents: 0
diff changeset
63 </data>
0
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
64 </outputs>
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
65 <help>
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
66 .. class:: infomark
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
67
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
68 **Perform Hierarchical Clustering (Cluster Samples) on a specified data set**
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
69
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
70 ----
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
71
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
72 **Parameters**
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
73
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
74 - **Data Set** - Specify the data matrix to be clustered. Data must be formated as follows:
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
75
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
76 * Tab-delimited
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
77 * Use row/column headers
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
78
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
79 - **Cluster Samples or Genes** - Specify the dimension of the matrix to cluster:
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
80
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
81 * Rows (Genes)
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
82 * Columns (Samples)
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
83
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
84 - **Distance Object** Specify whether or not the data set is a pairwise distance matrix
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
85
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
86 - **Distance Metric** Specify the distance metric to use. Choice of:
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
87
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
88 * Cosine (AKA uncentered pearson)
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
89 * Absolute Cosine (AKA uncentered pearson, absolute value)
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
90 * Pearson (pearson correlation)
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
91 * Absolute Pearson (pearson correlation, absolute value)
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
92 * Spearman (spearman correlation)
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
93 * Kendall (Kendall's Tau)
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
94 * Euclidean (euclidean distance)
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
95 * Maximum
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
96 * Manhattan (AKA city block)
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
97 * Canberra
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
98 * Binary
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
99
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
100 - **Linkage** Specify the linkage to use when clustering. Choice of:
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
101
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
102 * Average (see documentation for R's hclust function for explanation of choices)
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
103 * Single
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
104 * Complete
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
105 * Median
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
106 * Centroid
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
107 * McQuity
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
108 * Ward
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
109
8
a58527c632b7 Uploaded
peter-waltman
parents: 0
diff changeset
110 - **Number of Clusters** Specify the number of clusters to use. If set to -1, default values will be used, with the default set as follows:
a58527c632b7 Uploaded
peter-waltman
parents: 0
diff changeset
111 * if samples/columns are being clustered, the **default** is 5.
a58527c632b7 Uploaded
peter-waltman
parents: 0
diff changeset
112 * if genes/rows are being clustered, the **default** is set to num_rows/30, e.g. if there are 600 row/genes in the matrix, the default will be 20 clusters.
0
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
113
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
114 </help>
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
115 </tool>