annotate cluster.tools/partition.xml @ 9:a3c03541fe6f draft default tip

Uploaded
author peter-waltman
date Mon, 11 Mar 2013 17:30:48 -0400
parents a58527c632b7
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
1 <tool id="partiton_clust" name="Partition Clustering" force_history_refresh="True">
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
2 <command interpreter="python">partition.py
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
3 -d $dataset
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
4 ${dist_obj}
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
5 -n ${direction}
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
6 -a $alg_cond.algorithm
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
7 #if $alg_cond.algorithm == 'pam' # -m ${alg_cond.distance_metric}
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
8 #end if
8
a58527c632b7 Uploaded
peter-waltman
parents: 0
diff changeset
9
a58527c632b7 Uploaded
peter-waltman
parents: 0
diff changeset
10 #if str($numk) != "-1":
0
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
11 -k ${numk}
8
a58527c632b7 Uploaded
peter-waltman
parents: 0
diff changeset
12 #end if
a58527c632b7 Uploaded
peter-waltman
parents: 0
diff changeset
13
a58527c632b7 Uploaded
peter-waltman
parents: 0
diff changeset
14 #if str($direction) == "rows":
a58527c632b7 Uploaded
peter-waltman
parents: 0
diff changeset
15 -o ${rdata_output_rows}
a58527c632b7 Uploaded
peter-waltman
parents: 0
diff changeset
16 #end if
a58527c632b7 Uploaded
peter-waltman
parents: 0
diff changeset
17
a58527c632b7 Uploaded
peter-waltman
parents: 0
diff changeset
18 #if str($direction) == "cols":
a58527c632b7 Uploaded
peter-waltman
parents: 0
diff changeset
19 -o ${rdata_output_cols}
a58527c632b7 Uploaded
peter-waltman
parents: 0
diff changeset
20 #end if
a58527c632b7 Uploaded
peter-waltman
parents: 0
diff changeset
21
0
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
22
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
23 </command>
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
24 <inputs>
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
25 <param name="dataset" type="data" format='tabular' label="Data Set" help="Specify the data matrix (tab-delimited) to be clustered"/>
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
26 <param name="dist_obj" type="boolean" label="Distance Object (R dist object)?" truevalue="-D" falsevalue="" checked="False" help="Check if the matrix contains the pairwise distances between a set of objects"/>
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
27
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
28 <param name="direction" type="select" label="Cluster Columns or Rows?" help="Specify the matrix dimension to cluster (see help below)">
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
29 <option value="cols">Columns (Samples)</option>
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
30 <option value="rows" selected='true'>Rows (Genes)</option>
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
31 </param>
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
32
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
33 <conditional name='alg_cond'>
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
34 <param name="algorithm" type="select" label="PAM or K-means?" help="Specify the partition cluster method to use (see help below)">
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
35 <option value="km">K-means</option>
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
36 <option value="pam" selected='true'>PAM</option>
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
37 </param>
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
38 <when value='pam'>
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
39 <param name="distance_metric" type="select" label="Distance Metric" help="Specify the distance metric to use (see help below)">
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
40 <option value="cosine" selected='true'>Cosine</option>
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
41 <option value="abscosine">Absolute Cosine</option>
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
42 <option value="pearson">Pearson</option>
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
43 <option value="abspearson">Absolute Pearson</option>
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
44 <option value="spearman">Spearman</option>
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
45 <option value="kendall">Kendall</option>
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
46 <option value="euclidean">Euclidean</option>
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
47 <option value="maximum">Maximum</option>
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
48 <option value="manhattan">Manhattan (AKA city block)</option>
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
49 <option value="canberra">Canberra</option>
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
50 <option value="binary">Binary</option>
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
51 </param>
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
52 </when>
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
53 </conditional>
8
a58527c632b7 Uploaded
peter-waltman
parents: 0
diff changeset
54 <param name="numk" type="integer" label="Number of Clusters" value="-1" help="Specify the number of clusters to use (-1 to use default. See help below)."/>
0
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
55
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
56 </inputs>
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
57 <outputs>
8
a58527c632b7 Uploaded
peter-waltman
parents: 0
diff changeset
58 <data format="rdata" name="rdata_output_rows" label="Partition Clustering Results; Gene Clusters (RData)">
a58527c632b7 Uploaded
peter-waltman
parents: 0
diff changeset
59 <filter>(direction)=="rows"</filter>
a58527c632b7 Uploaded
peter-waltman
parents: 0
diff changeset
60 </data>
a58527c632b7 Uploaded
peter-waltman
parents: 0
diff changeset
61 <data format="rdata" name="rdata_output_cols" label="Partition Clustering Results; Sample Clusters (RData)">
a58527c632b7 Uploaded
peter-waltman
parents: 0
diff changeset
62 <filter>(direction)=="cols"</filter>
a58527c632b7 Uploaded
peter-waltman
parents: 0
diff changeset
63 </data>
0
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
64 </outputs>
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
65 <help>
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
66 .. class:: infomark
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
67
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
68 **Perform Partition Clustering (Cluster Samples) on a specified data set**
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
69
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
70 ----
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
71
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
72 **Parameters**
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
73
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
74 - **Data Set** - Specify the data matrix to be clustered. Data must be formated as follows:
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
75
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
76 * Tab-delimited
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
77 * Use row/column headers
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
78
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
79 - **Distance Object** Specify whether or not the data set is a pairwise distance matrix
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
80
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
81 - **Cluster Samples or Genes** - Specify the dimension of the matrix to cluster:
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
82
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
83 * Rows (Genes)
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
84 * Columns (Samples)
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
85
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
86 - **PAM or K-means?** Specify which partition clustering method to use - users have choice of:
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
87
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
88 * PAM (Partition Around Mediods)
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
89 * K-means
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
90
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
91 - **Distance Metric** Specify the distance metric to use. Note, this is ONLY AVAILABLE IF PAM IS THE ALGORITHM BEING USED. Choice of:
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
92
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
93 * Cosine (AKA uncentered pearson)
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
94 * Absolute Cosine (AKA uncentered pearson, absolute value)
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
95 * Pearson (pearson correlation)
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
96 * Absolute Pearson (pearson correlation, absolute value)
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
97 * Spearman (spearman correlation)
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
98 * Kendall (Kendall's Tau)
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
99 * Euclidean (euclidean distance)
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
100 * Maximum
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
101 * Manhattan (AKA city block)
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
102 * Canberra
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
103 * Binary
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
104
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
105
8
a58527c632b7 Uploaded
peter-waltman
parents: 0
diff changeset
106 - **Number of Clusters** Specify the number of clusters to use. If set to -1, default values will be used, with the default set as follows:
a58527c632b7 Uploaded
peter-waltman
parents: 0
diff changeset
107 * if samples/columns are being clustered, the **default** is 5.
a58527c632b7 Uploaded
peter-waltman
parents: 0
diff changeset
108 * if genes/rows are being clustered, the **default** is set to num_rows/30, e.g. if there are 600 row/genes in the matrix, the default will be 20 clusters.
0
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
109
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
110 </help>
0decf3fd54bc Uploaded
peter-waltman
parents:
diff changeset
111 </tool>