annotate kmersvm/index.html @ 11:3b0c30b3baf1 draft default tip

Uploaded
author test-svm
date Wed, 08 Aug 2012 19:20:14 -0400
parents
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
11
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
1 <!doctype html>
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
2 <!-- paulirish.com/2008/conditional-stylesheets-vs-css-hacks-answer-neither/ -->
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
3 <!--[if lt IE 7]> <html class="no-js lt-ie9 lt-ie8 lt-ie7" lang="en"> <![endif]-->
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
4 <!--[if IE 7]> <html class="no-js lt-ie9 lt-ie8" lang="en"> <![endif]-->
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
5 <!--[if IE 8]> <html class="no-js lt-ie9" lang="en"> <![endif]-->
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
6 <!-- Consider adding a manifest.appcache: h5bp.com/d/Offline -->
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
7 <!--[if gt IE 8]><!--> <html class="no-js" lang="en"> <!--<![endif]-->
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
8 <head>
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
9 <meta charset="utf-8">
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
10
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
11 <!-- Use the .htaccess and remove these lines to avoid edge case issues.
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
12 More info: h5bp.com/i/378 -->
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
13 <meta http-equiv="X-UA-Compatible" content="IE=edge,chrome=1">
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
14
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
15 <title></title>
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
16 <meta name="description" content="">
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
17
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
18 <!-- Mobile viewport optimized: h5bp.com/viewport -->
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
19 <meta name="viewport" content="width=device-width">
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
20
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
21 <!-- Place favicon.ico and apple-touch-icon.png in the root directory: mathiasbynens.be/notes/touch-icons -->
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
22
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
23 <link rel="stylesheet" href="css/style.css">
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
24
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
25 <!-- More ideas for your <head> here: h5bp.com/d/head-Tips -->
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
26
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
27 <!-- All JavaScript at the bottom, except this Modernizr build.
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
28 Modernizr enables HTML5 elements & feature detects for optimal performance.
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
29 Create your own custom Modernizr build: www.modernizr.com/download/ -->
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
30 <script src="js/libs/modernizr-2.5.3.min.js"></script>
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
31 </head>
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
32 <body>
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
33 <!-- Prompt IE 6 users to install Chrome Frame. Remove this if you support IE 6.
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
34 chromium.org/developers/how-tos/chrome-frame-getting-started -->
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
35 <!--[if lt IE 7]><p class=chromeframe>Your browser is <em>ancient!</em> <a href="http://browsehappy.com/">Upgrade to a different browser</a> or <a href="http://www.google.com/chromeframe/?redirect=true">install Google Chrome Frame</a> to experience this site.</p><![endif]-->
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
36 <header>
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
37
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
38 </header>
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
39 <div role="main">
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
40 <head>
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
41 <h2> Installation for KmerSVM Tool from Galaxy ToolShed</h2>
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
42 </head>
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
43 <body>
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
44 <p>
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
45 Christopher Fletez-Brant, Dongwon Lee, Andrew McCallion and Michael A. Beer
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
46 </p>
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
47 <p>
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
48 KmerSVM can be downloaded from the Galaxy Tool Shed, located at <a>Dummy Link</a>. To install KmerSVM, download files from LINK BELOW. Untar/zip the archive and move the resulting file 'kmersvm' to '~/galaxy-dist/tools/'.
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
49 </p>
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
50 <section>
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
51 <h2>Dependencies</h2>
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
52 <h3>Mac Users:</h3>
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
53 <ol>
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
54 <li>Xcode (Mac App Store)</li>
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
55 <li>Fortran compiler (http://gcc.gnu.org/wiki/GFortran/)</li>
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
56 </ol>
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
57 <h3>Everyone:</h3>
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
58 <ol>
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
59 <li>Swig (http://www.swig.org)</li>
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
60 <li>Numpy (numpy.scipy.org)</li>
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
61 <li>Shogun Toolbox, v0.9.3 - v1.10 (http://www.shogun-toolbox.org/)</li>
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
62 <li>Bitarray (http://pypi.python.org/pypi/bitarray/)</li>
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
63 <li>R (http://www.r-project.org)</li>
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
64 <li>ROCR R Package (Available through CRAN)</li>
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
65 </ol>
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
66 <p>Note that for binaries are provided for Mac users. However, if difficulties in installation are encountered, it may be beneficial to compile the Fortran compiler from source. Additionally, be sure to add the location of your Shogun installation to the PYTHONPATH.</p>
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
67 <p>Further, KmerSVM has been tested on Python 2.6, 2.7 on Linux and Mac OS X. At this time KmerSVM has not been tested on Windows.</p>
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
68 </section>
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
69 <section>
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
70 <h2>Required Files</h2>
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
71 <p>For efficient access to genome-wide data "Generate Null Sequence" and
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
72 "Sequence Profiles" rely on access to binary files (indices) generated
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
73 by using the script 'nullseq_build_indices.py'. Download the *.tar or
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
74 *.zip files for each genome to be analyzed. To create indices for a
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
75 specific genome, call nullseq_build_indices.py as follows:</p>
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
76 <p><pre>
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
77 python nullseq_build_indices.py <GENOME ARCHIVE FILE> <GENOME BUILD>
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
78 </pre></p>
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
79 <p>Next copy nullseq_indices.loc.sample to tool-data/nullseq_indices.loc
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
80 and add the path to the created indices following the instructions
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
81 included in that file.</p>
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
82 <p>To generate FASTA files for training or scoring purposes, KmerSVM uses
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
83 the built-in tool "Fetch Sequences", which looks for genomes in *.nib or
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
84 *.2bit format. Download genomes related to your data and update the
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
85 'alignseq.loc' file to include the location of these genomes according
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
86 to directions in that file. FASTA files can also be provided by the user.</p>
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
87 <p>Move the file sample_roc_chen.png to the 'tool-data' file.</p>
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
88 </section>
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
89 <section>
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
90 <h2>tool_conf.xml</h2>
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
91 <p>Add the following lines to tool_conf.xml to make tools visible in Galaxy:</p>
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
92 <p><pre>
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
93 &lt;section name="SVM Tools" id="kmersvm"&gt;
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
94 &lt;tool file="kmersvm/classify.xml"/&gt;
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
95 &lt;tool file="kmersvm/nullseq.xml"/&gt;
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
96 &lt;tool file="kmersvm/rocprcurve.xml"/&gt;
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
97 &lt;tool file="kmersvm/train.xml"/&gt;
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
98 &lt;tool file="kmersvm/split_genome.xml"/&gt;
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
99 &lt;tool file="kmersvm/seqprofile.xml" /&gt;
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
100 &lt;/section&gt;
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
101 </pre></p>
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
102 </section>
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
103 <section>
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
104 <h2>Tool Tests</h2>
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
105 <p>To run tests on the tools "Train SVM", "Score Sequences of Interest" and
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
106 "Split Genome", move the following files to the 'test-data' directory:</p>
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
107 <ul>
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
108 <li>classify_output.out</li>
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
109 <li>classify_test.fa</li>
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
110 <li>kmersvm_output_weights.out</li>
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
111 <li>test_positive.fa</li>
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
112 <li>test_negative.fa</li>
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
113 <li>test_weights.out</li>
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
114 <li>train_predictions.out</li>
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
115 </ul>
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
116 <p>IDs for KmerSVM tests can be found by calling run_functional_tests.sh with the '-list' flag.</p>
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
117 </section>
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
118 <section>
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
119 <h2>Non-Galaxy-Based Usage</h2>
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
120 <p>The KmerSVM suite can be ran without using the Galaxy framework. Each tool exists as
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
121 a standalone Python script (all located in /scripts) which can be called from the command
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
122 line. Specific documentation can be found within each tool's Python file, or by calling the script with no arguments. A general
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
123 workflow can be found in INSERT_PAPER_TITLE_HERE, which can be followed by calling
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
124 each of the relevant Python scripts as outlined below, with the exception that users will have to provide
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
125 needed FASTA files themselves.</p>
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
126 <p>A simple worflow for the KmerSVM suite is as follows: </p>
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
127 <ol>
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
128 <li>python nullseq_build_indices.py &lt;TARBALL OR ZIP OF GENOME&gt; &lt;GENOME BUILD&gt;</li>
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
129 <li>python nullseq_generate &lt;INPUT FILE&gt; &lt;GENOME BUILD&gt; &lt;PATH TO INDEX FILES&gt;#This assumes no negative data sets. Output will need to be converted to FASTA. Skip if negative data is provided.</li>
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
130 <li>python kmersvm_train.py &lt;POSITIVE FASTA&gt; &lt;NEGATIVE FASTA&gt; #Outputs will be WEIGHTS, PREDICTIONS</li>
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
131 <li>python split_genome.py &lt;INPUT BED FILE&gt; #Skip if already have a list of regions you want to test. Output is TEST_SEQS, which will need to be converted to FASTA.</li>
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
132 <li>python kmersvm_classify.py &lt;WEIGHTS&gt; &lt;TEST_SEQS&gt;</li>
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
133 </ol>
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
134 <p>Additionally, for any BED file, sequence composition (in terms of length, GC content and repeat fraction) can be obtained by calling 'make profile' as follows:</p>
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
135 <p>python make_profile.py &lt;BEDFILE&gt; &lt;BUILDNAME&gt; &lt;BASE_DIR&gt; &lt;OUT_FILE&gt;</p>
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
136 <p>Note that each tool has its own parameters, the manipulation of which allow the user to further customize their analysis. To learn more about a particular tool, simply call it without passing it any arguments.</p>
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
137 </section>
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
138 </body>
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
139 </div>
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
140 <footer>
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
141
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
142 </footer>
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
143
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
144
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
145 <!-- JavaScript at the bottom for fast page loading -->
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
146
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
147 <!-- Grab Google CDN's jQuery, with a protocol relative URL; fall back to local if offline -->
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
148 <script src="//ajax.googleapis.com/ajax/libs/jquery/1.7.1/jquery.min.js"></script>
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
149 <script>window.jQuery || document.write('<script src="js/libs/jquery-1.7.1.min.js"><\/script>')</script>
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
150
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
151 <!-- scripts concatenated and minified via build script -->
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
152 <script src="js/plugins.js"></script>
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
153 <script src="js/script.js"></script>
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
154 <!-- end scripts -->
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
155
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
156 <!-- Asynchronous Google Analytics snippet. Change UA-XXXXX-X to be your site's ID.
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
157 mathiasbynens.be/notes/async-analytics-snippet -->
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
158 <script>
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
159 var _gaq=[['_setAccount','UA-XXXXX-X'],['_trackPageview']];
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
160 (function(d,t){var g=d.createElement(t),s=d.getElementsByTagName(t)[0];
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
161 g.src=('https:'==location.protocol?'//ssl':'//www')+'.google-analytics.com/ga.js';
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
162 s.parentNode.insertBefore(g,s)}(document,'script'));
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
163 </script>
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
164 </body>
3b0c30b3baf1 Uploaded
test-svm
parents:
diff changeset
165 </html>