annotate split_fasta.Rmd @ 1:8ef62ca3938b draft default tip

initial tool
author mingchen0919
date Mon, 09 Apr 2018 12:30:44 -0400
parents efd5c022b54d
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
efd5c022b54d planemo upload
mingchen0919
parents:
diff changeset
1 ---
efd5c022b54d planemo upload
mingchen0919
parents:
diff changeset
2 title: 'FASTA splitter'
efd5c022b54d planemo upload
mingchen0919
parents:
diff changeset
3 output:
efd5c022b54d planemo upload
mingchen0919
parents:
diff changeset
4 html_document:
efd5c022b54d planemo upload
mingchen0919
parents:
diff changeset
5 highlight: pygments
efd5c022b54d planemo upload
mingchen0919
parents:
diff changeset
6 ---
efd5c022b54d planemo upload
mingchen0919
parents:
diff changeset
7
efd5c022b54d planemo upload
mingchen0919
parents:
diff changeset
8 ```{r setup, include=FALSE, warning=FALSE, message=FALSE}
efd5c022b54d planemo upload
mingchen0919
parents:
diff changeset
9 knitr::opts_chunk$set(echo = TRUE, error = TRUE)
efd5c022b54d planemo upload
mingchen0919
parents:
diff changeset
10 ```
efd5c022b54d planemo upload
mingchen0919
parents:
diff changeset
11
efd5c022b54d planemo upload
mingchen0919
parents:
diff changeset
12
efd5c022b54d planemo upload
mingchen0919
parents:
diff changeset
13 ```{bash}
efd5c022b54d planemo upload
mingchen0919
parents:
diff changeset
14 # build job-script
efd5c022b54d planemo upload
mingchen0919
parents:
diff changeset
15 mkdir -p ${WORKING_DIR}/fasta_files
efd5c022b54d planemo upload
mingchen0919
parents:
diff changeset
16
efd5c022b54d planemo upload
mingchen0919
parents:
diff changeset
17 # single-end.sh
efd5c022b54d planemo upload
mingchen0919
parents:
diff changeset
18 cat <<EOF >${X_d}/job-script.sh
efd5c022b54d planemo upload
mingchen0919
parents:
diff changeset
19 ${X_t}/split_multifasta.pl \\
efd5c022b54d planemo upload
mingchen0919
parents:
diff changeset
20 --input_file=${X_A} \\
efd5c022b54d planemo upload
mingchen0919
parents:
diff changeset
21 --seqs_per_file=${X_B} \\
efd5c022b54d planemo upload
mingchen0919
parents:
diff changeset
22 --output_dir=${WORKING_DIR}/fasta_files > ${X_d}/fasta_splitter-log.txt 2>&1
efd5c022b54d planemo upload
mingchen0919
parents:
diff changeset
23 EOF
efd5c022b54d planemo upload
mingchen0919
parents:
diff changeset
24 ```
efd5c022b54d planemo upload
mingchen0919
parents:
diff changeset
25
efd5c022b54d planemo upload
mingchen0919
parents:
diff changeset
26 ```{bash, 'run jobs', echo=FALSE}
efd5c022b54d planemo upload
mingchen0919
parents:
diff changeset
27 # run job script, always use absolute path.
efd5c022b54d planemo upload
mingchen0919
parents:
diff changeset
28 # we want to run all jobs within the working path.
efd5c022b54d planemo upload
mingchen0919
parents:
diff changeset
29 sh ${X_d}/job-script.sh
efd5c022b54d planemo upload
mingchen0919
parents:
diff changeset
30 ```
efd5c022b54d planemo upload
mingchen0919
parents:
diff changeset
31
efd5c022b54d planemo upload
mingchen0919
parents:
diff changeset
32 ```{r, 'display output directory contents', results='asis', echo=FALSE}
efd5c022b54d planemo upload
mingchen0919
parents:
diff changeset
33 ## after the job is done, we list all files from the output directory.
efd5c022b54d planemo upload
mingchen0919
parents:
diff changeset
34 ## full relative path to the output directory needs to be displayed.
efd5c022b54d planemo upload
mingchen0919
parents:
diff changeset
35
efd5c022b54d planemo upload
mingchen0919
parents:
diff changeset
36 cat('##All output files')
efd5c022b54d planemo upload
mingchen0919
parents:
diff changeset
37 cat('\n\n')
efd5c022b54d planemo upload
mingchen0919
parents:
diff changeset
38 all_files = list.files(path = opt$X_d,
efd5c022b54d planemo upload
mingchen0919
parents:
diff changeset
39 full.names = TRUE,
efd5c022b54d planemo upload
mingchen0919
parents:
diff changeset
40 recursive = TRUE)
efd5c022b54d planemo upload
mingchen0919
parents:
diff changeset
41
efd5c022b54d planemo upload
mingchen0919
parents:
diff changeset
42 for (f in sub(opt$X_d, '.', all_files) ) {
efd5c022b54d planemo upload
mingchen0919
parents:
diff changeset
43 cat('* [', f, '](', f, ')\n')
efd5c022b54d planemo upload
mingchen0919
parents:
diff changeset
44 }
efd5c022b54d planemo upload
mingchen0919
parents:
diff changeset
45 cat('\n')
efd5c022b54d planemo upload
mingchen0919
parents:
diff changeset
46 ```
efd5c022b54d planemo upload
mingchen0919
parents:
diff changeset
47