annotate 02_per_base_sequence_quality.Rmd @ 8:94762f1cb779 draft

planemo upload commit 76f9ca75d5b1c0c0fad6c10876d9dfeba7d5ecff-dirty
author mingchen0919
date Mon, 30 Apr 2018 16:15:39 -0400
parents b9c9d1dacda6
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
1
645291efd2e7 working version
mingchen0919
parents: 0
diff changeset
1 ---
645291efd2e7 working version
mingchen0919
parents: 0
diff changeset
2 output: html_document
645291efd2e7 working version
mingchen0919
parents: 0
diff changeset
3 ---
645291efd2e7 working version
mingchen0919
parents: 0
diff changeset
4
645291efd2e7 working version
mingchen0919
parents: 0
diff changeset
5 ```{r setup, include=FALSE, warning=FALSE, message=FALSE}
8
94762f1cb779 planemo upload commit 76f9ca75d5b1c0c0fad6c10876d9dfeba7d5ecff-dirty
mingchen0919
parents: 3
diff changeset
6 knitr::opts_knit$set(progress = FALSE)
94762f1cb779 planemo upload commit 76f9ca75d5b1c0c0fad6c10876d9dfeba7d5ecff-dirty
mingchen0919
parents: 3
diff changeset
7 knitr::opts_chunk$set(error = TRUE, echo = FALSE)
1
645291efd2e7 working version
mingchen0919
parents: 0
diff changeset
8 ```
645291efd2e7 working version
mingchen0919
parents: 0
diff changeset
9
3
b9c9d1dacda6 reformat code
mingchen0919
parents: 1
diff changeset
10 ### Per base sequence quality
1
645291efd2e7 working version
mingchen0919
parents: 0
diff changeset
11
645291efd2e7 working version
mingchen0919
parents: 0
diff changeset
12 ```{r 'per base sequence quality', fig.width=10}
645291efd2e7 working version
mingchen0919
parents: 0
diff changeset
13 ## reads 1
645291efd2e7 working version
mingchen0919
parents: 0
diff changeset
14 pbsq_1 = extract_data_module(paste0(opt$X_d, '/read_1_fastqc/fastqc_data.txt'), 'Per base sequence quality')
645291efd2e7 working version
mingchen0919
parents: 0
diff changeset
15 pbsq_1$id = 1:length(pbsq_1$X.Base)
645291efd2e7 working version
mingchen0919
parents: 0
diff changeset
16 pbsq_1$trim = 'before'
645291efd2e7 working version
mingchen0919
parents: 0
diff changeset
17
645291efd2e7 working version
mingchen0919
parents: 0
diff changeset
18 ## reads 2
645291efd2e7 working version
mingchen0919
parents: 0
diff changeset
19 pbsq_2 = extract_data_module(paste0(opt$X_d, '/read_2_fastqc/fastqc_data.txt'), 'Per base sequence quality')
645291efd2e7 working version
mingchen0919
parents: 0
diff changeset
20 pbsq_2$id = 1:length(pbsq_2$X.Base)
645291efd2e7 working version
mingchen0919
parents: 0
diff changeset
21 pbsq_2$trim = 'after'
645291efd2e7 working version
mingchen0919
parents: 0
diff changeset
22
645291efd2e7 working version
mingchen0919
parents: 0
diff changeset
23 comb_pbsq = rbind(pbsq_1, pbsq_2)
645291efd2e7 working version
mingchen0919
parents: 0
diff changeset
24 comb_pbsq$trim = factor(levels = c('before', 'after'), comb_pbsq$trim)
645291efd2e7 working version
mingchen0919
parents: 0
diff changeset
25
645291efd2e7 working version
mingchen0919
parents: 0
diff changeset
26 p = ggplot(data = comb_pbsq) +
645291efd2e7 working version
mingchen0919
parents: 0
diff changeset
27 geom_boxplot(mapping = aes(x = id,
645291efd2e7 working version
mingchen0919
parents: 0
diff changeset
28 lower = Lower.Quartile,
645291efd2e7 working version
mingchen0919
parents: 0
diff changeset
29 upper = Upper.Quartile,
645291efd2e7 working version
mingchen0919
parents: 0
diff changeset
30 middle = Median,
645291efd2e7 working version
mingchen0919
parents: 0
diff changeset
31 ymin = X10th.Percentile,
645291efd2e7 working version
mingchen0919
parents: 0
diff changeset
32 ymax = X90th.Percentile,
645291efd2e7 working version
mingchen0919
parents: 0
diff changeset
33 fill = "yellow"),
645291efd2e7 working version
mingchen0919
parents: 0
diff changeset
34 stat = 'identity') +
645291efd2e7 working version
mingchen0919
parents: 0
diff changeset
35 geom_line(mapping = aes(x = id, y = Mean, color = "red")) +
3
b9c9d1dacda6 reformat code
mingchen0919
parents: 1
diff changeset
36 scale_x_continuous(name = 'Position in read (bp)', breaks = pbsq_2$id, labels = pbsq_2$X.Base) +
b9c9d1dacda6 reformat code
mingchen0919
parents: 1
diff changeset
37 scale_y_continuous(limits = c(0, max(comb_pbsq$Upper.Quartile) + 5)) +
1
645291efd2e7 working version
mingchen0919
parents: 0
diff changeset
38 scale_fill_identity() +
645291efd2e7 working version
mingchen0919
parents: 0
diff changeset
39 scale_color_identity() +
645291efd2e7 working version
mingchen0919
parents: 0
diff changeset
40 facet_grid(. ~ trim) +
3
b9c9d1dacda6 reformat code
mingchen0919
parents: 1
diff changeset
41 theme(axis.text.x = element_text(size = 5),
b9c9d1dacda6 reformat code
mingchen0919
parents: 1
diff changeset
42 panel.background = element_rect(fill = NA),
b9c9d1dacda6 reformat code
mingchen0919
parents: 1
diff changeset
43 panel.grid.major.y = element_line(color = 'blue', size = 0.1))
1
645291efd2e7 working version
mingchen0919
parents: 0
diff changeset
44 p
3
b9c9d1dacda6 reformat code
mingchen0919
parents: 1
diff changeset
45 ```
1
645291efd2e7 working version
mingchen0919
parents: 0
diff changeset
46