annotate 05_per_base_sequence_content.Rmd @ 1:645291efd2e7 draft

working version
author mingchen0919
date Tue, 27 Feb 2018 10:36:24 -0500
parents f74fdae99053
children b9c9d1dacda6
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
1
645291efd2e7 working version
mingchen0919
parents: 0
diff changeset
1 ---
645291efd2e7 working version
mingchen0919
parents: 0
diff changeset
2 output: html_document
645291efd2e7 working version
mingchen0919
parents: 0
diff changeset
3 ---
645291efd2e7 working version
mingchen0919
parents: 0
diff changeset
4
645291efd2e7 working version
mingchen0919
parents: 0
diff changeset
5 ```{r setup, include=FALSE, warning=FALSE, message=FALSE}
645291efd2e7 working version
mingchen0919
parents: 0
diff changeset
6 knitr::opts_chunk$set(
645291efd2e7 working version
mingchen0919
parents: 0
diff changeset
7 echo = as.logical(opt$X_e),
645291efd2e7 working version
mingchen0919
parents: 0
diff changeset
8 error = TRUE,
645291efd2e7 working version
mingchen0919
parents: 0
diff changeset
9 eval = TRUE
645291efd2e7 working version
mingchen0919
parents: 0
diff changeset
10 )
645291efd2e7 working version
mingchen0919
parents: 0
diff changeset
11 ```
645291efd2e7 working version
mingchen0919
parents: 0
diff changeset
12
645291efd2e7 working version
mingchen0919
parents: 0
diff changeset
13
645291efd2e7 working version
mingchen0919
parents: 0
diff changeset
14 # Per base sequence content
645291efd2e7 working version
mingchen0919
parents: 0
diff changeset
15
645291efd2e7 working version
mingchen0919
parents: 0
diff changeset
16 ```{r 'Per base sequence content', fig.width=10}
645291efd2e7 working version
mingchen0919
parents: 0
diff changeset
17 ## reads 1
645291efd2e7 working version
mingchen0919
parents: 0
diff changeset
18 pbsc_1 = extract_data_module(paste0(opt$X_d, '/read_1_fastqc/fastqc_data.txt'), 'Per base sequence content')
645291efd2e7 working version
mingchen0919
parents: 0
diff changeset
19 pbsc_1$id = 1:length(pbsc_1$X.Base)
645291efd2e7 working version
mingchen0919
parents: 0
diff changeset
20
645291efd2e7 working version
mingchen0919
parents: 0
diff changeset
21 melt_pbsc_1 = melt(pbsc_1, id=c('X.Base', 'id'))
645291efd2e7 working version
mingchen0919
parents: 0
diff changeset
22 melt_pbsc_1$trim = 'before'
645291efd2e7 working version
mingchen0919
parents: 0
diff changeset
23
645291efd2e7 working version
mingchen0919
parents: 0
diff changeset
24
645291efd2e7 working version
mingchen0919
parents: 0
diff changeset
25 ## reads 2
645291efd2e7 working version
mingchen0919
parents: 0
diff changeset
26 pbsc_2 = extract_data_module(paste0(opt$X_d, '/read_2_fastqc/fastqc_data.txt'), 'Per base sequence content')
645291efd2e7 working version
mingchen0919
parents: 0
diff changeset
27 pbsc_2$id = 1:length(pbsc_2$X.Base)
645291efd2e7 working version
mingchen0919
parents: 0
diff changeset
28
645291efd2e7 working version
mingchen0919
parents: 0
diff changeset
29 melt_pbsc_2 = melt(pbsc_2, id=c('X.Base', 'id'))
645291efd2e7 working version
mingchen0919
parents: 0
diff changeset
30 melt_pbsc_2$trim = 'after'
645291efd2e7 working version
mingchen0919
parents: 0
diff changeset
31
645291efd2e7 working version
mingchen0919
parents: 0
diff changeset
32 comb_pbsc = rbind(melt_pbsc_1, melt_pbsc_2)
645291efd2e7 working version
mingchen0919
parents: 0
diff changeset
33 comb_pbsc$trim = factor(levels = c('before', 'after'), comb_pbsc$trim)
645291efd2e7 working version
mingchen0919
parents: 0
diff changeset
34
645291efd2e7 working version
mingchen0919
parents: 0
diff changeset
35 p = ggplot(data = comb_pbsc, aes(x = id, y = value, color = variable)) +
645291efd2e7 working version
mingchen0919
parents: 0
diff changeset
36 geom_line() +
645291efd2e7 working version
mingchen0919
parents: 0
diff changeset
37 facet_grid(. ~ trim) +
645291efd2e7 working version
mingchen0919
parents: 0
diff changeset
38 xlim(min(comb_pbsc$id), max(comb_pbsc$id)) +
645291efd2e7 working version
mingchen0919
parents: 0
diff changeset
39 ylim(0, 100) +
645291efd2e7 working version
mingchen0919
parents: 0
diff changeset
40 xlab('Position in read (bp)') +
645291efd2e7 working version
mingchen0919
parents: 0
diff changeset
41 ylab('')
645291efd2e7 working version
mingchen0919
parents: 0
diff changeset
42 ggplotly(p)
645291efd2e7 working version
mingchen0919
parents: 0
diff changeset
43 ```