annotate segmentation_sequenza.R @ 0:0e54da14f831 draft

"planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/snvtocnv commit fd049d0796cbfaa6c41a7d80e84d3a734b30acc8"
author artbio
date Thu, 18 Feb 2021 18:59:53 +0000
parents
children 9265faa93098
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
0e54da14f831 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/snvtocnv commit fd049d0796cbfaa6c41a7d80e84d3a734b30acc8"
artbio
parents:
diff changeset
1 # load packages that are provided in the conda env
0e54da14f831 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/snvtocnv commit fd049d0796cbfaa6c41a7d80e84d3a734b30acc8"
artbio
parents:
diff changeset
2 options(show.error.messages = F,
0e54da14f831 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/snvtocnv commit fd049d0796cbfaa6c41a7d80e84d3a734b30acc8"
artbio
parents:
diff changeset
3 error = function() {
0e54da14f831 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/snvtocnv commit fd049d0796cbfaa6c41a7d80e84d3a734b30acc8"
artbio
parents:
diff changeset
4 cat(geterrmessage(), file = stderr()); q("no", 1, F)})
0e54da14f831 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/snvtocnv commit fd049d0796cbfaa6c41a7d80e84d3a734b30acc8"
artbio
parents:
diff changeset
5 Sys.setenv(TZ = "Pacific/Auckland") # turnaround the tidyverse bug "In OlsonNames() : no Olson database found"
0e54da14f831 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/snvtocnv commit fd049d0796cbfaa6c41a7d80e84d3a734b30acc8"
artbio
parents:
diff changeset
6
0e54da14f831 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/snvtocnv commit fd049d0796cbfaa6c41a7d80e84d3a734b30acc8"
artbio
parents:
diff changeset
7
0e54da14f831 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/snvtocnv commit fd049d0796cbfaa6c41a7d80e84d3a734b30acc8"
artbio
parents:
diff changeset
8 library(optparse)
0e54da14f831 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/snvtocnv commit fd049d0796cbfaa6c41a7d80e84d3a734b30acc8"
artbio
parents:
diff changeset
9 library(sequenza)
0e54da14f831 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/snvtocnv commit fd049d0796cbfaa6c41a7d80e84d3a734b30acc8"
artbio
parents:
diff changeset
10 library(BiocParallel)
0e54da14f831 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/snvtocnv commit fd049d0796cbfaa6c41a7d80e84d3a734b30acc8"
artbio
parents:
diff changeset
11 library(tidyverse)
0e54da14f831 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/snvtocnv commit fd049d0796cbfaa6c41a7d80e84d3a734b30acc8"
artbio
parents:
diff changeset
12
0e54da14f831 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/snvtocnv commit fd049d0796cbfaa6c41a7d80e84d3a734b30acc8"
artbio
parents:
diff changeset
13 option_list <- list(
0e54da14f831 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/snvtocnv commit fd049d0796cbfaa6c41a7d80e84d3a734b30acc8"
artbio
parents:
diff changeset
14 make_option(
0e54da14f831 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/snvtocnv commit fd049d0796cbfaa6c41a7d80e84d3a734b30acc8"
artbio
parents:
diff changeset
15 c("-i", "--input"),
0e54da14f831 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/snvtocnv commit fd049d0796cbfaa6c41a7d80e84d3a734b30acc8"
artbio
parents:
diff changeset
16 default = NA,
0e54da14f831 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/snvtocnv commit fd049d0796cbfaa6c41a7d80e84d3a734b30acc8"
artbio
parents:
diff changeset
17 type = "character",
0e54da14f831 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/snvtocnv commit fd049d0796cbfaa6c41a7d80e84d3a734b30acc8"
artbio
parents:
diff changeset
18 help = "Path to Sequenza seqz processed segments file"
0e54da14f831 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/snvtocnv commit fd049d0796cbfaa6c41a7d80e84d3a734b30acc8"
artbio
parents:
diff changeset
19 ),
0e54da14f831 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/snvtocnv commit fd049d0796cbfaa6c41a7d80e84d3a734b30acc8"
artbio
parents:
diff changeset
20 make_option(
0e54da14f831 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/snvtocnv commit fd049d0796cbfaa6c41a7d80e84d3a734b30acc8"
artbio
parents:
diff changeset
21 c("-O", "--output_dir"),
0e54da14f831 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/snvtocnv commit fd049d0796cbfaa6c41a7d80e84d3a734b30acc8"
artbio
parents:
diff changeset
22 default = NA,
0e54da14f831 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/snvtocnv commit fd049d0796cbfaa6c41a7d80e84d3a734b30acc8"
artbio
parents:
diff changeset
23 type = "character",
0e54da14f831 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/snvtocnv commit fd049d0796cbfaa6c41a7d80e84d3a734b30acc8"
artbio
parents:
diff changeset
24 help = "Output directory"
0e54da14f831 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/snvtocnv commit fd049d0796cbfaa6c41a7d80e84d3a734b30acc8"
artbio
parents:
diff changeset
25 ),
0e54da14f831 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/snvtocnv commit fd049d0796cbfaa6c41a7d80e84d3a734b30acc8"
artbio
parents:
diff changeset
26 make_option(
0e54da14f831 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/snvtocnv commit fd049d0796cbfaa6c41a7d80e84d3a734b30acc8"
artbio
parents:
diff changeset
27 c("-s", "--sample_name"),
0e54da14f831 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/snvtocnv commit fd049d0796cbfaa6c41a7d80e84d3a734b30acc8"
artbio
parents:
diff changeset
28 default = NA,
0e54da14f831 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/snvtocnv commit fd049d0796cbfaa6c41a7d80e84d3a734b30acc8"
artbio
parents:
diff changeset
29 type = "character",
0e54da14f831 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/snvtocnv commit fd049d0796cbfaa6c41a7d80e84d3a734b30acc8"
artbio
parents:
diff changeset
30 help = "Sample name"
0e54da14f831 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/snvtocnv commit fd049d0796cbfaa6c41a7d80e84d3a734b30acc8"
artbio
parents:
diff changeset
31 )
0e54da14f831 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/snvtocnv commit fd049d0796cbfaa6c41a7d80e84d3a734b30acc8"
artbio
parents:
diff changeset
32 )
0e54da14f831 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/snvtocnv commit fd049d0796cbfaa6c41a7d80e84d3a734b30acc8"
artbio
parents:
diff changeset
33
0e54da14f831 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/snvtocnv commit fd049d0796cbfaa6c41a7d80e84d3a734b30acc8"
artbio
parents:
diff changeset
34 opt <- parse_args(OptionParser(option_list = option_list),
0e54da14f831 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/snvtocnv commit fd049d0796cbfaa6c41a7d80e84d3a734b30acc8"
artbio
parents:
diff changeset
35 args = commandArgs(trailingOnly = TRUE))
0e54da14f831 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/snvtocnv commit fd049d0796cbfaa6c41a7d80e84d3a734b30acc8"
artbio
parents:
diff changeset
36
0e54da14f831 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/snvtocnv commit fd049d0796cbfaa6c41a7d80e84d3a734b30acc8"
artbio
parents:
diff changeset
37 data_file <- opt$input
0e54da14f831 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/snvtocnv commit fd049d0796cbfaa6c41a7d80e84d3a734b30acc8"
artbio
parents:
diff changeset
38 output_dir <- opt$output_dir
0e54da14f831 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/snvtocnv commit fd049d0796cbfaa6c41a7d80e84d3a734b30acc8"
artbio
parents:
diff changeset
39 sample_name <- opt$sample_name
0e54da14f831 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/snvtocnv commit fd049d0796cbfaa6c41a7d80e84d3a734b30acc8"
artbio
parents:
diff changeset
40
0e54da14f831 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/snvtocnv commit fd049d0796cbfaa6c41a7d80e84d3a734b30acc8"
artbio
parents:
diff changeset
41
0e54da14f831 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/snvtocnv commit fd049d0796cbfaa6c41a7d80e84d3a734b30acc8"
artbio
parents:
diff changeset
42 ## Processing seqz files : normalisation and segmentation for chromosomes 1 to 22
0e54da14f831 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/snvtocnv commit fd049d0796cbfaa6c41a7d80e84d3a734b30acc8"
artbio
parents:
diff changeset
43 message(sprintf("\nExtraction step for %s", data_file))
0e54da14f831 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/snvtocnv commit fd049d0796cbfaa6c41a7d80e84d3a734b30acc8"
artbio
parents:
diff changeset
44
0e54da14f831 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/snvtocnv commit fd049d0796cbfaa6c41a7d80e84d3a734b30acc8"
artbio
parents:
diff changeset
45 segfile <- sequenza.extract(data_file,
0e54da14f831 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/snvtocnv commit fd049d0796cbfaa6c41a7d80e84d3a734b30acc8"
artbio
parents:
diff changeset
46 verbose = TRUE) # ,
0e54da14f831 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/snvtocnv commit fd049d0796cbfaa6c41a7d80e84d3a734b30acc8"
artbio
parents:
diff changeset
47 # chromosome.list = as.character(c(1:22)))
0e54da14f831 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/snvtocnv commit fd049d0796cbfaa6c41a7d80e84d3a734b30acc8"
artbio
parents:
diff changeset
48
0e54da14f831 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/snvtocnv commit fd049d0796cbfaa6c41a7d80e84d3a734b30acc8"
artbio
parents:
diff changeset
49 ## Estimation of cellularity and ploidy
0e54da14f831 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/snvtocnv commit fd049d0796cbfaa6c41a7d80e84d3a734b30acc8"
artbio
parents:
diff changeset
50
0e54da14f831 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/snvtocnv commit fd049d0796cbfaa6c41a7d80e84d3a734b30acc8"
artbio
parents:
diff changeset
51 segfile_cp <- sequenza.fit(segfile)
0e54da14f831 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/snvtocnv commit fd049d0796cbfaa6c41a7d80e84d3a734b30acc8"
artbio
parents:
diff changeset
52 message(sprintf("\nEstimation step for %s\n", data_file))
0e54da14f831 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/snvtocnv commit fd049d0796cbfaa6c41a7d80e84d3a734b30acc8"
artbio
parents:
diff changeset
53
0e54da14f831 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/snvtocnv commit fd049d0796cbfaa6c41a7d80e84d3a734b30acc8"
artbio
parents:
diff changeset
54 ## writing files and plots using default parameters
0e54da14f831 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/snvtocnv commit fd049d0796cbfaa6c41a7d80e84d3a734b30acc8"
artbio
parents:
diff changeset
55 message(sprintf("\nWriting files and plots for %s\n", data_file))
0e54da14f831 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/snvtocnv commit fd049d0796cbfaa6c41a7d80e84d3a734b30acc8"
artbio
parents:
diff changeset
56
0e54da14f831 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/snvtocnv commit fd049d0796cbfaa6c41a7d80e84d3a734b30acc8"
artbio
parents:
diff changeset
57 sequenza.results(sequenza.extract = segfile,
0e54da14f831 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/snvtocnv commit fd049d0796cbfaa6c41a7d80e84d3a734b30acc8"
artbio
parents:
diff changeset
58 cp.table = segfile_cp,
0e54da14f831 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/snvtocnv commit fd049d0796cbfaa6c41a7d80e84d3a734b30acc8"
artbio
parents:
diff changeset
59 sample.id = sample_name,
0e54da14f831 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/snvtocnv commit fd049d0796cbfaa6c41a7d80e84d3a734b30acc8"
artbio
parents:
diff changeset
60 out.dir = output_dir)
0e54da14f831 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/snvtocnv commit fd049d0796cbfaa6c41a7d80e84d3a734b30acc8"
artbio
parents:
diff changeset
61 message(sprintf("\nOutput written to %s\n", output_dir))