annotate segmentation_sequenza.R @ 10:0a19b63c521d draft default tip

planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/snvtocnv commit 116f2555558a283190cd1dd60ee25b359bcda51e
author artbio
date Fri, 20 May 2022 17:07:09 +0000
parents f3bacfd9b670
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
8
67213c4eefa6 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/snvtocnv commit 10ad3a0ca7cd23ad1e0940844147e1d1b3d069f0"
artbio
parents: 7
diff changeset
1 options(show.error.messages = F, error = function() {
67213c4eefa6 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/snvtocnv commit 10ad3a0ca7cd23ad1e0940844147e1d1b3d069f0"
artbio
parents: 7
diff changeset
2 cat(geterrmessage(), file = stderr()); q("no", 1, F) })
7
e66b91475343 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/snvtocnv commit 7df896b940e80984168b1fa6326c4d862e7e208c"
artbio
parents: 6
diff changeset
3
0
0e54da14f831 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/snvtocnv commit fd049d0796cbfaa6c41a7d80e84d3a734b30acc8"
artbio
parents:
diff changeset
4 # load packages that are provided in the conda env
0e54da14f831 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/snvtocnv commit fd049d0796cbfaa6c41a7d80e84d3a734b30acc8"
artbio
parents:
diff changeset
5 library(optparse)
0e54da14f831 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/snvtocnv commit fd049d0796cbfaa6c41a7d80e84d3a734b30acc8"
artbio
parents:
diff changeset
6 library(sequenza)
0e54da14f831 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/snvtocnv commit fd049d0796cbfaa6c41a7d80e84d3a734b30acc8"
artbio
parents:
diff changeset
7 library(BiocParallel)
0e54da14f831 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/snvtocnv commit fd049d0796cbfaa6c41a7d80e84d3a734b30acc8"
artbio
parents:
diff changeset
8 library(tidyverse)
8
67213c4eefa6 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/snvtocnv commit 10ad3a0ca7cd23ad1e0940844147e1d1b3d069f0"
artbio
parents: 7
diff changeset
9 library(readr)
67213c4eefa6 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/snvtocnv commit 10ad3a0ca7cd23ad1e0940844147e1d1b3d069f0"
artbio
parents: 7
diff changeset
10
0
0e54da14f831 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/snvtocnv commit fd049d0796cbfaa6c41a7d80e84d3a734b30acc8"
artbio
parents:
diff changeset
11 option_list <- list(
0e54da14f831 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/snvtocnv commit fd049d0796cbfaa6c41a7d80e84d3a734b30acc8"
artbio
parents:
diff changeset
12 make_option(
0e54da14f831 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/snvtocnv commit fd049d0796cbfaa6c41a7d80e84d3a734b30acc8"
artbio
parents:
diff changeset
13 c("-i", "--input"),
0e54da14f831 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/snvtocnv commit fd049d0796cbfaa6c41a7d80e84d3a734b30acc8"
artbio
parents:
diff changeset
14 default = NA,
0e54da14f831 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/snvtocnv commit fd049d0796cbfaa6c41a7d80e84d3a734b30acc8"
artbio
parents:
diff changeset
15 type = "character",
0e54da14f831 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/snvtocnv commit fd049d0796cbfaa6c41a7d80e84d3a734b30acc8"
artbio
parents:
diff changeset
16 help = "Path to Sequenza seqz processed segments file"
0e54da14f831 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/snvtocnv commit fd049d0796cbfaa6c41a7d80e84d3a734b30acc8"
artbio
parents:
diff changeset
17 ),
0e54da14f831 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/snvtocnv commit fd049d0796cbfaa6c41a7d80e84d3a734b30acc8"
artbio
parents:
diff changeset
18 make_option(
0e54da14f831 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/snvtocnv commit fd049d0796cbfaa6c41a7d80e84d3a734b30acc8"
artbio
parents:
diff changeset
19 c("-O", "--output_dir"),
0e54da14f831 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/snvtocnv commit fd049d0796cbfaa6c41a7d80e84d3a734b30acc8"
artbio
parents:
diff changeset
20 default = NA,
0e54da14f831 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/snvtocnv commit fd049d0796cbfaa6c41a7d80e84d3a734b30acc8"
artbio
parents:
diff changeset
21 type = "character",
0e54da14f831 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/snvtocnv commit fd049d0796cbfaa6c41a7d80e84d3a734b30acc8"
artbio
parents:
diff changeset
22 help = "Output directory"
0e54da14f831 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/snvtocnv commit fd049d0796cbfaa6c41a7d80e84d3a734b30acc8"
artbio
parents:
diff changeset
23 ),
0e54da14f831 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/snvtocnv commit fd049d0796cbfaa6c41a7d80e84d3a734b30acc8"
artbio
parents:
diff changeset
24 make_option(
0e54da14f831 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/snvtocnv commit fd049d0796cbfaa6c41a7d80e84d3a734b30acc8"
artbio
parents:
diff changeset
25 c("-s", "--sample_name"),
0e54da14f831 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/snvtocnv commit fd049d0796cbfaa6c41a7d80e84d3a734b30acc8"
artbio
parents:
diff changeset
26 default = NA,
0e54da14f831 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/snvtocnv commit fd049d0796cbfaa6c41a7d80e84d3a734b30acc8"
artbio
parents:
diff changeset
27 type = "character",
0e54da14f831 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/snvtocnv commit fd049d0796cbfaa6c41a7d80e84d3a734b30acc8"
artbio
parents:
diff changeset
28 help = "Sample name"
0e54da14f831 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/snvtocnv commit fd049d0796cbfaa6c41a7d80e84d3a734b30acc8"
artbio
parents:
diff changeset
29 )
0e54da14f831 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/snvtocnv commit fd049d0796cbfaa6c41a7d80e84d3a734b30acc8"
artbio
parents:
diff changeset
30 )
0e54da14f831 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/snvtocnv commit fd049d0796cbfaa6c41a7d80e84d3a734b30acc8"
artbio
parents:
diff changeset
31
0e54da14f831 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/snvtocnv commit fd049d0796cbfaa6c41a7d80e84d3a734b30acc8"
artbio
parents:
diff changeset
32 opt <- parse_args(OptionParser(option_list = option_list),
0e54da14f831 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/snvtocnv commit fd049d0796cbfaa6c41a7d80e84d3a734b30acc8"
artbio
parents:
diff changeset
33 args = commandArgs(trailingOnly = TRUE))
0e54da14f831 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/snvtocnv commit fd049d0796cbfaa6c41a7d80e84d3a734b30acc8"
artbio
parents:
diff changeset
34
0e54da14f831 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/snvtocnv commit fd049d0796cbfaa6c41a7d80e84d3a734b30acc8"
artbio
parents:
diff changeset
35 data_file <- opt$input
0e54da14f831 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/snvtocnv commit fd049d0796cbfaa6c41a7d80e84d3a734b30acc8"
artbio
parents:
diff changeset
36 output_dir <- opt$output_dir
0e54da14f831 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/snvtocnv commit fd049d0796cbfaa6c41a7d80e84d3a734b30acc8"
artbio
parents:
diff changeset
37 sample_name <- opt$sample_name
0e54da14f831 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/snvtocnv commit fd049d0796cbfaa6c41a7d80e84d3a734b30acc8"
artbio
parents:
diff changeset
38
0e54da14f831 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/snvtocnv commit fd049d0796cbfaa6c41a7d80e84d3a734b30acc8"
artbio
parents:
diff changeset
39
0e54da14f831 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/snvtocnv commit fd049d0796cbfaa6c41a7d80e84d3a734b30acc8"
artbio
parents:
diff changeset
40 ## Processing seqz files : normalisation and segmentation for chromosomes 1 to 22
0e54da14f831 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/snvtocnv commit fd049d0796cbfaa6c41a7d80e84d3a734b30acc8"
artbio
parents:
diff changeset
41 message(sprintf("\nExtraction step for %s", data_file))
0e54da14f831 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/snvtocnv commit fd049d0796cbfaa6c41a7d80e84d3a734b30acc8"
artbio
parents:
diff changeset
42
9
f3bacfd9b670 planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/snvtocnv commit aa1b68e64cbbdcdd9167134ec2ea61a151333688
artbio
parents: 8
diff changeset
43 chrom_list <- c("chr1", "chr2", "chr3", "chr4", "chr5", "chr6", "chr7", "chr8", "chr9",
f3bacfd9b670 planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/snvtocnv commit aa1b68e64cbbdcdd9167134ec2ea61a151333688
artbio
parents: 8
diff changeset
44 "chr10", "chr11", "chr12", "chr13", "chr14", "chr15", "chr16", "chr17",
f3bacfd9b670 planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/snvtocnv commit aa1b68e64cbbdcdd9167134ec2ea61a151333688
artbio
parents: 8
diff changeset
45 "chr18", "chr19", "chr20", "chr21", "chr22", "chrX")
2
9265faa93098 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/snvtocnv commit fd049d0796cbfaa6c41a7d80e84d3a734b30acc8-dirty"
artbio
parents: 0
diff changeset
46
8
67213c4eefa6 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/snvtocnv commit 10ad3a0ca7cd23ad1e0940844147e1d1b3d069f0"
artbio
parents: 7
diff changeset
47 Sys.setenv(TZDIR = "/usr/share/zoneinfo/")
67213c4eefa6 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/snvtocnv commit 10ad3a0ca7cd23ad1e0940844147e1d1b3d069f0"
artbio
parents: 7
diff changeset
48 Sys.setenv(TZ = "US/Eastern")
67213c4eefa6 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/snvtocnv commit 10ad3a0ca7cd23ad1e0940844147e1d1b3d069f0"
artbio
parents: 7
diff changeset
49 options(tz = "US/Eastern")
67213c4eefa6 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/snvtocnv commit 10ad3a0ca7cd23ad1e0940844147e1d1b3d069f0"
artbio
parents: 7
diff changeset
50 Sys.timezone(location = TRUE)
67213c4eefa6 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/snvtocnv commit 10ad3a0ca7cd23ad1e0940844147e1d1b3d069f0"
artbio
parents: 7
diff changeset
51
67213c4eefa6 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/snvtocnv commit 10ad3a0ca7cd23ad1e0940844147e1d1b3d069f0"
artbio
parents: 7
diff changeset
52
0
0e54da14f831 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/snvtocnv commit fd049d0796cbfaa6c41a7d80e84d3a734b30acc8"
artbio
parents:
diff changeset
53 segfile <- sequenza.extract(data_file,
8
67213c4eefa6 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/snvtocnv commit 10ad3a0ca7cd23ad1e0940844147e1d1b3d069f0"
artbio
parents: 7
diff changeset
54 verbose = FALSE,
2
9265faa93098 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/snvtocnv commit fd049d0796cbfaa6c41a7d80e84d3a734b30acc8-dirty"
artbio
parents: 0
diff changeset
55 chromosome.list = chrom_list)
0
0e54da14f831 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/snvtocnv commit fd049d0796cbfaa6c41a7d80e84d3a734b30acc8"
artbio
parents:
diff changeset
56
0e54da14f831 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/snvtocnv commit fd049d0796cbfaa6c41a7d80e84d3a734b30acc8"
artbio
parents:
diff changeset
57 ## Estimation of cellularity and ploidy
0e54da14f831 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/snvtocnv commit fd049d0796cbfaa6c41a7d80e84d3a734b30acc8"
artbio
parents:
diff changeset
58
0e54da14f831 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/snvtocnv commit fd049d0796cbfaa6c41a7d80e84d3a734b30acc8"
artbio
parents:
diff changeset
59 segfile_cp <- sequenza.fit(segfile)
0e54da14f831 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/snvtocnv commit fd049d0796cbfaa6c41a7d80e84d3a734b30acc8"
artbio
parents:
diff changeset
60 message(sprintf("\nEstimation step for %s\n", data_file))
0e54da14f831 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/snvtocnv commit fd049d0796cbfaa6c41a7d80e84d3a734b30acc8"
artbio
parents:
diff changeset
61
0e54da14f831 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/snvtocnv commit fd049d0796cbfaa6c41a7d80e84d3a734b30acc8"
artbio
parents:
diff changeset
62 ## writing files and plots using default parameters
0e54da14f831 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/snvtocnv commit fd049d0796cbfaa6c41a7d80e84d3a734b30acc8"
artbio
parents:
diff changeset
63 message(sprintf("\nWriting files and plots for %s\n", data_file))
0e54da14f831 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/snvtocnv commit fd049d0796cbfaa6c41a7d80e84d3a734b30acc8"
artbio
parents:
diff changeset
64
0e54da14f831 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/snvtocnv commit fd049d0796cbfaa6c41a7d80e84d3a734b30acc8"
artbio
parents:
diff changeset
65 sequenza.results(sequenza.extract = segfile,
0e54da14f831 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/snvtocnv commit fd049d0796cbfaa6c41a7d80e84d3a734b30acc8"
artbio
parents:
diff changeset
66 cp.table = segfile_cp,
0e54da14f831 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/snvtocnv commit fd049d0796cbfaa6c41a7d80e84d3a734b30acc8"
artbio
parents:
diff changeset
67 sample.id = sample_name,
0e54da14f831 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/snvtocnv commit fd049d0796cbfaa6c41a7d80e84d3a734b30acc8"
artbio
parents:
diff changeset
68 out.dir = output_dir)
0e54da14f831 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/snvtocnv commit fd049d0796cbfaa6c41a7d80e84d3a734b30acc8"
artbio
parents:
diff changeset
69 message(sprintf("\nOutput written to %s\n", output_dir))