annotate lib.r @ 31:f248fd3b89d6 draft

planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 49203f8a5271fa5e6bb889e907df71ebf7757309
author lecorguille
date Thu, 08 Mar 2018 05:53:40 -0500
parents cc3a32791781
children 68282292acc4
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
29
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
1 #@authors ABiMS TEAM, Y. Guitton
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
2 # lib.r for Galaxy Workflow4Metabolomics xcms tools
4
fef3d1b8e7f4 planemo upload commit a3229faad6949bbca965d1d7e138cb3c0550780e
lecorguille
parents:
diff changeset
3
29
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
4 #@author G. Le Corguille
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
5 # solve an issue with batch if arguments are logical TRUE/FALSE
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
6 parseCommandArgs <- function(...) {
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
7 args <- batch::parseCommandArgs(...)
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
8 for (key in names(args)) {
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
9 if (args[key] %in% c("TRUE","FALSE"))
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
10 args[key] = as.logical(args[key])
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
11 }
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
12 return(args)
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
13 }
4
fef3d1b8e7f4 planemo upload commit a3229faad6949bbca965d1d7e138cb3c0550780e
lecorguille
parents:
diff changeset
14
13
206e5a968dc5 planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 08e7f269a5c59687a7768be8db5fcb4e4d736093
lecorguille
parents: 12
diff changeset
15 #@author G. Le Corguille
29
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
16 # This function will
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
17 # - load the packages
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
18 # - display the sessionInfo
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
19 loadAndDisplayPackages <- function(pkgs) {
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
20 for(pkg in pkgs) suppressPackageStartupMessages( stopifnot( library(pkg, quietly=TRUE, logical.return=TRUE, character.only=TRUE)))
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
21
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
22 sessioninfo = sessionInfo()
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
23 cat(sessioninfo$R.version$version.string,"\n")
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
24 cat("Main packages:\n")
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
25 for (pkg in names(sessioninfo$otherPkgs)) { cat(paste(pkg,packageVersion(pkg)),"\t") }; cat("\n")
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
26 cat("Other loaded packages:\n")
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
27 for (pkg in names(sessioninfo$loadedOnly)) { cat(paste(pkg,packageVersion(pkg)),"\t") }; cat("\n")
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
28 }
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
29
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
30 #@author G. Le Corguille
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
31 # This function convert if it is required the Retention Time in minutes
13
206e5a968dc5 planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 08e7f269a5c59687a7768be8db5fcb4e4d736093
lecorguille
parents: 12
diff changeset
32 RTSecondToMinute <- function(variableMetadata, convertRTMinute) {
206e5a968dc5 planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 08e7f269a5c59687a7768be8db5fcb4e4d736093
lecorguille
parents: 12
diff changeset
33 if (convertRTMinute){
206e5a968dc5 planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 08e7f269a5c59687a7768be8db5fcb4e4d736093
lecorguille
parents: 12
diff changeset
34 #converting the retention times (seconds) into minutes
206e5a968dc5 planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 08e7f269a5c59687a7768be8db5fcb4e4d736093
lecorguille
parents: 12
diff changeset
35 print("converting the retention times into minutes in the variableMetadata")
29
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
36 variableMetadata[,"rt"] <- variableMetadata[,"rt"]/60
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
37 variableMetadata[,"rtmin"] <- variableMetadata[,"rtmin"]/60
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
38 variableMetadata[,"rtmax"] <- variableMetadata[,"rtmax"]/60
13
206e5a968dc5 planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 08e7f269a5c59687a7768be8db5fcb4e4d736093
lecorguille
parents: 12
diff changeset
39 }
206e5a968dc5 planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 08e7f269a5c59687a7768be8db5fcb4e4d736093
lecorguille
parents: 12
diff changeset
40 return (variableMetadata)
206e5a968dc5 planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 08e7f269a5c59687a7768be8db5fcb4e4d736093
lecorguille
parents: 12
diff changeset
41 }
4
fef3d1b8e7f4 planemo upload commit a3229faad6949bbca965d1d7e138cb3c0550780e
lecorguille
parents:
diff changeset
42
13
206e5a968dc5 planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 08e7f269a5c59687a7768be8db5fcb4e4d736093
lecorguille
parents: 12
diff changeset
43 #@author G. Le Corguille
29
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
44 # This function format ions identifiers
17
a28473761624 planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 481448087f0e09c131b24f7d552db69f3552d371-dirty
lecorguille
parents: 16
diff changeset
45 formatIonIdentifiers <- function(variableMetadata, numDigitsRT=0, numDigitsMZ=0) {
29
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
46 splitDeco <- strsplit(as.character(variableMetadata$name),"_")
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
47 idsDeco <- sapply(splitDeco, function(x) { deco=unlist(x)[2]; if (is.na(deco)) return ("") else return(paste0("_",deco)) })
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
48 namecustom <- make.unique(paste0("M",round(variableMetadata[,"mz"],numDigitsMZ),"T",round(variableMetadata[,"rt"],numDigitsRT),idsDeco))
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
49 variableMetadata <- cbind(name=variableMetadata$name, namecustom=namecustom, variableMetadata[,!(colnames(variableMetadata) %in% c("name"))])
17
a28473761624 planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 481448087f0e09c131b24f7d552db69f3552d371-dirty
lecorguille
parents: 16
diff changeset
50 return(variableMetadata)
13
206e5a968dc5 planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 08e7f269a5c59687a7768be8db5fcb4e4d736093
lecorguille
parents: 12
diff changeset
51 }
206e5a968dc5 planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 08e7f269a5c59687a7768be8db5fcb4e4d736093
lecorguille
parents: 12
diff changeset
52
206e5a968dc5 planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 08e7f269a5c59687a7768be8db5fcb4e4d736093
lecorguille
parents: 12
diff changeset
53 #@author G. Le Corguille
29
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
54 # Draw the plotChromPeakDensity 3 per page in a pdf file
30
cc3a32791781 planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 7b226c3ba91a3cf654ec1c14b3ef85090968bb0f
lecorguille
parents: 29
diff changeset
55 getPlotChromPeakDensity <- function(xdata, mzdigit=4) {
29
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
56 pdf(file="plotChromPeakDensity.pdf", width=16, height=12)
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
57
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
58 par(mfrow = c(3, 1), mar = c(4, 4, 1, 0.5))
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
59
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
60 group_colors <- brewer.pal(3, "Set1")[1:length(unique(xdata$sample_group))]
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
61 names(group_colors) <- unique(xdata$sample_group)
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
62
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
63 xlim <- c(min(featureDefinitions(xdata)$rtmin), max(featureDefinitions(xdata)$rtmax))
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
64 for (i in 1:nrow(featureDefinitions(xdata))) {
30
cc3a32791781 planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 7b226c3ba91a3cf654ec1c14b3ef85090968bb0f
lecorguille
parents: 29
diff changeset
65 mzmin = featureDefinitions(xdata)[i,]$mzmin
cc3a32791781 planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 7b226c3ba91a3cf654ec1c14b3ef85090968bb0f
lecorguille
parents: 29
diff changeset
66 mzmax = featureDefinitions(xdata)[i,]$mzmax
cc3a32791781 planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 7b226c3ba91a3cf654ec1c14b3ef85090968bb0f
lecorguille
parents: 29
diff changeset
67 plotChromPeakDensity(xdata, mz=c(mzmin,mzmax), col=group_colors, pch=16, xlim=xlim, main=paste(round(mzmin,mzdigit),round(mzmax,mzdigit)))
29
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
68 legend("topright", legend=names(group_colors), col=group_colors, cex=0.8, lty=1)
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
69 }
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
70
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
71 dev.off()
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
72 }
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
73
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
74 #@author G. Le Corguille
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
75 # Draw the plotChromPeakDensity 3 per page in a pdf file
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
76 getPlotAdjustedRtime <- function(xdata) {
31
f248fd3b89d6 planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 49203f8a5271fa5e6bb889e907df71ebf7757309
lecorguille
parents: 30
diff changeset
77
29
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
78 pdf(file="raw_vs_adjusted_rt.pdf", width=16, height=12)
31
f248fd3b89d6 planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 49203f8a5271fa5e6bb889e907df71ebf7757309
lecorguille
parents: 30
diff changeset
79
29
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
80 # Color by group
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
81 group_colors <- brewer.pal(3, "Set1")[1:length(unique(xdata$sample_group))]
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
82 names(group_colors) <- unique(xdata$sample_group)
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
83 plotAdjustedRtime(xdata, col = group_colors[xdata$sample_group])
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
84 legend("topright", legend=names(group_colors), col=group_colors, cex=0.8, lty=1)
31
f248fd3b89d6 planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 49203f8a5271fa5e6bb889e907df71ebf7757309
lecorguille
parents: 30
diff changeset
85
29
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
86 # Color by sample
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
87 plotAdjustedRtime(xdata, col = rainbow(length(xdata@phenoData@data$sample_name)))
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
88 legend("topright", legend=xdata@phenoData@data$sample_name, col=rainbow(length(xdata@phenoData@data$sample_name)), cex=0.8, lty=1)
31
f248fd3b89d6 planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 49203f8a5271fa5e6bb889e907df71ebf7757309
lecorguille
parents: 30
diff changeset
89
29
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
90 dev.off()
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
91 }
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
92
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
93 #@author G. Le Corguille
13
206e5a968dc5 planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 08e7f269a5c59687a7768be8db5fcb4e4d736093
lecorguille
parents: 12
diff changeset
94 # value: intensity values to be used into, maxo or intb
29
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
95 getPeaklistW4M <- function(xdata, intval="into", convertRTMinute=F, numDigitsMZ=4, numDigitsRT=0, variableMetadataOutput, dataMatrixOutput) {
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
96 dataMatrix <- featureValues(xdata, method="medret", value=intval)
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
97 colnames(dataMatrix) <- tools::file_path_sans_ext(colnames(dataMatrix))
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
98 dataMatrix = cbind(name=groupnamesW4M(xdata), dataMatrix)
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
99 variableMetadata <- featureDefinitions(xdata)
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
100 colnames(variableMetadata)[1] = "mz"; colnames(variableMetadata)[4] = "rt"
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
101 variableMetadata = data.frame(name=groupnamesW4M(xdata), variableMetadata)
14
f4dc089f9d19 planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 22c4e92909198328fc7439ff47e4546a273eb907
lecorguille
parents: 13
diff changeset
102
29
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
103 variableMetadata <- RTSecondToMinute(variableMetadata, convertRTMinute)
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
104 variableMetadata <- formatIonIdentifiers(variableMetadata, numDigitsRT=numDigitsRT, numDigitsMZ=numDigitsMZ)
13
206e5a968dc5 planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 08e7f269a5c59687a7768be8db5fcb4e4d736093
lecorguille
parents: 12
diff changeset
105
17
a28473761624 planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 481448087f0e09c131b24f7d552db69f3552d371-dirty
lecorguille
parents: 16
diff changeset
106 write.table(variableMetadata, file=variableMetadataOutput,sep="\t",quote=F,row.names=F)
a28473761624 planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 481448087f0e09c131b24f7d552db69f3552d371-dirty
lecorguille
parents: 16
diff changeset
107 write.table(dataMatrix, file=dataMatrixOutput,sep="\t",quote=F,row.names=F)
29
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
108
13
206e5a968dc5 planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 08e7f269a5c59687a7768be8db5fcb4e4d736093
lecorguille
parents: 12
diff changeset
109 }
4
fef3d1b8e7f4 planemo upload commit a3229faad6949bbca965d1d7e138cb3c0550780e
lecorguille
parents:
diff changeset
110
31
f248fd3b89d6 planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 49203f8a5271fa5e6bb889e907df71ebf7757309
lecorguille
parents: 30
diff changeset
111 #@author G. Le Corguille
f248fd3b89d6 planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 49203f8a5271fa5e6bb889e907df71ebf7757309
lecorguille
parents: 30
diff changeset
112 getPlotChromatogram <- function(xdata, pdfname="Chromatogram.pdf", aggregationFun = "max") {
f248fd3b89d6 planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 49203f8a5271fa5e6bb889e907df71ebf7757309
lecorguille
parents: 30
diff changeset
113
f248fd3b89d6 planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 49203f8a5271fa5e6bb889e907df71ebf7757309
lecorguille
parents: 30
diff changeset
114 chrom <- chromatogram(xdata, aggregationFun = aggregationFun)
f248fd3b89d6 planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 49203f8a5271fa5e6bb889e907df71ebf7757309
lecorguille
parents: 30
diff changeset
115 if (aggregationFun == "sum")
f248fd3b89d6 planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 49203f8a5271fa5e6bb889e907df71ebf7757309
lecorguille
parents: 30
diff changeset
116 type="Total Ion Chromatograms"
f248fd3b89d6 planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 49203f8a5271fa5e6bb889e907df71ebf7757309
lecorguille
parents: 30
diff changeset
117 else
f248fd3b89d6 planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 49203f8a5271fa5e6bb889e907df71ebf7757309
lecorguille
parents: 30
diff changeset
118 type="Base Peak Intensity Chromatograms"
f248fd3b89d6 planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 49203f8a5271fa5e6bb889e907df71ebf7757309
lecorguille
parents: 30
diff changeset
119
f248fd3b89d6 planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 49203f8a5271fa5e6bb889e907df71ebf7757309
lecorguille
parents: 30
diff changeset
120 adjusted="Raw"
f248fd3b89d6 planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 49203f8a5271fa5e6bb889e907df71ebf7757309
lecorguille
parents: 30
diff changeset
121 if (hasAdjustedRtime(xdata))
f248fd3b89d6 planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 49203f8a5271fa5e6bb889e907df71ebf7757309
lecorguille
parents: 30
diff changeset
122 adjusted="Adjusted"
f248fd3b89d6 planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 49203f8a5271fa5e6bb889e907df71ebf7757309
lecorguille
parents: 30
diff changeset
123
f248fd3b89d6 planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 49203f8a5271fa5e6bb889e907df71ebf7757309
lecorguille
parents: 30
diff changeset
124 main <- paste(type,":",adjusted,"data")
f248fd3b89d6 planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 49203f8a5271fa5e6bb889e907df71ebf7757309
lecorguille
parents: 30
diff changeset
125
f248fd3b89d6 planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 49203f8a5271fa5e6bb889e907df71ebf7757309
lecorguille
parents: 30
diff changeset
126 pdf(pdfname, width=16, height=10)
f248fd3b89d6 planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 49203f8a5271fa5e6bb889e907df71ebf7757309
lecorguille
parents: 30
diff changeset
127
f248fd3b89d6 planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 49203f8a5271fa5e6bb889e907df71ebf7757309
lecorguille
parents: 30
diff changeset
128 # Color by group
f248fd3b89d6 planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 49203f8a5271fa5e6bb889e907df71ebf7757309
lecorguille
parents: 30
diff changeset
129 group_colors <- brewer.pal(3, "Set1")[1:length(unique(xdata$sample_group))]
f248fd3b89d6 planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 49203f8a5271fa5e6bb889e907df71ebf7757309
lecorguille
parents: 30
diff changeset
130 names(group_colors) <- unique(xdata$sample_group)
f248fd3b89d6 planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 49203f8a5271fa5e6bb889e907df71ebf7757309
lecorguille
parents: 30
diff changeset
131 plot(chrom, col = group_colors[chrom$sample_group], main=main)
f248fd3b89d6 planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 49203f8a5271fa5e6bb889e907df71ebf7757309
lecorguille
parents: 30
diff changeset
132 legend("topright", legend=names(group_colors), col=group_colors, cex=0.8, lty=1)
f248fd3b89d6 planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 49203f8a5271fa5e6bb889e907df71ebf7757309
lecorguille
parents: 30
diff changeset
133
f248fd3b89d6 planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 49203f8a5271fa5e6bb889e907df71ebf7757309
lecorguille
parents: 30
diff changeset
134 # Color by sample
f248fd3b89d6 planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 49203f8a5271fa5e6bb889e907df71ebf7757309
lecorguille
parents: 30
diff changeset
135 plot(chrom, col = rainbow(length(xdata@phenoData@data$sample_name)), main=main)
f248fd3b89d6 planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 49203f8a5271fa5e6bb889e907df71ebf7757309
lecorguille
parents: 30
diff changeset
136 legend("topright", legend=xdata@phenoData@data$sample_name, col=rainbow(length(xdata@phenoData@data$sample_name)), cex=0.8, lty=1)
f248fd3b89d6 planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 49203f8a5271fa5e6bb889e907df71ebf7757309
lecorguille
parents: 30
diff changeset
137
f248fd3b89d6 planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 49203f8a5271fa5e6bb889e907df71ebf7757309
lecorguille
parents: 30
diff changeset
138 dev.off()
4
fef3d1b8e7f4 planemo upload commit a3229faad6949bbca965d1d7e138cb3c0550780e
lecorguille
parents:
diff changeset
139 }
fef3d1b8e7f4 planemo upload commit a3229faad6949bbca965d1d7e138cb3c0550780e
lecorguille
parents:
diff changeset
140
31
f248fd3b89d6 planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 49203f8a5271fa5e6bb889e907df71ebf7757309
lecorguille
parents: 30
diff changeset
141 #@author G. Le Corguille
f248fd3b89d6 planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 49203f8a5271fa5e6bb889e907df71ebf7757309
lecorguille
parents: 30
diff changeset
142 getPlotTICs <- function(xdata, pdfname="TICs.pdf") {
f248fd3b89d6 planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 49203f8a5271fa5e6bb889e907df71ebf7757309
lecorguille
parents: 30
diff changeset
143 getPlotChromatogram(xdata, pdfname, aggregationFun = "sum")
4
fef3d1b8e7f4 planemo upload commit a3229faad6949bbca965d1d7e138cb3c0550780e
lecorguille
parents:
diff changeset
144 }
fef3d1b8e7f4 planemo upload commit a3229faad6949bbca965d1d7e138cb3c0550780e
lecorguille
parents:
diff changeset
145
31
f248fd3b89d6 planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 49203f8a5271fa5e6bb889e907df71ebf7757309
lecorguille
parents: 30
diff changeset
146 #@author G. Le Corguille
f248fd3b89d6 planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 49203f8a5271fa5e6bb889e907df71ebf7757309
lecorguille
parents: 30
diff changeset
147 getPlotBPIs <- function(xdata, pdfname="BPIs.pdf") {
f248fd3b89d6 planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 49203f8a5271fa5e6bb889e907df71ebf7757309
lecorguille
parents: 30
diff changeset
148 getPlotChromatogram(xdata, pdfname, aggregationFun = "max")
4
fef3d1b8e7f4 planemo upload commit a3229faad6949bbca965d1d7e138cb3c0550780e
lecorguille
parents:
diff changeset
149 }
fef3d1b8e7f4 planemo upload commit a3229faad6949bbca965d1d7e138cb3c0550780e
lecorguille
parents:
diff changeset
150
fef3d1b8e7f4 planemo upload commit a3229faad6949bbca965d1d7e138cb3c0550780e
lecorguille
parents:
diff changeset
151
29
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
152 # Get the polarities from all the samples of a condition
4
fef3d1b8e7f4 planemo upload commit a3229faad6949bbca965d1d7e138cb3c0550780e
lecorguille
parents:
diff changeset
153 #@author Misharl Monsoor misharl.monsoor@sb-roscoff.fr ABiMS TEAM
fef3d1b8e7f4 planemo upload commit a3229faad6949bbca965d1d7e138cb3c0550780e
lecorguille
parents:
diff changeset
154 #@author Gildas Le Corguille lecorguille@sb-roscoff.fr ABiMS TEAM
29
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
155 getSampleMetadata <- function(xdata=NULL, sampleMetadataOutput="sampleMetadata.tsv") {
14
f4dc089f9d19 planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 22c4e92909198328fc7439ff47e4546a273eb907
lecorguille
parents: 13
diff changeset
156 cat("Creating the sampleMetadata file...\n")
13
206e5a968dc5 planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 08e7f269a5c59687a7768be8db5fcb4e4d736093
lecorguille
parents: 12
diff changeset
157
14
f4dc089f9d19 planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 22c4e92909198328fc7439ff47e4546a273eb907
lecorguille
parents: 13
diff changeset
158 #Create the sampleMetada dataframe
29
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
159 sampleMetadata <- xdata@phenoData@data
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
160 rownames(sampleMetadata) <- NULL
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
161 colnames(sampleMetadata) <- c("sampleMetadata", "class")
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
162
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
163 sampleNamesOrigin <- sampleMetadata$sampleMetadata
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
164 sampleNamesMakeNames <- make.names(sampleNamesOrigin)
4
fef3d1b8e7f4 planemo upload commit a3229faad6949bbca965d1d7e138cb3c0550780e
lecorguille
parents:
diff changeset
165
14
f4dc089f9d19 planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 22c4e92909198328fc7439ff47e4546a273eb907
lecorguille
parents: 13
diff changeset
166 if (any(duplicated(sampleNamesMakeNames))) {
f4dc089f9d19 planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 22c4e92909198328fc7439ff47e4546a273eb907
lecorguille
parents: 13
diff changeset
167 write("\n\nERROR: Usually, R has trouble to deal with special characters in its column names, so it rename them using make.names().\nIn your case, at least two columns after the renaming obtain the same name, thus XCMS will collapse those columns per name.", stderr())
f4dc089f9d19 planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 22c4e92909198328fc7439ff47e4546a273eb907
lecorguille
parents: 13
diff changeset
168 for (sampleName in sampleNamesOrigin) {
f4dc089f9d19 planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 22c4e92909198328fc7439ff47e4546a273eb907
lecorguille
parents: 13
diff changeset
169 write(paste(sampleName,"\t->\t",make.names(sampleName)),stderr())
f4dc089f9d19 planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 22c4e92909198328fc7439ff47e4546a273eb907
lecorguille
parents: 13
diff changeset
170 }
f4dc089f9d19 planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 22c4e92909198328fc7439ff47e4546a273eb907
lecorguille
parents: 13
diff changeset
171 stop("\n\nERROR: One or more of your files will not be import by xcmsSet. It may due to bad characters in their filenames.")
f4dc089f9d19 planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 22c4e92909198328fc7439ff47e4546a273eb907
lecorguille
parents: 13
diff changeset
172 }
4
fef3d1b8e7f4 planemo upload commit a3229faad6949bbca965d1d7e138cb3c0550780e
lecorguille
parents:
diff changeset
173
14
f4dc089f9d19 planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 22c4e92909198328fc7439ff47e4546a273eb907
lecorguille
parents: 13
diff changeset
174 if (!all(sampleNamesOrigin == sampleNamesMakeNames)) {
f4dc089f9d19 planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 22c4e92909198328fc7439ff47e4546a273eb907
lecorguille
parents: 13
diff changeset
175 cat("\n\nWARNING: Usually, R has trouble to deal with special characters in its column names, so it rename them using make.names()\nIn your case, one or more sample names will be renamed in the sampleMetadata and dataMatrix files:\n")
f4dc089f9d19 planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 22c4e92909198328fc7439ff47e4546a273eb907
lecorguille
parents: 13
diff changeset
176 for (sampleName in sampleNamesOrigin) {
f4dc089f9d19 planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 22c4e92909198328fc7439ff47e4546a273eb907
lecorguille
parents: 13
diff changeset
177 cat(paste(sampleName,"\t->\t",make.names(sampleName),"\n"))
f4dc089f9d19 planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 22c4e92909198328fc7439ff47e4546a273eb907
lecorguille
parents: 13
diff changeset
178 }
4
fef3d1b8e7f4 planemo upload commit a3229faad6949bbca965d1d7e138cb3c0550780e
lecorguille
parents:
diff changeset
179 }
fef3d1b8e7f4 planemo upload commit a3229faad6949bbca965d1d7e138cb3c0550780e
lecorguille
parents:
diff changeset
180
29
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
181 sampleMetadata$sampleMetadata <- sampleNamesMakeNames
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
182
14
f4dc089f9d19 planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 22c4e92909198328fc7439ff47e4546a273eb907
lecorguille
parents: 13
diff changeset
183
f4dc089f9d19 planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 22c4e92909198328fc7439ff47e4546a273eb907
lecorguille
parents: 13
diff changeset
184 #For each sample file, the following actions are done
29
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
185 for (fileIdx in 1:length(fileNames(xdata))) {
14
f4dc089f9d19 planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 22c4e92909198328fc7439ff47e4546a273eb907
lecorguille
parents: 13
diff changeset
186 #Check if the file is in the CDF format
29
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
187 if (!mzR:::netCDFIsFile(fileNames(xdata))) {
14
f4dc089f9d19 planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 22c4e92909198328fc7439ff47e4546a273eb907
lecorguille
parents: 13
diff changeset
188
f4dc089f9d19 planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 22c4e92909198328fc7439ff47e4546a273eb907
lecorguille
parents: 13
diff changeset
189 # If the column isn't exist, with add one filled with NA
29
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
190 if (is.null(sampleMetadata$polarity)) sampleMetadata$polarity <- NA
4
fef3d1b8e7f4 planemo upload commit a3229faad6949bbca965d1d7e138cb3c0550780e
lecorguille
parents:
diff changeset
191
14
f4dc089f9d19 planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 22c4e92909198328fc7439ff47e4546a273eb907
lecorguille
parents: 13
diff changeset
192 #Extract the polarity (a list of polarities)
29
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
193 polarity <- fData(xdata)[fData(xdata)$fileIdx == fileIdx,"polarity"]
14
f4dc089f9d19 planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 22c4e92909198328fc7439ff47e4546a273eb907
lecorguille
parents: 13
diff changeset
194 #Verify if all the scans have the same polarity
29
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
195 uniq_list <- unique(polarity)
14
f4dc089f9d19 planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 22c4e92909198328fc7439ff47e4546a273eb907
lecorguille
parents: 13
diff changeset
196 if (length(uniq_list)>1){
29
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
197 polarity <- "mixed"
14
f4dc089f9d19 planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 22c4e92909198328fc7439ff47e4546a273eb907
lecorguille
parents: 13
diff changeset
198 } else {
29
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
199 polarity <- as.character(uniq_list)
14
f4dc089f9d19 planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 22c4e92909198328fc7439ff47e4546a273eb907
lecorguille
parents: 13
diff changeset
200 }
4
fef3d1b8e7f4 planemo upload commit a3229faad6949bbca965d1d7e138cb3c0550780e
lecorguille
parents:
diff changeset
201
14
f4dc089f9d19 planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 22c4e92909198328fc7439ff47e4546a273eb907
lecorguille
parents: 13
diff changeset
202 #Set the polarity attribute
29
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
203 sampleMetadata$polarity[fileIdx] <- polarity
14
f4dc089f9d19 planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 22c4e92909198328fc7439ff47e4546a273eb907
lecorguille
parents: 13
diff changeset
204 }
f4dc089f9d19 planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 22c4e92909198328fc7439ff47e4546a273eb907
lecorguille
parents: 13
diff changeset
205
f4dc089f9d19 planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 22c4e92909198328fc7439ff47e4546a273eb907
lecorguille
parents: 13
diff changeset
206 }
f4dc089f9d19 planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 22c4e92909198328fc7439ff47e4546a273eb907
lecorguille
parents: 13
diff changeset
207
f4dc089f9d19 planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 22c4e92909198328fc7439ff47e4546a273eb907
lecorguille
parents: 13
diff changeset
208 write.table(sampleMetadata, sep="\t", quote=FALSE, row.names=FALSE, file=sampleMetadataOutput)
f4dc089f9d19 planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 22c4e92909198328fc7439ff47e4546a273eb907
lecorguille
parents: 13
diff changeset
209
29
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
210 return(list("sampleNamesOrigin"=sampleNamesOrigin, "sampleNamesMakeNames"=sampleNamesMakeNames))
4
fef3d1b8e7f4 planemo upload commit a3229faad6949bbca965d1d7e138cb3c0550780e
lecorguille
parents:
diff changeset
211
fef3d1b8e7f4 planemo upload commit a3229faad6949bbca965d1d7e138cb3c0550780e
lecorguille
parents:
diff changeset
212 }
fef3d1b8e7f4 planemo upload commit a3229faad6949bbca965d1d7e138cb3c0550780e
lecorguille
parents:
diff changeset
213
fef3d1b8e7f4 planemo upload commit a3229faad6949bbca965d1d7e138cb3c0550780e
lecorguille
parents:
diff changeset
214
29
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
215 # This function check if xcms will found all the files
4
fef3d1b8e7f4 planemo upload commit a3229faad6949bbca965d1d7e138cb3c0550780e
lecorguille
parents:
diff changeset
216 #@author Gildas Le Corguille lecorguille@sb-roscoff.fr ABiMS TEAM
fef3d1b8e7f4 planemo upload commit a3229faad6949bbca965d1d7e138cb3c0550780e
lecorguille
parents:
diff changeset
217 checkFilesCompatibilityWithXcms <- function(directory) {
14
f4dc089f9d19 planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 22c4e92909198328fc7439ff47e4546a273eb907
lecorguille
parents: 13
diff changeset
218 cat("Checking files filenames compatibilities with xmcs...\n")
f4dc089f9d19 planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 22c4e92909198328fc7439ff47e4546a273eb907
lecorguille
parents: 13
diff changeset
219 # WHAT XCMS WILL FIND
f4dc089f9d19 planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 22c4e92909198328fc7439ff47e4546a273eb907
lecorguille
parents: 13
diff changeset
220 filepattern <- c("[Cc][Dd][Ff]", "[Nn][Cc]", "([Mm][Zz])?[Xx][Mm][Ll]","[Mm][Zz][Dd][Aa][Tt][Aa]", "[Mm][Zz][Mm][Ll]")
29
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
221 filepattern <- paste(paste("\\.", filepattern, "$", sep=""),collapse="|")
14
f4dc089f9d19 planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 22c4e92909198328fc7439ff47e4546a273eb907
lecorguille
parents: 13
diff changeset
222 info <- file.info(directory)
29
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
223 listed <- list.files(directory[info$isdir], pattern=filepattern, recursive=TRUE, full.names=TRUE)
14
f4dc089f9d19 planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 22c4e92909198328fc7439ff47e4546a273eb907
lecorguille
parents: 13
diff changeset
224 files <- c(directory[!info$isdir], listed)
f4dc089f9d19 planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 22c4e92909198328fc7439ff47e4546a273eb907
lecorguille
parents: 13
diff changeset
225 files_abs <- file.path(getwd(), files)
f4dc089f9d19 planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 22c4e92909198328fc7439ff47e4546a273eb907
lecorguille
parents: 13
diff changeset
226 exists <- file.exists(files_abs)
f4dc089f9d19 planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 22c4e92909198328fc7439ff47e4546a273eb907
lecorguille
parents: 13
diff changeset
227 files[exists] <- files_abs[exists]
f4dc089f9d19 planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 22c4e92909198328fc7439ff47e4546a273eb907
lecorguille
parents: 13
diff changeset
228 files[exists] <- sub("//","/",files[exists])
4
fef3d1b8e7f4 planemo upload commit a3229faad6949bbca965d1d7e138cb3c0550780e
lecorguille
parents:
diff changeset
229
14
f4dc089f9d19 planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 22c4e92909198328fc7439ff47e4546a273eb907
lecorguille
parents: 13
diff changeset
230 # WHAT IS ON THE FILESYSTEM
30
cc3a32791781 planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 7b226c3ba91a3cf654ec1c14b3ef85090968bb0f
lecorguille
parents: 29
diff changeset
231 filesystem_filepaths <- system(paste0("find \"$PWD/",directory,"\" -not -name '\\.*' -not -path '*conda-env*' -type f -name \"*\""), intern=T)
29
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
232 filesystem_filepaths <- filesystem_filepaths[grep(filepattern, filesystem_filepaths, perl=T)]
4
fef3d1b8e7f4 planemo upload commit a3229faad6949bbca965d1d7e138cb3c0550780e
lecorguille
parents:
diff changeset
233
14
f4dc089f9d19 planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 22c4e92909198328fc7439ff47e4546a273eb907
lecorguille
parents: 13
diff changeset
234 # COMPARISON
f4dc089f9d19 planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 22c4e92909198328fc7439ff47e4546a273eb907
lecorguille
parents: 13
diff changeset
235 if (!is.na(table(filesystem_filepaths %in% files)["FALSE"])) {
f4dc089f9d19 planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 22c4e92909198328fc7439ff47e4546a273eb907
lecorguille
parents: 13
diff changeset
236 write("\n\nERROR: List of the files which will not be imported by xcmsSet",stderr())
f4dc089f9d19 planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 22c4e92909198328fc7439ff47e4546a273eb907
lecorguille
parents: 13
diff changeset
237 write(filesystem_filepaths[!(filesystem_filepaths %in% files)],stderr())
f4dc089f9d19 planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 22c4e92909198328fc7439ff47e4546a273eb907
lecorguille
parents: 13
diff changeset
238 stop("\n\nERROR: One or more of your files will not be import by xcmsSet. It may due to bad characters in their filenames.")
f4dc089f9d19 planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 22c4e92909198328fc7439ff47e4546a273eb907
lecorguille
parents: 13
diff changeset
239 }
4
fef3d1b8e7f4 planemo upload commit a3229faad6949bbca965d1d7e138cb3c0550780e
lecorguille
parents:
diff changeset
240 }
fef3d1b8e7f4 planemo upload commit a3229faad6949bbca965d1d7e138cb3c0550780e
lecorguille
parents:
diff changeset
241
fef3d1b8e7f4 planemo upload commit a3229faad6949bbca965d1d7e138cb3c0550780e
lecorguille
parents:
diff changeset
242
29
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
243 #This function list the compatible files within the directory as xcms did
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
244 #@author Gildas Le Corguille lecorguille@sb-roscoff.fr ABiMS TEAM
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
245 getMSFiles <- function (directory) {
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
246 filepattern <- c("[Cc][Dd][Ff]", "[Nn][Cc]", "([Mm][Zz])?[Xx][Mm][Ll]","[Mm][Zz][Dd][Aa][Tt][Aa]", "[Mm][Zz][Mm][Ll]")
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
247 filepattern <- paste(paste("\\.", filepattern, "$", sep=""),collapse="|")
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
248 info <- file.info(directory)
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
249 listed <- list.files(directory[info$isdir], pattern=filepattern,recursive=TRUE, full.names=TRUE)
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
250 files <- c(directory[!info$isdir], listed)
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
251 exists <- file.exists(files)
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
252 files <- files[exists]
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
253 return(files)
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
254 }
4
fef3d1b8e7f4 planemo upload commit a3229faad6949bbca965d1d7e138cb3c0550780e
lecorguille
parents:
diff changeset
255
29
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
256 # This function check if XML contains special caracters. It also checks integrity and completness.
4
fef3d1b8e7f4 planemo upload commit a3229faad6949bbca965d1d7e138cb3c0550780e
lecorguille
parents:
diff changeset
257 #@author Misharl Monsoor misharl.monsoor@sb-roscoff.fr ABiMS TEAM
fef3d1b8e7f4 planemo upload commit a3229faad6949bbca965d1d7e138cb3c0550780e
lecorguille
parents:
diff changeset
258 checkXmlStructure <- function (directory) {
14
f4dc089f9d19 planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 22c4e92909198328fc7439ff47e4546a273eb907
lecorguille
parents: 13
diff changeset
259 cat("Checking XML structure...\n")
4
fef3d1b8e7f4 planemo upload commit a3229faad6949bbca965d1d7e138cb3c0550780e
lecorguille
parents:
diff changeset
260
30
cc3a32791781 planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 7b226c3ba91a3cf654ec1c14b3ef85090968bb0f
lecorguille
parents: 29
diff changeset
261 cmd <- paste0("IFS=$'\n'; for xml in $(find '",directory,"' -not -name '\\.*' -not -path '*conda-env*' -type f -iname '*.*ml*'); do if [ $(xmllint --nonet --noout \"$xml\" 2> /dev/null; echo $?) -gt 0 ]; then echo $xml;fi; done;")
29
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
262 capture <- system(cmd, intern=TRUE)
4
fef3d1b8e7f4 planemo upload commit a3229faad6949bbca965d1d7e138cb3c0550780e
lecorguille
parents:
diff changeset
263
14
f4dc089f9d19 planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 22c4e92909198328fc7439ff47e4546a273eb907
lecorguille
parents: 13
diff changeset
264 if (length(capture)>0){
f4dc089f9d19 planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 22c4e92909198328fc7439ff47e4546a273eb907
lecorguille
parents: 13
diff changeset
265 #message=paste("The following mzXML or mzML file is incorrect, please check these files first:",capture)
f4dc089f9d19 planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 22c4e92909198328fc7439ff47e4546a273eb907
lecorguille
parents: 13
diff changeset
266 write("\n\nERROR: The following mzXML or mzML file(s) are incorrect, please check these files first:", stderr())
f4dc089f9d19 planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 22c4e92909198328fc7439ff47e4546a273eb907
lecorguille
parents: 13
diff changeset
267 write(capture, stderr())
f4dc089f9d19 planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 22c4e92909198328fc7439ff47e4546a273eb907
lecorguille
parents: 13
diff changeset
268 stop("ERROR: xcmsSet cannot continue with incorrect mzXML or mzML files")
f4dc089f9d19 planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 22c4e92909198328fc7439ff47e4546a273eb907
lecorguille
parents: 13
diff changeset
269 }
13
206e5a968dc5 planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 08e7f269a5c59687a7768be8db5fcb4e4d736093
lecorguille
parents: 12
diff changeset
270
4
fef3d1b8e7f4 planemo upload commit a3229faad6949bbca965d1d7e138cb3c0550780e
lecorguille
parents:
diff changeset
271 }
fef3d1b8e7f4 planemo upload commit a3229faad6949bbca965d1d7e138cb3c0550780e
lecorguille
parents:
diff changeset
272
fef3d1b8e7f4 planemo upload commit a3229faad6949bbca965d1d7e138cb3c0550780e
lecorguille
parents:
diff changeset
273
29
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
274 # This function check if XML contain special characters
4
fef3d1b8e7f4 planemo upload commit a3229faad6949bbca965d1d7e138cb3c0550780e
lecorguille
parents:
diff changeset
275 #@author Misharl Monsoor misharl.monsoor@sb-roscoff.fr ABiMS TEAM
fef3d1b8e7f4 planemo upload commit a3229faad6949bbca965d1d7e138cb3c0550780e
lecorguille
parents:
diff changeset
276 deleteXmlBadCharacters<- function (directory) {
14
f4dc089f9d19 planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 22c4e92909198328fc7439ff47e4546a273eb907
lecorguille
parents: 13
diff changeset
277 cat("Checking Non ASCII characters in the XML...\n")
4
fef3d1b8e7f4 planemo upload commit a3229faad6949bbca965d1d7e138cb3c0550780e
lecorguille
parents:
diff changeset
278
29
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
279 processed <- F
30
cc3a32791781 planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 7b226c3ba91a3cf654ec1c14b3ef85090968bb0f
lecorguille
parents: 29
diff changeset
280 l <- system( paste0("find '",directory, "' -not -name '\\.*' -not -path '*conda-env*' -type f -iname '*.*ml*'"), intern=TRUE)
14
f4dc089f9d19 planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 22c4e92909198328fc7439ff47e4546a273eb907
lecorguille
parents: 13
diff changeset
281 for (i in l){
29
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
282 cmd <- paste("LC_ALL=C grep '[^ -~]' \"", i, "\"", sep="")
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
283 capture <- suppressWarnings(system(cmd, intern=TRUE))
14
f4dc089f9d19 planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 22c4e92909198328fc7439ff47e4546a273eb907
lecorguille
parents: 13
diff changeset
284 if (length(capture)>0){
29
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
285 cmd <- paste("perl -i -pe 's/[^[:ascii:]]//g;'",i)
14
f4dc089f9d19 planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 22c4e92909198328fc7439ff47e4546a273eb907
lecorguille
parents: 13
diff changeset
286 print( paste("WARNING: Non ASCII characters have been removed from the ",i,"file") )
29
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
287 c <- system(cmd, intern=TRUE)
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
288 capture <- ""
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
289 processed <- T
14
f4dc089f9d19 planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 22c4e92909198328fc7439ff47e4546a273eb907
lecorguille
parents: 13
diff changeset
290 }
4
fef3d1b8e7f4 planemo upload commit a3229faad6949bbca965d1d7e138cb3c0550780e
lecorguille
parents:
diff changeset
291 }
14
f4dc089f9d19 planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 22c4e92909198328fc7439ff47e4546a273eb907
lecorguille
parents: 13
diff changeset
292 if (processed) cat("\n\n")
f4dc089f9d19 planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 22c4e92909198328fc7439ff47e4546a273eb907
lecorguille
parents: 13
diff changeset
293 return(processed)
4
fef3d1b8e7f4 planemo upload commit a3229faad6949bbca965d1d7e138cb3c0550780e
lecorguille
parents:
diff changeset
294 }
fef3d1b8e7f4 planemo upload commit a3229faad6949bbca965d1d7e138cb3c0550780e
lecorguille
parents:
diff changeset
295
fef3d1b8e7f4 planemo upload commit a3229faad6949bbca965d1d7e138cb3c0550780e
lecorguille
parents:
diff changeset
296
29
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
297 # This function will compute MD5 checksum to check the data integrity
4
fef3d1b8e7f4 planemo upload commit a3229faad6949bbca965d1d7e138cb3c0550780e
lecorguille
parents:
diff changeset
298 #@author Gildas Le Corguille lecorguille@sb-roscoff.fr
fef3d1b8e7f4 planemo upload commit a3229faad6949bbca965d1d7e138cb3c0550780e
lecorguille
parents:
diff changeset
299 getMd5sum <- function (directory) {
14
f4dc089f9d19 planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 22c4e92909198328fc7439ff47e4546a273eb907
lecorguille
parents: 13
diff changeset
300 cat("Compute md5 checksum...\n")
f4dc089f9d19 planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 22c4e92909198328fc7439ff47e4546a273eb907
lecorguille
parents: 13
diff changeset
301 # WHAT XCMS WILL FIND
f4dc089f9d19 planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 22c4e92909198328fc7439ff47e4546a273eb907
lecorguille
parents: 13
diff changeset
302 filepattern <- c("[Cc][Dd][Ff]", "[Nn][Cc]", "([Mm][Zz])?[Xx][Mm][Ll]","[Mm][Zz][Dd][Aa][Tt][Aa]", "[Mm][Zz][Mm][Ll]")
29
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
303 filepattern <- paste(paste("\\.", filepattern, "$", sep=""),collapse="|")
14
f4dc089f9d19 planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 22c4e92909198328fc7439ff47e4546a273eb907
lecorguille
parents: 13
diff changeset
304 info <- file.info(directory)
29
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
305 listed <- list.files(directory[info$isdir], pattern=filepattern, recursive=TRUE, full.names=TRUE)
14
f4dc089f9d19 planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 22c4e92909198328fc7439ff47e4546a273eb907
lecorguille
parents: 13
diff changeset
306 files <- c(directory[!info$isdir], listed)
f4dc089f9d19 planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 22c4e92909198328fc7439ff47e4546a273eb907
lecorguille
parents: 13
diff changeset
307 exists <- file.exists(files)
f4dc089f9d19 planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 22c4e92909198328fc7439ff47e4546a273eb907
lecorguille
parents: 13
diff changeset
308 files <- files[exists]
4
fef3d1b8e7f4 planemo upload commit a3229faad6949bbca965d1d7e138cb3c0550780e
lecorguille
parents:
diff changeset
309
14
f4dc089f9d19 planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 22c4e92909198328fc7439ff47e4546a273eb907
lecorguille
parents: 13
diff changeset
310 library(tools)
4
fef3d1b8e7f4 planemo upload commit a3229faad6949bbca965d1d7e138cb3c0550780e
lecorguille
parents:
diff changeset
311
14
f4dc089f9d19 planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 22c4e92909198328fc7439ff47e4546a273eb907
lecorguille
parents: 13
diff changeset
312 #cat("\n\n")
4
fef3d1b8e7f4 planemo upload commit a3229faad6949bbca965d1d7e138cb3c0550780e
lecorguille
parents:
diff changeset
313
14
f4dc089f9d19 planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 22c4e92909198328fc7439ff47e4546a273eb907
lecorguille
parents: 13
diff changeset
314 return(as.matrix(md5sum(files)))
4
fef3d1b8e7f4 planemo upload commit a3229faad6949bbca965d1d7e138cb3c0550780e
lecorguille
parents:
diff changeset
315 }
20
a79d839d625f planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 87dc789d7cd70a3733a1ad0b5a427f4d5905795d
lecorguille
parents: 17
diff changeset
316
a79d839d625f planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 87dc789d7cd70a3733a1ad0b5a427f4d5905795d
lecorguille
parents: 17
diff changeset
317
a79d839d625f planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 87dc789d7cd70a3733a1ad0b5a427f4d5905795d
lecorguille
parents: 17
diff changeset
318 # This function get the raw file path from the arguments
29
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
319 #@author Gildas Le Corguille lecorguille@sb-roscoff.fr
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
320 getRawfilePathFromArguments <- function(singlefile, zipfile, args) {
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
321 if (!is.null(args$zipfile)) zipfile <- args$zipfile
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
322 if (!is.null(args$zipfilePositive)) zipfile <- args$zipfilePositive
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
323 if (!is.null(args$zipfileNegative)) zipfile <- args$zipfileNegative
20
a79d839d625f planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 87dc789d7cd70a3733a1ad0b5a427f4d5905795d
lecorguille
parents: 17
diff changeset
324
29
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
325 if (!is.null(args$singlefile_galaxyPath)) {
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
326 singlefile_galaxyPaths <- args$singlefile_galaxyPath;
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
327 singlefile_sampleNames <- args$singlefile_sampleName
20
a79d839d625f planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 87dc789d7cd70a3733a1ad0b5a427f4d5905795d
lecorguille
parents: 17
diff changeset
328 }
29
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
329 if (!is.null(args$singlefile_galaxyPathPositive)) {
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
330 singlefile_galaxyPaths <- args$singlefile_galaxyPathPositive;
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
331 singlefile_sampleNames <- args$singlefile_sampleNamePositive
20
a79d839d625f planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 87dc789d7cd70a3733a1ad0b5a427f4d5905795d
lecorguille
parents: 17
diff changeset
332 }
29
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
333 if (!is.null(args$singlefile_galaxyPathNegative)) {
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
334 singlefile_galaxyPaths <- args$singlefile_galaxyPathNegative;
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
335 singlefile_sampleNames <- args$singlefile_sampleNameNegative
20
a79d839d625f planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 87dc789d7cd70a3733a1ad0b5a427f4d5905795d
lecorguille
parents: 17
diff changeset
336 }
a79d839d625f planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 87dc789d7cd70a3733a1ad0b5a427f4d5905795d
lecorguille
parents: 17
diff changeset
337 if (exists("singlefile_galaxyPaths")){
30
cc3a32791781 planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 7b226c3ba91a3cf654ec1c14b3ef85090968bb0f
lecorguille
parents: 29
diff changeset
338 singlefile_galaxyPaths <- unlist(strsplit(singlefile_galaxyPaths,"\\|"))
cc3a32791781 planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 7b226c3ba91a3cf654ec1c14b3ef85090968bb0f
lecorguille
parents: 29
diff changeset
339 singlefile_sampleNames <- unlist(strsplit(singlefile_sampleNames,"\\|"))
20
a79d839d625f planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 87dc789d7cd70a3733a1ad0b5a427f4d5905795d
lecorguille
parents: 17
diff changeset
340
29
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
341 singlefile <- NULL
20
a79d839d625f planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 87dc789d7cd70a3733a1ad0b5a427f4d5905795d
lecorguille
parents: 17
diff changeset
342 for (singlefile_galaxyPath_i in seq(1:length(singlefile_galaxyPaths))) {
29
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
343 singlefile_galaxyPath <- singlefile_galaxyPaths[singlefile_galaxyPath_i]
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
344 singlefile_sampleName <- singlefile_sampleNames[singlefile_galaxyPath_i]
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
345 singlefile[[singlefile_sampleName]] <- singlefile_galaxyPath
20
a79d839d625f planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 87dc789d7cd70a3733a1ad0b5a427f4d5905795d
lecorguille
parents: 17
diff changeset
346 }
a79d839d625f planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 87dc789d7cd70a3733a1ad0b5a427f4d5905795d
lecorguille
parents: 17
diff changeset
347 }
a79d839d625f planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 87dc789d7cd70a3733a1ad0b5a427f4d5905795d
lecorguille
parents: 17
diff changeset
348 for (argument in c("zipfile","zipfilePositive","zipfileNegative","singlefile_galaxyPath","singlefile_sampleName","singlefile_galaxyPathPositive","singlefile_sampleNamePositive","singlefile_galaxyPathNegative","singlefile_sampleNameNegative")) {
29
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
349 args[[argument]] <- NULL
20
a79d839d625f planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 87dc789d7cd70a3733a1ad0b5a427f4d5905795d
lecorguille
parents: 17
diff changeset
350 }
29
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
351 return(list(zipfile=zipfile, singlefile=singlefile, args=args))
20
a79d839d625f planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 87dc789d7cd70a3733a1ad0b5a427f4d5905795d
lecorguille
parents: 17
diff changeset
352 }
a79d839d625f planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 87dc789d7cd70a3733a1ad0b5a427f4d5905795d
lecorguille
parents: 17
diff changeset
353
a79d839d625f planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 87dc789d7cd70a3733a1ad0b5a427f4d5905795d
lecorguille
parents: 17
diff changeset
354
a79d839d625f planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 87dc789d7cd70a3733a1ad0b5a427f4d5905795d
lecorguille
parents: 17
diff changeset
355 # This function retrieve the raw file in the working directory
a79d839d625f planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 87dc789d7cd70a3733a1ad0b5a427f4d5905795d
lecorguille
parents: 17
diff changeset
356 # - if zipfile: unzip the file with its directory tree
a79d839d625f planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 87dc789d7cd70a3733a1ad0b5a427f4d5905795d
lecorguille
parents: 17
diff changeset
357 # - if singlefiles: set symlink with the good filename
29
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
358 #@author Gildas Le Corguille lecorguille@sb-roscoff.fr
20
a79d839d625f planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 87dc789d7cd70a3733a1ad0b5a427f4d5905795d
lecorguille
parents: 17
diff changeset
359 retrieveRawfileInTheWorkingDirectory <- function(singlefile, zipfile) {
a79d839d625f planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 87dc789d7cd70a3733a1ad0b5a427f4d5905795d
lecorguille
parents: 17
diff changeset
360 if(!is.null(singlefile) && (length("singlefile")>0)) {
a79d839d625f planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 87dc789d7cd70a3733a1ad0b5a427f4d5905795d
lecorguille
parents: 17
diff changeset
361 for (singlefile_sampleName in names(singlefile)) {
29
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
362 singlefile_galaxyPath <- singlefile[[singlefile_sampleName]]
20
a79d839d625f planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 87dc789d7cd70a3733a1ad0b5a427f4d5905795d
lecorguille
parents: 17
diff changeset
363 if(!file.exists(singlefile_galaxyPath)){
29
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
364 error_message <- paste("Cannot access the sample:",singlefile_sampleName,"located:",singlefile_galaxyPath,". Please, contact your administrator ... if you have one!")
20
a79d839d625f planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 87dc789d7cd70a3733a1ad0b5a427f4d5905795d
lecorguille
parents: 17
diff changeset
365 print(error_message); stop(error_message)
a79d839d625f planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 87dc789d7cd70a3733a1ad0b5a427f4d5905795d
lecorguille
parents: 17
diff changeset
366 }
a79d839d625f planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 87dc789d7cd70a3733a1ad0b5a427f4d5905795d
lecorguille
parents: 17
diff changeset
367
29
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
368 if (!suppressWarnings( try (file.link(singlefile_galaxyPath, singlefile_sampleName), silent=T)))
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
369 file.copy(singlefile_galaxyPath, singlefile_sampleName)
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
370
20
a79d839d625f planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 87dc789d7cd70a3733a1ad0b5a427f4d5905795d
lecorguille
parents: 17
diff changeset
371 }
29
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
372 directory <- "."
20
a79d839d625f planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 87dc789d7cd70a3733a1ad0b5a427f4d5905795d
lecorguille
parents: 17
diff changeset
373
a79d839d625f planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 87dc789d7cd70a3733a1ad0b5a427f4d5905795d
lecorguille
parents: 17
diff changeset
374 }
29
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
375 if(!is.null(zipfile) && (zipfile != "")) {
20
a79d839d625f planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 87dc789d7cd70a3733a1ad0b5a427f4d5905795d
lecorguille
parents: 17
diff changeset
376 if(!file.exists(zipfile)){
29
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
377 error_message <- paste("Cannot access the Zip file:",zipfile,". Please, contact your administrator ... if you have one!")
20
a79d839d625f planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 87dc789d7cd70a3733a1ad0b5a427f4d5905795d
lecorguille
parents: 17
diff changeset
378 print(error_message)
a79d839d625f planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 87dc789d7cd70a3733a1ad0b5a427f4d5905795d
lecorguille
parents: 17
diff changeset
379 stop(error_message)
a79d839d625f planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 87dc789d7cd70a3733a1ad0b5a427f4d5905795d
lecorguille
parents: 17
diff changeset
380 }
a79d839d625f planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 87dc789d7cd70a3733a1ad0b5a427f4d5905795d
lecorguille
parents: 17
diff changeset
381
a79d839d625f planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 87dc789d7cd70a3733a1ad0b5a427f4d5905795d
lecorguille
parents: 17
diff changeset
382 #list all file in the zip file
29
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
383 #zip_files <- unzip(zipfile,list=T)[,"Name"]
20
a79d839d625f planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 87dc789d7cd70a3733a1ad0b5a427f4d5905795d
lecorguille
parents: 17
diff changeset
384
a79d839d625f planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 87dc789d7cd70a3733a1ad0b5a427f4d5905795d
lecorguille
parents: 17
diff changeset
385 #unzip
a79d839d625f planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 87dc789d7cd70a3733a1ad0b5a427f4d5905795d
lecorguille
parents: 17
diff changeset
386 suppressWarnings(unzip(zipfile, unzip="unzip"))
a79d839d625f planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 87dc789d7cd70a3733a1ad0b5a427f4d5905795d
lecorguille
parents: 17
diff changeset
387
a79d839d625f planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 87dc789d7cd70a3733a1ad0b5a427f4d5905795d
lecorguille
parents: 17
diff changeset
388 #get the directory name
29
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
389 suppressWarnings(filesInZip <- unzip(zipfile, list=T))
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
390 directories <- unique(unlist(lapply(strsplit(filesInZip$Name,"/"), function(x) x[1])))
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
391 directories <- directories[!(directories %in% c("__MACOSX")) & file.info(directories)$isdir]
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
392 directory <- "."
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
393 if (length(directories) == 1) directory <- directories
20
a79d839d625f planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 87dc789d7cd70a3733a1ad0b5a427f4d5905795d
lecorguille
parents: 17
diff changeset
394
a79d839d625f planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 87dc789d7cd70a3733a1ad0b5a427f4d5905795d
lecorguille
parents: 17
diff changeset
395 cat("files_root_directory\t",directory,"\n")
a79d839d625f planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 87dc789d7cd70a3733a1ad0b5a427f4d5905795d
lecorguille
parents: 17
diff changeset
396
a79d839d625f planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 87dc789d7cd70a3733a1ad0b5a427f4d5905795d
lecorguille
parents: 17
diff changeset
397 }
a79d839d625f planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 87dc789d7cd70a3733a1ad0b5a427f4d5905795d
lecorguille
parents: 17
diff changeset
398 return (directory)
a79d839d625f planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 87dc789d7cd70a3733a1ad0b5a427f4d5905795d
lecorguille
parents: 17
diff changeset
399 }
29
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
400
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
401
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
402 # This function retrieve a xset like object
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
403 #@author Gildas Le Corguille lecorguille@sb-roscoff.fr
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
404 getxcmsSetObject <- function(xobject) {
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
405 # XCMS 1.x
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
406 if (class(xobject) == "xcmsSet")
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
407 return (xobject)
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
408 # XCMS 3.x
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
409 if (class(xobject) == "XCMSnExp") {
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
410 # Get the legacy xcmsSet object
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
411 suppressWarnings(xset <- as(xobject, 'xcmsSet'))
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
412 sampclass(xset) <- xset@phenoData$sample_group
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
413 return (xset)
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
414 }
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
415 }
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
416
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
417
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
418 #@TODO: remove this function as soon as we can use xcms 3.x.x from Bioconductor 3.7
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
419 # https://github.com/sneumann/xcms/issues/250
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
420 groupnamesW4M <- function(xdata, mzdec = 0, rtdec = 0) {
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
421 mzfmt <- paste("%.", mzdec, "f", sep = "")
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
422 rtfmt <- paste("%.", rtdec, "f", sep = "")
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
423
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
424 gnames <- paste("M", sprintf(mzfmt, featureDefinitions(xdata)[,"mzmed"]), "T",
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
425 sprintf(rtfmt, featureDefinitions(xdata)[,"rtmed"]), sep = "")
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
426
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
427 if (any(dup <- duplicated(gnames)))
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
428 for (dupname in unique(gnames[dup])) {
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
429 dupidx <- which(gnames == dupname)
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
430 gnames[dupidx] <- paste(gnames[dupidx], seq(along = dupidx), sep = "_")
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
431 }
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
432
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
433 return (gnames)
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
434 }
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
435
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
436 #@TODO: remove this function as soon as we can use xcms 3.x.x from Bioconductor 3.7
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
437 # https://github.com/sneumann/xcms/issues/247
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
438 .concatenate_XCMSnExp <- function(...) {
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
439 x <- list(...)
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
440 if (length(x) == 0)
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
441 return(NULL)
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
442 if (length(x) == 1)
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
443 return(x[[1]])
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
444 ## Check that all are XCMSnExp objects.
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
445 if (!all(unlist(lapply(x, function(z) is(z, "XCMSnExp")))))
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
446 stop("All passed objects should be 'XCMSnExp' objects")
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
447 new_x <- as(.concatenate_OnDiskMSnExp(...), "XCMSnExp")
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
448 ## If any of the XCMSnExp has alignment results or detected features drop
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
449 ## them!
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
450 x <- lapply(x, function(z) {
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
451 if (hasAdjustedRtime(z)) {
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
452 z <- dropAdjustedRtime(z)
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
453 warning("Adjusted retention times found, had to drop them.")
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
454 }
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
455 if (hasFeatures(z)) {
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
456 z <- dropFeatureDefinitions(z)
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
457 warning("Feature definitions found, had to drop them.")
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
458 }
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
459 z
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
460 })
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
461 ## Combine peaks
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
462 fls <- lapply(x, fileNames)
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
463 startidx <- cumsum(lengths(fls))
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
464 pks <- lapply(x, chromPeaks)
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
465 procH <- lapply(x, processHistory)
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
466 for (i in 2:length(fls)) {
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
467 pks[[i]][, "sample"] <- pks[[i]][, "sample"] + startidx[i - 1]
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
468 procH[[i]] <- lapply(procH[[i]], function(z) {
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
469 z@fileIndex <- as.integer(z@fileIndex + startidx[i - 1])
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
470 z
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
471 })
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
472 }
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
473 pks <- do.call(rbind, pks)
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
474 new_x@.processHistory <- unlist(procH)
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
475 chromPeaks(new_x) <- pks
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
476 if (validObject(new_x))
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
477 new_x
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
478 }
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
479
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
480 #@TODO: remove this function as soon as we can use xcms 3.x.x from Bioconductor 3.7
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
481 # https://github.com/sneumann/xcms/issues/247
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
482 .concatenate_OnDiskMSnExp <- function(...) {
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
483 x <- list(...)
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
484 if (length(x) == 0)
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
485 return(NULL)
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
486 if (length(x) == 1)
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
487 return(x[[1]])
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
488 ## Check that all are XCMSnExp objects.
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
489 if (!all(unlist(lapply(x, function(z) is(z, "OnDiskMSnExp")))))
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
490 stop("All passed objects should be 'OnDiskMSnExp' objects")
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
491 ## Check processingQueue
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
492 procQ <- lapply(x, function(z) z@spectraProcessingQueue)
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
493 new_procQ <- procQ[[1]]
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
494 is_ok <- unlist(lapply(procQ, function(z)
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
495 !is.character(all.equal(new_procQ, z))
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
496 ))
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
497 if (any(!is_ok)) {
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
498 warning("Processing queues from the submitted objects differ! ",
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
499 "Dropping the processing queue.")
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
500 new_procQ <- list()
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
501 }
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
502 ## processingData
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
503 fls <- lapply(x, function(z) z@processingData@files)
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
504 startidx <- cumsum(lengths(fls))
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
505 ## featureData
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
506 featd <- lapply(x, fData)
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
507 ## Have to update the file index and the spectrum names.
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
508 for (i in 2:length(featd)) {
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
509 featd[[i]]$fileIdx <- featd[[i]]$fileIdx + startidx[i - 1]
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
510 rownames(featd[[i]]) <- MSnbase:::formatFileSpectrumNames(
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
511 fileIds = featd[[i]]$fileIdx,
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
512 spectrumIds = featd[[i]]$spIdx,
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
513 nSpectra = nrow(featd[[i]]),
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
514 nFiles = length(unlist(fls))
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
515 )
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
516 }
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
517 featd <- do.call(rbind, featd)
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
518 featd$spectrum <- 1:nrow(featd)
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
519 ## experimentData
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
520 expdata <- lapply(x, function(z) {
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
521 ed <- z@experimentData
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
522 data.frame(instrumentManufacturer = ed@instrumentManufacturer,
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
523 instrumentModel = ed@instrumentModel,
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
524 ionSource = ed@ionSource,
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
525 analyser = ed@analyser,
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
526 detectorType = ed@detectorType,
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
527 stringsAsFactors = FALSE)
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
528 })
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
529 expdata <- do.call(rbind, expdata)
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
530 expdata <- new("MIAPE",
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
531 instrumentManufacturer = expdata$instrumentManufacturer,
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
532 instrumentModel = expdata$instrumentModel,
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
533 ionSource = expdata$ionSource,
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
534 analyser = expdata$analyser,
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
535 detectorType = expdata$detectorType)
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
536
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
537 ## protocolData
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
538 protodata <- lapply(x, function(z) z@protocolData)
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
539 if (any(unlist(lapply(protodata, nrow)) > 0))
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
540 warning("Found non-empty protocol data, but merging protocol data is",
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
541 " currently not supported. Skipped.")
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
542 ## phenoData
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
543 pdata <- do.call(rbind, lapply(x, pData))
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
544 res <- new(
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
545 "OnDiskMSnExp",
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
546 phenoData = new("NAnnotatedDataFrame", data = pdata),
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
547 featureData = new("AnnotatedDataFrame", featd),
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
548 processingData = new("MSnProcess",
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
549 processing = paste0("Concatenated [", date(), "]"),
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
550 files = unlist(fls), smoothed = NA),
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
551 experimentData = expdata,
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
552 spectraProcessingQueue = new_procQ)
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
553 if (validObject(res))
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
554 res
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
555 }
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
556
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
557 #@TODO: remove this function as soon as we can use xcms 3.x.x from Bioconductor 3.7
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
558 # https://github.com/sneumann/xcms/issues/247
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
559 c.XCMSnExp <- function(...) {
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
560 .concatenate_XCMSnExp(...)
020d065edd9e planemo upload for repository https://github.com/workflow4metabolomics/xcms commit e384d6dd5f410799ec211f73bca0b5d5d7bc651e
lecorguille
parents: 28
diff changeset
561 }