@@ -81,8 +84,6 @@ #if $peaklist.peaklistBool - variableMetadataOutput '$variableMetadata' - dataMatrixOutput '$dataMatrix' convertRTMinute $peaklist.convertRTMinute numDigitsMZ $peaklist.numDigitsMZ numDigitsRT $peaklist.numDigitsRT @@ -108,10 +109,10 @@ - + (peaklist['peaklistBool']) - + (peaklist['peaklistBool']) @@ -131,6 +132,39 @@ + + +For details and explanations for all the parameters and the workflow of xcms_ package, see its manual_ and this example_ + +.. _xcms: https://bioconductor.org/packages/release/bioc/html/xcms.html +.. _manual: http://www.bioconductor.org/packages/release/bioc/manuals/xcms/man/xcms.pdf +.. _example: https://bioconductor.org/packages/release/bioc/vignettes/xcms/inst/doc/xcms.html + + + + + +Get a Peak List +--------------- + +If 'true', the module generates two additional files corresponding to the peak list: +- the variable metadata file (corresponding to information about extracted ions such as mass or retention time) +- the data matrix (corresponding to related intensities) + +**decimal places for [mass or retention time] values in identifiers** + + | Ions' identifiers are constructed as MxxxTyyy where 'xxx' is the ion median mass and 'yyy' the ion median retention time. + | Two parameters are used to adjust the number of decimal places wanted in identifiers for mass and retention time respectively. + | Theses parameters do not affect decimal places in columns other than the identifier one. + +**Reported intensity values** + + | This parameter determines which values should be reported as intensities in the dataMatrix table; it correspond to xcms 'intval' parameter: + | - into: integrated area of original (raw) peak + | - maxo: maximum intensity of original (raw) peak + | - intb: baseline corrected integrated peak area (only available if peak detection was done by ‘findPeaks.centWave’) + + diff -r 8ad83969888b -r 3d4339594010 test-data/faahKO-single.xset.merged.group.retcor.group.fillpeaks.RData Binary file test-data/faahKO-single.xset.merged.group.retcor.group.fillpeaks.RData has changed diff -r 8ad83969888b -r 3d4339594010 test-data/faahKO-single.xset.merged.group.retcor.group.fillpeaks.summary.html --- a/test-data/faahKO-single.xset.merged.group.retcor.group.fillpeaks.summary.html Tue Feb 13 04:45:13 2018 -0500 +++ b/test-data/faahKO-single.xset.merged.group.retcor.group.fillpeaks.summary.html Thu Mar 01 04:17:50 2018 -0500 @@ -17,79 +17,126 @@

Samples used:

- +

sample	filename	md5sum^*
ko15	./ko15.CDF	4698c36c0b3af007faf70975c04ccf2a
ko16	./ko16.CDF	afaeed94ced3140bc042d5ab6aeb16c1
wt15	./wt15.CDF	d58a27fad7c04ddddb0359ddc2b7ba68
wt16	./wt16.CDF	29654e9f8ad48c1fbe2a41b9ba578f6e
ko15	ko15.CDF	4698c36c0b3af007faf70975c04ccf2a
ko16	ko16.CDF	afaeed94ced3140bc042d5ab6aeb16c1
wt15	wt15.CDF	d58a27fad7c04ddddb0359ddc2b7ba68
wt16	wt16.CDF	29654e9f8ad48c1fbe2a41b9ba578f6e

^*The program md5sum is designed to verify data integrity. So you can check if the data were uploaded correctly or if the data were changed during the process.

Function launched:

- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - + + + + +

timestamp^***	function	argument	value
170203-11:04:42	xcmsSet	nSlaves	1
		method	centWave
		ppm	25
		peakwidth	2050
170203-11:05:21	xcmsSet	nSlaves	1
		method	centWave
		ppm	25
		peakwidth	2050
170203-11:06:21	xcmsSet	nSlaves	1
		method	centWave
		ppm	25
		peakwidth	2050
170203-11:06:59	xcmsSet	nSlaves	1
		method	centWave
		ppm	25
		peakwidth	2050
170203-14:38:53	group	method	density
		sleep	0.001
		minfrac	0.3
		bw	5
		mzwid	0.01
		max	50
170203-14:51:16	retcor	method	peakgroups
		smooth	loess
		extra	1
		missing	1
		span	0.2
		family	gaussian
		plottype	deviation
170203-15:27:58	group	method	density
		sleep	0.001
		minfrac	0.3
		bw	5
		mzwid	0.01
		max	50
170203-15:44:50	fillPeaks	method	chrom
		convertRTMinute	FALSE
		numDigitsMZ	4
		numDigitsRT	1
		intval	into
Wed Feb 7 11:15:25 2018	Peak detection	+Object of class: CentWaveParam +Parameters: + ppm: 25 + peakwidth: 20, 50 + snthresh: 10 + prefilter: 3, 100 + mzCenterFun: wMean + integrate: 1 + mzdiff: -0.001 + fitgauss: FALSE + noise: 0 + verboseColumns: FALSE + roiList length: 0 + firstBaselineCheck TRUE + roiScales length: 0 +
Mon Feb 12 15:31:11 2018	Peak grouping	+Object of class: PeakDensityParam +Parameters: + sampleGroups: character of length 4 + bw: 30 + minFraction: 0.8 + minSamples: 1 + binSize: 0.25 + maxFeatures: 50 +
Mon Feb 12 15:31:19 2018	Retention time correction	+Object of class: PeakGroupsParam +Parameters: + minFraction: 0.85 + extraPeaks: 1 + smooth: loess + span: 0.2 + family: gaussian + number of peak groups: 125 +
Mon Feb 12 15:31:27 2018	Peak grouping	+Object of class: PeakDensityParam +Parameters: + sampleGroups: character of length 4 + bw: 20 + minFraction: 0.4 + minSamples: 1 + binSize: 0.25 + maxFeatures: 50 +
Wed Feb 14 09:55:13 2018	Missing peak filling	+Object of class: FillChromPeaksParam +Parameters: + expandMz: 0 + expandRt: 0 + ppm: 0 +

-
^***timestamp format: yymmdd-hh:mm:ss +
^***timestamp format: DD MM dd hh:mm:ss YYYY or yymmdd-hh:mm:ss

Informations about the XCMSnExp object:

+MSn experiment data ("XCMSnExp")
+Object size in memory: 1.36 Mb
+- - - Spectra data - - -
+ MS level(s): 1 
+ Number of spectra: 5112 
+ MSn retention times: 41:33 - 75:0 minutes
+- - - Processing information - - -
+Concatenated [Thu Feb  8 15:36:09 2018] 
+ MSnbase version: 2.4.2 
+- - - Meta data  - - -
+phenoData
+  rowNames: ./ko15.CDF ./ko16.CDF ./wt15.CDF ./wt16.CDF
+  varLabels: sample_name sample_group
+  varMetadata: labelDescription
+Loaded from:
+  [1] ko15.CDF...  [4] wt16.CDF
+  Use 'fileNames(.)' to see all files.
+protocolData: none
+featureData
+  featureNames: F1.S0001 F1.S0002 ... F4.S1278 (5112 total)
+  fvarLabels: fileIdx spIdx ... spectrum (27 total)
+  fvarMetadata: labelDescription
+experimentData: use 'experimentData(object)'
+- - - xcms preprocessing - - -
+Chromatographic peak detection:
+ method: centWave 
+ 15230 peaks identified in 4 samples.
+ On average 3808 chromatographic peaks per sample.
+Alignment/retention time adjustment:
+ method: peak groups 
+Correspondence:
+ method: chromatographic peak density 
+ 6332 features identified.
+ Median mz range of features: 0
+ Median rt range of features: 0
+ 5979 filled peaks (on average 1494.75 per sample).
+

Informations about the xcmsSet object:

 An "xcmsSet" object with 4 samples
 
-Time range: 2506-4484 seconds (41.8-74.7 minutes)
+Time range: 2499.4-4473.6 seconds (41.7-74.6 minutes)
 Mass range: 200.1-600 m/z
-Peaks: 32720 (about 8180 per sample)
-Peak Groups: 8157 
+Peaks: 15230 (about 3808 per sample)
+Peak Groups: 6332 
 Sample classes: KO, WT 
 
-Peak picking was performed on MS1.
+Feature detection:
+ o Peak picking performed on MS1.
+ o Scan range limited to  1 - 1278 
 Profile settings: method = bin
                   step = 0.1
 
-Memory usage: 4.25 MB
+Memory usage: 2.98 MB

Citations:

Samples used:

- +

sample	filename	md5sum^*
ko15	faahKO_reduce/KO/ko15.CDF	4698c36c0b3af007faf70975c04ccf2a
ko16	faahKO_reduce/KO/ko16.CDF	afaeed94ced3140bc042d5ab6aeb16c1
wt15	faahKO_reduce/WT/wt15.CDF	d58a27fad7c04ddddb0359ddc2b7ba68
wt16	faahKO_reduce/WT/wt16.CDF	29654e9f8ad48c1fbe2a41b9ba578f6e
ko15	faahKO_reduce/KO/ko15.CDF	4698c36c0b3af007faf70975c04ccf2a
ko16	faahKO_reduce/KO/ko16.CDF	afaeed94ced3140bc042d5ab6aeb16c1
wt15	faahKO_reduce/WT/wt15.CDF	d58a27fad7c04ddddb0359ddc2b7ba68
wt16	faahKO_reduce/WT/wt16.CDF	29654e9f8ad48c1fbe2a41b9ba578f6e

^*The program md5sum is designed to verify data integrity. So you can check if the data were uploaded correctly or if the data were changed during the process.

^***

Informations about the xcmsSet object:

@@ -66,6 +66,7 @@
 Peak Groups: 8157 
 Sample classes: KO, WT 
 
+Feature detection:
 Profile settings: method = bin
                   step = 0.1
 
diff -r 8ad83969888b -r 3d4339594010 xcms_summary.r
--- a/xcms_summary.r	Tue Feb 13 04:45:13 2018 -0500
+++ b/xcms_summary.r	Thu Mar 01 04:17:50 2018 -0500
@@ -1,51 +1,81 @@
 #!/usr/bin/env Rscript
-# version="1.0.0"
-#@author Gildas Le Corguille lecorguille@sb-roscoff.fr ABIMS TEAM
 
 
 
 # ----- ARGUMENTS BLACKLIST -----
 #xcms.r
-argBlacklist=c("zipfile","singlefile_galaxyPath","singlefile_sampleName","xfunction","xsetRdataOutput","sampleMetadataOutput","ticspdf","bicspdf","rplotspdf")
+argBlacklist <- c("zipfile", "singlefile_galaxyPath", "singlefile_sampleName", "xfunction", "xsetRdataOutput", "sampleMetadataOutput", "ticspdf", "bicspdf", "rplotspdf")
 #CAMERA.r
-argBlacklist=c(argBlacklist,"dataMatrixOutput","variableMetadataOutput","new_file_path")
+argBlacklist <- c(argBlacklist, "dataMatrixOutput", "variableMetadataOutput", "new_file_path")
+
 
 # ----- PACKAGE -----
+cat("\tSESSION INFO\n")
 
-pkgs=c("parallel","BiocGenerics", "Biobase", "Rcpp", "mzR", "igraph", "xcms","CAMERA","batch")
-for(pkg in pkgs) {
-    cat(pkg,"\n")
-    suppressPackageStartupMessages( stopifnot( library(pkg, quietly=TRUE, logical.return=TRUE, character.only=TRUE)))
-}
+#Import the different functions
+source_local <- function(fname){ argv <- commandArgs(trailingOnly=FALSE); base_dir <- dirname(substring(argv[grep("--file=", argv)], 8)); source(paste(base_dir, fname, sep="/")) }
+source_local("lib.r")
+
+pkgs <- c("CAMERA","batch")
+loadAndDisplayPackages(pkgs)
+cat("\n\n");
 
 
 # ----- FUNCTION -----
-writehtml = function(...) { cat(...,"\n", file=htmlOutput,append = TRUE,sep="") }
+writehtml <- function(...) { cat(...,"\n", file=htmlOutput,append = TRUE,sep="") }
+writeraw <- function(htmlOutput, object, open="at") {
+    log_file <- file(htmlOutput, open = open)
+    sink(log_file)
+    sink(log_file, type = "output")
+        print(object)
+    sink()
+    close(log_file)
+}
+getSampleNames <- function(xobject) {
+    if (class(xobject) == "xcmsSet")
+        return (sampnames(xobject))
+    if (class(xobject) == "XCMSnExp")
+        return (xobject@phenoData@data$sample_name)
+}
+getFilePaths <- function(xobject) {
+    if (class(xobject) == "xcmsSet")
+        return (xobject@filepaths)
+    if (class(xobject) == "XCMSnExp")
+        return (fileNames(xobject))
+}
+equalParams <- function(param1, param2) {
+    writeraw("param1.txt", param1, open="wt")
+    writeraw("param2.txt", param2, open="wt")
+    return(tools::md5sum("param1.txt") == tools::md5sum("param2.txt"))
+}
 
 
 # ----- ARGUMENTS -----
 
-listArguments = parseCommandArgs(evaluate=FALSE) #interpretation of arguments given in command line as an R list of objects
+args <- parseCommandArgs(evaluate=FALSE) #interpretation of arguments given in command line as an R list of objects
 
 
 # ----- ARGUMENTS PROCESSING -----
 
 #image is an .RData file necessary to use xset variable given by previous tools
-load(listArguments[["image"]]);
+load(args$image);
 
-htmlOutput = "summary.html"
-if (!is.null(listArguments[["htmlOutput"]])) htmlOutput = listArguments[["htmlOutput"]];
+htmlOutput <- "summary.html"
+if (!is.null(args$htmlOutput)) htmlOutput = args$htmlOutput;
 
-user_email = NULL
-if (!is.null(listArguments[["user_email"]])) user_email = listArguments[["user_email"]];
+user_email <- NULL
+if (!is.null(args$user_email)) user_email = args$user_email;
 
-# if the RData come from CAMERA
-if (!exists("xset") & exists("xa")) xset=xa@xcmsSet
-
+# if the RData come from XCMS 1.x
+if (exists("xset")) xobject <- xset
 # retrocompatability
-if (!exists("sampleNamesList")) sampleNamesList=list("sampleNamesMakeNames"=make.names(sampnames(xset)))
+if (!exists("sampleNamesList")) sampleNamesList <- list("sampleNamesMakeNames"=make.names(sampnames(xobject)))
+# if the RData come from CAMERA
+if (exists("xa")) xobject <- xa@xcmsSet
+# if the RData come from XCMS 3.x
+if (exists("xdata")) xobject <- xdata
 
-if (!exists("xset")) stop("You need at least a xset or a xa object.")
+if (!exists("xobject")) stop("You need at least a xdata, a xset or a xa object.")
 
 
 
@@ -71,37 +101,37 @@
     writehtml("___ XCMS analysis summary using Workflow4Metabolomics ___")
     # to pass the planemo shed_test
     if (user_email != "test@bx.psu.edu") {
-        if (!is.null(user_email)) writehtml("By: ",user_email," - ")
-        writehtml("Date: ",format(Sys.time(), "%y%m%d-%H:%M:%S"))
+        if (!is.null(user_email)) writehtml("By: ", user_email," - ")
+        writehtml("Date: ", format(Sys.time(), "%y%m%d-%H:%M:%S"))
     }
     writehtml("")
 
     writehtml("Samples used:")
     writehtml("")
-        if (all(sampnames(xset) == sampleNamesList$sampleNamesMakeNames)) {
-            sampleNameHeaderHtml = paste("")
-            sampleNameHtml = paste("")
+        if (all(getSampleNames(xobject) == sampleNamesList$sampleNamesMakeNames)) {
+            sampleNameHeaderHtml <- paste0("")
+            sampleNameHtml <- paste0("")
         } else {
-            sampleNameHeaderHtml = paste("")
-            sampleNameHtml = paste("")
+            sampleNameHeaderHtml <- paste0("")
+            sampleNameHtml <- paste0("")
         }
 
         if (!exists("md5sumList")) {
-            md5sumHeaderHtml = ""
-            md5sumHtml = ""
-            md5sumLegend=""
+            md5sumHeaderHtml <- ""
+            md5sumHtml <- ""
+            md5sumLegend <- ""
         } else if (is.null(md5sumList$removalBadCharacters)) {
-            md5sumHeaderHtml = paste("")
-            md5sumHtml = paste("")
-            md5sumLegend = "
^*The program md5sum is designed to verify data integrity. So you can check if the data were uploaded correctly or if the data were changed during the process."
+            md5sumHeaderHtml <- paste0("")
+            md5sumHtml <- paste0("")
+            md5sumLegend <- "
^*The program md5sum is designed to verify data integrity. So you can check if the data were uploaded correctly or if the data were changed during the process."
         } else {
-            md5sumHeaderHtml = paste("")
-            md5sumHtml = paste("")
-            md5sumLegend = "
^*The program md5sum is designed to verify data integrity. So you can check if the data were uploaded correctly or if the data were changed during the process.
^**Because some bad characters (eg: accent) were removed from your original file, the checksum have changed too.
"
+            md5sumHeaderHtml <- paste0("")
+            md5sumHtml <- paste0("")
+            md5sumLegend <- "
^*The program md5sum is designed to verify data integrity. So you can check if the data were uploaded correctly or if the data were changed during the process.
^**Because some bad characters (eg: accent) were removed from your original file, the checksum have changed too.
"
         }
 
         writehtml("",sampleNameHeaderHtml,"",md5sumHeaderHtml,"")
-        writehtml(paste("",sampleNameHtml,"",md5sumHtml,""))
+        writehtml(paste0("",sampleNameHtml,"",md5sumHtml,""))
 
     writehtml("sample ",sampnames(xset)," sample ",getSampleNames(xobject)," sample sample renamed ",sampnames(xset)," ",sampleNamesList$sampleNamesMakeNames," sample sample renamed ",getSampleNames(xobject)," ",sampleNamesList$sampleNamesMakeNames," md5sum^* ",md5sumList$origin," md5sum^* ",md5sumList$origin," md5sum^* md5sum^** after bad characters removal ",md5sumList$origin," ",md5sumList$removalBadCharacters," md5sum^* md5sum^** after bad characters removal ",md5sumList$origin," ",md5sumList$removalBadCharacters,"
filename
",xset@filepaths,"
",getFilePaths(xobject),"")
     writehtml(md5sumLegend)
@@ -110,32 +140,57 @@
     writehtml("Function launched:")
     writehtml("")
         writehtml("")
-        for(tool in names(listOFlistArguments)) {
-            listOFlistArgumentsDisplay=listOFlistArguments[[tool]][!(names(listOFlistArguments[[tool]]) %in% argBlacklist)]
+        # XCMS 3.x
+        if (class(xobject) == "XCMSnExp") {
+            xcmsFunction <- NULL
+            params <- NULL
+            for (processHistoryItem in processHistory(xobject)) {
+                if ((xcmsFunction == processType(processHistoryItem)) && equalParams(params, processParam(processHistoryItem)))
+                    next
+                timestamp <- processDate(processHistoryItem)
+                xcmsFunction <- processType(processHistoryItem)
+                params <- processParam(processHistoryItem)
+                writehtml("")
+            }
+        }
+        # CAMERA and retrocompatability XCMS 1.x
+        if (exists("listOFlistArguments")) {
+            for(tool in names(listOFlistArguments)) {
+                listOFlistArgumentsDisplay <- listOFlistArguments[[tool]][!(names(listOFlistArguments[[tool]]) %in% argBlacklist)]
 
-            timestamp = strsplit(tool,"_")[[1]][1]
-            xcmsFunction = strsplit(tool,"_")[[1]][2]
-            writehtml("")
-            line_begin=""
-            for (arg in names(listOFlistArgumentsDisplay)) {
-                writehtml(line_begin,"")
-                line_begin=""
+                timestamp <- strsplit(tool,"_")[[1]][1]
+                xcmsFunction <- strsplit(tool,"_")[[1]][2]
+                writehtml("")
+                line_begin <- ""
+                for (arg in names(listOFlistArgumentsDisplay)) {
+                    writehtml(line_begin,"")
+                    line_begin <- ""
+                }
             }
         }
     writehtml("timestamp^*** function argument value
",timestamp," ",xcmsFunction," ")
+                writeraw(htmlOutput, params)
+                writehtml("
",timestamp," ",xcmsFunction," ",arg," ",unlist(listOFlistArgumentsDisplay[arg][1]),"
",timestamp," ",xcmsFunction," ",arg," ",unlist(listOFlistArgumentsDisplay[arg][1]),"
")
-    writehtml("
^***timestamp format: yymmdd-hh:mm:ss")
+    writehtml("
^***timestamp format: DD MM dd hh:mm:ss YYYY or yymmdd-hh:mm:ss")
     writehtml("")
 
+    if (class(xobject) == "XCMSnExp") {
+        writehtml("Informations about the XCMSnExp object:")
+
+        writehtml("")
+            writeraw(htmlOutput, xobject)
+        writehtml("")
+    }
+
     writehtml("Informations about the xcmsSet object:")
 
     writehtml("")
-        log_file=file(htmlOutput, open = "at")
-        sink(log_file)
-        sink(log_file, type = "output")
-            xset
-        sink()
+        # Get the legacy xcmsSet object
+        xset <- getxcmsSetObject(xobject)
+        writeraw(htmlOutput, xset)
     writehtml("")
 
+    # CAMERA
     if (exists("xa")) {
         writehtml("Informations about the CAMERA object:")

filename
sample	",sampnames(xset),"	sample	",getSampleNames(xobject),"	sample	sample renamed	",sampnames(xset),"	",sampleNamesList$sampleNamesMakeNames,"	sample	sample renamed	",getSampleNames(xobject),"	",sampleNamesList$sampleNamesMakeNames,"	md5sum^*	",md5sumList$origin,"	md5sum^*	",md5sumList$origin,"	md5sum^*	md5sum^** after bad characters removal	",md5sumList$origin,"	",md5sumList$removalBadCharacters,"	md5sum^*	md5sum^** after bad characters removal	",md5sumList$origin,"	",md5sumList$removalBadCharacters,"
",xset@filepaths,"
",getFilePaths(xobject),"

timestamp^***	function	argument	value
",timestamp,"	",xcmsFunction,"	") + writeraw(htmlOutput, params) + writehtml("
",timestamp,"	",xcmsFunction,"	",arg,"	",unlist(listOFlistArgumentsDisplay[arg][1]),"
",timestamp,"	",xcmsFunction,"	",arg,"	",unlist(listOFlistArgumentsDisplay[arg][1]),"