annotate QDNAseq.sh @ 26:069289631381 draft

Deleted selected files
author stef
date Mon, 06 Jul 2015 05:38:44 -0400
parents 034fedc6043f
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
1
034fedc6043f Uploaded
stef
parents:
diff changeset
1 #!/bin/sh
034fedc6043f Uploaded
stef
parents:
diff changeset
2
034fedc6043f Uploaded
stef
parents:
diff changeset
3 ## This script creates a config file for use with the QDNAseq R wrapper
034fedc6043f Uploaded
stef
parents:
diff changeset
4 ## For use outside Galaxy
034fedc6043f Uploaded
stef
parents:
diff changeset
5
034fedc6043f Uploaded
stef
parents:
diff changeset
6 QDNASEQ_R_SCRIPT='/ccagc/home/stef/code/QDNASEQ/QDNAseq.R'
034fedc6043f Uploaded
stef
parents:
diff changeset
7 R_LOCATION='/ccagc/lib/R/R-3.1.0/bin/'
034fedc6043f Uploaded
stef
parents:
diff changeset
8 OUTPUT_DIR='QDNASEQ'
034fedc6043f Uploaded
stef
parents:
diff changeset
9 SCRIPT_DIR=$(dirname $0)
034fedc6043f Uploaded
stef
parents:
diff changeset
10 SCRIPT_NAME=$(basename $0)
034fedc6043f Uploaded
stef
parents:
diff changeset
11
034fedc6043f Uploaded
stef
parents:
diff changeset
12 binSizesString='1000,100,15'
034fedc6043f Uploaded
stef
parents:
diff changeset
13 outputName=`basename $PWD`
034fedc6043f Uploaded
stef
parents:
diff changeset
14 doSegment='TRUE'
034fedc6043f Uploaded
stef
parents:
diff changeset
15 debug='FALSE'
034fedc6043f Uploaded
stef
parents:
diff changeset
16
034fedc6043f Uploaded
stef
parents:
diff changeset
17 usage()
034fedc6043f Uploaded
stef
parents:
diff changeset
18 {
034fedc6043f Uploaded
stef
parents:
diff changeset
19 cat<<EOF
034fedc6043f Uploaded
stef
parents:
diff changeset
20 This script creates a QDNAseq wrapper config.
034fedc6043f Uploaded
stef
parents:
diff changeset
21
034fedc6043f Uploaded
stef
parents:
diff changeset
22 Experiment name and/or output dir are optional
034fedc6043f Uploaded
stef
parents:
diff changeset
23 $SCRIPT_NAME [-n myExperiment] [-o outputDir] *.bam
034fedc6043f Uploaded
stef
parents:
diff changeset
24
034fedc6043f Uploaded
stef
parents:
diff changeset
25 Debug mode for working with build in LGG150 data
034fedc6043f Uploaded
stef
parents:
diff changeset
26 $SCRIPT_NAME -d
034fedc6043f Uploaded
stef
parents:
diff changeset
27
034fedc6043f Uploaded
stef
parents:
diff changeset
28 OPTIONS:
034fedc6043f Uploaded
stef
parents:
diff changeset
29 -n [s] provide analysis name [$outputName]
034fedc6043f Uploaded
stef
parents:
diff changeset
30 -o [s] output dir [$OUTPUT_DIR]
034fedc6043f Uploaded
stef
parents:
diff changeset
31 -d debug mode (only create config)
034fedc6043f Uploaded
stef
parents:
diff changeset
32
034fedc6043f Uploaded
stef
parents:
diff changeset
33 EOF
034fedc6043f Uploaded
stef
parents:
diff changeset
34 }
034fedc6043f Uploaded
stef
parents:
diff changeset
35
034fedc6043f Uploaded
stef
parents:
diff changeset
36 PARAM_COUNT=0
034fedc6043f Uploaded
stef
parents:
diff changeset
37 if [ $# -eq 0 ] || [ "$1" == "-h" ]
034fedc6043f Uploaded
stef
parents:
diff changeset
38 then
034fedc6043f Uploaded
stef
parents:
diff changeset
39 usage
034fedc6043f Uploaded
stef
parents:
diff changeset
40 exit 1
034fedc6043f Uploaded
stef
parents:
diff changeset
41 else
034fedc6043f Uploaded
stef
parents:
diff changeset
42 while getopts "n:o:d" opt; do
034fedc6043f Uploaded
stef
parents:
diff changeset
43 case $opt in
034fedc6043f Uploaded
stef
parents:
diff changeset
44 n)
034fedc6043f Uploaded
stef
parents:
diff changeset
45 #echo "$opt was triggered, Parameter: $OPTARG" >&2
034fedc6043f Uploaded
stef
parents:
diff changeset
46 outputName=$OPTARG
034fedc6043f Uploaded
stef
parents:
diff changeset
47 PARAM_COUNT=`bc <<< $PARAM_COUNT+2`
034fedc6043f Uploaded
stef
parents:
diff changeset
48 ;;
034fedc6043f Uploaded
stef
parents:
diff changeset
49 o)
034fedc6043f Uploaded
stef
parents:
diff changeset
50 OUTPUT_DIR=$OPTARG
034fedc6043f Uploaded
stef
parents:
diff changeset
51 PARAM_COUNT=`bc <<< $PARAM_COUNT+2`
034fedc6043f Uploaded
stef
parents:
diff changeset
52 ;;
034fedc6043f Uploaded
stef
parents:
diff changeset
53 d)
034fedc6043f Uploaded
stef
parents:
diff changeset
54 debug='TRUE'
034fedc6043f Uploaded
stef
parents:
diff changeset
55 PARAM_COUNT=`bc <<< $PARAM_COUNT+1`
034fedc6043f Uploaded
stef
parents:
diff changeset
56 ;;
034fedc6043f Uploaded
stef
parents:
diff changeset
57 \?)
034fedc6043f Uploaded
stef
parents:
diff changeset
58 echo "Invalid option: -$OPTARG" >&2
034fedc6043f Uploaded
stef
parents:
diff changeset
59 exit 1
034fedc6043f Uploaded
stef
parents:
diff changeset
60 ;;
034fedc6043f Uploaded
stef
parents:
diff changeset
61 :)
034fedc6043f Uploaded
stef
parents:
diff changeset
62 echo "Option -$OPTARG requires an argument." >&2
034fedc6043f Uploaded
stef
parents:
diff changeset
63 exit 1
034fedc6043f Uploaded
stef
parents:
diff changeset
64 ;;
034fedc6043f Uploaded
stef
parents:
diff changeset
65 esac
034fedc6043f Uploaded
stef
parents:
diff changeset
66 done
034fedc6043f Uploaded
stef
parents:
diff changeset
67 fi
034fedc6043f Uploaded
stef
parents:
diff changeset
68
034fedc6043f Uploaded
stef
parents:
diff changeset
69 ## set param dependent variables
034fedc6043f Uploaded
stef
parents:
diff changeset
70 printf '%s\n' "[INFO] --- QDNAseq wrapper config creator ---"
034fedc6043f Uploaded
stef
parents:
diff changeset
71 CONFIG_FILE=$OUTPUT_DIR'/qdnaseqConfig.R'
034fedc6043f Uploaded
stef
parents:
diff changeset
72
034fedc6043f Uploaded
stef
parents:
diff changeset
73 ## remove the params from input string leaving only the BAMs
034fedc6043f Uploaded
stef
parents:
diff changeset
74 shift $PARAM_COUNT
034fedc6043f Uploaded
stef
parents:
diff changeset
75
034fedc6043f Uploaded
stef
parents:
diff changeset
76 ## sanity checks
034fedc6043f Uploaded
stef
parents:
diff changeset
77 if [ -e $CONFIG_FILE ]; then
034fedc6043f Uploaded
stef
parents:
diff changeset
78 echo "[ERR] Config file ($CONFIG_FILE) already exists, exit..";
034fedc6043f Uploaded
stef
parents:
diff changeset
79 exit 0
034fedc6043f Uploaded
stef
parents:
diff changeset
80 fi
034fedc6043f Uploaded
stef
parents:
diff changeset
81 if [ -d $OUTPUT_DIR ]; then
034fedc6043f Uploaded
stef
parents:
diff changeset
82 echo "[ERR] Output dir ($OUTPUT_DIR) already exists, exit..";
034fedc6043f Uploaded
stef
parents:
diff changeset
83 exit 0
034fedc6043f Uploaded
stef
parents:
diff changeset
84 else
034fedc6043f Uploaded
stef
parents:
diff changeset
85 mkdir $OUTPUT_DIR
034fedc6043f Uploaded
stef
parents:
diff changeset
86 fi
034fedc6043f Uploaded
stef
parents:
diff changeset
87
034fedc6043f Uploaded
stef
parents:
diff changeset
88 ## variables setup
034fedc6043f Uploaded
stef
parents:
diff changeset
89 CONFIG_TXT="## ==========
034fedc6043f Uploaded
stef
parents:
diff changeset
90 ## QDNAseq pipeline config file
034fedc6043f Uploaded
stef
parents:
diff changeset
91 ## ==========
034fedc6043f Uploaded
stef
parents:
diff changeset
92
034fedc6043f Uploaded
stef
parents:
diff changeset
93 ## ----------
034fedc6043f Uploaded
stef
parents:
diff changeset
94 inGalaxy <- FALSE
034fedc6043f Uploaded
stef
parents:
diff changeset
95 binSizesString <- '$binSizesString'
034fedc6043f Uploaded
stef
parents:
diff changeset
96 experimentType <- 'SR50'
034fedc6043f Uploaded
stef
parents:
diff changeset
97 outputName <- '$outputName'
034fedc6043f Uploaded
stef
parents:
diff changeset
98
034fedc6043f Uploaded
stef
parents:
diff changeset
99 ## ----------
034fedc6043f Uploaded
stef
parents:
diff changeset
100 outputHtml <- 'galaxyIndex.html'
034fedc6043f Uploaded
stef
parents:
diff changeset
101 outputId <- NA
034fedc6043f Uploaded
stef
parents:
diff changeset
102 newFilePath <- '$OUTPUT_DIR'
034fedc6043f Uploaded
stef
parents:
diff changeset
103 outputPath <- '$OUTPUT_DIR'
034fedc6043f Uploaded
stef
parents:
diff changeset
104 doSegment <- as.logical( $doSegment )
034fedc6043f Uploaded
stef
parents:
diff changeset
105 debug <- as.logical( $debug )
034fedc6043f Uploaded
stef
parents:
diff changeset
106 undoSD <- as.double( 1.0 )
034fedc6043f Uploaded
stef
parents:
diff changeset
107 binAnnotations <- ''
034fedc6043f Uploaded
stef
parents:
diff changeset
108
034fedc6043f Uploaded
stef
parents:
diff changeset
109 ## ----------
034fedc6043f Uploaded
stef
parents:
diff changeset
110 filterBlacklistedBins <- as.logical( 'TRUE' )
034fedc6043f Uploaded
stef
parents:
diff changeset
111 mappabilityCutoff <- as.integer( 0 )
034fedc6043f Uploaded
stef
parents:
diff changeset
112 undoSplits <- 'sdundo'
034fedc6043f Uploaded
stef
parents:
diff changeset
113 doOutputCopynumbersIgv <- FALSE
034fedc6043f Uploaded
stef
parents:
diff changeset
114
034fedc6043f Uploaded
stef
parents:
diff changeset
115 ## ----------
034fedc6043f Uploaded
stef
parents:
diff changeset
116 PLOT_WIDTH <- as.integer( 1440 )
034fedc6043f Uploaded
stef
parents:
diff changeset
117 PLOT_HEIGHT <- as.integer( 720 )
034fedc6043f Uploaded
stef
parents:
diff changeset
118 excludeChrsString <- 'X,Y'
034fedc6043f Uploaded
stef
parents:
diff changeset
119
034fedc6043f Uploaded
stef
parents:
diff changeset
120 ## ----------
034fedc6043f Uploaded
stef
parents:
diff changeset
121 bamsPaths <- c()
034fedc6043f Uploaded
stef
parents:
diff changeset
122 bamsNames <- c()
034fedc6043f Uploaded
stef
parents:
diff changeset
123 "
034fedc6043f Uploaded
stef
parents:
diff changeset
124
034fedc6043f Uploaded
stef
parents:
diff changeset
125 ## create config file
034fedc6043f Uploaded
stef
parents:
diff changeset
126 printf '%s\n' "$CONFIG_TXT" > $CONFIG_FILE
034fedc6043f Uploaded
stef
parents:
diff changeset
127
034fedc6043f Uploaded
stef
parents:
diff changeset
128 ## add bam files to config file
034fedc6043f Uploaded
stef
parents:
diff changeset
129 BAMS=$@
034fedc6043f Uploaded
stef
parents:
diff changeset
130 for bam_path in $BAMS; do
034fedc6043f Uploaded
stef
parents:
diff changeset
131
034fedc6043f Uploaded
stef
parents:
diff changeset
132 if [ ! -e $bam_path ]; then
034fedc6043f Uploaded
stef
parents:
diff changeset
133 echo "[ERR] Bam file does not exist ($bam_path), exit..";
034fedc6043f Uploaded
stef
parents:
diff changeset
134 exit 0
034fedc6043f Uploaded
stef
parents:
diff changeset
135 fi
034fedc6043f Uploaded
stef
parents:
diff changeset
136
034fedc6043f Uploaded
stef
parents:
diff changeset
137 bam_name=`basename "$bam_path"`
034fedc6043f Uploaded
stef
parents:
diff changeset
138 printf '%s\n' "bamsPaths <- c( bamsPaths, \"$bam_path\" )" >> $CONFIG_FILE
034fedc6043f Uploaded
stef
parents:
diff changeset
139 printf '%s\n' "bamsNames <- c( bamsNames, \"$bam_name\" )" >> $CONFIG_FILE
034fedc6043f Uploaded
stef
parents:
diff changeset
140 printf '%s\n' "[INFO] BAM: $bam_name"
034fedc6043f Uploaded
stef
parents:
diff changeset
141 done
034fedc6043f Uploaded
stef
parents:
diff changeset
142
034fedc6043f Uploaded
stef
parents:
diff changeset
143 ## done
034fedc6043f Uploaded
stef
parents:
diff changeset
144 printf '%s\n' "[INFO] OUTPUT DIR: $OUTPUT_DIR"
034fedc6043f Uploaded
stef
parents:
diff changeset
145 printf '%s\n' "[INFO] OUTPUT NAME: $outputName"
034fedc6043f Uploaded
stef
parents:
diff changeset
146 printf '%s\n' "[INFO] CONFIG FILE can be found in $CONFIG_FILE"
034fedc6043f Uploaded
stef
parents:
diff changeset
147 printf '%s\n' "[INFO] Run with: $R_LOCATION/Rscript $QDNASEQ_R_SCRIPT $CONFIG_FILE"
034fedc6043f Uploaded
stef
parents:
diff changeset
148 printf '%s\n' "[INFO] Done"