# HG changeset patch # User mingchen0919 # Date 1520143199 18000 # Node ID 75a55316ff323d652b52bdd38f4fba2925cc2fa8 # Parent b5a576fc2a7c9ac495b321201b8cb25d2661b391 add samtools diff -r b5a576fc2a7c -r 75a55316ff32 star.Rmd --- a/star.Rmd Sat Mar 03 12:21:18 2018 -0500 +++ b/star.Rmd Sun Mar 04 00:59:59 2018 -0500 @@ -41,3 +41,45 @@ tags$code(tags$pre(readChar(index_genome_sh, file.info(index_genome_sh)$size ))) ``` +# Running mapping jobs + +```{bash} +cd ${X_d} + +cat >temp.sh < /dev/null 2>&1 +EOF + +grep -v None temp.sh > mapping.sh + +# run mapping +sh mapping.sh +``` + + +```{r} +# display skewer job script +mapping_sh = paste0(opt$X_d, '/mapping.sh') +tags$code(tags$pre(readChar(mapping_sh, file.info(mapping_sh)$size ))) +``` + + +# SAM to sorted BAM + +```{bash} +cd ${X_d} +samtools view \ + -b Aligned.out.sam \ + -h \ + -o Aligned.out.bam + +samtools sort \ + -o Aligned.out.sorted.bam \ + Aligned.out.bam +``` + diff -r b5a576fc2a7c -r 75a55316ff32 star.sh --- a/star.sh Sat Mar 03 12:21:18 2018 -0500 +++ b/star.sh Sun Mar 04 00:59:59 2018 -0500 @@ -8,4 +8,7 @@ -A '$genomeFastaFiles' -B '$sjdbGTFfile' - -C '$sjdbOverhang' \ No newline at end of file + -C '$sjdbOverhang' + -F '$first_reads' + -R '$second_reads' + -S '$sorted_bam' \ No newline at end of file diff -r b5a576fc2a7c -r 75a55316ff32 star.xml --- a/star.xml Sat Mar 03 12:21:18 2018 -0500 +++ b/star.xml Sun Mar 04 00:59:59 2018 -0500 @@ -6,6 +6,7 @@ r-getopt r-rmarkdown star + samtools + -C '$sjdbOverhang' + -F '$first_reads' + -R '$second_reads' + -S '$sorted_bam']]> @@ -33,10 +37,13 @@ + + - + + diff -r b5a576fc2a7c -r 75a55316ff32 star_render.R --- a/star_render.R Sat Mar 03 12:21:18 2018 -0500 +++ b/star_render.R Sun Mar 04 00:59:59 2018 -0500 @@ -23,12 +23,12 @@ spec_matrix = as.matrix( data.frame(stringsAsFactors=FALSE, long_flags = c("X_e", "X_o", "X_d", "X_s", "X_t", "X_A", "X_B", - "X_C"), - short_flags = c("e", "o", "d", "s", "t", "A", "B", "C"), - argument_mask_flags = c(1L, 1L, 1L, 1L, 1L, 1L, 1L, 1L), + "X_C", "X_F", "X_R", "X_S"), + short_flags = c("e", "o", "d", "s", "t", "A", "B", "C", "F", "R", "S"), + argument_mask_flags = c(1L, 1L, 1L, 1L, 1L, 1L, 1L, 1L, 1L, 1L, 1L), data_type_flags = c("character", "character", "character", "character", "character", "character", "character", - "character") + "character", "character", "character", "character") ) ) opt = getopt(spec_matrix)