# HG changeset patch # User rnateam # Date 1446639486 18000 # Node ID 1bfc5a5de843118a737d9fad4d69a63ecc93b593 # Parent e841de88235ce1c22524868db28cedbbdbddb0b8 Uploaded diff -r e841de88235c -r 1bfc5a5de843 convert_bc_to_binary_RY.xml --- a/convert_bc_to_binary_RY.xml Fri Oct 23 07:28:06 2015 -0400 +++ b/convert_bc_to_binary_RY.xml Wed Nov 04 07:18:06 2015 -0500 @@ -1,5 +1,5 @@ - - Convert to binary barcodes. + + from regular barcodes. macros.xml @@ -25,15 +25,21 @@ diff -r e841de88235c -r 1bfc5a5de843 coords2clnt.xml --- a/coords2clnt.xml Fri Oct 23 07:28:06 2015 -0400 +++ b/coords2clnt.xml Wed Nov 04 07:18:06 2015 -0500 @@ -1,5 +1,5 @@ - - Extract crosslinked nucleotide. + + from full alignments macros.xml @@ -32,6 +32,7 @@ Crosslinked nts are assumed to be one nt upstream of the 5'-end of the read. Input: + * bed6 file containing coordinates of aligned reads * bed6 file containing coordinates of crosslinking events diff -r e841de88235c -r 1bfc5a5de843 extract_aln_ends.xml --- a/extract_aln_ends.xml Fri Oct 23 07:28:06 2015 -0400 +++ b/extract_aln_ends.xml Wed Nov 04 07:18:06 2015 -0500 @@ -1,5 +1,5 @@ - - Extract alignment ends from sam file. + + from a sam file macros.xml @@ -37,9 +37,11 @@ ("forward-reverse") direction. Input: + * sam file containing alignments (paired-end sequencing) Output: + * bed6 file containing outer coordinates (sorted by read id) Author: Daniel Maticzka diff -r e841de88235c -r 1bfc5a5de843 extract_bcs.xml --- a/extract_bcs.xml Fri Oct 23 07:28:06 2015 -0400 +++ b/extract_bcs.xml Wed Nov 04 07:18:06 2015 -0500 @@ -1,5 +1,5 @@ - - Extract barcodes using pattern. + + using pattern. macros.xml diff -r e841de88235c -r 1bfc5a5de843 merge_pcr_duplicates.xml --- a/merge_pcr_duplicates.xml Fri Oct 23 07:28:06 2015 -0400 +++ b/merge_pcr_duplicates.xml Wed Nov 04 07:18:06 2015 -0500 @@ -1,5 +1,5 @@ - - Merge PCR duplicates according to random barcode library. + + according to random barcode library. macros.xml @@ -35,11 +35,13 @@ Barcodes containing uncalled base 'N' are removed. -Input: +Input:: + * bed6 file containing alignments with fastq read-id in name field * fasta library with fastq read-id as sequence ids -Output: +Output:: + * bed6 file with random barcode in name field and number of PCR duplicates as score, sorted by fields chrom, start, stop, strand, name Author: Daniel Maticzka diff -r e841de88235c -r 1bfc5a5de843 remove_tail.xml --- a/remove_tail.xml Fri Oct 23 07:28:06 2015 -0400 +++ b/remove_tail.xml Wed Nov 04 07:18:06 2015 -0500 @@ -1,5 +1,5 @@ - - Remove nts from 3'-end. + + from FASTQ macros.xml diff -r e841de88235c -r 1bfc5a5de843 rm_spurious_events.xml --- a/rm_spurious_events.xml Fri Oct 23 07:28:06 2015 -0400 +++ b/rm_spurious_events.xml Wed Nov 04 07:18:06 2015 -0500 @@ -1,5 +1,5 @@ - - Remove spurious events. + + crosslinking events macros.xml @@ -32,17 +32,17 @@