# HG changeset patch # User jbrayet # Date 1453985026 18000 # Node ID 8f3347849abf54b3e573da78e320dfa3bbecab1d # Parent f8c76a03d758be3d81a88b76dd42c0ec7f3be09c Uploaded diff -r f8c76a03d758 -r 8f3347849abf ncPRO-PROFILING.xml --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/ncPRO-PROFILING.xml Thu Jan 28 07:43:46 2016 -0500 @@ -0,0 +1,592 @@ + + of mapped reads + + institutcuriengsintegration/ncproseqgalaxy:1.6.5 + + ncPRO-PROFILING.sh + -i $input + -g $genome + -t $cond.datatype + -e $cond['database']$cond['borne']$cond['N1']"_"$cond['N2'] + -l $outlog + #if str($cond.datatype) == "matmir": + -o $out_mirna_ab + -p $out_mirna_dis + #elif str($cond.datatype) == 'trna': + -o $out_trna_ab + -p $out_trna_dis + #elif str($cond.datatype) == 'premir': + -o $out_premirna_ab + -p $out_premirna_dis + #elif str($cond.datatype) == 'rfam': + -o $out_rfam_ab + -p $out_rfam_dis + #elif str($cond.datatype) == 'rmsk': + -o $out_rmsk_ab + -p $out_rmsk_dis + #end if + -r ${__root_dir__} + -n $projectName + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + Fill this field with +/- value + + + Fill this field with +/- value + + + + + + + + + + + + + + + + + + Fill this field with +/- value + + + Fill this field with +/- value + + + + + + + + + + + + + + + + Fill this field with +/- value + + + Fill this field with +/- value + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + Fill this field with +/- value + + + Fill this field with +/- value + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + Fill this field with +/- value + + + Fill this field with +/- value + + + + + + + + + + + (str(cond['datatype']) == "matmir") + + + (str(cond['datatype']) == "matmir") + + + + (str(cond['datatype']) == "premir") + + + (str(cond['datatype']) == "premir") + + + + (str(cond['datatype']) == "trna") + + + (str(cond['datatype']) == "trna") + + + + (str(cond['datatype']) == "rfam") + + + (str(cond['datatype']) == "rfam") + + + + (str(cond['datatype']) == "rmsk") + + + (str(cond['datatype']) == "rmsk") + + + + + + + +**What ncPRO-seq does ?** + +------ + +ncPRO-seq is a tool for annotation and profiling of ncRNAs from smallRNA sequencing data. It aims to interrogate and perform detailed analysis on small RNAs derived from annotated non-coding regions in miRBase, Rfam and repeatMasker, and regions defined by users. A command line version and an online version are available at http://ncpro.curie.fr. +If you use the ncPRO-seq tool for your analysis, please cite the following paper : +Chen C., Servant N., Toedling J., Sarazin A., Marchais A., Duvernois-Berthet E., Cognat V., Colot V., Voinnet O., Heard E., Ciaudo C. and Barillot E. (2012) ncPRO-seq: a tool for annotation and profiling analysis of ncRNAs from small RNA-seq.Bioinformatics.28(23):3147-9. + +# Copyleft ↄ⃝ 2012 Institut Curie +# Author(s): Jocelyn Brayet, Laurene Syx, Chongjian Chen, Nicolas Servant(Institut Curie) 2012 - 2015 +# Contact: bioinfo.ncproseq@curie.fr +# This software is distributed without any guarantee under the terms of the GNU General +# Public License, either Version 2, June 1991 or Version 3, June 2007. + +------ + +**Input Formats** + +Aligned file (BAM) is allowed. See ncPRO-seq Alignment and quality control for more details. + +------ + +**Profiling** + +Read profiling refers to the analysis of read profiles, which are represented by the distribution of positional read coverage and the read length distribution in annotation families. For a given annotation family, ncPRO-seq will compute and plot two types of read profiles by using abundant and distinct reads. (Note that distinct reads are read groups that only count once for reads with he same sequence, whereas abudant reads are all sequenced reads.) + +-Reads with multiple mapping sites +A major challenging problem using NGS sequencing data is the annotation of reads aligned at multiple +locations. Most of the available frameworks resolve this situation by discarding these reads or by +providing random annotations. Here, we propose to keep all the reads aligned to the genome, and to +weight them by the number of mapping sites. Suppose a read can be aligned 5 times to the genome, +for each mapping site, the read would be counted as 0.2, i.e. 1/5. + +-Annotation +There are four types of extended items which can be used to modify coordinates. +1- shorten [+-]N1 bp at 5' end, [+-]N2 bp at 3' end +2- extend [+-]N1 bp at 5' end, [+-]N2 bp at 3' end +3- get coordinates for sub-region from position N1 to N2 indexed from 5' end +4- get coordinates for sub-region from position N1 to N2 indexed from 3' end + +For instance, due to the inaccurate processing of precursor miRNAs by Dicer or downstream miRNA remodelling, mature miRNAs often have end heterogeneities comparing to their annotations in miRBase. Thus, when analyzing mature miRNAs, it is necessary to extend miRNA annotation several bases (e.g. 2 bases) in both upstream and downstream region. + + +