# HG changeset patch # User galaxyp # Date 1524162628 14400 # Node ID 4f8cf8fbef57e0df0e33e689204323693007a894 # Parent f2dc9805107ac7015716c882b0cab9260b39f988 planemo upload for repository https://github.com/galaxyproteomics/tools-galaxyp/tree/master/tools/mzsqlite_psm_align commit b0c57cac4e558d974a16b14d4498cf8d4ba9e0c7 diff -r f2dc9805107a -r 4f8cf8fbef57 mzsqlite_psm_align.xml --- a/mzsqlite_psm_align.xml Mon Apr 16 18:00:53 2018 -0400 +++ b/mzsqlite_psm_align.xml Thu Apr 19 14:30:28 2018 -0400 @@ -1,5 +1,5 @@ - - from mz.sqlite aand genomic mapping + + from mz.sqlite and genomic mapping biopython twobitreader @@ -41,10 +41,13 @@ '$mzsqlitedb' '$genomicdb' ]]> - - + + - + @@ -57,11 +60,14 @@ - - - + + + - + @@ -79,13 +85,18 @@ select * from feature_cds_map WHERE name like 'ENSMUSP00000000001%'; + name chrom start end strand cds_start cds_end ENSMUSP00000000001 chr3 108145887 108146005 - 0 118 ENSMUSP00000000001 chr3 108123794 108123837 - 118 161 ENSMUSP00000000001 chr3 108123541 108123683 - 161 303 @@ -107,7 +123,23 @@ ENSMUSP00000000001 chr3 108111934 108112088 - 720 874 ENSMUSP00000000001 chr3 108109421 108109612 - 874 1065 +Each row represents an exon in the search protein. +The locations: start,end, cds_start, and cds_end are **zero-based** like BED format. + +The **name** field must match the **accession** name used in the mz.sqlite database +and thus the mzIdentML search results file. + +The protein positions are described in CDS base offsets rather than Animo Acids offsets +to allow for codons being split across exons. + This schema can describe structural variants as well as canonical transcripts. +.. _proBAM: http://www.psidev.info/probam +.. _proBED: http://www.psidev.info/probed +.. _mz_to_sqlite: https://toolshed.g2.bx.psu.edu/view/galaxyp/mz_to_sqlite/e34bdac5b157 + ]]> + + 10.1186/s13059-017-1377-x +