Mercurial > repos > charles_s_test > seqsero2
comparison libs/sratoolkit.2.8.0-centos_linux64/schema/ncbi/seq-graph.vschema @ 3:38ad1130d077 draft
planemo upload commit a4fb57231f274270afbfebd47f67df05babffa4a-dirty
| author | charles_s_test |
|---|---|
| date | Mon, 27 Nov 2017 11:21:07 -0500 |
| parents | |
| children |
comparison
equal
deleted
inserted
replaced
| 2:0d65b71ff8df | 3:38ad1130d077 |
|---|---|
| 1 /*=========================================================================== | |
| 2 * | |
| 3 * PUBLIC DOMAIN NOTICE | |
| 4 * National Center for Biotechnology Information | |
| 5 * | |
| 6 * This software/database is a "United States Government Work" under the | |
| 7 * terms of the United States Copyright Act. It was written as part of | |
| 8 * the author's official duties as a United States Government employee and | |
| 9 * thus cannot be copyrighted. This software/database is freely available | |
| 10 * to the public for use. The National Library of Medicine and the U.S. | |
| 11 * Government have not placed any restriction on its use or reproduction. | |
| 12 * | |
| 13 * Although all reasonable efforts have been taken to ensure the accuracy | |
| 14 * and reliability of the software and data, the NLM and the U.S. | |
| 15 * Government do not and cannot warrant the performance or results that | |
| 16 * may be obtained by using this software or data. The NLM and the U.S. | |
| 17 * Government disclaim all warranties, express or implied, including | |
| 18 * warranties of performance, merchantability or fitness for any particular | |
| 19 * purpose. | |
| 20 * | |
| 21 * Please cite the author in any work or product based on this material. | |
| 22 * | |
| 23 * =========================================================================== | |
| 24 * | |
| 25 */ | |
| 26 | |
| 27 /*========================================================================== | |
| 28 * seq-graph style named annotations | |
| 29 */ | |
| 30 version 1; | |
| 31 | |
| 32 include 'vdb/vdb.vschema'; | |
| 33 | |
| 34 | |
| 35 /*-------------------------------------------------------------------------- | |
| 36 * types | |
| 37 * constants | |
| 38 */ | |
| 39 | |
| 40 // example usage of data type: | |
| 41 typedef utf8 NCBI:SeqGraph:sid; | |
| 42 typedef utf8 NCBI:SeqGraph:name; | |
| 43 typedef U32 NCBI:SeqGraph:len; | |
| 44 typedef U32 NCBI:SeqGraph:scale; | |
| 45 typedef I64 NCBI:SeqGraph:value; | |
| 46 typedef NCBI:SeqGraph:value NCBI:SeqGraph:start; | |
| 47 typedef NCBI:SeqGraph:value NCBI:SeqGraph:gr_q0; // min | |
| 48 typedef NCBI:SeqGraph:value NCBI:SeqGraph:gr_q10; // 10th quantile | |
| 49 typedef NCBI:SeqGraph:value NCBI:SeqGraph:gr_q50; // median | |
| 50 typedef NCBI:SeqGraph:value NCBI:SeqGraph:gr_q90; // 90th quantile | |
| 51 typedef NCBI:SeqGraph:value NCBI:SeqGraph:gr_q100; // max | |
| 52 typedef NCBI:SeqGraph:value NCBI:SeqGraph:gr_zoom_q0; // min zoomed to 100bp segment | |
| 53 typedef NCBI:SeqGraph:value NCBI:SeqGraph:gr_zoom_q10; // 10th quantile zoomed to 100bp segment | |
| 54 typedef NCBI:SeqGraph:value NCBI:SeqGraph:gr_zoom_q50; // median zoomed to 100bp segment | |
| 55 typedef NCBI:SeqGraph:value NCBI:SeqGraph:gr_zoom_q90; // 90th quantile zoomed to 100bp segment | |
| 56 typedef NCBI:SeqGraph:value NCBI:SeqGraph:gr_zoom_q100; // max zoomed to 100bp segment | |
| 57 typedef NCBI:SeqGraph:value NCBI:SeqGraph:gr_num_switches; // number of value switches in graph | |
| 58 | |
| 59 | |
| 60 /*-------------------------------------------------------------------------- | |
| 61 * tables | |
| 62 */ | |
| 63 table NCBI:SeqGraph:tbl:seqgraph #1.0 | |
| 64 { | |
| 65 /* SID | |
| 66 * Sequence id (Accession.version). | |
| 67 * Indexed. | |
| 68 */ | |
| 69 extern column NCBI:SeqGraph:sid SID | |
| 70 = ( NCBI:SeqGraph:sid ) idx:text:project #1.0 < 'sid' > ( .SID ); | |
| 71 physical column < NCBI:SeqGraph:sid > zip_encoding .SID | |
| 72 = ( NCBI:SeqGraph:sid ) idx:text:insert #1.0 < 'sid' > ( SID ); | |
| 73 | |
| 74 /* NAME | |
| 75 * Sequence name (which resolves into SID using assembly information) | |
| 76 * Indexed. | |
| 77 */ | |
| 78 extern column NCBI:SeqGraph:name NAME | |
| 79 = ( NCBI:SeqGraph:name ) idx:text:project #1.0 < 'name' > ( .NAME ); | |
| 80 physical column < NCBI:SeqGraph:name > zip_encoding .NAME | |
| 81 = ( NCBI:SeqGraph:name ) idx:text:insert #1.0 < 'name' > ( NAME ); | |
| 82 | |
| 83 /* START | |
| 84 * Sequence offset for the segment saved in this row. | |
| 85 * In most cases this can be calculated from row id and LEN below. | |
| 86 */ | |
| 87 extern column < NCBI:SeqGraph:start > izip_encoding START; | |
| 88 | |
| 89 /* LEN | |
| 90 * MAX_SEQ_LEN is used in our refseq schema | |
| 91 * CHUNK_SIZE might be preferred | |
| 92 * Mostly a constant ( = 5000), except for the last row for each sequence. | |
| 93 */ | |
| 94 extern column < NCBI:SeqGraph:len > izip_encoding LEN; | |
| 95 | |
| 96 /* SCALE | |
| 97 * Scaling factor for graph values. | |
| 98 * Mostly needed in order to store values as integers when actual values | |
| 99 * are real with a certain precision. | |
| 100 */ | |
| 101 extern column < NCBI:SeqGraph:scale > izip_encoding SCALE; | |
| 102 | |
| 103 /* GRAPH | |
| 104 * intensity values | |
| 105 */ | |
| 106 extern column < NCBI:SeqGraph:value > izip_encoding GRAPH; | |
| 107 | |
| 108 | |
| 109 /* GR_Q0 | |
| 110 * Minimal value for the row | |
| 111 */ | |
| 112 extern column < NCBI:SeqGraph:gr_q0 > izip_encoding GR_Q0; | |
| 113 | |
| 114 | |
| 115 /* GR_Q10 | |
| 116 * 10th quantile value for the row | |
| 117 */ | |
| 118 extern column < NCBI:SeqGraph:gr_q10 > izip_encoding GR_Q10; | |
| 119 | |
| 120 | |
| 121 /* GR_Q50 | |
| 122 * Median value for the row | |
| 123 */ | |
| 124 extern column < NCBI:SeqGraph:gr_q50 > izip_encoding GR_Q50; | |
| 125 | |
| 126 | |
| 127 /* GR_Q90 | |
| 128 * 90th quantile value for the row | |
| 129 */ | |
| 130 extern column < NCBI:SeqGraph:gr_q90 > izip_encoding GR_Q90; | |
| 131 | |
| 132 | |
| 133 /* GR_Q100 | |
| 134 * Maximal value for the row | |
| 135 */ | |
| 136 extern column < NCBI:SeqGraph:gr_q100 > izip_encoding GR_Q100; | |
| 137 | |
| 138 /* GR_ZOOM_Q0 | |
| 139 * Minimal values for 100bp segments of the graph chunk | |
| 140 */ | |
| 141 extern column < NCBI:SeqGraph:gr_zoom_q0 > izip_encoding GR_ZOOM_Q0; | |
| 142 | |
| 143 | |
| 144 /* GR_ZOOM_Q10 | |
| 145 * 10th quantile values for 100bp segments of the graph chunk | |
| 146 */ | |
| 147 extern column < NCBI:SeqGraph:gr_zoom_q10 > izip_encoding GR_ZOOM_Q10; | |
| 148 | |
| 149 | |
| 150 /* GR_ZOOM_Q50 | |
| 151 * Median values for 100bp segments of the graph chunk | |
| 152 */ | |
| 153 extern column < NCBI:SeqGraph:gr_zoom_q50 > izip_encoding GR_ZOOM_Q50; | |
| 154 | |
| 155 | |
| 156 /* GR_ZOOM_Q90 | |
| 157 * 90th quantile values for 100bp segments of the graph chunk | |
| 158 */ | |
| 159 extern column < NCBI:SeqGraph:gr_zoom_q90 > izip_encoding GR_ZOOM_Q90; | |
| 160 | |
| 161 | |
| 162 /* GR_ZOOM_Q100 | |
| 163 * Maximal values for 100bp segments of the graph chunk | |
| 164 */ | |
| 165 extern column < NCBI:SeqGraph:gr_zoom_q100 > izip_encoding GR_ZOOM_Q100; | |
| 166 | |
| 167 /* NUM_SWITCHES | |
| 168 * Number of value switches within the graph. Helps client make the decision how better to | |
| 169 * represent the graph in ASN.1 (Seq-graph or Seq-table). | |
| 170 */ | |
| 171 extern column < NCBI:SeqGraph:gr_num_switches > izip_encoding NUM_SWITCHES; | |
| 172 }; | |
| 173 | |
| 174 | |
| 175 database NCBI:SeqGraph:database:kmergraph #1.0 | |
| 176 { | |
| 177 table NCBI:SeqGraph:tbl:seqgraph #1.0 LEFT; | |
| 178 table NCBI:SeqGraph:tbl:seqgraph #1.0 RIGHT; | |
| 179 table NCBI:SeqGraph:tbl:seqgraph #1.0 SUM; | |
| 180 } |
