Mercurial > repos > charles_s_test > seqsero2
comparison libs/sratoolkit.2.8.0-centos_linux64/schema/sra/generic-fastq.vschema @ 3:38ad1130d077 draft
planemo upload commit a4fb57231f274270afbfebd47f67df05babffa4a-dirty
| author | charles_s_test |
|---|---|
| date | Mon, 27 Nov 2017 11:21:07 -0500 |
| parents | |
| children |
comparison
equal
deleted
inserted
replaced
| 2:0d65b71ff8df | 3:38ad1130d077 |
|---|---|
| 1 /*=========================================================================== | |
| 2 * | |
| 3 * PUBLIC DOMAIN NOTICE | |
| 4 * National Center for Biotechnology Information | |
| 5 * | |
| 6 * This software/database is a "United States Government Work" under the | |
| 7 * terms of the United States Copyright Act. It was written as part of | |
| 8 * the author's official duties as a United States Government employee and | |
| 9 * thus cannot be copyrighted. This software/database is freely available | |
| 10 * to the public for use. The National Library of Medicine and the U.S. | |
| 11 * Government have not placed any restriction on its use or reproduction. | |
| 12 * | |
| 13 * Although all reasonable efforts have been taken to ensure the accuracy | |
| 14 * and reliability of the software and data, the NLM and the U.S. | |
| 15 * Government do not and cannot warrant the performance or results that | |
| 16 * may be obtained by using this software or data. The NLM and the U.S. | |
| 17 * Government disclaim all warranties, express or implied, including | |
| 18 * warranties of performance, merchantability or fitness for any particular | |
| 19 * purpose. | |
| 20 * | |
| 21 * Please cite the author in any work or product based on this material. | |
| 22 * | |
| 23 * =========================================================================== | |
| 24 * | |
| 25 */ | |
| 26 | |
| 27 /*========================================================================== | |
| 28 * NCBI Generic Fastq Sequence Read Archive schema | |
| 29 */ | |
| 30 version 1; | |
| 31 | |
| 32 include 'insdc/sra.vschema'; | |
| 33 include 'ncbi/sra.vschema'; | |
| 34 include 'ncbi/clip.vschema'; | |
| 35 include 'ncbi/spotname.vschema'; | |
| 36 | |
| 37 /* tokenize_spot_name - currently ascii only capability */ | |
| 38 | |
| 39 extern function NCBI:SRA:spot_name_token | |
| 40 NCBI:SRA:GenericFastq:tokenize_spot_name #1 ( ascii name ); | |
| 41 | |
| 42 /*-------------------------------------------------------------------------- | |
| 43 * NCBI:SRA:GenericFastq:sequence | |
| 44 * Generic Fastq SRA Platform | |
| 45 */ | |
| 46 table NCBI:SRA:GenericFastq:sequence #1 | |
| 47 = NCBI:SRA:tbl:sra #2.1.3 | |
| 48 , NCBI:tbl:base_space #2.0.3 | |
| 49 , NCBI:tbl:phred_quality #2.0.4 | |
| 50 , NCBI:SRA:tbl:clip #1.0.2 | |
| 51 { | |
| 52 ascii platform_name | |
| 53 = < ascii > echo < "UNDEFINED" > (); | |
| 54 | |
| 55 INSDC:SRA:platform_id out_platform | |
| 56 = < INSDC:SRA:platform_id > echo < SRA_PLATFORM_UNDEFINED > (); | |
| 57 | |
| 58 /* ascii only spot name tokenizer */ | |
| 59 | |
| 60 NCBI:SRA:spot_name_token out_spot_name_tok | |
| 61 = NCBI:SRA:GenericFastq:tokenize_spot_name ( _out_name ); | |
| 62 | |
| 63 NCBI:SRA:spot_name_token in_spot_name_tok | |
| 64 = NCBI:SRA:GenericFastq:tokenize_spot_name ( NAME ); | |
| 65 | |
| 66 /* clips */ | |
| 67 | |
| 68 physical column < INSDC:coord:one > izip_encoding | |
| 69 .CLIP_ADAPTER_LEFT = CLIP_ADAPTER_LEFT; | |
| 70 physical column < INSDC:coord:one > izip_encoding | |
| 71 .CLIP_ADAPTER_RIGHT = CLIP_ADAPTER_RIGHT; | |
| 72 physical column < INSDC:coord:one > izip_encoding | |
| 73 .CLIP_QUALITY_LEFT = CLIP_QUALITY_LEFT; | |
| 74 physical column < INSDC:coord:one > izip_encoding | |
| 75 .CLIP_QUALITY_RIGHT = CLIP_QUALITY_RIGHT; | |
| 76 } | |
| 77 | |
| 78 database NCBI:SRA:GenericFastq:db #1 | |
| 79 { | |
| 80 table NCBI:SRA:GenericFastq:sequence #1.0 SEQUENCE; | |
| 81 }; | |
| 82 | |
| 83 /*-------------------------------------------------------------------------- | |
| 84 * NCBI:SRA:GenericFastq:sequence_no_name | |
| 85 * Generic Fastq SRA Platform (without name) | |
| 86 */ | |
| 87 table NCBI:SRA:GenericFastq:sequence_no_name #1 | |
| 88 = NCBI:SRA:tbl:sra #2.1.3 | |
| 89 , NCBI:tbl:base_space #2.0.3 | |
| 90 , NCBI:tbl:phred_quality #2.0.4 | |
| 91 , NCBI:SRA:tbl:clip #1.0.2 | |
| 92 { | |
| 93 ascii platform_name | |
| 94 = < ascii > echo < "UNDEFINED" > (); | |
| 95 | |
| 96 INSDC:SRA:platform_id out_platform | |
| 97 = < INSDC:SRA:platform_id > echo < SRA_PLATFORM_UNDEFINED > (); | |
| 98 | |
| 99 /* clips */ | |
| 100 | |
| 101 physical column < INSDC:coord:one > izip_encoding | |
| 102 .CLIP_ADAPTER_LEFT = CLIP_ADAPTER_LEFT; | |
| 103 physical column < INSDC:coord:one > izip_encoding | |
| 104 .CLIP_ADAPTER_RIGHT = CLIP_ADAPTER_RIGHT; | |
| 105 physical column < INSDC:coord:one > izip_encoding | |
| 106 .CLIP_QUALITY_LEFT = CLIP_QUALITY_LEFT; | |
| 107 physical column < INSDC:coord:one > izip_encoding | |
| 108 .CLIP_QUALITY_RIGHT = CLIP_QUALITY_RIGHT; | |
| 109 } | |
| 110 | |
| 111 database NCBI:SRA:GenericFastqNoNames:db #1 | |
| 112 { | |
| 113 table NCBI:SRA:GenericFastq:sequence_no_name #1.0 SEQUENCE; | |
| 114 }; | |
| 115 | |
| 116 /*-------------------------------------------------------------------------- | |
| 117 * NCBI:SRA:GenericFastq:sequence_log_odds | |
| 118 * Generic Fastq SRA Platform (for log_odds) | |
| 119 */ | |
| 120 table NCBI:SRA:GenericFastq:sequence_log_odds #1 | |
| 121 = NCBI:SRA:tbl:sra #2.1.3 | |
| 122 , NCBI:tbl:base_space #2.0.3 | |
| 123 , NCBI:tbl:log_odds_quality #2.1.0 | |
| 124 , NCBI:SRA:tbl:clip #1.0.2 | |
| 125 { | |
| 126 ascii platform_name | |
| 127 = < ascii > echo < "UNDEFINED" > (); | |
| 128 | |
| 129 INSDC:SRA:platform_id out_platform | |
| 130 = < INSDC:SRA:platform_id > echo < SRA_PLATFORM_UNDEFINED > (); | |
| 131 | |
| 132 /* ascii only spot name tokenizer */ | |
| 133 | |
| 134 NCBI:SRA:spot_name_token out_spot_name_tok | |
| 135 = NCBI:SRA:GenericFastq:tokenize_spot_name ( _out_name ); | |
| 136 | |
| 137 NCBI:SRA:spot_name_token in_spot_name_tok | |
| 138 = NCBI:SRA:GenericFastq:tokenize_spot_name ( NAME ); | |
| 139 | |
| 140 /* clips */ | |
| 141 | |
| 142 physical column < INSDC:coord:one > izip_encoding | |
| 143 .CLIP_ADAPTER_LEFT = CLIP_ADAPTER_LEFT; | |
| 144 physical column < INSDC:coord:one > izip_encoding | |
| 145 .CLIP_ADAPTER_RIGHT = CLIP_ADAPTER_RIGHT; | |
| 146 physical column < INSDC:coord:one > izip_encoding | |
| 147 .CLIP_QUALITY_LEFT = CLIP_QUALITY_LEFT; | |
| 148 physical column < INSDC:coord:one > izip_encoding | |
| 149 .CLIP_QUALITY_RIGHT = CLIP_QUALITY_RIGHT; | |
| 150 } | |
| 151 | |
| 152 database NCBI:SRA:GenericFastqLogOdds:db #1 | |
| 153 { | |
| 154 table NCBI:SRA:GenericFastq:sequence_log_odds #1.0 SEQUENCE; | |
| 155 }; | |
| 156 | |
| 157 /*-------------------------------------------------------------------------- | |
| 158 * NCBI:SRA:GenericFastq:sequence_nanopore | |
| 159 * Oxford Nanopore SRA Platform | |
| 160 */ | |
| 161 table NCBI:SRA:GenericFastq:sequence_nanopore #1 | |
| 162 = NCBI:SRA:tbl:sra #2.1.3 | |
| 163 , NCBI:tbl:base_space #2.0.3 | |
| 164 , NCBI:tbl:phred_quality #2.0.4 | |
| 165 { | |
| 166 ascii platform_name | |
| 167 = < ascii > echo < "OXFORD_NANOPORE" > (); | |
| 168 | |
| 169 INSDC:SRA:platform_id out_platform | |
| 170 = < INSDC:SRA:platform_id > echo < SRA_PLATFORM_OXFORD_NANOPORE > (); | |
| 171 | |
| 172 /* ascii only spot name tokenizer */ | |
| 173 | |
| 174 NCBI:SRA:spot_name_token out_spot_name_tok | |
| 175 = NCBI:SRA:GenericFastq:tokenize_spot_name ( _out_name ); | |
| 176 | |
| 177 NCBI:SRA:spot_name_token in_spot_name_tok | |
| 178 = NCBI:SRA:GenericFastq:tokenize_spot_name ( NAME ); | |
| 179 | |
| 180 /* channel and read number columns */ | |
| 181 | |
| 182 extern column < U32 > izip_encoding #1 CHANNEL; | |
| 183 extern column < U32 > izip_encoding #1 READ_NUMBER; | |
| 184 } | |
| 185 | |
| 186 /*-------------------------------------------------------------------------- | |
| 187 * NCBI:SRA:GenericFastq:consensus_nanopore | |
| 188 * Oxford Nanopore SRA Platform | |
| 189 */ | |
| 190 table NCBI:SRA:GenericFastq:consensus_nanopore #1 | |
| 191 = NCBI:SRA:tbl:sra #2.1.3 | |
| 192 , NCBI:tbl:base_space #2.0.3 | |
| 193 , NCBI:tbl:phred_quality #2.0.4 | |
| 194 { | |
| 195 ascii platform_name | |
| 196 = < ascii > echo < "OXFORD_NANOPORE" > (); | |
| 197 | |
| 198 INSDC:SRA:platform_id out_platform | |
| 199 = < INSDC:SRA:platform_id > echo < SRA_PLATFORM_OXFORD_NANOPORE > (); | |
| 200 | |
| 201 /* ascii only spot name tokenizer */ | |
| 202 | |
| 203 NCBI:SRA:spot_name_token out_spot_name_tok | |
| 204 = NCBI:SRA:GenericFastq:tokenize_spot_name ( _out_name ); | |
| 205 | |
| 206 NCBI:SRA:spot_name_token in_spot_name_tok | |
| 207 = NCBI:SRA:GenericFastq:tokenize_spot_name ( NAME ); | |
| 208 | |
| 209 /* channel and read number columns */ | |
| 210 | |
| 211 extern column < U32 > izip_encoding #1 CHANNEL; | |
| 212 extern column < U32 > izip_encoding #1 READ_NUMBER; | |
| 213 } | |
| 214 | |
| 215 database NCBI:SRA:GenericFastqNanopore:db #1 | |
| 216 { | |
| 217 table NCBI:SRA:GenericFastq:sequence_nanopore #1.0 SEQUENCE; | |
| 218 table NCBI:SRA:GenericFastq:consensus_nanopore #1.0 CONSENSUS; | |
| 219 }; | |
| 220 | |
| 221 database NCBI:SRA:GenericFastqNanoporeConsensusOnly:db #1 | |
| 222 { | |
| 223 table NCBI:SRA:GenericFastq:consensus_nanopore #1.0 CONSENSUS; | |
| 224 }; | |
| 225 | |
| 226 /*-------------------------------------------------------------------------- | |
| 227 * NCBI:SRA:GenericFastq:absolid | |
| 228 * Generic fastq for AB Solid platform | |
| 229 */ | |
| 230 table NCBI:SRA:GenericFastq:absolid #1 | |
| 231 = NCBI:SRA:tbl:sra #2.1.3 | |
| 232 , NCBI:tbl:color_space #2.1.0 | |
| 233 , NCBI:tbl:phred_quality #2.0.4 | |
| 234 , NCBI:SRA:tbl:clip #1.0.2 | |
| 235 { | |
| 236 ascii platform_name | |
| 237 = < ascii > echo < "UNDEFINED" > (); | |
| 238 | |
| 239 INSDC:SRA:platform_id out_platform | |
| 240 = < INSDC:SRA:platform_id > echo < SRA_PLATFORM_UNDEFINED > (); | |
| 241 | |
| 242 /* ascii only spot name tokenizer */ | |
| 243 | |
| 244 NCBI:SRA:spot_name_token out_spot_name_tok | |
| 245 = NCBI:SRA:GenericFastq:tokenize_spot_name ( _out_name ); | |
| 246 | |
| 247 NCBI:SRA:spot_name_token in_spot_name_tok | |
| 248 = NCBI:SRA:GenericFastq:tokenize_spot_name ( NAME ); | |
| 249 | |
| 250 /* clips */ | |
| 251 | |
| 252 physical column < INSDC:coord:one > izip_encoding | |
| 253 .CLIP_ADAPTER_LEFT = CLIP_ADAPTER_LEFT; | |
| 254 physical column < INSDC:coord:one > izip_encoding | |
| 255 .CLIP_ADAPTER_RIGHT = CLIP_ADAPTER_RIGHT; | |
| 256 physical column < INSDC:coord:one > izip_encoding | |
| 257 .CLIP_QUALITY_LEFT = CLIP_QUALITY_LEFT; | |
| 258 physical column < INSDC:coord:one > izip_encoding | |
| 259 .CLIP_QUALITY_RIGHT = CLIP_QUALITY_RIGHT; | |
| 260 } | |
| 261 | |
| 262 database NCBI:SRA:GenericFastqAbsolid:db #1 | |
| 263 { | |
| 264 table NCBI:SRA:GenericFastq:absolid #1.0 SEQUENCE; | |
| 265 }; |
