Mercurial > repos > charles_s_test > seqsero2
comparison libs/sratoolkit.2.8.0-centos_linux64/schema/sra/generic-fastq.vschema @ 3:38ad1130d077 draft
planemo upload commit a4fb57231f274270afbfebd47f67df05babffa4a-dirty
author | charles_s_test |
---|---|
date | Mon, 27 Nov 2017 11:21:07 -0500 |
parents | |
children |
comparison
equal
deleted
inserted
replaced
2:0d65b71ff8df | 3:38ad1130d077 |
---|---|
1 /*=========================================================================== | |
2 * | |
3 * PUBLIC DOMAIN NOTICE | |
4 * National Center for Biotechnology Information | |
5 * | |
6 * This software/database is a "United States Government Work" under the | |
7 * terms of the United States Copyright Act. It was written as part of | |
8 * the author's official duties as a United States Government employee and | |
9 * thus cannot be copyrighted. This software/database is freely available | |
10 * to the public for use. The National Library of Medicine and the U.S. | |
11 * Government have not placed any restriction on its use or reproduction. | |
12 * | |
13 * Although all reasonable efforts have been taken to ensure the accuracy | |
14 * and reliability of the software and data, the NLM and the U.S. | |
15 * Government do not and cannot warrant the performance or results that | |
16 * may be obtained by using this software or data. The NLM and the U.S. | |
17 * Government disclaim all warranties, express or implied, including | |
18 * warranties of performance, merchantability or fitness for any particular | |
19 * purpose. | |
20 * | |
21 * Please cite the author in any work or product based on this material. | |
22 * | |
23 * =========================================================================== | |
24 * | |
25 */ | |
26 | |
27 /*========================================================================== | |
28 * NCBI Generic Fastq Sequence Read Archive schema | |
29 */ | |
30 version 1; | |
31 | |
32 include 'insdc/sra.vschema'; | |
33 include 'ncbi/sra.vschema'; | |
34 include 'ncbi/clip.vschema'; | |
35 include 'ncbi/spotname.vschema'; | |
36 | |
37 /* tokenize_spot_name - currently ascii only capability */ | |
38 | |
39 extern function NCBI:SRA:spot_name_token | |
40 NCBI:SRA:GenericFastq:tokenize_spot_name #1 ( ascii name ); | |
41 | |
42 /*-------------------------------------------------------------------------- | |
43 * NCBI:SRA:GenericFastq:sequence | |
44 * Generic Fastq SRA Platform | |
45 */ | |
46 table NCBI:SRA:GenericFastq:sequence #1 | |
47 = NCBI:SRA:tbl:sra #2.1.3 | |
48 , NCBI:tbl:base_space #2.0.3 | |
49 , NCBI:tbl:phred_quality #2.0.4 | |
50 , NCBI:SRA:tbl:clip #1.0.2 | |
51 { | |
52 ascii platform_name | |
53 = < ascii > echo < "UNDEFINED" > (); | |
54 | |
55 INSDC:SRA:platform_id out_platform | |
56 = < INSDC:SRA:platform_id > echo < SRA_PLATFORM_UNDEFINED > (); | |
57 | |
58 /* ascii only spot name tokenizer */ | |
59 | |
60 NCBI:SRA:spot_name_token out_spot_name_tok | |
61 = NCBI:SRA:GenericFastq:tokenize_spot_name ( _out_name ); | |
62 | |
63 NCBI:SRA:spot_name_token in_spot_name_tok | |
64 = NCBI:SRA:GenericFastq:tokenize_spot_name ( NAME ); | |
65 | |
66 /* clips */ | |
67 | |
68 physical column < INSDC:coord:one > izip_encoding | |
69 .CLIP_ADAPTER_LEFT = CLIP_ADAPTER_LEFT; | |
70 physical column < INSDC:coord:one > izip_encoding | |
71 .CLIP_ADAPTER_RIGHT = CLIP_ADAPTER_RIGHT; | |
72 physical column < INSDC:coord:one > izip_encoding | |
73 .CLIP_QUALITY_LEFT = CLIP_QUALITY_LEFT; | |
74 physical column < INSDC:coord:one > izip_encoding | |
75 .CLIP_QUALITY_RIGHT = CLIP_QUALITY_RIGHT; | |
76 } | |
77 | |
78 database NCBI:SRA:GenericFastq:db #1 | |
79 { | |
80 table NCBI:SRA:GenericFastq:sequence #1.0 SEQUENCE; | |
81 }; | |
82 | |
83 /*-------------------------------------------------------------------------- | |
84 * NCBI:SRA:GenericFastq:sequence_no_name | |
85 * Generic Fastq SRA Platform (without name) | |
86 */ | |
87 table NCBI:SRA:GenericFastq:sequence_no_name #1 | |
88 = NCBI:SRA:tbl:sra #2.1.3 | |
89 , NCBI:tbl:base_space #2.0.3 | |
90 , NCBI:tbl:phred_quality #2.0.4 | |
91 , NCBI:SRA:tbl:clip #1.0.2 | |
92 { | |
93 ascii platform_name | |
94 = < ascii > echo < "UNDEFINED" > (); | |
95 | |
96 INSDC:SRA:platform_id out_platform | |
97 = < INSDC:SRA:platform_id > echo < SRA_PLATFORM_UNDEFINED > (); | |
98 | |
99 /* clips */ | |
100 | |
101 physical column < INSDC:coord:one > izip_encoding | |
102 .CLIP_ADAPTER_LEFT = CLIP_ADAPTER_LEFT; | |
103 physical column < INSDC:coord:one > izip_encoding | |
104 .CLIP_ADAPTER_RIGHT = CLIP_ADAPTER_RIGHT; | |
105 physical column < INSDC:coord:one > izip_encoding | |
106 .CLIP_QUALITY_LEFT = CLIP_QUALITY_LEFT; | |
107 physical column < INSDC:coord:one > izip_encoding | |
108 .CLIP_QUALITY_RIGHT = CLIP_QUALITY_RIGHT; | |
109 } | |
110 | |
111 database NCBI:SRA:GenericFastqNoNames:db #1 | |
112 { | |
113 table NCBI:SRA:GenericFastq:sequence_no_name #1.0 SEQUENCE; | |
114 }; | |
115 | |
116 /*-------------------------------------------------------------------------- | |
117 * NCBI:SRA:GenericFastq:sequence_log_odds | |
118 * Generic Fastq SRA Platform (for log_odds) | |
119 */ | |
120 table NCBI:SRA:GenericFastq:sequence_log_odds #1 | |
121 = NCBI:SRA:tbl:sra #2.1.3 | |
122 , NCBI:tbl:base_space #2.0.3 | |
123 , NCBI:tbl:log_odds_quality #2.1.0 | |
124 , NCBI:SRA:tbl:clip #1.0.2 | |
125 { | |
126 ascii platform_name | |
127 = < ascii > echo < "UNDEFINED" > (); | |
128 | |
129 INSDC:SRA:platform_id out_platform | |
130 = < INSDC:SRA:platform_id > echo < SRA_PLATFORM_UNDEFINED > (); | |
131 | |
132 /* ascii only spot name tokenizer */ | |
133 | |
134 NCBI:SRA:spot_name_token out_spot_name_tok | |
135 = NCBI:SRA:GenericFastq:tokenize_spot_name ( _out_name ); | |
136 | |
137 NCBI:SRA:spot_name_token in_spot_name_tok | |
138 = NCBI:SRA:GenericFastq:tokenize_spot_name ( NAME ); | |
139 | |
140 /* clips */ | |
141 | |
142 physical column < INSDC:coord:one > izip_encoding | |
143 .CLIP_ADAPTER_LEFT = CLIP_ADAPTER_LEFT; | |
144 physical column < INSDC:coord:one > izip_encoding | |
145 .CLIP_ADAPTER_RIGHT = CLIP_ADAPTER_RIGHT; | |
146 physical column < INSDC:coord:one > izip_encoding | |
147 .CLIP_QUALITY_LEFT = CLIP_QUALITY_LEFT; | |
148 physical column < INSDC:coord:one > izip_encoding | |
149 .CLIP_QUALITY_RIGHT = CLIP_QUALITY_RIGHT; | |
150 } | |
151 | |
152 database NCBI:SRA:GenericFastqLogOdds:db #1 | |
153 { | |
154 table NCBI:SRA:GenericFastq:sequence_log_odds #1.0 SEQUENCE; | |
155 }; | |
156 | |
157 /*-------------------------------------------------------------------------- | |
158 * NCBI:SRA:GenericFastq:sequence_nanopore | |
159 * Oxford Nanopore SRA Platform | |
160 */ | |
161 table NCBI:SRA:GenericFastq:sequence_nanopore #1 | |
162 = NCBI:SRA:tbl:sra #2.1.3 | |
163 , NCBI:tbl:base_space #2.0.3 | |
164 , NCBI:tbl:phred_quality #2.0.4 | |
165 { | |
166 ascii platform_name | |
167 = < ascii > echo < "OXFORD_NANOPORE" > (); | |
168 | |
169 INSDC:SRA:platform_id out_platform | |
170 = < INSDC:SRA:platform_id > echo < SRA_PLATFORM_OXFORD_NANOPORE > (); | |
171 | |
172 /* ascii only spot name tokenizer */ | |
173 | |
174 NCBI:SRA:spot_name_token out_spot_name_tok | |
175 = NCBI:SRA:GenericFastq:tokenize_spot_name ( _out_name ); | |
176 | |
177 NCBI:SRA:spot_name_token in_spot_name_tok | |
178 = NCBI:SRA:GenericFastq:tokenize_spot_name ( NAME ); | |
179 | |
180 /* channel and read number columns */ | |
181 | |
182 extern column < U32 > izip_encoding #1 CHANNEL; | |
183 extern column < U32 > izip_encoding #1 READ_NUMBER; | |
184 } | |
185 | |
186 /*-------------------------------------------------------------------------- | |
187 * NCBI:SRA:GenericFastq:consensus_nanopore | |
188 * Oxford Nanopore SRA Platform | |
189 */ | |
190 table NCBI:SRA:GenericFastq:consensus_nanopore #1 | |
191 = NCBI:SRA:tbl:sra #2.1.3 | |
192 , NCBI:tbl:base_space #2.0.3 | |
193 , NCBI:tbl:phred_quality #2.0.4 | |
194 { | |
195 ascii platform_name | |
196 = < ascii > echo < "OXFORD_NANOPORE" > (); | |
197 | |
198 INSDC:SRA:platform_id out_platform | |
199 = < INSDC:SRA:platform_id > echo < SRA_PLATFORM_OXFORD_NANOPORE > (); | |
200 | |
201 /* ascii only spot name tokenizer */ | |
202 | |
203 NCBI:SRA:spot_name_token out_spot_name_tok | |
204 = NCBI:SRA:GenericFastq:tokenize_spot_name ( _out_name ); | |
205 | |
206 NCBI:SRA:spot_name_token in_spot_name_tok | |
207 = NCBI:SRA:GenericFastq:tokenize_spot_name ( NAME ); | |
208 | |
209 /* channel and read number columns */ | |
210 | |
211 extern column < U32 > izip_encoding #1 CHANNEL; | |
212 extern column < U32 > izip_encoding #1 READ_NUMBER; | |
213 } | |
214 | |
215 database NCBI:SRA:GenericFastqNanopore:db #1 | |
216 { | |
217 table NCBI:SRA:GenericFastq:sequence_nanopore #1.0 SEQUENCE; | |
218 table NCBI:SRA:GenericFastq:consensus_nanopore #1.0 CONSENSUS; | |
219 }; | |
220 | |
221 database NCBI:SRA:GenericFastqNanoporeConsensusOnly:db #1 | |
222 { | |
223 table NCBI:SRA:GenericFastq:consensus_nanopore #1.0 CONSENSUS; | |
224 }; | |
225 | |
226 /*-------------------------------------------------------------------------- | |
227 * NCBI:SRA:GenericFastq:absolid | |
228 * Generic fastq for AB Solid platform | |
229 */ | |
230 table NCBI:SRA:GenericFastq:absolid #1 | |
231 = NCBI:SRA:tbl:sra #2.1.3 | |
232 , NCBI:tbl:color_space #2.1.0 | |
233 , NCBI:tbl:phred_quality #2.0.4 | |
234 , NCBI:SRA:tbl:clip #1.0.2 | |
235 { | |
236 ascii platform_name | |
237 = < ascii > echo < "UNDEFINED" > (); | |
238 | |
239 INSDC:SRA:platform_id out_platform | |
240 = < INSDC:SRA:platform_id > echo < SRA_PLATFORM_UNDEFINED > (); | |
241 | |
242 /* ascii only spot name tokenizer */ | |
243 | |
244 NCBI:SRA:spot_name_token out_spot_name_tok | |
245 = NCBI:SRA:GenericFastq:tokenize_spot_name ( _out_name ); | |
246 | |
247 NCBI:SRA:spot_name_token in_spot_name_tok | |
248 = NCBI:SRA:GenericFastq:tokenize_spot_name ( NAME ); | |
249 | |
250 /* clips */ | |
251 | |
252 physical column < INSDC:coord:one > izip_encoding | |
253 .CLIP_ADAPTER_LEFT = CLIP_ADAPTER_LEFT; | |
254 physical column < INSDC:coord:one > izip_encoding | |
255 .CLIP_ADAPTER_RIGHT = CLIP_ADAPTER_RIGHT; | |
256 physical column < INSDC:coord:one > izip_encoding | |
257 .CLIP_QUALITY_LEFT = CLIP_QUALITY_LEFT; | |
258 physical column < INSDC:coord:one > izip_encoding | |
259 .CLIP_QUALITY_RIGHT = CLIP_QUALITY_RIGHT; | |
260 } | |
261 | |
262 database NCBI:SRA:GenericFastqAbsolid:db #1 | |
263 { | |
264 table NCBI:SRA:GenericFastq:absolid #1.0 SEQUENCE; | |
265 }; |