Mercurial > repos > sanbi-uwc > data_manager_fetch_refseq
annotate tool-data/all_fasta.loc.sample @ 2:a4ee45e7237b draft
planemo upload for repository https://github.com/pvanheus/refseq_fasta_data_manager commit a0125981706495e0a8be4fafe2eb1af3f0cfdaa3-dirty
author | sanbi-uwc |
---|---|
date | Fri, 07 Sep 2018 18:08:23 -0400 |
parents | cfe6cd521835 |
children |
rev | line source |
---|---|
0
cfe6cd521835
planemo upload for repository https://github.com/pvanheus/refseq_fasta_data_manager commit cfd2aa18826b938402ccfc6003f1793886001202-dirty
sanbi-uwc
parents:
diff
changeset
|
1 #This file lists the locations and dbkeys of all the fasta files |
cfe6cd521835
planemo upload for repository https://github.com/pvanheus/refseq_fasta_data_manager commit cfd2aa18826b938402ccfc6003f1793886001202-dirty
sanbi-uwc
parents:
diff
changeset
|
2 #under the "genome" directory (a directory that contains a directory |
cfe6cd521835
planemo upload for repository https://github.com/pvanheus/refseq_fasta_data_manager commit cfd2aa18826b938402ccfc6003f1793886001202-dirty
sanbi-uwc
parents:
diff
changeset
|
3 #for each build). The script extract_fasta.py will generate the file |
cfe6cd521835
planemo upload for repository https://github.com/pvanheus/refseq_fasta_data_manager commit cfd2aa18826b938402ccfc6003f1793886001202-dirty
sanbi-uwc
parents:
diff
changeset
|
4 #all_fasta.loc. This file has the format (white space characters are |
cfe6cd521835
planemo upload for repository https://github.com/pvanheus/refseq_fasta_data_manager commit cfd2aa18826b938402ccfc6003f1793886001202-dirty
sanbi-uwc
parents:
diff
changeset
|
5 #TAB characters): |
cfe6cd521835
planemo upload for repository https://github.com/pvanheus/refseq_fasta_data_manager commit cfd2aa18826b938402ccfc6003f1793886001202-dirty
sanbi-uwc
parents:
diff
changeset
|
6 # |
cfe6cd521835
planemo upload for repository https://github.com/pvanheus/refseq_fasta_data_manager commit cfd2aa18826b938402ccfc6003f1793886001202-dirty
sanbi-uwc
parents:
diff
changeset
|
7 #<unique_build_id> <dbkey> <display_name> <file_path> |
cfe6cd521835
planemo upload for repository https://github.com/pvanheus/refseq_fasta_data_manager commit cfd2aa18826b938402ccfc6003f1793886001202-dirty
sanbi-uwc
parents:
diff
changeset
|
8 # |
cfe6cd521835
planemo upload for repository https://github.com/pvanheus/refseq_fasta_data_manager commit cfd2aa18826b938402ccfc6003f1793886001202-dirty
sanbi-uwc
parents:
diff
changeset
|
9 #So, all_fasta.loc could look something like this: |
cfe6cd521835
planemo upload for repository https://github.com/pvanheus/refseq_fasta_data_manager commit cfd2aa18826b938402ccfc6003f1793886001202-dirty
sanbi-uwc
parents:
diff
changeset
|
10 # |
cfe6cd521835
planemo upload for repository https://github.com/pvanheus/refseq_fasta_data_manager commit cfd2aa18826b938402ccfc6003f1793886001202-dirty
sanbi-uwc
parents:
diff
changeset
|
11 #apiMel3 apiMel3 Honeybee (Apis mellifera): apiMel3 /path/to/genome/apiMel3/apiMel3.fa |
cfe6cd521835
planemo upload for repository https://github.com/pvanheus/refseq_fasta_data_manager commit cfd2aa18826b938402ccfc6003f1793886001202-dirty
sanbi-uwc
parents:
diff
changeset
|
12 #hg19canon hg19 Human (Homo sapiens): hg19 Canonical /path/to/genome/hg19/hg19canon.fa |
cfe6cd521835
planemo upload for repository https://github.com/pvanheus/refseq_fasta_data_manager commit cfd2aa18826b938402ccfc6003f1793886001202-dirty
sanbi-uwc
parents:
diff
changeset
|
13 #hg19full hg19 Human (Homo sapiens): hg19 Full /path/to/genome/hg19/hg19full.fa |
cfe6cd521835
planemo upload for repository https://github.com/pvanheus/refseq_fasta_data_manager commit cfd2aa18826b938402ccfc6003f1793886001202-dirty
sanbi-uwc
parents:
diff
changeset
|
14 # |
cfe6cd521835
planemo upload for repository https://github.com/pvanheus/refseq_fasta_data_manager commit cfd2aa18826b938402ccfc6003f1793886001202-dirty
sanbi-uwc
parents:
diff
changeset
|
15 #Your all_fasta.loc file should contain an entry for each individual |
cfe6cd521835
planemo upload for repository https://github.com/pvanheus/refseq_fasta_data_manager commit cfd2aa18826b938402ccfc6003f1793886001202-dirty
sanbi-uwc
parents:
diff
changeset
|
16 #fasta file. So there will be multiple fasta files for each build, |
cfe6cd521835
planemo upload for repository https://github.com/pvanheus/refseq_fasta_data_manager commit cfd2aa18826b938402ccfc6003f1793886001202-dirty
sanbi-uwc
parents:
diff
changeset
|
17 #such as with hg19 above. |
cfe6cd521835
planemo upload for repository https://github.com/pvanheus/refseq_fasta_data_manager commit cfd2aa18826b938402ccfc6003f1793886001202-dirty
sanbi-uwc
parents:
diff
changeset
|
18 # |