Mercurial > repos > cpt > cpt_gff_to_gbk
annotate all_fasta.loc.sample @ 5:03384dbb511d draft default tip
planemo upload commit f33bdf952d796c5d7a240b132af3c4cbd102decc
author | cpt |
---|---|
date | Fri, 05 Jan 2024 05:52:51 +0000 |
parents | 35a6c466e270 |
children |
rev | line source |
---|---|
4
35a6c466e270
planemo upload commit 852ac96ca53a2ffa0947e6df5e24671866b642f5
cpt
parents:
diff
changeset
|
1 #This file lists the locations and dbkeys of all the fasta files |
35a6c466e270
planemo upload commit 852ac96ca53a2ffa0947e6df5e24671866b642f5
cpt
parents:
diff
changeset
|
2 #under the "genome" directory (a directory that contains a directory |
35a6c466e270
planemo upload commit 852ac96ca53a2ffa0947e6df5e24671866b642f5
cpt
parents:
diff
changeset
|
3 #for each build). The script extract_fasta.py will generate the file |
35a6c466e270
planemo upload commit 852ac96ca53a2ffa0947e6df5e24671866b642f5
cpt
parents:
diff
changeset
|
4 #all_fasta.loc. This file has the format (white space characters are |
35a6c466e270
planemo upload commit 852ac96ca53a2ffa0947e6df5e24671866b642f5
cpt
parents:
diff
changeset
|
5 #TAB characters): |
35a6c466e270
planemo upload commit 852ac96ca53a2ffa0947e6df5e24671866b642f5
cpt
parents:
diff
changeset
|
6 # |
35a6c466e270
planemo upload commit 852ac96ca53a2ffa0947e6df5e24671866b642f5
cpt
parents:
diff
changeset
|
7 #<unique_build_id> <dbkey> <display_name> <file_path> |
35a6c466e270
planemo upload commit 852ac96ca53a2ffa0947e6df5e24671866b642f5
cpt
parents:
diff
changeset
|
8 # |
35a6c466e270
planemo upload commit 852ac96ca53a2ffa0947e6df5e24671866b642f5
cpt
parents:
diff
changeset
|
9 #So, all_fasta.loc could look something like this: |
35a6c466e270
planemo upload commit 852ac96ca53a2ffa0947e6df5e24671866b642f5
cpt
parents:
diff
changeset
|
10 # |
35a6c466e270
planemo upload commit 852ac96ca53a2ffa0947e6df5e24671866b642f5
cpt
parents:
diff
changeset
|
11 #apiMel3 apiMel3 Honeybee (Apis mellifera): apiMel3 /path/to/genome/apiMel3/apiMel3.fa |
35a6c466e270
planemo upload commit 852ac96ca53a2ffa0947e6df5e24671866b642f5
cpt
parents:
diff
changeset
|
12 #hg19canon hg19 Human (Homo sapiens): hg19 Canonical /path/to/genome/hg19/hg19canon.fa |
35a6c466e270
planemo upload commit 852ac96ca53a2ffa0947e6df5e24671866b642f5
cpt
parents:
diff
changeset
|
13 #hg19full hg19 Human (Homo sapiens): hg19 Full /path/to/genome/hg19/hg19full.fa |
35a6c466e270
planemo upload commit 852ac96ca53a2ffa0947e6df5e24671866b642f5
cpt
parents:
diff
changeset
|
14 # |
35a6c466e270
planemo upload commit 852ac96ca53a2ffa0947e6df5e24671866b642f5
cpt
parents:
diff
changeset
|
15 #Your all_fasta.loc file should contain an entry for each individual |
35a6c466e270
planemo upload commit 852ac96ca53a2ffa0947e6df5e24671866b642f5
cpt
parents:
diff
changeset
|
16 #fasta file. So there will be multiple fasta files for each build, |
35a6c466e270
planemo upload commit 852ac96ca53a2ffa0947e6df5e24671866b642f5
cpt
parents:
diff
changeset
|
17 #such as with hg19 above. |
35a6c466e270
planemo upload commit 852ac96ca53a2ffa0947e6df5e24671866b642f5
cpt
parents:
diff
changeset
|
18 # |