Mercurial > repos > cpt > cpt_annotation_table
annotate all_fasta.loc.sample @ 2:6998c2570145 draft
planemo upload commit 852ac96ca53a2ffa0947e6df5e24671866b642f5
author | cpt |
---|---|
date | Sun, 23 Jul 2023 01:42:48 +0000 |
parents | |
children |
rev | line source |
---|---|
2
6998c2570145
planemo upload commit 852ac96ca53a2ffa0947e6df5e24671866b642f5
cpt
parents:
diff
changeset
|
1 #This file lists the locations and dbkeys of all the fasta files |
6998c2570145
planemo upload commit 852ac96ca53a2ffa0947e6df5e24671866b642f5
cpt
parents:
diff
changeset
|
2 #under the "genome" directory (a directory that contains a directory |
6998c2570145
planemo upload commit 852ac96ca53a2ffa0947e6df5e24671866b642f5
cpt
parents:
diff
changeset
|
3 #for each build). The script extract_fasta.py will generate the file |
6998c2570145
planemo upload commit 852ac96ca53a2ffa0947e6df5e24671866b642f5
cpt
parents:
diff
changeset
|
4 #all_fasta.loc. This file has the format (white space characters are |
6998c2570145
planemo upload commit 852ac96ca53a2ffa0947e6df5e24671866b642f5
cpt
parents:
diff
changeset
|
5 #TAB characters): |
6998c2570145
planemo upload commit 852ac96ca53a2ffa0947e6df5e24671866b642f5
cpt
parents:
diff
changeset
|
6 # |
6998c2570145
planemo upload commit 852ac96ca53a2ffa0947e6df5e24671866b642f5
cpt
parents:
diff
changeset
|
7 #<unique_build_id> <dbkey> <display_name> <file_path> |
6998c2570145
planemo upload commit 852ac96ca53a2ffa0947e6df5e24671866b642f5
cpt
parents:
diff
changeset
|
8 # |
6998c2570145
planemo upload commit 852ac96ca53a2ffa0947e6df5e24671866b642f5
cpt
parents:
diff
changeset
|
9 #So, all_fasta.loc could look something like this: |
6998c2570145
planemo upload commit 852ac96ca53a2ffa0947e6df5e24671866b642f5
cpt
parents:
diff
changeset
|
10 # |
6998c2570145
planemo upload commit 852ac96ca53a2ffa0947e6df5e24671866b642f5
cpt
parents:
diff
changeset
|
11 #apiMel3 apiMel3 Honeybee (Apis mellifera): apiMel3 /path/to/genome/apiMel3/apiMel3.fa |
6998c2570145
planemo upload commit 852ac96ca53a2ffa0947e6df5e24671866b642f5
cpt
parents:
diff
changeset
|
12 #hg19canon hg19 Human (Homo sapiens): hg19 Canonical /path/to/genome/hg19/hg19canon.fa |
6998c2570145
planemo upload commit 852ac96ca53a2ffa0947e6df5e24671866b642f5
cpt
parents:
diff
changeset
|
13 #hg19full hg19 Human (Homo sapiens): hg19 Full /path/to/genome/hg19/hg19full.fa |
6998c2570145
planemo upload commit 852ac96ca53a2ffa0947e6df5e24671866b642f5
cpt
parents:
diff
changeset
|
14 # |
6998c2570145
planemo upload commit 852ac96ca53a2ffa0947e6df5e24671866b642f5
cpt
parents:
diff
changeset
|
15 #Your all_fasta.loc file should contain an entry for each individual |
6998c2570145
planemo upload commit 852ac96ca53a2ffa0947e6df5e24671866b642f5
cpt
parents:
diff
changeset
|
16 #fasta file. So there will be multiple fasta files for each build, |
6998c2570145
planemo upload commit 852ac96ca53a2ffa0947e6df5e24671866b642f5
cpt
parents:
diff
changeset
|
17 #such as with hg19 above. |
6998c2570145
planemo upload commit 852ac96ca53a2ffa0947e6df5e24671866b642f5
cpt
parents:
diff
changeset
|
18 # |