annotate test-data/README.test_db @ 1:edb671f0661e draft default tip

planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/genomad/ commit dddf8b42771f66318f3325607bbd7aa33a3716b5
author ufz
date Mon, 07 Oct 2024 11:51:02 +0000
parents 955e33326e20
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
1 creating of a smaller reference database: https://github.com/apcamargo/genomad/issues/104#issuecomment-2170949010
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
2
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
3 - Download reference db v1.7
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
4 - store in dir genomad_db in test-data
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
5 - run test and get ids with `awk -v FS="\t" 'NR>1 && $9!="NA" {print $9}' output/sequence_annotate/sequence_genes.tsv | sort -u > markers
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
6 - join -1 2 -2 1 genomad_db/genomad_db.lookup markers | cut -d" " -f 2 | sort -u -n > sorted_markers
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
7 - cd genomad_db
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
8 - `mmseqs createsubdb ~/projects/tools-iuc/tools/genomad/test-data/sorted_markers genomad_db genomad_microdb`
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
9 - mv genomad_microdb.index genomad_db.index
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
10 - mv genomad_microdb.dbtype genomad_db.dbtype
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
11 - mv genomad_microdb genomad_db
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
12 - genomad_microdb*
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
13