annotate genomad_end_to_end.xml @ 0:955e33326e20 draft

planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
author ufz
date Tue, 18 Jun 2024 14:28:44 +0000
parents
children edb671f0661e
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
1 <tool id="genomad_end_to_end" name="geNomad" version="@TOOL_VERSION@+galaxy@VERSION_SUFFIX@" profile="23.0" license="MIT">
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
2 <description>identify virus and plasmid genomes from nucleotide sequences</description>
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
3 <macros>
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
4 <token name="@TOOL_VERSION@">1.8.0</token>
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
5 <token name="@VERSION_SUFFIX@">0</token>
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
6 <token name="@MIN_DB_VERSION@">1.2</token> <!-- https://portal.nersc.gov/genomad/__data__/releases.txt -->
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
7 <xml name="summary_output_macro" tokens="type">
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
8 <data name="summary_@TYPE@_fna" format="fasta" from_work_dir="output/sequence_summary/sequence_@TYPE@.fna" label="${tool.name} on ${on_string}: @TYPE@ fasta"/>
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
9 <data name="summary_@TYPE@_genes" format="tabular" from_work_dir="output/sequence_summary/sequence_@TYPE@_genes.tsv" label="${tool.name} on ${on_string}: @TYPE@ genes">
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
10 <actions>
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
11 <action name="column_names" type="metadata" default="gene,start,end,length,strand,gc_content,genetic_code,rbs_motif,marker,evalue,bitscore,uscg,plasmid_hallmark,virus_hallmark,taxid,taxname,annotation_conjscan,annotation_amr,annotation_accessions,annotation_description"/>
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
12 </actions>
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
13 </data>
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
14 <data name="summary_@TYPE@_proteins" format="fasta" from_work_dir="output/sequence_summary/sequence_@TYPE@_proteins.faa" label="${tool.name} on ${on_string}: @TYPE@ proteins fasta"/>
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
15 <data name="summary_@TYPE@_summary" format="tabular" from_work_dir="output/sequence_summary/sequence_@TYPE@_summary.tsv" label="${tool.name} on ${on_string}: @TYPE@ summary">
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
16 <actions>
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
17 <action name="column_names" type="metadata" default="seq_name,length,topology,coordinates,n_genes,genetic_code,virus_score,fdr,n_hallmarks,marker_enrichment,taxonomy" />
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
18 </actions>
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
19 </data>
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
20 </xml>
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
21 </macros>
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
22 <xrefs>
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
23 <xref type="bio.tools">genomad</xref>
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
24 </xrefs>
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
25 <requirements>
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
26 <requirement type="package" version="@TOOL_VERSION@">genomad</requirement>
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
27 </requirements>
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
28 <version_command><![CDATA[genomad end-to-end --version | cut -f 3 -d " "]]></version_command>
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
29 <command detect_errors="exit_code"><![CDATA[
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
30 ## symlink sequence (to make output directory names predictable)
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
31 ln -s '$INPUT' sequence.fa &&
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
32 mkdir output/ &&
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
33 genomad end-to-end
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
34 $filter_cond.filtering_preset
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
35 #if $filter_cond.filtering_preset == ''
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
36 --min-score $filter_cond.min_score
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
37 --max-fdr $filter_cond.max_fdr
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
38 --min-plasmid-marker-enrichment $filter_cond.min_plasmid_marker_enrichment
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
39 --min-virus-marker-enrichment $filter_cond.min_virus_marker_enrichment
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
40 --min-plasmid-hallmarks $filter_cond.min_plasmid_hallmarks
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
41 --min-plasmid-hallmarks-short-seqs $filter_cond.min_plasmid_hallmarks_short_seqs
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
42 --min-virus-hallmarks $filter_cond.min_virus_hallmarks
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
43 --min-virus-hallmarks-short-seqs $filter_cond.min_virus_hallmarks_short_seqs
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
44 --max-uscg $filter_cond.max_uscg
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
45 #end if
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
46 --threads \${GALAXY_SLOTS:-4}
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
47 $basic.disable_find_proviruses
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
48 $basic.disable_nn_classification
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
49 $basic.enable_score_calibration
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
50 $annotation.conservative_taxonomy
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
51 --sensitivity $annotation.sensitivity
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
52 --splits $annotation.splits
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
53 $provirus.skip_integrase_identification
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
54 $provirus.skip_trna_identification
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
55 --composition $score.composition
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
56 $score.force_auto
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
57 sequence.fa
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
58 output/
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
59 '$DATABASE.fields.path'
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
60 ]]></command>
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
61 <inputs>
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
62 <param argument="INPUT" type="data" format="fasta" label="Input sequences" help="geNomad will work for isolate genomes, metagenomes, and metatranscriptomes"/>
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
63 <param name="DATABASE" type="select" label="Reference data" help="">
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
64 <options from_data_table="genomad"/>
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
65 <!-- TODO needs to be activated with https://github.com/galaxyproject/galaxy/pull/18411
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
66 <validator type="in_range" min="@MIN_DB_VERSION@"/> -->
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
67 </param>
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
68 <conditional name="filter_cond">
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
69 <param name="filtering_preset" type="select" label="Filtering presets" help="After classification, sequences are further filtered to remove possible false positives. The --conservative preset makes those filters even more aggressive, resulting in more restricted sets of plasmid and virus, containing only sequences whose classification is strongly supported. The --relaxed preset disables all post-classification filters.">
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
70 <option value="--conservative">Conservative (--conservative)</option>
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
71 <option value="--relaxed">Relaxed (--relaxed)</option>
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
72 <option value="">Manual</option>
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
73 </param>
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
74 <when value="--conservative"/>
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
75 <when value="--relaxed"/>
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
76 <when value="">
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
77 <param argument="--min-score" type="float" min="0" max="1" value="0.7" label="Minimum score to flag a sequence as virus or plasmid" help=""/>
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
78 <param argument="--max-fdr" type="float" min="0" max="1" value="0.1" label="Maximum false discovery rate" help="This option will be ignored if the scores were not calibrated"/>
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
79 <param argument="--min-plasmid-marker-enrichment" type="float" value="0.1" label="Minimum allowed value for the plasmid marker enrichment score" help="This enrichment score represents the total enrichment of plasmid markers in the sequence. Sequences with multiple plasmid markers will have higher values than the ones that encode few or no markers. This option will be ignored if the annotation module was not executed." />
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
80 <param argument="--min-virus-marker-enrichment" type="float" value="0.0" label="Minimum allowed value for the virus marker enrichment score" help="This enrichment score represents the total enrichment of virus markers in the sequence. Sequences with multiple virus markers will have higher values than the ones that encode few or no markers. This option will be ignored if the annotation module was not executed." />
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
81 <param argument="--min-plasmid-hallmarks" type="integer" min="0" value="0" label="minimum number of plasmid hallmarks in the identified plasmids" help="this option will be ignored if the annotation module was not executed." />
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
82 <param argument="--min-plasmid-hallmarks-short-seqs" type="integer" min="0" value="1" label="minimum number of plasmid hallmarks in plasmids shorter than 2,500 bp" help="this option will be ignored if the annotation module was not executed." />
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
83 <param argument="--min-virus-hallmarks" type="integer" min="0" value="0" label="minimum number of virus hallmarks in the identified viruses" help="this option will be ignored if the annotation module was not executed." />
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
84 <param argument="--min-virus-hallmarks-short-seqs" type="integer" min="0" value="1" label="minimum number of virus hallmarks in viruses shorter than 2,500 bp" help="this option will be ignored if the annotation module was not executed." />
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
85 <param argument="--max-uscg" type="integer" value="4" label="Maximum allowed number of universal single copy genes (USCGs) in a virus or a plasmid." help="Sequences with more than this number of USCGs will not be classified as viruses or plasmids, regardless of their score. This option will be ignored if the annotation module was not executed." />
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
86 </when>
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
87 </conditional>
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
88 <section name="basic" title="basic options" expanded="true">
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
89 <param argument="--disable-find-proviruses" type="boolean" truevalue="" falsevalue="--disable-find-proviruses" checked="true" label="Execute the find-proviruses module" help="" />
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
90 <param argument="--disable-nn-classification" type="boolean" truevalue="" falsevalue="--disable-nn-classification" checked="true" label="Execute the find-proviruses module" help="" />
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
91 <param argument="--enable-score-calibration" type="boolean" truevalue="--enable-score-calibration" falsevalue="" checked="false" label="Execute the score-calibration module" help="" />
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
92 </section>
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
93 <section name="annotation" title="annotation options" expanded="true">
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
94 <param argument="--conservative-taxonomy" type="boolean" truevalue="--conservative-taxonomy" falsevalue="" checked="false" label="More conservative virus taxonomic assignment" help="This might reduce the amount of genomes assigned to the family level, but will decrease the rate of family misassignment" />
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
95 <param argument="--sensitivity" type="float" min="0" value="4.2" label="MMseqs2 marker search sensitivity" help="Higher values will annotate more proteins, but the search will be slower and consume more memory" />
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
96 <param argument="--splits" type="integer" min="0" value="0" label="Split the data for the MMseqs2 search." help="Higher values will reduce memory usage, but will make the search slower. If the MMseqs2 search is failing, try to increase the number of splits. Consult you Galaxy admin if more memory may be used" />
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
97 </section>
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
98 <section name="provirus" title="find-proviruses options" expanded="true">
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
99 <param argument="--skip-integrase-identification" type="boolean" truevalue="--skip-integrase-identification" falsevalue="" checked="false" label="Disable provirus boundary extension using nearby integrases" />
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
100 <param argument="--skip-trna-identification" type="boolean" truevalue="--skip-trna-identification" falsevalue="" checked="false" label="Disable provirus boundary extension using nearby tRNAs" />
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
101 </section>
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
102 <section name="score" title="score-calibration options" expanded="true">
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
103 <param argument="--composition" type="select" label="Method for estimating sample composition" >
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
104 <option value="auto" selected="true">auto</option>
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
105 <option value="metagenome">metagenome</option>
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
106 <option value="virom">virom</option>
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
107 </param>
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
108 <param argument="--force-auto" type="boolean" truevalue="--force-auto" falsevalue="" checked="false" label="Force automatic composition estimation" help="regardless of the sample size" />
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
109 </section>
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
110 </inputs>
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
111 <outputs>
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
112 <expand macro="summary_output_macro" type="plasmid"/>
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
113 <expand macro="summary_output_macro" type="virus"/>
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
114 </outputs>
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
115 <tests>
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
116 <test>
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
117 <param name="INPUT" value="GCF_009025895.1_ASM902589v1_genomic.fna" ftype="fasta"/>
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
118 <param name="DATABASE" value="1.2"/>
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
119 <section name="annotation">
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
120 <param name="splits" value="8"/><!-- needed for low mem CI-->
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
121 </section>
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
122 <output name="summary_plasmid_fna">
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
123 <assert_contents>
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
124 <has_line_matching expression="^>.*" n="5"/>
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
125 </assert_contents>
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
126 </output>
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
127 <output name="summary_plasmid_genes">
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
128 <assert_contents>
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
129 <has_n_lines n="336"/>
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
130 <has_n_columns n="20"/>
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
131 </assert_contents>
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
132 </output>
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
133 <output name="summary_plasmid_proteins">
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
134 <assert_contents>
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
135 <has_line_matching expression="^>.*" n="335"/>
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
136 </assert_contents>
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
137 </output>
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
138 <output name="summary_plasmid_summary">
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
139 <assert_contents>
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
140 <has_n_lines n="6"/>
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
141 <has_n_columns n="11"/>
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
142 </assert_contents>
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
143 </output>
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
144 <output name="summary_virus_fna">
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
145 <assert_contents>
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
146 <has_line_matching expression="^>.*" n="1"/>
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
147 </assert_contents>
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
148 </output>
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
149 <output name="summary_virus_genes">
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
150 <assert_contents>
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
151 <has_n_lines n="58"/>
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
152 <has_n_columns n="20"/>
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
153 </assert_contents>
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
154 </output>
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
155 <output name="summary_virus_proteins">
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
156 <assert_contents>
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
157 <has_line_matching expression="^>.*" n="57"/>
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
158 </assert_contents>
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
159 </output>
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
160 <output name="summary_virus_summary">
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
161 <assert_contents>
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
162 <has_n_lines n="2"/>
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
163 <has_n_columns n="11"/>
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
164 </assert_contents>
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
165 </output>
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
166 </test>
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
167 </tests>
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
168 <help><![CDATA[
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
169
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
170 geNomad is a tool that identifies virus and plasmid genomes from nucleotide sequences.
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
171 For details on the function refer to the citation or https://portal.nersc.gov/genomad/index.html.
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
172
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
173 This Galaxy tool executed the ent-to-end geNomad workflow.
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
174
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
175 Usage
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
176 .....
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
177
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
178
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
179 **Input**
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
180
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
181 Any FASTA file containing nucleotide sequences as input. geNomad will work for isolate genomes, metagenomes, and metatranscriptomes.
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
182 In addition you need to select a reference database that has to be installed by your Galaxy admin.
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
183
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
184
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
185 **Output**
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
186
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
187 plasmid/virus summary with the following columns
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
188
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
189 * seq_name: The identifier of the sequence in the input FASTA file. Proviruses will have the following name scheme: <sequence_identifier>|provirus_<start_coordinate>_<end_coordinate>.
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
190 * length: Length of the sequence (or the provirus, in the case of integrated viruses).
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
191 * topology: Topology of the viral sequence. Possible values are: No terminal repeats, DTR (direct terminal repeats), ITR (inverted terminal repeats), or Provirus (viruses integrated in host genomes).
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
192 * coordinates: 1-indexed coordinates of the provirus region within host sequences. Will be NA for viruses that were not predicted to be integrated.
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
193 * n_genes: Number of genes encoded in the sequence.
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
194 * genetic_code: Predicted genetic code. Possible values are: 11 (standard code for Bacteria and Archaea), 4 (recoded TGA stop codon), or 15 (recoded TAG stop codon).
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
195 * virus_score: A measure of how confident geNomad is that the sequence is a virus. Sequences that have scores close to 1.0 are more likely to be viruses than the ones that have lower scores.
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
196 * fdr: The estimated false discovery rate (FDR) of the classification (that is, the expected proportion of false positives among the sequences up to this row). To estimate FDRs geNomad requires score calibration, which is turned off by default. Therefore, this column will only contain NA values in this example.
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
197 * n_hallmarks: Number of genes that matched a hallmark geNomad marker. Hallmarks are genes that were previously associated with viral function and their presence is a strong indicative that the sequence is indeed a virus.
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
198 * marker_enrichment: A score that represents the total enrichment of viral markers in the sequence. The value goes as the number of virus markers in the sequence increases, so sequences with multiple markers will have higher score. Chromosome and plasmid markers will reduce the score.
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
199 * taxonomy: Taxonomic assignment of the virus genome. Lineages follow the taxonomy contained in ICTV's VMR number 19. Viruses can be taxonomically assigned up to the family level, but not to specific genera or species within that family. The taxonomy is presented with a fixed number of fields (corresponding to taxonomic ranks) separated by semicolons, with empty fields left blank.
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
200
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
201 The virus specific summary misses the coordinates and taxonomy columns and there are wto additional columns:
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
202
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
203 * conjugation_genes genes that might be involved in conjugation. It's important to note that the presence of such genes is not sufficient to tell whether a given plasmid is conjugative or mobilizible. If you are interested in identifying conjugative plasmids, we recommend you to analyze the plasmids you identified using geNomad with CONJscan.
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
204 * amr_genes genes annotated with antimicrobial resistance function. You can check the specific functions associated with each accession in AMRFinderPlus website.
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
205
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
206
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
207 plasmid/virus genes: During its execution, geNomad annotates the genes encoded by the input sequences using a database of chromosome, plasmid, and virus-specific markers. The <prefix>_virus_genes.tsv file summarizes the annotation of the genes encoded by the identified viruses.
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
208
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
209 * gene: Identifier of the gene (<sequence_name>_<gene_number>). Usually, gene numbers start with 1 (first gene in the sequence). However, genes encoded by prophages integrated in the middle of the host chromosome may start with a different number, depending on it's position within the chromosome.
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
210 * start: 1-indexed start coordinate of the gene.
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
211 * end: 1-indexed end coordinate of the gene.
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
212 * length: Length of the gene locus (in base pairs).
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
213 * strand: Strand that encodes the gene. Can be 1 (direct strand) or -1 (reverse strand).
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
214 * gc_content: GC content of the gene locus.
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
215 * genetic_code: Predicted genetic code (see details in the explanation of the summary file).
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
216 * rbs_motif: Detected motif of the ribosome-binding site.
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
217 * marker: Best matching geNomad marker. If this gene doesn't match any markers, the value will be NA.
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
218 * evalue: E-value of the alignment between the protein encoded by the gene and the best matching geNomad marker.
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
219 * bitscore: Bitscore of the alignment between the protein encoded by the gene and the best matching geNomad marker.
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
220 * uscg: Whether the marker assigned to this gene corresponds to a universal single-copy gene (UCSG, as defined in BUSCO v5). These genes are expected to be found in chromosomes and are rare in plasmids and viruses. Can be 1 (gene is USCG) or 0 (gene is not USCG).
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
221 * plasmid_hallmark: Whether the marker assigned to this gene represents a plasmid hallmark.
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
222 * virus_hallmark: Whether the marker assigned to this gene represents a virus hallmark.
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
223 * taxid: Taxonomic identifier of the marker assigned to this gene (you can ignore this as it is meant to be used internally by geNomad).
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
224 * taxname: Name of the taxon associated with the assigned geNomad marker. In this example, we can see that the annotated proteins are all characteristic of Caudoviricetes (which is why the provirus was assigned to this class).
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
225 * annotation_conjscan: If the marker that matched the gene is a conjugation-related gene (as defined in CONJscan) this field will show which CONJscan acession was assigned to the marker.
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
226 * annotation_amr: If the marker that matched the gene was annotated with an antimicrobial resistance (AMR) function (as defined in NCBIfam-AMRFinder), this field will show which NCBIfam acession was assigned to the marker.
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
227 * annotation_accessions: Some of the geNomad markers are functionally annotated. This column tells you which entries in Pfam, TIGRFAM, COG, and KEGG were assigned to the marker.
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
228 * annotation_description: A text describing the function assigned to the marker.
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
229
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
230
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
231 plasmid/virus genes/proteins: gives the nucleotide and aminoaced sequences of the annotated genes
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
232
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
233 ]]></help>
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
234 <citations>
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
235 <citation type="doi">10.1038/s41587-023-01953-y</citation>
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
236 </citations>
955e33326e20 planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/longorf/ commit 483ade5362574a59ddc87e3788334bcbff253805
ufz
parents:
diff changeset
237 </tool>