comparison dnadiff.xml @ 0:491b007eec5d draft default tip

Uploaded
author greg
date Mon, 27 Feb 2023 20:02:43 +0000
parents
children
comparison
equal deleted inserted replaced
-1:000000000000 0:491b007eec5d
1 <tool id="mummer_dnadiff" name="DNAdiff" version="@TOOL_VERSION@+galaxy@VERSION_SUFFIX@" profile="@PROFILE@">
2 <description>Evaluate similarities/differences between two sequences</description>
3 <macros>
4 <import>macros.xml</import>
5 </macros>
6 <expand macro="bio_tools"/>
7 <expand macro="requirements"/>
8 <command detect_errors="exit_code">
9 <![CDATA[
10 #if $reference_source.reference_source_selector == 'history':
11 ln -f -s '$reference_source.reference_sequence' reference.fa &&
12 #else:
13 ln -f -s '$reference_source.reference_sequence.fields.path' reference.fa &&
14 #end if
15 ln -s $query_sequence query.fa &&
16 dnadiff 'reference.fa' 'query.fa'
17 ]]>
18 </command>
19 <inputs>
20 <conditional name="reference_source">
21 <param name="reference_source_selector" type="select" label="Select a reference genome from your history or select a cached reference genome?">
22 <option value="cached">Select a cached reference genome</option>
23 <option value="history">Select a reference genome from the history and build the index</option>
24 </param>
25 <when value="cached">
26 <param name="reference_sequence" type="select" label="Using reference genome" help="Select genome from the list">
27 <options from_data_table="all_fasta">
28 <filter type="sort_by" column="2"/>
29 <validator type="no_options" message="No reference genomes are available"/>
30 </options>
31 <validator type="no_options" message="A cached reference genome is not available for the build associated with the selected input file"/>
32 </param>
33 </when>
34 <when value="history">
35 <param name="reference_sequence" type="data" format="fasta" label="Use the following dataset as the reference genome" help="You can upload a FASTA or multi-Fasta file to your history and use it as reference"/>
36 </when>
37 </conditional>
38 <param name="query_sequence" type="data" format="fasta" label="Query Sequence(s)" help="FastA or multi-FastA"/>
39 <param name="report_only" type="select" label="Output only the general report file?" help="Select no to output all output files">
40 <option value="yes">YES</option>
41 <option value="no">NO</option>
42 </param>
43 </inputs>
44 <outputs>
45 <data name="report" format="txt" from_work_dir="out.report" label="${tool.name} on ${on_string}: report"/>
46 <data name="delta" format="tabular" from_work_dir="out.delta" label="${tool.name} on ${on_string}: delta">
47 <filter> report_only == 'no'</filter>
48 </data>
49 <data name="delta1" format="tabular" from_work_dir="out.1delta" label="${tool.name} on ${on_string}: 1delta" >
50 <filter> report_only == 'no' </filter>
51 </data>
52 <data name="mdelta" format="tabular" from_work_dir="out.mdelta" label="${tool.name} on ${on_string}: mdelta" >
53 <filter> report_only == 'no' </filter>
54 </data>
55 <data name="coords1" format="tabular" from_work_dir="out.1coords" label="${tool.name} on ${on_string}: 1coords" >
56 <filter> report_only == 'no' </filter>
57 <actions>
58 <action name="column_names" type="metadata" default="[S1], [E1], [S2], [E2], [LEN 1], [LEN 2], [% IDY], [LEN R], [LEN Q], [COV R], [COV Q], [REF TAG], [QUERY TAG]"/>
59 </actions>
60 </data>
61 <data name="mcoords" format="tabular" from_work_dir="out.mcoords" label="${tool.name} on ${on_string}: mcoords" >
62 <filter> report_only == 'no' </filter>
63 <actions>
64 <action name="column_names" type="metadata" default="[S1], [E1], [S2], [E2], [LEN 1], [LEN 2], [% IDY], [LEN R], [LEN Q], [COV R], [COV Q], [REF TAG], [QUERY TAG]"/>
65 </actions>
66 </data>
67 <data name="snps" format="tabular" from_work_dir="out.snps" label="${tool.name} on ${on_string}: snps" >
68 <filter> report_only == 'no' </filter>
69 <actions>
70 <action name="column_names" type="metadata" default="[P1], [REF SUB], [QUERY SUB], [P2], [BUFF], [DIST], [LEN REF], [LEN QUERY], [REF FRAME], [QUERY FRAME], [REF TAG], [QUERY TAG]"/>
71 </actions>
72 </data>
73 <data name="rdiff" format="tabular" from_work_dir="out.rdiff" label="${tool.name} on ${on_string}: rdiff" >
74 <filter> report_only == 'no' </filter>
75 <actions>
76 <action name="column_names" type="metadata" default="Seq ID, Feature Type, Feature Start, Feature End, Feature Length"/>
77 </actions>
78 </data>
79 <data name="qdiff" format="tabular" from_work_dir="out.qdiff" label="${tool.name} on ${on_string}: qdiff" >
80 <filter> report_only == 'no' </filter>
81 <actions>
82 <action name="column_names" type="metadata" default="Seq ID, Feature Type, Feature Start, Feature End, Feature Length"/>
83 </actions>
84 </data>
85 </outputs>
86 <tests>
87 <test>
88 <param name="reference_source_selector" value="history"/>
89 <param name="reference_sequence" ftype="fasta" value="human_aqp3.fasta"/>
90 <param name="query_sequence" ftype="fasta" value="mouse_aqp3.fasta"/>
91 <param name="report_only" value="no"/>
92 <output name="report" ftype="txt" compare="diff" sort="true" lines_diff="2" value="report.txt"/>
93 <output name="delta" ftype="tabular" compare="diff" lines_diff="2" value="delta.txt"/>
94 <output name="delta1" ftype="tabular" compare="diff" lines_diff="2" value="1delta.txt"/>
95 <output name="mdelta" ftype="tabular" compare="diff" lines_diff="2" value="mdelta.txt"/>
96 <output name="coords1" ftype="tabular" compare="diff" value="1coords.txt"/>
97 <output name="mcoords" ftype="tabular" compare="diff" value="mcoords.txt"/>
98 <output name="snps" ftype="tabular" compare="diff" value="snps.txt"/>
99 <output name="rdiff" ftype="tabular" compare="diff" value="rdiff.txt"/>
100 <output name="qdiff" ftype="tabular" compare="diff" value="qdiff.txt"/>
101 </test>
102 <test>
103 <param name="reference_source_selector" value="cached"/>
104 <param name="reference_sequence" ftype="fasta" value="human_aqp3"/>
105 <param name="query_sequence" ftype="fasta" value="mouse_aqp3.fasta"/>
106 <param name="report_only" value="no"/>
107 <output name="report" ftype="txt" compare="diff" sort="true" lines_diff="2" value="report.txt"/>
108 <output name="delta" ftype="tabular" compare="diff" lines_diff="2" value="delta.txt"/>
109 <output name="delta1" ftype="tabular" compare="diff" lines_diff="2" value="1delta.txt"/>
110 <output name="mdelta" ftype="tabular" compare="diff" lines_diff="2" value="mdelta.txt"/>
111 <output name="coords1" ftype="tabular" compare="diff" value="1coords.txt"/>
112 <output name="mcoords" ftype="tabular" compare="diff" value="mcoords.txt"/>
113 <output name="snps" ftype="tabular" compare="diff" value="snps.txt"/>
114 <output name="rdiff" ftype="tabular" compare="diff" value="rdiff.txt"/>
115 <output name="qdiff" ftype="tabular" compare="diff" value="qdiff.txt"/>
116 </test>
117 </tests>
118 <help><![CDATA[
119 This script is a wrapper around nucmer that builds an alignment using default parameters, and runs many of nucmer's helper scripts to process the output and report alignment statistics, SNPs, breakpoints, etc. It is designed for evaluating the sequence and structural similarity of two highly similar sequence sets. E.g. comparing two different assemblies of the same organism, or comparing two strains of the same species.
120
121 **Output files:**
122 * report: Summary of alignments, differences and SNPs
123 * delta: Standard nucmer alignment output
124 * 1delta: 1-to-1 alignment from delta-filter -1
125 * mdelta: M-to-M alignment from delta-filter -m
126 * 1coords: 1-to-1 coordinates from show-coords -THrcl .1delta
127 * mcoords: M-to-M coordinates from show-coords -THrcl .mdelta
128 * snps: SNPs from show-snps -rlTHC .1delta
129 * rdiff: Classified ref breakpoints from show-diff -rH .mdelta
130 * qdiff: Classified qry breakpoints from show-diff -qH .mdelta
131 ]]></help>
132 <expand macro="citation"/>
133 </tool>