comparison gemini_macros.xml @ 0:3123ce7acd0e draft

planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gemini commit 62ed732cba355e695181924a8ed4cce49ca21c59
author iuc
date Fri, 11 Jan 2019 17:50:55 -0500
parents
children 2c68e29c3527
comparison
equal deleted inserted replaced
-1:000000000000 0:3123ce7acd0e
1 <macros>
2 <!-- gemini version to be used -->
3 <token name="@VERSION@">0.20.1</token>
4 <!-- minimal annotation files version required by this version of gemini -->
5 <token name="@DB_VERSION@">200</token>
6
7 <xml name="requirements">
8 <requirements>
9 <requirement type="package" version="@VERSION@">gemini</requirement>
10 <yield />
11 </requirements>
12 </xml>
13
14 <xml name="version_command">
15 <version_command>gemini --version</version_command>
16 </xml>
17
18 <xml name="stdio">
19 <stdio>
20 <exit_code range="1:" />
21 <exit_code range=":-1" />
22 <regex match="Error:" />
23 <regex match="Exception:" />
24 <yield />
25 </stdio>
26 </xml>
27
28 <xml name="citations">
29 <citations>
30 <citation type="doi">10.1371/journal.pcbi.1003153</citation>
31 <yield />
32 </citations>
33 </xml>
34
35 <xml name="annotation_dir">
36 <param name="annotation_databases" type="select" label="Choose a gemini annotation source">
37 <options from_data_table="gemini_versioned_databases">
38 <filter type="sort_by" column="0" />
39 <filter type="static_value" column="2" value="@DB_VERSION@" />
40 </options>
41 </param>
42 </xml>
43
44 <xml name="infile">
45 <param name="infile" type="data" format="gemini.sqlite" label="GEMINI database" help="Only files with version @VERSION@ are accepted." >
46 <options options_filter_attribute="metadata.gemini_version" >
47 <filter type="add_value" value="@VERSION@" />
48 </options>
49 </param>
50 </xml>
51
52 <xml name="add_header_column">
53 <param argument="--header" name="header" type="boolean" truevalue="--header" falsevalue="" checked="True"
54 label="Add a header of column names to the output" />
55 </xml>
56
57 <xml name="column_filter" token_help="" token_minimalset="variant_id, gene">
58 <conditional name="report">
59 <param name="report_selector" type="select"
60 label="Set of columns to include in the variant report table"
61 help="@HELP@">
62 <option value="minimal">Minimal (report only a preconfigured minimal set of columns)</option>
63 <option value="full">Full (report all columns defined in the GEMINI database variants table)</option>
64 <option value="custom">Custom (report user-specified columns)</option>
65 </param>
66 <when value="full" />
67 <when value="minimal">
68 <param name="columns" type="hidden" value="@MINIMALSET@" />
69 <param name="extra_cols" type="hidden" value="" />
70 </when>
71 <when value="custom">
72 <param name="columns" type="select" display="checkboxes" multiple="true" optional="true"
73 label="Choose columns to include in the report" help="(--columns)">
74 <option value="gene">gene</option>
75 <option value="chrom">chrom</option>
76 <option value="start">start</option>
77 <option value="end">end</option>
78 <option value="ref">ref</option>
79 <option value="alt">alt</option>
80 <option value="impact">impact</option>
81 <option value="impact_severity">impact_severity</option>
82 <option value="max_aaf_all">alternative allele frequency (max_aaf_all)</option>
83 </param>
84 <param name="extra_cols" type="text"
85 label="Additional columns (comma-separated)"
86 help="Column must be specified by the exact name they have in the GEMINI database, e.g., is_exonic or num_hom_alt, but, for genotype columns, GEMINI wildcard syntax is supported. The order of columns in the list is maintained in the output.">
87 <expand macro="sanitize_query" />
88 </param>
89 </when>
90 </conditional>
91 </xml>
92
93 <xml name="filter" token_argument="--filter">
94 <param argument="@ARGUMENT@" name="filter" type="text"
95 label="Additional constraints expressed in SQL syntax"
96 help="Constraints defined here will become the WHERE clause of the SQL query issued to the GEMINI database. E.g. alt='G' or impact_severity = 'HIGH'.">
97 <expand macro="sanitize_query" />
98 </param>
99 </xml>
100
101 <xml name="sanitize_query">
102 <sanitizer invalid_char="">
103 <valid initial="string.printable">
104 <remove value="&apos;" />
105 </valid>
106 <mapping initial="none">
107 <add source="&apos;" target="&apos;&quot;&apos;&quot;&apos;" />
108 </mapping>
109 </sanitizer>
110 </xml>
111
112 <xml name="lenient" token_argument="--lenient" token_truevalue="--lenient" token_help="The exact consequence of this setting depends on the type of inheritance pattern you are looking for (see the tool help below).">
113 <param argument="@ARGUMENT@" name="lenient" type="boolean" truevalue="@TRUEVALUE@" falsevalue="" checked="False"
114 label="Include hits with less convincing inheritance patterns"
115 help= "@HELP@" />
116 </xml>
117
118 <xml name="unaffected">
119 <param argument="--allow-unaffected" name="allow_unaffected" type="boolean" truevalue="--allow-unaffected" falsevalue="" checked="False"
120 label="Report candidates shared by unaffected samples"
121 help="Activating this option will enable the reporting of variants as candidate causative even if they are shared by unaffected samples in the family tree. The default will only report variants that are unique to affected samples."/>
122 </xml>
123
124 <xml name="min_kindreds" token_label="Minimum number of families with a candidate variant for a gene to be reported" token_help="This is the number of families required to have a variant fitting the inheritance model in the same gene in order for the gene and its variants to be reported. For example, we may only be interested in candidates where at least 4 families have a variant (with a fitting inheritance pattern) in that gene.">
125 <param argument="--min-kindreds" name="min_kindreds" type="integer" value="1" min="1"
126 label="@LABEL@"
127 help="@HELP@" />
128 </xml>
129
130 <xml name="insert_constraint" token_max_repeat="1">
131 <repeat name="constraint" title="Additional constraints on variants" default="0" max="@MAX_REPEAT@">
132 <expand macro="filter" />
133 <yield />
134 </repeat>
135 </xml>
136
137 <xml name="overwritable_where_default" token_default_where="">
138 <param name="overwrite_default_filter" type="boolean" checked="false"
139 label="Overwrite the default constraint of this tool"
140 help="By default, this tool restricts its analysis to @DEFAULT_WHERE@ and this constraint is applied on top of any constraint expressed above. With this option here selected, your custom constraint, if given, will overwrite the default instead." />
141 </xml>
142
143 <xml name="gt_filter" token_default_repeat="0" token_min_repeat="0" token_max_repeat="1">
144 <repeat name="filter_by_genotype" title="Genotype filter expression" default="@DEFAULT_REPEAT@" min="@MIN_REPEAT@" max="@MAX_REPEAT@">
145 <param argument="--gt-filter" name="gt_filter" type="text" value="" area="True" size="5x50"
146 label="Restrictions to apply to genotype values" help="">
147 <expand macro="sanitize_query" />
148 <validator type="expression" message="Genotype filter expression cannot be empty">value.strip()</validator>
149 </param>
150 <yield />
151 </repeat>
152 </xml>
153
154 <xml name="sample_filter">
155 <repeat name="filter_by_sample" title="Sample filter expression" default="0" max="1">
156 <param argument="--sample-filter" name="sample_filter" type="text" area="True" size="5x50"
157 label="SQL filter to use to filter the sample table" help="">
158 <expand macro="sanitize_query" />
159 <validator type="expression" message="Sample filter expression cannot be empty">value.strip()</validator>
160 </param>
161 <param argument="--in" name="in" type="select"
162 label="A variant must be in either all, none or any samples passing the sample-query filter"
163 help="">
164 <option value="">Return a variant if it is found in any sample passing the sample filter. (default) </option>
165 <option value="--in all">Return a variant if it is found in ALL samples passing the sample filter. (all)</option>
166 <option value="--in none">Return a variant if it is found in NO sample passing the sample filter. (none)</option>
167 <option value="--in only">Return a variant if it is found in any sample passing the sample filter, and in NO sample NOT passing it. (only)</option>
168 <option value="--in only all">Return a variant if is found in ALL samples passing the sample filter, and in NO sample NOT passing it. (only all)</option>
169 </param>
170 <expand macro="min_kindreds"
171 label="Minimum number of families in which a variant must pass the sample filter" help=""/>
172 <param argument="--family-wise" name="family_wise" type="boolean" truevalue="--family-wise" falsevalue="" checked="False"
173 label="Apply the sample-filter on a family-wise basis" help="If a variant passes the sample filter in at least the minimum number of families specified above it is retained." />
174 </repeat>
175 </xml>
176
177 <xml name="region_filter">
178 <repeat name="regions" title="Region Filter" default="0" min="0"
179 help="Filter variant sites by their position in the genome. If multiple Region Filters are specified, all variants that fall in ONE of the regions are reported.">
180 <param name="chrom" type="text" label="Chromosome">
181 <validator type="expression" message="A chromosome identifier is required when specifying a region filter">value.strip()</validator>
182 </param>
183 <param name="start" type="text" label="Region Start">
184 <validator type="expression" message="an integer number is required">not value or value.isdigit()</validator>
185 </param>
186 <param name="stop" type="text" label="Region End">
187 <validator type="expression" message="an integer number is required">not value or value.isdigit()</validator>
188 </param>
189 </repeat>
190 </xml>
191
192 <token name="@PROVIDE_ANNO_DATA@"><![CDATA[
193 mkdir gemini &&
194 ln -s '${annotation_databases.fields.path}/gemini/data' gemini/data &&
195 export GEMINI_CONFIG='${annotation_databases.fields.path}' &&
196 ]]></token>
197
198 <token name="@MULTILN_SQL_EXPR_TO_CMDLN@">
199 #set $sql_expr = str($multiline_sql_expr).strip()
200 #if str($sql_expr):
201 #set $sql_expr = $sql_expr.replace('\r\n', '\n')
202 #set $sql_expr = $sql_expr.replace('\r', '\n')
203 #set $sql_expr = $sql_expr.replace('\\\n', ' ')
204 $cmdln_param '$sql_expr'
205 #end if
206 </token>
207
208 <token name="@SET_COLS@">
209 #if str($report.report_selector) == 'full':
210 #set cols = "*"
211 #else:
212 #if $report.columns and str($report.columns) != '':
213 #set $cols = str($report.columns)
214 #else
215 #set $cols = ''
216 #end if
217 #if str($report.extra_cols).strip():
218 #if $cols:
219 #set $cols = $cols + ', ' + str($report.extra_cols)
220 #else:
221 #set $cols = str($report.extra_cols)
222 #end if
223 #end if
224 #if not $cols:
225 #set $cols = "variant_id, gene"
226 #end if
227 #end if
228 </token>
229
230 <token name="@COLUMN_SELECT@">
231 @SET_COLS@
232 #if $cols != "*"
233 --columns '$cols'
234 #end if
235 </token>
236
237 <token name="@PARSE_REGION_ELEMENTS@"><![CDATA[
238 #set $region_elements = []
239 #for $r in $regions:
240 ## The actual chromosome name needs to be single-quoted
241 ## in SQL, so we need to quote the single quotes like the
242 ## sanitize_query macro would if the whole was a parameter.
243 #set $r_elements = ["chrom = '\"'\"'%s'\"'\"'" % str($r.chrom).strip()]
244 #if str($r.start).strip():
245 #silent $r_elements.append("start >= %d" % int($r.start))
246 #end if
247 #if str($r.stop).strip():
248 #silent $r_elements.append("end <= %d" % int($r.stop))
249 #end if
250 #silent $region_elements.append("(%s)" % " AND ".join($r_elements))
251 #end for
252 ]]>
253 </token>
254 </macros>