0
|
1 <tool id="ngs_run_annotation" name="NGS Run Annotation">
|
|
2 <description>Create a SAM format header from run metadata for sample annotation.</description>
|
|
3 <version_command>mimodd version -q</version_command>
|
|
4 <command>
|
|
5 mimodd header
|
|
6
|
|
7 --rg-id "$rg_id"
|
|
8 --rg-sm "$rg_sm"
|
|
9
|
|
10 #if $str($rg_cn):
|
|
11 --rg-cn "$rg_cn"
|
|
12 #end if
|
|
13 #if $str($rg_ds):
|
|
14 --rg-ds "$rg_ds"
|
|
15 #end if
|
|
16 #if $str($rg_date):
|
|
17 --rg-dt "$rg_date"
|
|
18 #end if
|
|
19 #if $str($rg_lb):
|
|
20 --rg-lb "$rg_lb"
|
|
21 #end if
|
|
22 #if $str($rg_pl):
|
|
23 --rg-pl "$rg_pl"
|
|
24 #end if
|
|
25 #if $str($rg_pi):
|
|
26 --rg-pi "$rg_pi"
|
|
27 #end if
|
|
28 #if $str($rg_pu):
|
|
29 --rg-pu "$rg_pu"
|
|
30 #end if
|
|
31
|
|
32 --ofile "$outputfile"
|
|
33
|
|
34 </command>
|
|
35
|
|
36 <inputs>
|
|
37 <param name="rg_id" type="text" size="80" label="read-group ID (required)">
|
|
38 <sanitizer invalid_char="">
|
|
39 <valid initial="string.printable">
|
|
40 <remove value=""" />
|
|
41 </valid>
|
|
42 <mapping initial="none">
|
|
43 <add source=""" target="\""/>
|
|
44 </mapping>
|
|
45 </sanitizer>
|
|
46 </param>
|
|
47 <param name="rg_sm" type="text" size="80" label="sample name (required)">
|
|
48 <sanitizer invalid_char="">
|
|
49 <valid initial="string.printable">
|
|
50 <remove value=""" />
|
|
51 </valid>
|
|
52 <mapping initial="none">
|
|
53 <add source=""" target="\""/>
|
|
54 </mapping>
|
|
55 </sanitizer>
|
|
56 </param>
|
|
57 <param name="rg_ds" type="text" size="80" label="description">
|
|
58 <sanitizer invalid_char="">
|
|
59 <valid initial="string.printable">
|
|
60 <remove value=""" />
|
|
61 </valid>
|
|
62 <mapping initial="none">
|
|
63 <add source=""" target="\""/>
|
|
64 </mapping>
|
|
65 </sanitizer>
|
|
66 </param>
|
|
67 <param name="rg_date" type="text" label="date (YYYY-MM-DD) the run was produced" />
|
|
68 <param name="rg_cn" type="text" size="80" label="name of sequencing center">
|
|
69 <sanitizer invalid_char="">
|
|
70 <valid initial="string.printable">
|
|
71 <remove value=""" />
|
|
72 </valid>
|
|
73 <mapping initial="none">
|
|
74 <add source=""" target="\""/>
|
|
75 </mapping>
|
|
76 </sanitizer>
|
|
77 </param>
|
|
78 <param name="rg_lb" type="text" size="80" label="read-group library">
|
|
79 <sanitizer invalid_char="">
|
|
80 <valid initial="string.printable">
|
|
81 <remove value=""" />
|
|
82 </valid>
|
|
83 <mapping initial="none">
|
|
84 <add source=""" target="\""/>
|
|
85 </mapping>
|
|
86 </sanitizer>
|
|
87 </param>
|
|
88 <param name="rg_pl" type="text" label="platform/technology used to produce the reads" />
|
|
89 <param name="rg_pi" type="text" label="predicted median insert size" />
|
|
90 <param name="rg_pu" type="text" size="80" label="platform unit; unique identifier">
|
|
91 <sanitizer invalid_char="">
|
|
92 <valid initial="string.printable">
|
|
93 <remove value=""" />
|
|
94 </valid>
|
|
95 <mapping initial="none">
|
|
96 <add source=""" target="\""/>
|
|
97 </mapping>
|
|
98 </sanitizer>
|
|
99 </param>
|
|
100 </inputs>
|
|
101
|
|
102 <outputs>
|
|
103 <data name="outputfile" format="sam" label="${rg_sm} (${rg_id}) header information from MiModd ${tool.name} on ${on_string}"/>
|
|
104 </outputs>
|
|
105
|
|
106 <help>
|
|
107 .. class:: infomark
|
|
108
|
|
109 **What it does**
|
|
110
|
|
111 This tool takes the user-provided information about a next-generation sequencing run and constructs a valid header in the SAM file format from it.
|
|
112
|
|
113 The result file can be used by the tools *Convert* and *Reheader* or in the *SNAP Read Alignment* step to add run metadata to sequenced reads files (or to overwrite pre-existing information).
|
|
114
|
|
115 **Note:**
|
|
116
|
|
117 **MiModD requires run metadata for every input file at the Alignment step !**
|
|
118
|
|
119 **Tip:**
|
|
120
|
|
121 While you can do Alignments from fastq file format by providing a custom header file directly to the *SNAP Read Alignment* tool, we **recommend** you to first convert all input files to and archive all datasets in SAM/BAM format with appropriate header information prior to any downstream analysis. Although a bit more time-consuming, this practice protects against information loss and ensures that the input datasets will remain useful for others in the future.
|
|
122
|
|
123 </help>
|
|
124 </tool>
|
|
125
|