annotate vsnp_sample_names.xml @ 7:e1cb13d6a82c draft

"planemo upload for repository https://github.com/gregvonkuster/galaxy_tools/tree/master/tools/sequence_analysis/vsnp/vsnp_sample_names commit f85ae0f073297ca7f5dfa22ae3a24f5fc2e6bad6"
author greg
date Fri, 03 Sep 2021 17:21:52 +0000
parents fb3defef50e5
children 4f43f163c408
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
3
fb3defef50e5 Uploaded
greg
parents: 2
diff changeset
1 <tool id="vsnp_sample_names" name="vSNP: sample names" version="@WRAPPER_VERSION@.1" profile="@PROFILE@">
0
f75e2ac7b6cd Uploaded
greg
parents:
diff changeset
2 <description></description>
3
fb3defef50e5 Uploaded
greg
parents: 2
diff changeset
3 <macros>
fb3defef50e5 Uploaded
greg
parents: 2
diff changeset
4 <import>macros.xml</import>
fb3defef50e5 Uploaded
greg
parents: 2
diff changeset
5 </macros>
0
f75e2ac7b6cd Uploaded
greg
parents:
diff changeset
6 <command detect_errors="exit_code"><![CDATA[
7
e1cb13d6a82c "planemo upload for repository https://github.com/gregvonkuster/galaxy_tools/tree/master/tools/sequence_analysis/vsnp/vsnp_sample_names commit f85ae0f073297ca7f5dfa22ae3a24f5fc2e6bad6"
greg
parents: 3
diff changeset
7 #import difflib
0
f75e2ac7b6cd Uploaded
greg
parents:
diff changeset
8 #import os
f75e2ac7b6cd Uploaded
greg
parents:
diff changeset
9 #import re
3
fb3defef50e5 Uploaded
greg
parents: 2
diff changeset
10
7
e1cb13d6a82c "planemo upload for repository https://github.com/gregvonkuster/galaxy_tools/tree/master/tools/sequence_analysis/vsnp/vsnp_sample_names commit f85ae0f073297ca7f5dfa22ae3a24f5fc2e6bad6"
greg
parents: 3
diff changeset
11 #if $input_type_cond.input_type == 'single':
e1cb13d6a82c "planemo upload for repository https://github.com/gregvonkuster/galaxy_tools/tree/master/tools/sequence_analysis/vsnp/vsnp_sample_names commit f85ae0f073297ca7f5dfa22ae3a24f5fc2e6bad6"
greg
parents: 3
diff changeset
12 #set read1 = $input_type_cond.read1
e1cb13d6a82c "planemo upload for repository https://github.com/gregvonkuster/galaxy_tools/tree/master/tools/sequence_analysis/vsnp/vsnp_sample_names commit f85ae0f073297ca7f5dfa22ae3a24f5fc2e6bad6"
greg
parents: 3
diff changeset
13 #set sample_name = re.sub('[^\s\w\-\\.]', '_', str($read1.element_identifier))
e1cb13d6a82c "planemo upload for repository https://github.com/gregvonkuster/galaxy_tools/tree/master/tools/sequence_analysis/vsnp/vsnp_sample_names commit f85ae0f073297ca7f5dfa22ae3a24f5fc2e6bad6"
greg
parents: 3
diff changeset
14 #else if $input_type_cond.input_type == 'pair':
3
fb3defef50e5 Uploaded
greg
parents: 2
diff changeset
15 #set read1 = $input_type_cond.read1
7
e1cb13d6a82c "planemo upload for repository https://github.com/gregvonkuster/galaxy_tools/tree/master/tools/sequence_analysis/vsnp/vsnp_sample_names commit f85ae0f073297ca7f5dfa22ae3a24f5fc2e6bad6"
greg
parents: 3
diff changeset
16 #set read1_identifier = re.sub('[^\s\w\-]', '_', str($read1.element_identifier))
e1cb13d6a82c "planemo upload for repository https://github.com/gregvonkuster/galaxy_tools/tree/master/tools/sequence_analysis/vsnp/vsnp_sample_names commit f85ae0f073297ca7f5dfa22ae3a24f5fc2e6bad6"
greg
parents: 3
diff changeset
17 #set read2 = $input_type_cond.read2
e1cb13d6a82c "planemo upload for repository https://github.com/gregvonkuster/galaxy_tools/tree/master/tools/sequence_analysis/vsnp/vsnp_sample_names commit f85ae0f073297ca7f5dfa22ae3a24f5fc2e6bad6"
greg
parents: 3
diff changeset
18 #set read2_identifier = re.sub('[^\s\w\-]', '_', str($read2.element_identifier))
e1cb13d6a82c "planemo upload for repository https://github.com/gregvonkuster/galaxy_tools/tree/master/tools/sequence_analysis/vsnp/vsnp_sample_names commit f85ae0f073297ca7f5dfa22ae3a24f5fc2e6bad6"
greg
parents: 3
diff changeset
19 #set matches = difflib.SequenceMatcher(None, read1_identifier, read2_identifier).get_matching_blocks()
e1cb13d6a82c "planemo upload for repository https://github.com/gregvonkuster/galaxy_tools/tree/master/tools/sequence_analysis/vsnp/vsnp_sample_names commit f85ae0f073297ca7f5dfa22ae3a24f5fc2e6bad6"
greg
parents: 3
diff changeset
20 #set match = $matches[0]
e1cb13d6a82c "planemo upload for repository https://github.com/gregvonkuster/galaxy_tools/tree/master/tools/sequence_analysis/vsnp/vsnp_sample_names commit f85ae0f073297ca7f5dfa22ae3a24f5fc2e6bad6"
greg
parents: 3
diff changeset
21 #set sample_name = re.sub('[^\s\w\-]', '_', str($read1_identifier[match.a:match.a + match.size]))
3
fb3defef50e5 Uploaded
greg
parents: 2
diff changeset
22 #else:
7
e1cb13d6a82c "planemo upload for repository https://github.com/gregvonkuster/galaxy_tools/tree/master/tools/sequence_analysis/vsnp/vsnp_sample_names commit f85ae0f073297ca7f5dfa22ae3a24f5fc2e6bad6"
greg
parents: 3
diff changeset
23 #set read1 = $input_type_cond.reads_collection['forward']
e1cb13d6a82c "planemo upload for repository https://github.com/gregvonkuster/galaxy_tools/tree/master/tools/sequence_analysis/vsnp/vsnp_sample_names commit f85ae0f073297ca7f5dfa22ae3a24f5fc2e6bad6"
greg
parents: 3
diff changeset
24 #set read1_filename = $read1.name
3
fb3defef50e5 Uploaded
greg
parents: 2
diff changeset
25 #set sample_name = re.sub('[^\s\w\-]', '_', str($read1_filename))
fb3defef50e5 Uploaded
greg
parents: 2
diff changeset
26 #end if
fb3defef50e5 Uploaded
greg
parents: 2
diff changeset
27
fb3defef50e5 Uploaded
greg
parents: 2
diff changeset
28 #if $sample_name.find('_R1') >0:
fb3defef50e5 Uploaded
greg
parents: 2
diff changeset
29 ## Something like CMC_20E1_R1.fastq.gz
fb3defef50e5 Uploaded
greg
parents: 2
diff changeset
30 #set sample_name = $sample_name.split('_R1')[0]
fb3defef50e5 Uploaded
greg
parents: 2
diff changeset
31 #else if $sample_name.find(".") > 0:
7
e1cb13d6a82c "planemo upload for repository https://github.com/gregvonkuster/galaxy_tools/tree/master/tools/sequence_analysis/vsnp/vsnp_sample_names commit f85ae0f073297ca7f5dfa22ae3a24f5fc2e6bad6"
greg
parents: 3
diff changeset
32 #if $read1.is_of_type('fastqsanger.gz') and $sample_name.endswith('gz'):
3
fb3defef50e5 Uploaded
greg
parents: 2
diff changeset
33 ## Something like my_sample.fastq.gz
fb3defef50e5 Uploaded
greg
parents: 2
diff changeset
34 #set sample_name = '.'.join($sample_name.split('.')[0:-2])
fb3defef50e5 Uploaded
greg
parents: 2
diff changeset
35 #else:
fb3defef50e5 Uploaded
greg
parents: 2
diff changeset
36 ## Something like my_sample.fastq
fb3defef50e5 Uploaded
greg
parents: 2
diff changeset
37 #set sample_name = $os.path.splitext($sample_name)[0]
0
f75e2ac7b6cd Uploaded
greg
parents:
diff changeset
38 #end if
3
fb3defef50e5 Uploaded
greg
parents: 2
diff changeset
39 #else if $sample_name.find("_") > 0:
7
e1cb13d6a82c "planemo upload for repository https://github.com/gregvonkuster/galaxy_tools/tree/master/tools/sequence_analysis/vsnp/vsnp_sample_names commit f85ae0f073297ca7f5dfa22ae3a24f5fc2e6bad6"
greg
parents: 3
diff changeset
40 #if $read1.is_of_type('fastqsanger.gz') and $sample_name.endswith('gz'):
3
fb3defef50e5 Uploaded
greg
parents: 2
diff changeset
41 ## Something like my_sample_fastq_gz
fb3defef50e5 Uploaded
greg
parents: 2
diff changeset
42 #set sample_name = '_'.join($sample_name.split('_')[0:-2])
fb3defef50e5 Uploaded
greg
parents: 2
diff changeset
43 #else:
fb3defef50e5 Uploaded
greg
parents: 2
diff changeset
44 ## Something like my_sample_fastq
fb3defef50e5 Uploaded
greg
parents: 2
diff changeset
45 #set sample_name = "_".join($sample_name.split("_")[0:-1])
fb3defef50e5 Uploaded
greg
parents: 2
diff changeset
46 #end if
0
f75e2ac7b6cd Uploaded
greg
parents:
diff changeset
47 #end if
7
e1cb13d6a82c "planemo upload for repository https://github.com/gregvonkuster/galaxy_tools/tree/master/tools/sequence_analysis/vsnp/vsnp_sample_names commit f85ae0f073297ca7f5dfa22ae3a24f5fc2e6bad6"
greg
parents: 3
diff changeset
48
3
fb3defef50e5 Uploaded
greg
parents: 2
diff changeset
49 echo '$sample_name' > '$output'
0
f75e2ac7b6cd Uploaded
greg
parents:
diff changeset
50 ]]></command>
f75e2ac7b6cd Uploaded
greg
parents:
diff changeset
51 <inputs>
f75e2ac7b6cd Uploaded
greg
parents:
diff changeset
52 <conditional name="input_type_cond">
f75e2ac7b6cd Uploaded
greg
parents:
diff changeset
53 <param name="input_type" type="select" label="Choose the category of the files to be analyzed">
3
fb3defef50e5 Uploaded
greg
parents: 2
diff changeset
54 <option value="single" selected="true">Single dataset</option>
fb3defef50e5 Uploaded
greg
parents: 2
diff changeset
55 <option value="pair">Dataset pair</option>
fb3defef50e5 Uploaded
greg
parents: 2
diff changeset
56 <option value="paired">List of dataset pairs</option>
0
f75e2ac7b6cd Uploaded
greg
parents:
diff changeset
57 </param>
f75e2ac7b6cd Uploaded
greg
parents:
diff changeset
58 <when value="single">
3
fb3defef50e5 Uploaded
greg
parents: 2
diff changeset
59 <param name="read1" type="data" format="fastqsanger.gz,fastqsanger" label="Read1 fastq file"/>
0
f75e2ac7b6cd Uploaded
greg
parents:
diff changeset
60 </when>
3
fb3defef50e5 Uploaded
greg
parents: 2
diff changeset
61 <when value="pair">
fb3defef50e5 Uploaded
greg
parents: 2
diff changeset
62 <param name="read1" type="data" format="fastqsanger.gz,fastqsanger" label="Read1 fastq file"/>
fb3defef50e5 Uploaded
greg
parents: 2
diff changeset
63 <param name="read2" type="data" format="fastqsanger.gz,fastqsanger" label="Read2 fastq file"/>
0
f75e2ac7b6cd Uploaded
greg
parents:
diff changeset
64 </when>
7
e1cb13d6a82c "planemo upload for repository https://github.com/gregvonkuster/galaxy_tools/tree/master/tools/sequence_analysis/vsnp/vsnp_sample_names commit f85ae0f073297ca7f5dfa22ae3a24f5fc2e6bad6"
greg
parents: 3
diff changeset
65 <when value="paired">
e1cb13d6a82c "planemo upload for repository https://github.com/gregvonkuster/galaxy_tools/tree/master/tools/sequence_analysis/vsnp/vsnp_sample_names commit f85ae0f073297ca7f5dfa22ae3a24f5fc2e6bad6"
greg
parents: 3
diff changeset
66 <param name="reads_collection" type="data_collection" format="fastqsanger,fastqsanger.gz" collection_type="paired" label="Collection of fastqsanger paired read files"/>
e1cb13d6a82c "planemo upload for repository https://github.com/gregvonkuster/galaxy_tools/tree/master/tools/sequence_analysis/vsnp/vsnp_sample_names commit f85ae0f073297ca7f5dfa22ae3a24f5fc2e6bad6"
greg
parents: 3
diff changeset
67 </when>
0
f75e2ac7b6cd Uploaded
greg
parents:
diff changeset
68 </conditional>
f75e2ac7b6cd Uploaded
greg
parents:
diff changeset
69 </inputs>
f75e2ac7b6cd Uploaded
greg
parents:
diff changeset
70 <outputs>
3
fb3defef50e5 Uploaded
greg
parents: 2
diff changeset
71 <data name="output" format="txt"/>
0
f75e2ac7b6cd Uploaded
greg
parents:
diff changeset
72 </outputs>
f75e2ac7b6cd Uploaded
greg
parents:
diff changeset
73 <tests>
3
fb3defef50e5 Uploaded
greg
parents: 2
diff changeset
74 <!-- Single files -->
0
f75e2ac7b6cd Uploaded
greg
parents:
diff changeset
75 <test>
3
fb3defef50e5 Uploaded
greg
parents: 2
diff changeset
76 <param name="input_type" value="single"/>
fb3defef50e5 Uploaded
greg
parents: 2
diff changeset
77 <param name="read1" value="CMC_20E1_R1.fastq.gz" dbkey="89"/>
fb3defef50e5 Uploaded
greg
parents: 2
diff changeset
78 <output name="output" file="sample_names.txt" ftype="txt"/>
fb3defef50e5 Uploaded
greg
parents: 2
diff changeset
79 </test>
7
e1cb13d6a82c "planemo upload for repository https://github.com/gregvonkuster/galaxy_tools/tree/master/tools/sequence_analysis/vsnp/vsnp_sample_names commit f85ae0f073297ca7f5dfa22ae3a24f5fc2e6bad6"
greg
parents: 3
diff changeset
80 <!-- Paired reads in separate datasets -->
e1cb13d6a82c "planemo upload for repository https://github.com/gregvonkuster/galaxy_tools/tree/master/tools/sequence_analysis/vsnp/vsnp_sample_names commit f85ae0f073297ca7f5dfa22ae3a24f5fc2e6bad6"
greg
parents: 3
diff changeset
81 <test>
e1cb13d6a82c "planemo upload for repository https://github.com/gregvonkuster/galaxy_tools/tree/master/tools/sequence_analysis/vsnp/vsnp_sample_names commit f85ae0f073297ca7f5dfa22ae3a24f5fc2e6bad6"
greg
parents: 3
diff changeset
82 <param name="input_type" value="pair"/>
e1cb13d6a82c "planemo upload for repository https://github.com/gregvonkuster/galaxy_tools/tree/master/tools/sequence_analysis/vsnp/vsnp_sample_names commit f85ae0f073297ca7f5dfa22ae3a24f5fc2e6bad6"
greg
parents: 3
diff changeset
83 <param name="read1" value="CMC_20E1_R1.fastq.gz" dbkey="89"/>
e1cb13d6a82c "planemo upload for repository https://github.com/gregvonkuster/galaxy_tools/tree/master/tools/sequence_analysis/vsnp/vsnp_sample_names commit f85ae0f073297ca7f5dfa22ae3a24f5fc2e6bad6"
greg
parents: 3
diff changeset
84 <param name="read2" value="CMC_20E1_R2.fastq.gz" dbkey="89"/>
e1cb13d6a82c "planemo upload for repository https://github.com/gregvonkuster/galaxy_tools/tree/master/tools/sequence_analysis/vsnp/vsnp_sample_names commit f85ae0f073297ca7f5dfa22ae3a24f5fc2e6bad6"
greg
parents: 3
diff changeset
85 <output name="output" file="sample_names.txt" ftype="txt"/>
e1cb13d6a82c "planemo upload for repository https://github.com/gregvonkuster/galaxy_tools/tree/master/tools/sequence_analysis/vsnp/vsnp_sample_names commit f85ae0f073297ca7f5dfa22ae3a24f5fc2e6bad6"
greg
parents: 3
diff changeset
86 </test>
e1cb13d6a82c "planemo upload for repository https://github.com/gregvonkuster/galaxy_tools/tree/master/tools/sequence_analysis/vsnp/vsnp_sample_names commit f85ae0f073297ca7f5dfa22ae3a24f5fc2e6bad6"
greg
parents: 3
diff changeset
87 <!-- Collection of Paired reads -->
3
fb3defef50e5 Uploaded
greg
parents: 2
diff changeset
88 <test>
fb3defef50e5 Uploaded
greg
parents: 2
diff changeset
89 <param name="input_type" value="paired"/>
0
f75e2ac7b6cd Uploaded
greg
parents:
diff changeset
90 <param name="reads_collection">
3
fb3defef50e5 Uploaded
greg
parents: 2
diff changeset
91 <collection type="paired">
fb3defef50e5 Uploaded
greg
parents: 2
diff changeset
92 <element name="forward" value="CMC_20E1_R1.fastq.gz"/>
fb3defef50e5 Uploaded
greg
parents: 2
diff changeset
93 <element name="reverse" value="CMC_20E1_R2.fastq.gz"/>
0
f75e2ac7b6cd Uploaded
greg
parents:
diff changeset
94 </collection>
f75e2ac7b6cd Uploaded
greg
parents:
diff changeset
95 </param>
3
fb3defef50e5 Uploaded
greg
parents: 2
diff changeset
96 <output name="output" file="sample_names.txt" ftype="txt"/>
fb3defef50e5 Uploaded
greg
parents: 2
diff changeset
97 </test>
7
e1cb13d6a82c "planemo upload for repository https://github.com/gregvonkuster/galaxy_tools/tree/master/tools/sequence_analysis/vsnp/vsnp_sample_names commit f85ae0f073297ca7f5dfa22ae3a24f5fc2e6bad6"
greg
parents: 3
diff changeset
98 <!-- Collection of Paired reads -->
3
fb3defef50e5 Uploaded
greg
parents: 2
diff changeset
99 <test>
7
e1cb13d6a82c "planemo upload for repository https://github.com/gregvonkuster/galaxy_tools/tree/master/tools/sequence_analysis/vsnp/vsnp_sample_names commit f85ae0f073297ca7f5dfa22ae3a24f5fc2e6bad6"
greg
parents: 3
diff changeset
100 <param name="input_type" value="paired"/>
e1cb13d6a82c "planemo upload for repository https://github.com/gregvonkuster/galaxy_tools/tree/master/tools/sequence_analysis/vsnp/vsnp_sample_names commit f85ae0f073297ca7f5dfa22ae3a24f5fc2e6bad6"
greg
parents: 3
diff changeset
101 <param name="reads_collection">
e1cb13d6a82c "planemo upload for repository https://github.com/gregvonkuster/galaxy_tools/tree/master/tools/sequence_analysis/vsnp/vsnp_sample_names commit f85ae0f073297ca7f5dfa22ae3a24f5fc2e6bad6"
greg
parents: 3
diff changeset
102 <collection type="paired">
e1cb13d6a82c "planemo upload for repository https://github.com/gregvonkuster/galaxy_tools/tree/master/tools/sequence_analysis/vsnp/vsnp_sample_names commit f85ae0f073297ca7f5dfa22ae3a24f5fc2e6bad6"
greg
parents: 3
diff changeset
103 <element name="forward" value="SRR14085881_forward"/>
e1cb13d6a82c "planemo upload for repository https://github.com/gregvonkuster/galaxy_tools/tree/master/tools/sequence_analysis/vsnp/vsnp_sample_names commit f85ae0f073297ca7f5dfa22ae3a24f5fc2e6bad6"
greg
parents: 3
diff changeset
104 <element name="reverse" value="SRR14085881_reverse"/>
e1cb13d6a82c "planemo upload for repository https://github.com/gregvonkuster/galaxy_tools/tree/master/tools/sequence_analysis/vsnp/vsnp_sample_names commit f85ae0f073297ca7f5dfa22ae3a24f5fc2e6bad6"
greg
parents: 3
diff changeset
105 </collection>
e1cb13d6a82c "planemo upload for repository https://github.com/gregvonkuster/galaxy_tools/tree/master/tools/sequence_analysis/vsnp/vsnp_sample_names commit f85ae0f073297ca7f5dfa22ae3a24f5fc2e6bad6"
greg
parents: 3
diff changeset
106 </param>
e1cb13d6a82c "planemo upload for repository https://github.com/gregvonkuster/galaxy_tools/tree/master/tools/sequence_analysis/vsnp/vsnp_sample_names commit f85ae0f073297ca7f5dfa22ae3a24f5fc2e6bad6"
greg
parents: 3
diff changeset
107 <output name="output" file="sample_names2.txt" ftype="txt"/>
0
f75e2ac7b6cd Uploaded
greg
parents:
diff changeset
108 </test>
f75e2ac7b6cd Uploaded
greg
parents:
diff changeset
109 </tests>
f75e2ac7b6cd Uploaded
greg
parents:
diff changeset
110 <help>
f75e2ac7b6cd Uploaded
greg
parents:
diff changeset
111 **What it does**
f75e2ac7b6cd Uploaded
greg
parents:
diff changeset
112
3
fb3defef50e5 Uploaded
greg
parents: 2
diff changeset
113 Accepts fastqsanger sample files, extracts a unique portion of the file name as the sample name, and writes it to
fb3defef50e5 Uploaded
greg
parents: 2
diff changeset
114 the output. The output text file can be consumed by the **Parse parameter value** expression tool to provide workflow
fb3defef50e5 Uploaded
greg
parents: 2
diff changeset
115 parameter values to the **Read group identifier (ID)** and the **Sample name identifier (SM)** parameters in the
fb3defef50e5 Uploaded
greg
parents: 2
diff changeset
116 **Map with BWA-MEM** tool.
0
f75e2ac7b6cd Uploaded
greg
parents:
diff changeset
117 </help>
3
fb3defef50e5 Uploaded
greg
parents: 2
diff changeset
118 <expand macro="citations"/>
0
f75e2ac7b6cd Uploaded
greg
parents:
diff changeset
119 </tool>
f75e2ac7b6cd Uploaded
greg
parents:
diff changeset
120