comparison utils_extract-boxed-sequences.xml @ 4:63df1e23f4ff draft

planemo upload for repository https://github.com/ErasmusMC-Bioinformatics/segmentation_fold_galaxy_wrapper commit 00690c63c51a7f7563f2428c313d7fa75f2657e5-dirty
author yhoogstrate
date Thu, 28 Jul 2016 10:25:37 -0400
parents
children b7cf9b172cfe
comparison
equal deleted inserted replaced
3:cd1bba1c66b3 4:63df1e23f4ff
1 <tool id="smf_utils_extract-boxed-sequences" name="extract-boxed-sequences" version="@VERSION@-1">
2 <description>Extracts boxed sequences from bed_input_file which has to be created with 'find-box', part of this utility</description>
3
4 <macros>
5 <import>macros.xml</import>
6 </macros>
7
8 <requirements>
9 <requirement type="package" version="2.7.10">python</requirement>
10 <requirement type="package" version="1.9">numpy</requirement>
11 <requirement type="package" version="0.8.2.1">pysam</requirement>
12 <requirement type="package" version="0.6.1">htseq</requirement>
13 <requirement type="package" version="2.0.1">segmentation-fold-utils</requirement>
14 </requirements>
15 <expand macro="stdio" />
16
17 <version_command>@VERSION_COMMAND_UTILS@</version_command>
18
19 <command><![CDATA[
20 segmentation-fold-utils
21 extract-boxed-sequences
22
23 --max-inner-dist $max_inner_dist
24 --bp-extension $bp_extension
25
26 '${fasta_input_file}'
27 '${bed_input_file}'
28 '${fasta_output_file}'
29
30 ]]></command>
31
32 <inputs>
33 <param name="fasta_input_file"
34 type="data"
35 format="fasta"
36 label="Genomic reference FASTA file"/>
37 <param name="bed_input_file"
38 type="data"
39 format="bed"
40 label="BED file containing the sequence boxes"
41 help="This file should have been created with 'find-boxes'"/>
42
43 <param name="max_inner_dist"
44 type="integer"
45 min="0"
46 value="250"
47 label="Maximal distance between the boxes"
48 help="(default=250bp)"/>
49 <param name="bp_extension"
50 type="integer"
51 min="0"
52 value="10"
53 label="Extend extracted sequences with this number of bases"
54 help="(default: 10bp)"/>
55 </inputs>
56
57 <outputs>
58 <data name="fasta_output_file"
59 format="fasta"
60 label="${tool.name} on ${fasta_input_file.hid}: ${fasta_input_file.name}"/>
61 </outputs>
62
63 <tests>
64 <test>
65 <param name="fasta_input_file" value="ExtractBoxedSequences.test_01.in.fa" ftype="fasta"/>
66 <param name="bed_input_file" value="ExtractBoxedSequences.test_01.in.bed" ftype="bed"/>
67 <param name="max_inner_dist" value='100'/>
68 <param name="bp_extension" value='0'/>
69
70 <output name="fasta_output_file" file="ExtractBoxedSequences.test_01.out.fa"/>
71 </test>
72 </tests>
73
74 <help><![CDATA[
75 extact-boxed-sequences
76 ----------------------
77 *Extracts boxes sequences from `bed_input_file` which has to be created with 'find-box', also part of this utility*
78
79 The user can use this utility to extract sequences containing the boxes provided in the bed file by `find-boxes`.
80
81 **input**
82
83 Important information about the input:
84
85 - `FASTA_INPUT_FILE` can be any generic FASTA file that can be read with pysam. This means that if the sequence is split into multiple lines, they must all be at the same length.
86 - `BED_INPUT_FILE` the bed file should be provided by `find-boxes` as it properly denotes the names (box1-f, box1-r, box2-f and box2-r) which are used for extraction.
87 - `-d, --max-inner-dist INTEGER` Only sequences for which the distance in bases between the boxes is smaller than this distance, will be extracted. Boxes are excluded from this distance.
88 - `-e, --bp-extension INTEGER` Each sequence will be exteded with:
89 * The boxes
90 * An optional number of bases provided with this argument
91
92 **output**
93
94 Be aware that there can be overlapping sequences. For example, if you started box1=`TTTT` and box2=`CCCC` with the following sequence, you will extract 2 sequences:
95
96 ```>seq
97 gagagaTTTTgagagaTTTTgagagagagagagagaCCCCgaga
98 ```
99
100 Namely:
101
102 ```TTTTgagagaTTTTgagagagagagagagaCCCC
103 ```
104
105 and
106
107 ``` TTTTgagagagagagagagaCCCC
108 ```
109
110 This is an utility of the segmentation-fold package
111 ]]></help>
112
113 <expand macro="citations" />
114 </tool>