Mercurial > repos > devteam > picard
comparison picard_MarkDuplicatesWithMateCigar.xml @ 33:3f254c5ced1d draft default tip
planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/picard commit 9ecbbb878d68a980ba35a90865e524c723ca3ed8
author | iuc |
---|---|
date | Sun, 03 Mar 2024 16:06:11 +0000 |
parents | f9242e01365a |
children |
comparison
equal
deleted
inserted
replaced
32:f9242e01365a | 33:3f254c5ced1d |
---|---|
1 <tool name="MarkDuplicatesWithMateCigar" id="picard_MarkDuplicatesWithMateCigar" version="@TOOL_VERSION@.@WRAPPER_VERSION@"> | 1 <tool name="MarkDuplicatesWithMateCigar" id="picard_MarkDuplicatesWithMateCigar" version="@TOOL_VERSION@.@WRAPPER_VERSION@" profile="@PROFILE@"> |
2 <description>examine aligned records in BAM datasets to locate duplicate molecules</description> | 2 <description>examine aligned records in BAM datasets to locate duplicate molecules</description> |
3 <macros> | 3 <macros> |
4 <import>picard_macros.xml</import> | 4 <import>picard_macros.xml</import> |
5 <token name="@WRAPPER_VERSION@">3</token> | 5 <token name="@WRAPPER_VERSION@">0</token> |
6 </macros> | 6 </macros> |
7 <expand macro="requirements" /> | 7 <expand macro="requirements"/> |
8 <command detect_errors="exit_code"><![CDATA[ | 8 <command detect_errors="exit_code"><![CDATA[ |
9 @java_options@ | 9 @java_options@ |
10 @symlink_element_identifier@ | 10 @symlink_element_identifier@ |
11 picard | 11 picard MarkDuplicatesWithMateCigar |
12 MarkDuplicatesWithMateCigar | |
13 | 12 |
14 INPUT='$escaped_element_identifier' | 13 --INPUT '$escaped_element_identifier' |
15 OUTPUT="${outFile}" | 14 --OUTPUT '${outFile}' |
16 | 15 |
17 METRICS_FILE="${metrics_file}" | 16 --METRICS_FILE '${metrics_file}' |
18 COMMENT="${comment}" | 17 --COMMENT '${comment}' |
19 | 18 |
20 MINIMUM_DISTANCE="${minimum_distance}" | 19 --MINIMUM_DISTANCE '${minimum_distance}' |
21 SKIP_PAIRS_WITH_NO_MATE_CIGAR="${skip_pairs_with_no_mate_cigar}" | 20 --SKIP_PAIRS_WITH_NO_MATE_CIGAR '${skip_pairs_with_no_mate_cigar}' |
22 | 21 |
22 --REMOVE_DUPLICATES '${remove_duplicates}' | |
23 --ASSUME_SORTED '${assume_sorted}' | |
23 | 24 |
24 REMOVE_DUPLICATES="${remove_duplicates}" | 25 --DUPLICATE_SCORING_STRATEGY ${duplicate_scoring_strategy} |
25 ASSUME_SORTED="${assume_sorted}" | |
26 | 26 |
27 DUPLICATE_SCORING_STRATEGY="${duplicate_scoring_strategy}" | 27 --READ_NAME_REGEX '${ str( $read_name_regex ) }' |
28 --OPTICAL_DUPLICATE_PIXEL_DISTANCE '${optical_duplicate_pixel_distance}' | |
28 | 29 |
29 READ_NAME_REGEX='${ str( $read_name_regex ) }' | 30 --BLOCK_SIZE 100000 |
30 OPTICAL_DUPLICATE_PIXEL_DISTANCE="${optical_duplicate_pixel_distance}" | 31 --VALIDATION_STRINGENCY '${validation_stringency}' |
31 | 32 --QUIET true |
32 | 33 --VERBOSITY ERROR |
33 BLOCK_SIZE=100000 | |
34 VALIDATION_STRINGENCY="${validation_stringency}" | |
35 QUIET=true | |
36 VERBOSITY=ERROR | |
37 | 34 |
38 ]]></command> | 35 ]]></command> |
39 <inputs> | 36 <inputs> |
40 <param format="bam" name="inputFile" type="data" label="Select SAM/BAM dataset or dataset collection" help="If empty, upload or import a SAM/BAM dataset"/> | 37 <param name="inputFile" type="data" format="bam" label="Select SAM/BAM dataset or dataset collection" help="If empty, upload or import a SAM/BAM dataset"/> |
41 <param name="comment" type="text" label="Add this comment to BAM dataset"/> | 38 <param name="comment" type="text" label="Add this comment to BAM dataset"/> |
42 | 39 <param name="minimum_distance" type="integer" value="-1" label="The minimum distance to buffer records to account for clipping on the 5' end of the records" help="MINIMUM_DISTANCE; Set this number to -1 to use twice the first read's read length (or 100, whichever is smaller); default=-1"/> |
43 <param name="minimum_distance" type="integer" value="-1" label="The minimum distance to buffer records to account for clipping on the 5' end of the records" help="MINIMUM_DISTANCE; Set this number to -1 to use twice the first read's read length (or 100, whichever is smaller); default=-1"/> | 40 <param name="skip_pairs_with_no_mate_cigar" type="boolean" checked="true" truevalue="true" falsevalue="false" label="Skip record pairs with no mate cigar and include them in the output" help="SKIP_PAIRS_WITH_NO_MATE_CIGAR; default=True"/> |
44 <param name="skip_pairs_with_no_mate_cigar" type="boolean" checked="true" truevalue="true" falsevalue="false" label="Skip record pairs with no mate cigar and include them in the output" help="SKIP_PAIRS_WITH_NO_MATE_CIGAR; default=True"/> | 41 <param name="remove_duplicates" type="boolean" label="If true do not write duplicates to the output file instead of writing them with appropriate flags set" help="REMOVE_DUPLICATES; default=False"/> |
45 <param name="remove_duplicates" type="boolean" label="If true do not write duplicates to the output file instead of writing them with appropriate flags set" help="REMOVE_DUPLICATES; default=False"/> | 42 <param name="assume_sorted" type="boolean" label="Assume the input file is already sorted" checked="true" truevalue="true" falsevalue="false" help="ASSUME_SORTED; default=True"/> |
46 <param name="assume_sorted" type="boolean" label="Assume the input file is already sorted" checked="true" truevalue="true" falsevalue="false" help="ASSUME_SORTED; default=True"/> | 43 <param name="duplicate_scoring_strategy" type="select" label="The scoring strategy for choosing the non-duplicate among candidates" help="DUPLICATE_SCORING_STRATEGY; default=TOTAL_MAPPED_REFERENCE_LENGTH"> |
47 | 44 <option value="TOTAL_MAPPED_REFERENCE_LENGTH" selected="True">TOTAL_MAPPED_REFERENCE_LENGTH</option> |
48 <param name="duplicate_scoring_strategy" type="select" label="The scoring strategy for choosing the non-duplicate among candidates" help="DUPLICATE_SCORING_STRATEGY; default=TOTAL_MAPPED_REFERENCE_LENGTH"> | 45 <option value="SUM_OF_BASE_QUALITIES">SUM_OF_BASE_QUALITIES</option> |
49 <option value="TOTAL_MAPPED_REFERENCE_LENGTH" selected="True">TOTAL_MAPPED_REFERENCE_LENGTH</option> | 46 <option value="RANDOM">RANDOM</option> |
50 <option value="SUM_OF_BASE_QUALITIES">SUM_OF_BASE_QUALITIES</option> | 47 </param> |
51 </param> | 48 <param name="read_name_regex" type="text" value="[a-zA-Z0-9]+:[0-9]:([0-9]+):([0-9]+):([0-9]+).*." label="Regular expression that can be used to parse read names in the incoming SAM/BAM dataset" help="READ_NAME_REGEX; Read names are parsed to extract three variables: tile/region, x coordinate and y coordinate. These values are used to estimate the rate of optical duplication in order to give a more accurate estimated library size. See help below for more info; default=[a-zA-Z0-9]+:[0-9]:([0-9]+):([0-9]+):([0-9]+).*."> |
52 | 49 <expand macro="sanitize_query"/> |
53 | 50 </param> |
54 <param name="read_name_regex" type="text" value="[a-zA-Z0-9]+:[0-9]:([0-9]+):([0-9]+):([0-9]+).*." label="Regular expression that can be used to parse read names in the incoming SAM/BAM dataset" help="READ_NAME_REGEX; Read names are parsed to extract three variables: tile/region, x coordinate and y coordinate. These values are used to estimate the rate of optical duplication in order to give a more accurate estimated library size. See help below for more info; default=[a-zA-Z0-9]+:[0-9]:([0-9]+):([0-9]+):([0-9]+).*."> | 51 <param name="optical_duplicate_pixel_distance" type="integer" value="100" min="0" max="5000" label="The maximum offset between two duplicte clusters in order to consider them optical duplicates" help="OPTICAL_DUPLICATE_PIXEL_DISTANCE; default=100"/> |
55 <expand macro="sanitize_query" /> | 52 <expand macro="VS"/> |
56 </param> | 53 </inputs> |
57 <param name="optical_duplicate_pixel_distance" type="integer" value="100" min="0" max="5000" label="The maximum offset between two duplicte clusters in order to consider them optical duplicates" help="OPTICAL_DUPLICATE_PIXEL_DISTANCE; default=100"/> | 54 <outputs> |
58 | 55 <data format="txt" name="metrics_file" label="${tool.name} on ${on_string}: metrics"/> |
59 <expand macro="VS" /> | 56 <data format="bam" name="outFile" label="${tool.name} on ${on_string}: BAM"/> |
60 | 57 </outputs> |
61 </inputs> | 58 <tests> |
62 | 59 <test> |
63 <outputs> | 60 <param name="inputFile" value="picard_MarkDuplicatesWithMateCigar.bam" ftype="bam"/> |
64 <data format="txt" name="metrics_file" label="${tool.name} on ${on_string}: metrics"/> | 61 <param name="minimum_distance" value="-1"/> |
65 <data format="bam" name="outFile" label="${tool.name} on ${on_string}: BAM"/> | 62 <param name="skip_pairs_with_no_mate_cigar" value="True"/> |
66 </outputs> | 63 <param name="comment" value="test-run"/> |
67 | 64 <param name="assume_sorted" value="True"/> |
68 <tests> | 65 <param name="remove_duplicates" value="False"/> |
69 <test> | 66 <param name="read_name_regex" value="[a-zA-Z0-9]+:[0-9]:([0-9]+):([0-9]+):([0-9]+).*."/> |
70 <param name="inputFile" value="picard_MarkDuplicatesWithMateCigar.bam" ftype="bam"/> | 67 <param name="optical_duplicate_pixel_distance" value="100"/> |
71 <param name="minimum_distance" value="-1"/> | 68 <param name="duplicate_scoring_strategy" value="TOTAL_MAPPED_REFERENCE_LENGTH"/> |
72 <param name="skip_pairs_with_no_mate_cigar" value="True"/> | 69 <param name="validation_stringency" value="LENIENT"/> |
73 <param name="comment" value="test-run"/> | 70 <output name="outFile" file="picard_MarkDuplicatesWithMateCigar_test1.bam" ftype="bam" lines_diff="4"/> |
74 <param name="assume_sorted" value="True"/> | 71 </test> |
75 <param name="remove_duplicates" value="False"/> | 72 </tests> |
76 <param name="read_name_regex" value="[a-zA-Z0-9]+:[0-9]:([0-9]+):([0-9]+):([0-9]+).*."/> | 73 <help> |
77 <param name="optical_duplicate_pixel_distance" value="100"/> | |
78 <param name="duplicate_scoring_strategy" value="TOTAL_MAPPED_REFERENCE_LENGTH"/> | |
79 <param name="validation_stringency" value="LENIENT"/> | |
80 <output name="outFile" file="picard_MarkDuplicatesWithMateCigar_test1.bam" ftype="bam" lines_diff="4"/> | |
81 </test> | |
82 </tests> | |
83 | |
84 | |
85 <help> | |
86 | 74 |
87 **Purpose** | 75 **Purpose** |
88 | 76 |
89 Examines aligned records in the supplied SAM or BAM dataset to locate duplicate molecules. All records are then written to the output file with the duplicate records flagged. | 77 Examines aligned records in the supplied SAM or BAM dataset to locate duplicate molecules. All records are then written to the output file with the duplicate records flagged. |
90 | 78 |
147 which case 50-100 is more normal. Default value: 100. | 135 which case 50-100 is more normal. Default value: 100. |
148 | 136 |
149 @more_info@ | 137 @more_info@ |
150 | 138 |
151 </help> | 139 </help> |
152 <expand macro="citations" /> | 140 <expand macro="citations"/> |
153 </tool> | 141 </tool> |