comparison arriba.xml @ 7:25d207f7ff83 draft

"planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit e113a79cc67e0bdb168babfe964f34873b2e1303"
author jjohnson
date Mon, 11 Oct 2021 16:40:51 +0000
parents 7253b367c082
children 1a56888ddb7d
comparison
equal deleted inserted replaced
6:7253b367c082 7:25d207f7ff83
53 #if $input_params.chimeric 53 #if $input_params.chimeric
54 -c '$input_params.chimeric' 54 -c '$input_params.chimeric'
55 #end if 55 #end if
56 #end if 56 #end if
57 -a '$genome_assembly' 57 -a '$genome_assembly'
58 -g '$gtf' 58 -g '$annotation'
59 #if $blacklist 59 #if $blacklist
60 -b '$blacklist' 60 -b '$blacklist'
61 #else 61 #else
62 -f 'blacklist' 62 -f 'blacklist'
63 #end if 63 #end if
153 #elif str($visualization.do_viz) == "yes" 153 #elif str($visualization.do_viz) == "yes"
154 && samtools sort -@ \${GALAXY_SLOTS:-1} -m 4G -T tmp -O bam '$input_params.input' > Aligned.sortedByCoord.out.bam 154 && samtools sort -@ \${GALAXY_SLOTS:-1} -m 4G -T tmp -O bam '$input_params.input' > Aligned.sortedByCoord.out.bam
155 && samtools index Aligned.sortedByCoord.out.bam 155 && samtools index Aligned.sortedByCoord.out.bam
156 #end if 156 #end if
157 #if str($visualization.do_viz) == "yes" 157 #if str($visualization.do_viz) == "yes"
158 && draw_fusions.R 158 #set $fusions = 'fusions.tsv'
159 --fusions=fusions.tsv 159 && @DRAW_FUSIONS@
160 --alignments=Aligned.sortedByCoord.out.bam
161 --annotation='$gtf'
162 --output=fusions.pdf
163 #if $visualization.cytobands
164 --cytobands='$visualization.cytobands'
165 #end if
166 #if $protein_domains
167 --proteinDomains='$protein_domains'
168 #end if
169 ## Visualization Options
170 #if $visualization.options.transcriptSelection
171 --transcriptSelection=$visualization.options.transcriptSelection
172 #end if
173 #if $visualization.options.minConfidenceForCircosPlot
174 --minConfidenceForCircosPlot=$visualization.options.minConfidenceForCircosPlot
175 #end if
176 #if $visualization.options.showIntergenicVicinity
177 --showIntergenicVicinity=$visualization.options.showIntergenicVicinity
178 #end if
179 #if $visualization.options.squishIntrons
180 --squishIntrons=$visualization.options.squishIntrons
181 #end if
182 #if $visualization.options.mergeDomainsOverlappingBy
183 --mergeDomainsOverlappingBy=$visualization.options.mergeDomainsOverlappingBy
184 #end if
185 #if $visualization.options.printExonLabels
186 --printExonLabels=$visualization.options.printExonLabels
187 #end if
188 #if $visualization.options.render3dEffect
189 --render3dEffect=$visualization.options.render3dEffect
190 #end if
191 #if $visualization.options.optimizeDomainColors
192 --optimizeDomainColors=$visualization.options.optimizeDomainColors
193 #end if
194 #if $visualization.options.color1
195 --color1=$visualization.options.color1
196 #end if
197 #if $visualization.options.color2
198 --color2=$visualization.options.color2
199 #end if
200 #if $visualization.options.pdfWidth
201 --pdfWidth=$visualization.options.pdfWidth
202 #end if
203 #if $visualization.options.pdfHeight
204 --pdfHeight=$visualization.options.pdfHeight
205 #end if
206 #if $visualization.options.fontSize
207 --fontSize=$visualization.options.fontSize
208 #end if
209 #end if 160 #end if
210 ]]></command> 161 ]]></command>
211 <inputs> 162 <inputs>
212 <conditional name="input_params"> 163 <conditional name="input_params">
213 <param name="input_source" type="select" label="Use output from earlier STAR run or let Arriba running STAR"> 164 <param name="input_source" type="select" label="Use output from earlier STAR run or let Arriba running STAR">
241 </when> 192 </when>
242 </conditional> 193 </conditional>
243 </when> 194 </when>
244 </conditional> 195 </conditional>
245 <param name="genome_assembly" argument="-a" type="data" format="fasta" label="genome assembly fasta"/> 196 <param name="genome_assembly" argument="-a" type="data" format="fasta" label="genome assembly fasta"/>
246 <param name="gtf" argument="-g" type="data" format="gtf" label="GTF file with gene annotation"/> 197 <param name="annotation" argument="-g" type="data" format="gtf" label="GTF file with gene annotation"/>
247 <param name="blacklist" argument="-b" type="data" format="tabular,tabular.gz" optional="true" label="File containing blacklisted ranges."/> 198 <param name="blacklist" argument="-b" type="data" format="tabular,tabular.gz" optional="true" label="File containing blacklisted ranges."/>
248 <param name="protein_domains" argument="-p" type="data" format="gff3" optional="true" label="File containing protein domains"/> 199 <param name="protein_domains" argument="-p" type="data" format="gff3" optional="true" label="File containing protein domains"/>
249 <param name="known_fusions" argument="-k" type="data" format="tabular,tabular.gz" optional="true" label="File containing known fusions"> 200 <param name="known_fusions" argument="-k" type="data" format="tabular,tabular.gz" optional="true" label="File containing known fusions">
250 <help><![CDATA[ file two TAB separated columns: five-prime region three-prime region ]]></help> 201 <help><![CDATA[ file two TAB separated columns: five-prime region three-prime region ]]></help>
251 </param> 202 </param>
431 <param name="do_viz" type="select" label="Generate visualization"> 382 <param name="do_viz" type="select" label="Generate visualization">
432 <option value="yes">Yes</option> 383 <option value="yes">Yes</option>
433 <option value="no">no</option> 384 <option value="no">no</option>
434 </param> 385 </param>
435 <when value="yes"> 386 <when value="yes">
436 <param name="cytobands" argument="--cytobands" type="data" format="tabular" optional="true" label="Cytobands"/> 387 <expand macro="visualization_options" />
437 <section name="options" expanded="false" title="Visualization Options">
438 <param argument="--transcriptSelection" type="select" optional="true" label="Transcript selection">
439 <help>By default the transcript isoform with the highest coverage is drawn.
440 Alternatively, the transcript isoform that is provided in the columns
441 transcript_id1 and transcript_id2 in the given fusions file can be drawn.
442 Selecting the isoform with the highest coverage usually produces nicer plots,
443 in the sense that the coverage track is smooth and shows a visible increase in coverage after the fusion breakpoint.
444 However, the isoform with the highest coverage may not be the one that is involved in the fusion.
445 Often, genomic rearrangements lead to non-canonical isoforms being transcribed.
446 For this reason, it can make sense to rely on the transcript selection provided by the columns transcript_id1/2,
447 which reflect the actual isoforms involved in a fusion.
448 \ As a third option, the transcripts that are annotated as canonical can be drawn.
449 Transcript isoforms tagged with appris_principal, appris_candidate, or CCDS are considered canonical.
450 </help>
451 <option value="coverage">coverage</option>
452 <option value="provided">provided</option>
453 <option value="canonical">canonical</option>
454 </param>
455 <param argument="--minConfidenceForCircosPlot" type="select" optional="true" label="Transcript selection">
456 <help>The fusion of interest is drawn as a solid line in the circos plot.
457 To give an impression of the overall degree of rearrangement,
458 all other fusions are drawn as semi-transparent lines in the background.
459 This option determines which other fusions should be included in the circos plot.
460 Values specify the minimum confidence a fusion must have to be included.
461 It usually makes no sense to include low-confidence fusions in circos plots,
462 because they are abundant and unreliable, and would clutter up the circos plot.
463 Default: medium
464 </help>
465 <option value="none">none - only the fusion of interest is drawn</option>
466 <option value="low">low</option>
467 <option value="medium">medium</option>
468 <option value="high">high</option>
469 </param>
470 <param argument="--showIntergenicVicinity" type="integer" value="" min="0" optional="true" label="Intergenic Vicinity">
471 <help>This option only applies to intergenic breakpoints.
472 If it is set to a value greater than 0, then the script draws the genes
473 which are no more than the given distance away from an intergenic breakpoint.
474 Note that this option is incompatible with squishIntrons.
475 Default: 0
476 </help>
477 </param>
478 <param argument="--squishIntrons" type="select" optional="true" label="Squish introns">
479 <help>Exons usually make up only a small fraction of a gene.
480 They may be hard to see in the plot. i
481 Since introns are in most situations of no interest in the context of gene fusions,
482 this switch can be used to shrink the size of introns to a fixed, negligible size.
483 It makes sense to disable this feature, if breakpoints in introns are of importance.
484 Default: TRUE
485 </help>
486 <option value="TRUE">True</option>
487 <option value="FALSE">False</option>
488 </param>
489
490 <param argument="--mergeDomainsOverlappingBy" type="float" value="" min="0." max="1.0" optional="true" label="Merge Domains Overlapping By">
491 <help>Occasionally, domains are annotated redundantly.
492 For example, tyrosine kinase domains are frequently annotated as
493 Protein tyrosine kinase and Protein kinase domain.
494 In order to simplify the visualization, such domains can be merged into one,
495 given that they overlap by the given fraction.
496 The description of the larger domain is used.
497 Default: 0.9
498 </help>
499 </param>
500 <param argument="--printExonLabels" type="select" optional="true" label="Print Exon Labels">
501 <help>By default the number of an exon is printed inside each exon,
502 which is taken from the attribute exon_number of the GTF annotation.
503 When a gene has many exons, the boxes may be too narrow to contain the labels,
504 resulting in unreadable exon labels. In these situations, i
505 it may be better to turn off exon labels.
506 Default: TRUE
507 </help>
508 <option value="TRUE">True</option>
509 <option value="FALSE">False</option>
510 </param>
511 <param argument="--render3dEffect" type="select" optional="true" label="Render 3D effect">
512 <help>Whether light and shadow should be rendered to give objects a 3D effect.
513 Default: TRUE
514 </help>
515 <option value="TRUE">True</option>
516 <option value="FALSE">False</option>
517 </param>
518 <param argument="--optimizeDomainColors" type="select" optional="true" label="Optimize Domain Colors">
519 <help>By default, the script colorizes domains according to the colors
520 specified in the file given in --annotation.
521 This way, coloring of domains is consistent across all proteins.
522 But since there are more distinct domains than colors,
523 this can lead to different domains having the same color.
524 If this option is set to TRUE, the colors are recomputed for each fusion separately.
525 This ensures that the colors have the maximum distance for each individual fusion,
526 but they are no longer consistent across different fusions.
527 Default: FALSE
528 </help>
529 <option value="TRUE">True</option>
530 <option value="FALSE">False</option>
531 </param>
532 <param argument="--color1" type="color" value="" optional="true" label="Color of the 5' end of the fusion."/>
533 <param argument="--color2" type="color" value="" optional="true" label="Color of the 3' end of the fusion."/>
534 <param argument="--pdfWidth" type="float" value="" min="1." optional="true" label="Width of PDF output file in inches"
535 help="Default: 11.692"/>
536 <param argument="--pdfHeight" type="float" value="" min="1." optional="true" label="Height of PDF output file in inches"
537 help="Default: 8.267"/>
538 <param argument="--fontSize" type="float" value="" min="0." optional="true" label="Scale the size of text"
539 help="Default: 1.0"/>
540 </section>
541
542 </when> 388 </when>
543 <when value="no"/> 389 <when value="no"/>
544 </conditional> 390 </conditional>
545 391
546 </inputs> 392 </inputs>
547 <outputs> 393 <outputs>
548 <data name="fusions" format="tabular" label="${tool.name} on ${on_string}: fusions.tsv" from_work_dir="fusions.tsv"/> 394 <data name="fusions_tsv" format="tabular" label="${tool.name} on ${on_string}: fusions.tsv" from_work_dir="fusions.tsv"/>
549 <data name="discarded" format="tabular" label="${tool.name} on ${on_string}: fusions.discarded.tsv" from_work_dir="fusions.discarded.tsv"> 395 <data name="discarded_fusions_tsv" format="tabular" label="${tool.name} on ${on_string}: fusions.discarded.tsv" from_work_dir="fusions.discarded.tsv">
550 <filter> output_fusions_discarded == "yes"</filter> 396 <filter> output_fusions_discarded == "yes"</filter>
551 </data> 397 </data>
552 <data name="aligned_bam" format="bam" label="${tool.name} on ${on_string}: Aligned.bam" from_work_dir="Aligned.sortedByCoord.out.bam"> 398 <data name="aligned_bam" format="bam" label="${tool.name} on ${on_string}: Aligned.bam" from_work_dir="Aligned.sortedByCoord.out.bam">
553 <filter>input_params['input_source'] == "use_fastq"</filter> 399 <filter>input_params['input_source'] == "use_fastq"</filter>
554 </data> 400 </data>
562 <conditional name="input_params"> 408 <conditional name="input_params">
563 <param name="input_source" value="use_star"/> 409 <param name="input_source" value="use_star"/>
564 <param name="input" ftype="sam" value="Aligned.out.sam"/> 410 <param name="input" ftype="sam" value="Aligned.out.sam"/>
565 </conditional> 411 </conditional>
566 <param name="genome_assembly" ftype="fasta" value="genome.fasta"/> 412 <param name="genome_assembly" ftype="fasta" value="genome.fasta"/>
567 <param name="gtf" ftype="gtf" value="genome.gtf"/> 413 <param name="annotation" ftype="gtf" value="genome.gtf"/>
568 <param name="protein_domains" ftype="gff3" value="protein_domains.gff3"/> 414 <param name="protein_domains" ftype="gff3" value="protein_domains.gff3"/>
569 <conditional name="visualization"> 415 <conditional name="visualization">
570 <param name="do_viz" value="no"/> 416 <param name="do_viz" value="no"/>
571 <param name="cytobands" ftype="tabular" value="cytobands.tsv"/> 417 <param name="cytobands" ftype="tabular" value="cytobands.tsv"/>
572 </conditional> 418 </conditional>
573 <output name="fusions"> 419 <output name="fusions_tsv">
574 <assert_contents> 420 <assert_contents>
575 <has_text_matching expression="BCR\tABL1"/> 421 <has_text_matching expression="BCR\tABL1"/>
576 </assert_contents> 422 </assert_contents>
577 </output> 423 </output>
578 </test> 424 </test>
581 <conditional name="input_params"> 427 <conditional name="input_params">
582 <param name="input_source" value="use_star"/> 428 <param name="input_source" value="use_star"/>
583 <param name="input" ftype="sam" value="Aligned.out.sam"/> 429 <param name="input" ftype="sam" value="Aligned.out.sam"/>
584 </conditional> 430 </conditional>
585 <param name="genome_assembly" ftype="fasta" value="genome.fasta"/> 431 <param name="genome_assembly" ftype="fasta" value="genome.fasta"/>
586 <param name="gtf" ftype="gtf" value="genome.gtf"/> 432 <param name="annotation" ftype="gtf" value="genome.gtf"/>
433 <param name="protein_domains" ftype="gff3" value="protein_domains.gff3"/>
587 <conditional name="visualization"> 434 <conditional name="visualization">
588 <param name="do_viz" value="yes"/> 435 <param name="do_viz" value="yes"/>
436 <param name="cytobands" ftype="tabular" value="cytobands.tsv"/>
589 </conditional> 437 </conditional>
590 <output name="fusions"> 438 <output name="fusions_tsv">
591 <assert_contents> 439 <assert_contents>
592 <has_text_matching expression="BCR\tABL1"/> 440 <has_text_matching expression="BCR\tABL1"/>
441 </assert_contents>
442 </output>
443 <output name="fusions_pdf">
444 <assert_contents>
445 <has_size value= "64000" delta="5000" />
593 </assert_contents> 446 </assert_contents>
594 </output> 447 </output>
595 </test> 448 </test>
596 449
597 </tests> 450 </tests>