comparison macros.xml @ 2:cb2fc9f60381 draft

"planemo upload for repository https://github.com/galaxyproteomics/tools-galaxyp/tree/master/tools/drep commit eaae9983f0339c4624431f4f843e319f83814490"
author jjohnson
date Wed, 08 Jan 2020 13:01:03 -0500
parents 7e2debc267eb
children 3f7c9be3edde
comparison
equal deleted inserted replaced
1:7e2debc267eb 2:cb2fc9f60381
311 <data name="Chdb" format="tabular" label="${tool.name} on ${on_string}: Chdb.tsv" from_work_dir="outdir/data/checkM/checkM_outdir/Chdb.tsv"> 311 <data name="Chdb" format="tabular" label="${tool.name} on ${on_string}: Chdb.tsv" from_work_dir="outdir/data/checkM/checkM_outdir/Chdb.tsv">
312 <filter>'Chdb' in select_outputs</filter> 312 <filter>'Chdb' in select_outputs</filter>
313 </data> 313 </data>
314 </xml> 314 </xml>
315 315
316
317 <xml name="test_defaults_log">
318 <test>
319 <param name="genomes" ftype="fasta" value="Enterococcus_casseliflavus_EC20.fasta,Enterococcus_faecalis_T2.fna,Enterococcus_faecalis_TX0104.fa"/>
320 <output name="log">
321 <assert_contents>
322 <yield/>
323 </assert_contents>
324 </output>
325 </test>
326 </xml>
327
316 <token name="@GENOMES_HELP@"><![CDATA[ 328 <token name="@GENOMES_HELP@"><![CDATA[
317 I/O PARAMETERS: 329 I/O PARAMETERS:
318 -g [GENOMES [GENOMES ...]], --genomes [GENOMES [GENOMES ...]] 330 -g [GENOMES [GENOMES ...]], --genomes [GENOMES [GENOMES ...]]
319 genomes to cluster in .fasta format (default: None) 331 genomes to cluster in .fasta format
332 (default: None)
333
334
320 ]]></token> 335 ]]></token>
321 336
322 <token name="@FILTERING_HELP@"><![CDATA[ 337 <token name="@FILTERING_HELP@"><![CDATA[
323 FILTERING OPTIONS: 338 FILTERING OPTIONS:
324 -l LENGTH, --length LENGTH 339 -l LENGTH, --length LENGTH
325 Minimum genome length (default: 50000) 340 Minimum genome length
341 (default: 50000)
342
343
326 -comp COMPLETENESS, --completeness COMPLETENESS 344 -comp COMPLETENESS, --completeness COMPLETENESS
327 Minumum genome completeness (default: 75) 345 Minumum genome completeness
346 (default: 75)
347
348
328 -con CONTAMINATION, --contamination CONTAMINATION 349 -con CONTAMINATION, --contamination CONTAMINATION
329 Maximum genome contamination (default: 25) 350 Maximum genome contamination
351 (default: 25)
352
353
330 --ignoreGenomeQuality 354 --ignoreGenomeQuality
331 Don't run checkM or do any quality filtering. NOT 355 Don't run checkM or do any quality filtering. NOT
332 RECOMMENDED! This is useful for use with 356 RECOMMENDED! This is useful for use with
333 bacteriophages or eukaryotes or things where checkM 357 bacteriophages or eukaryotes or things where checkM
334 scoring does not work. Will only choose genomes based 358 scoring does not work. Will only choose genomes based
339 363
340 <token name="@GENOME_COMPARISON_HELP@"><![CDATA[ 364 <token name="@GENOME_COMPARISON_HELP@"><![CDATA[
341 GENOME COMPARISON PARAMETERS: 365 GENOME COMPARISON PARAMETERS:
342 -ms MASH_SKETCH, --MASH_sketch MASH_SKETCH 366 -ms MASH_SKETCH, --MASH_sketch MASH_SKETCH
343 MASH sketch size (default: 1000) 367 MASH sketch size (default: 1000)
368
344 --S_algorithm {goANI,ANIn,ANImf,gANI} 369 --S_algorithm {goANI,ANIn,ANImf,gANI}
345 Algorithm for secondary clustering comaprisons: 370 Algorithm for secondary clustering comaprisons:
346 ANImf = (RECOMMENDED) Align whole genomes with nucmer; filter alignment; compare aligned regions 371 ANImf = (RECOMMENDED) Align whole genomes with nucmer; filter alignment; compare aligned regions
347 ANIn = Align whole genomes with nucmer; compare aligned regions 372 ANIn = Align whole genomes with nucmer; compare aligned regions
348 gANI = Identify and align ORFs; compare aligned ORFS 373 gANI = Identify and align ORFs; compare aligned ORFS
349 (default: ANImf) 374 (default: ANImf)
375
350 -n_PRESET {normal,tight} 376 -n_PRESET {normal,tight}
351 Presets to pass to nucmer 377 Presets to pass to nucmer
352 tight = only align highly conserved regions 378 tight = only align highly conserved regions
353 normal = default ANIn parameters (default: normal) 379 normal = default ANIn parameters (default: normal)
354 380
358 CLUSTERING PARAMETERS: 384 CLUSTERING PARAMETERS:
359 -pa P_ANI, --P_ani P_ANI 385 -pa P_ANI, --P_ani P_ANI
360 ANI threshold to form primary (MASH) clusters 386 ANI threshold to form primary (MASH) clusters
361 (default: 0.9) 387 (default: 0.9)
362 -sa S_ANI, --S_ani S_ANI 388 -sa S_ANI, --S_ani S_ANI
363 ANI threshold to form secondary clusters (default: 389 ANI threshold to form secondary clusters
364 0.99) 390 (default: 0.99)
391
365 --SkipMash Skip MASH clustering, just do secondary clustering on 392 --SkipMash Skip MASH clustering, just do secondary clustering on
366 all genomes (default: False) 393 all genomes (default: False)
367 --SkipSecondary Skip secondary clustering, just perform MASH 394 --SkipSecondary Skip secondary clustering, just perform MASH clustering
368 clustering (default: False) 395 (default: False)
396
369 -nc COV_THRESH, --cov_thresh COV_THRESH 397 -nc COV_THRESH, --cov_thresh COV_THRESH
370 Minmum level of overlap between genomes when doing 398 Minmum level of overlap between genomes when doing
371 secondary comparisons (default: 0.1) 399 secondary comparisons (default: 0.1)
372 -cm {total,larger}, --coverage_method {total,larger} 400 -cm {total,larger}, --coverage_method {total,larger}
373 Method to calculate coverage of an alignment 401 Method to calculate coverage of an alignment
374 (for ANIn/ANImf only; gANI can only do larger method) 402 (for ANIn/ANImf only; gANI can only do larger method)
375 total = 2*(aligned length) / (sum of total genome lengths) 403 total = 2*(aligned length) / (sum of total genome lengths)
376 larger = max((aligned length / genome 1), (aligned_length / genome2)) 404 larger = max((aligned length / genome 1), (aligned_length / genome2))
377 (default: larger) 405 (default: larger)
406
378 --clusterAlg CLUSTERALG 407 --clusterAlg CLUSTERALG
379 Algorithm used to cluster genomes (passed to 408 Algorithm used to cluster genomes (passed to
380 scipy.cluster.hierarchy.linkage (default: average) 409 scipy.cluster.hierarchy.linkage (default: average)
381 410
382 ]]></token> 411 ]]></token>
396 -N50W N50_WEIGHT, --N50_weight N50_WEIGHT 425 -N50W N50_WEIGHT, --N50_weight N50_WEIGHT
397 weight of log(genome N50) (default: 0.5) 426 weight of log(genome N50) (default: 0.5)
398 -sizeW SIZE_WEIGHT, --size_weight SIZE_WEIGHT 427 -sizeW SIZE_WEIGHT, --size_weight SIZE_WEIGHT
399 weight of log(genome size) (default: 0) 428 weight of log(genome size) (default: 0)
400 429
430
401 ]]></token> 431 ]]></token>
402 432
403 <token name="@TAXONOMY_HELP@"><![CDATA[ 433 <token name="@TAXONOMY_HELP@"><![CDATA[
404 TAXONOMY: 434 TAXONOMY:
405 --run_tax generate taxonomy information (Tdb) (default: False) 435 --run_tax generate taxonomy information (Tdb)
436 (default: False)
437
406 --tax_method {percent,max} 438 --tax_method {percent,max}
407 Method of determining taxonomy 439 Method of determining taxonomy
408 percent = The most descriptive taxonimic level with at least (per) hits 440 percent = The most descriptive taxonimic level with at least (per) hits
409 max = The centrifuge taxonomic level with the most overall hits (default: percent) 441 max = The centrifuge taxonomic level with the most overall hits
442 (default: percent)
443
444
410 -per PERCENT, --percent PERCENT 445 -per PERCENT, --percent PERCENT
411 minimum percent for percent method (default: 50) 446 minimum percent for percent method
447 (default: 50)
448
449
412 --cent_index CENT_INDEX 450 --cent_index CENT_INDEX
413 path to centrifuge index (for example, 451 path to centrifuge index (for example,
414 /home/mattolm/download/centrifuge/indices/b+h+v 452 /home/mattolm/download/centrifuge/indices/b+h+v
415 (default: None) 453 (default: None)
416 454