Mercurial > repos > iuc > multiqc
changeset 16:bf675f34b056 draft
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/multiqc commit bd94f00ad5d023ae392ca8fc2378fd5a78bed875"
author | iuc |
---|---|
date | Sat, 16 May 2020 09:40:45 -0400 |
parents | 3d93dd18d9f8 |
children | 5e33b465d8d5 |
files | multiqc.xml test-data/genome_results.txt test-data/qualimap_bamqc_genome_results.tabular |
diffstat | 3 files changed, 179 insertions(+), 3 deletions(-) [+] |
line wrap: on
line diff
--- a/multiqc.xml Sat Jan 18 03:08:54 2020 -0500 +++ b/multiqc.xml Sat May 16 09:40:45 2020 -0400 @@ -1,7 +1,7 @@ -<tool id="multiqc" name="MultiQC" version="@WRAPPER_VERSION@.1"> +<tool id="multiqc" name="MultiQC" version="@WRAPPER_VERSION@+galaxy0"> <description>aggregate results from bioinformatics analyses into a single report</description> <macros> - <token name="@WRAPPER_VERSION@">1.7</token> + <token name="@WRAPPER_VERSION@">1.8</token> <token name="@ESCAPE_IDENTIFIER@"> <![CDATA[ #set identifier = re.sub('[^\s\w\-]', '_', str($file.element_identifier)) @@ -272,6 +272,28 @@ #elif str($repeat.software_cond.software) == "prokka" #set $pattern = "contigs:" @LN_FILES@ + #elif str($repeat.software_cond.software) == "qualimap" + #for $file in $repeat.software_cond.input + #if re.search("genome_results", str($file.element_identifier)) + sample="\$(grep 'bam file = ' $file | sed 's/bam file = //g' | sed 's: ::g')" && + dir_name="$software_dir/\${sample}" && + mkdir -p \${dir_name} && + filepath_1="\${dir_name}/genome_results.txt" && + ln -sf '$file' \${filepath_1} && + #elif re.search("coverage_histogram", str($file.element_identifier)) + nested_dir_name="\${dir_name}/raw_data_qualimapReport/" && + mkdir -p \${nested_dir_name} && + filepath_2="\${nested_dir_name}/coverage_histogram.txt" && + ln -sf '$file' \${filepath_2} && + #elif re.search("gc-content_distribution", str($file.element_identifier)) + nested_dir_name="\${dir_name}/raw_data_qualimapReport/" && + mkdir -p \${nested_dir_name} && + filepath_3="\${nested_dir_name}/mapped_reads_gc-content_distribution.txt" && + ln -sf '$file' \${filepath_3} && + #else + #pass + #end if + #end for #elif str($repeat.software_cond.software) == "quast" #for $k, $file in enumerate($repeat.software_cond.input) #set file_dir = os.path.join($software_dir, 'file_' + str($k)) @@ -499,6 +521,7 @@ <!--<option value="bbmap">BBMap</option>--> <option value="bcftools">Bcftools</option> <!--<option value="bcl2fastq">bcl2fastq</option>--> + <!--<option value="biobambam2">biobambam2</option>--> <!--<option value="biobloomtools">BioBloom Tools</option>--> <option value="bismark">Bismark</option> <!--<option value="bowtie1">Bowtie 1</option>--> @@ -515,6 +538,7 @@ <option value="fastp">fastp</option> <option value="fastqc">FastQC</option> <option value="featureCounts">featureCounts</option> + <!--<option value="fgbio">fgbio</option>--> <option value="flexbar">Flexbar</option> <option value="gatk">GATK</option> <!--<option value="goleft_indexcov">goleft indexcov</option>--> @@ -529,12 +553,14 @@ <!--<option value="leehom">leeHom</option>--> <option value="macs2">MACS2</option> <!--<option value="methylQA">methylQA</option>--> + <!--<option value="mosdepth">mostdepth</option>--> + <!--<option value="mtnucratio">mtnucratio</option>--> <!--<option value="peddy">Peddy</option>--> <option value="picard">Picard</option> <!--<option value="preseq">Preseq</option>--> <option value="prokka">Prokka</option> <!--<option value="qorts">QoRTs</option>--> - <!--<option value="qualimap">Qualimap (BamQC or RNASeq output)</option>--> + <option value="qualimap">Qualimap (BamQC or RNASeq output)</option> <option value="quast">QUAST</option> <!--<option value="rna_seqc">RNA-SeQC</option>--> <!--<option value="rsem">RSEM (rsem-calculate-regex output)</option>--> @@ -543,6 +569,8 @@ <option value="samblaster">Samblaster</option> <option value="samtools">Samtools</option> <!--<option value="sargasso">Sargasso</option>--> + <!--<option value="seqyclean">SeqyClean</option>--> + <!--<option value="sexdeterrmine">SexDetErrmine</option>--> <!--<option value="skewer">Skewer</option>--> <option value="slamdunk">Slamdunk</option> <option value="snpeff">SnpEff</option> @@ -663,6 +691,9 @@ <when value="prokka"> <param name="input" type="data" format="txt" multiple="true" label="Output of Prokka" help="It should contain 'contigs:'"/> </when> + <when value="qualimap"> + <param name="input" type="data" format="txt,tabular,tsv" multiple="true" label="Output of Qualimap BamQC" help="First result input should be genome_coverage (default from tool output). Run the Flatten Collection tool to keep all output in one report" /> + </when> <when value="quast"> <param name="input" type="data" format="tabular,tsv" multiple="true" label="Output of Quast"/> </when> @@ -1100,6 +1131,12 @@ </repeat> <repeat name="results"> <conditional name="software_cond"> + <param name="software" value="qualimap" /> + <param name="input" value="genome_results.txt" /> + </conditional> + </repeat> + <repeat name="results"> + <conditional name="software_cond"> <param name="software" value="quast" /> <param name="input" value="quast.tsv" /> </conditional> @@ -1177,6 +1214,7 @@ <has_text text="picard-insertsize" /> <has_text text="picard-gcbias" /> <has_text text="prokka_plot" /> + <has_text text="qualimap" /> <has_text text="samblaster_duplicates" /> <has_text text="quast-stats" /> <has_text text="samtools-flagstat-dp" /> @@ -1197,6 +1235,7 @@ <element name="picard_dups" file="picard_dups_stats.tabular" compare="sim_size" delta="0"/> <element name="picard_insertSize" file="picard_insertSize_stats.tabular" compare="sim_size" delta="0"/> <element name="prokka" file="prokka_stats.tabular" compare="sim_size" delta="0"/> + <element name="qualimap_bamqc_genome_results" file="qualimap_bamqc_genome_results.tabular" compare="sim_size" delta="0"/> <element name="quast" file="quast_stats.tabular" compare="sim_size" delta="0"/> <element name="samblaster" file="samblaster_stats.tabular" compare="sim_size" delta="0"/> <element name="samtools_flagstat">
--- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/genome_results.txt Sat May 16 09:40:45 2020 -0400 @@ -0,0 +1,135 @@ +BamQC report +----------------------------------- + +>>>>>>> Input + + bam file = x_bam + outfile = results/genome_results.txt + + +>>>>>>> Reference + + number of bases = 1,817,261 bp + number of contigs = 1 + + +>>>>>>> Globals + + number of windows = 400 + + number of reads = 1,248,774 + number of mapped reads = 1,242,183 (99.47%) + number of supplementary alignments = 3,386 (0.27%) + number of secondary alignments = 0 + + number of mapped paired reads (first in pair) = 623,192 + number of mapped paired reads (second in pair) = 618,991 + number of mapped paired reads (both in pair) = 1,237,764 + number of mapped paired reads (singletons) = 4,419 + number of overlapping read pairs = 463,596 + + number of mapped bases = 366,875,582 bp + number of sequenced bases = 366,823,893 bp + number of aligned bases = 0 bp + number of duplicated reads (estimated) = 673,527 + duplication rate = 47.01% + + +>>>>>>> Insert size + + mean insert size = 1,097.678 + std insert size = 27,365.2401 + median insert size = 524 + + +>>>>>>> Mapping quality + + mean mapping quality = 58.4552 + + +>>>>>>> ACTG content + + number of A's = 109,576,306 bp (29.87%) + number of C's = 73,524,910 bp (20.04%) + number of T's = 111,308,231 bp (30.34%) + number of G's = 72,414,446 bp (19.74%) + number of N's = 0 bp (0%) + + GC percentage = 39.78% + + +>>>>>>> Mismatches and indels + + general error rate = 0.0098 + number of mismatches = 3,560,959 + number of insertions = 7,229 + mapped reads with insertion percentage = 0.56% + number of deletions = 14,669 + mapped reads with deletion percentage = 1.15% + homopolymer indels = 46.92% + + +>>>>>>> Coverage + + mean coverageData = 201.8838X + std coverageData = 112.2733X + paired-end adapted mean coverage = 177.4988X + + There is a 99.81% of reference with a coverageData >= 1X + There is a 99.77% of reference with a coverageData >= 2X + There is a 99.74% of reference with a coverageData >= 3X + There is a 99.7% of reference with a coverageData >= 4X + There is a 99.66% of reference with a coverageData >= 5X + There is a 99.6% of reference with a coverageData >= 6X + There is a 99.53% of reference with a coverageData >= 7X + There is a 99.41% of reference with a coverageData >= 8X + There is a 99.3% of reference with a coverageData >= 9X + There is a 99.21% of reference with a coverageData >= 10X + There is a 99.11% of reference with a coverageData >= 11X + There is a 98.99% of reference with a coverageData >= 12X + There is a 98.87% of reference with a coverageData >= 13X + There is a 98.76% of reference with a coverageData >= 14X + There is a 98.63% of reference with a coverageData >= 15X + There is a 98.5% of reference with a coverageData >= 16X + There is a 98.35% of reference with a coverageData >= 17X + There is a 98.16% of reference with a coverageData >= 18X + There is a 97.97% of reference with a coverageData >= 19X + There is a 97.79% of reference with a coverageData >= 20X + There is a 97.59% of reference with a coverageData >= 21X + There is a 97.37% of reference with a coverageData >= 22X + There is a 97.16% of reference with a coverageData >= 23X + There is a 96.95% of reference with a coverageData >= 24X + There is a 96.71% of reference with a coverageData >= 25X + There is a 96.48% of reference with a coverageData >= 26X + There is a 96.24% of reference with a coverageData >= 27X + There is a 95.99% of reference with a coverageData >= 28X + There is a 95.73% of reference with a coverageData >= 29X + There is a 95.49% of reference with a coverageData >= 30X + There is a 95.23% of reference with a coverageData >= 31X + There is a 94.99% of reference with a coverageData >= 32X + There is a 94.75% of reference with a coverageData >= 33X + There is a 94.51% of reference with a coverageData >= 34X + There is a 94.27% of reference with a coverageData >= 35X + There is a 94.01% of reference with a coverageData >= 36X + There is a 93.8% of reference with a coverageData >= 37X + There is a 93.55% of reference with a coverageData >= 38X + There is a 93.31% of reference with a coverageData >= 39X + There is a 93.04% of reference with a coverageData >= 40X + There is a 92.77% of reference with a coverageData >= 41X + There is a 92.52% of reference with a coverageData >= 42X + There is a 92.27% of reference with a coverageData >= 43X + There is a 91.99% of reference with a coverageData >= 44X + There is a 91.72% of reference with a coverageData >= 45X + There is a 91.44% of reference with a coverageData >= 46X + There is a 91.17% of reference with a coverageData >= 47X + There is a 90.9% of reference with a coverageData >= 48X + There is a 90.64% of reference with a coverageData >= 49X + There is a 90.4% of reference with a coverageData >= 50X + There is a 90.15% of reference with a coverageData >= 51X + + +>>>>>>> Coverage per contig + + NZ_CP031250.1 1817261 366875582 201.88381415768015 112.27329056357358 + +
--- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/qualimap_bamqc_genome_results.tabular Sat May 16 09:40:45 2020 -0400 @@ -0,0 +1,2 @@ +Sample bam_file total_reads mapped_reads mapped_bases sequenced_bases mean_insert_size median_insert_size mean_mapping_quality general_error_rate percentage_aligned +x_bam x_bam 1248774.0 1242183.0 366875582.0 366823893.0 1097.678 524.0 58.4552 0.0098 99.4722023360512