Mercurial > repos > artbio > sr_bowtie_dataset_annotation
changeset 10:fd4a60fc3fca draft default tip
planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/sr_bowtie_dataset_annotation commit cf30b4fab90cf7910bb2900a05b85ca3344aae59
author | artbio |
---|---|
date | Tue, 15 Nov 2022 00:45:36 +0000 |
parents | 6bf9de09aa74 |
children | |
files | barplot.r sr_bowtie_dataset_annotation.xml test-data/unmatched_6.fa |
diffstat | 3 files changed, 544 insertions(+), 14 deletions(-) [+] |
line wrap: on
line diff
--- a/barplot.r Mon Apr 11 00:27:41 2022 +0000 +++ b/barplot.r Tue Nov 15 00:45:36 2022 +0000 @@ -1,13 +1,13 @@ if (length(commandArgs(TRUE)) == 0) { - system("Rscript barplot.r -h", intern = F) + system("Rscript barplot.r -h", intern = FALSE) q("no") } # load packages that are provided in the conda env -options(show.error.messages = F, +options(show.error.messages = FALSE, error = function() { cat(geterrmessage(), file = stderr()) - q("no", 1, F) + q("no", 1, FALSE) } ) loc <- Sys.setlocale("LC_MESSAGES", "en_US.UTF-8") @@ -35,7 +35,7 @@ opt <- parse_args(OptionParser(option_list = option_list), args = commandArgs(trailingOnly = TRUE)) -annotations <- read.delim(opt$input, header = F) +annotations <- read.delim(opt$input, header = FALSE) colnames(annotations) <- c("sample", "class", "percent_of_reads", "total") annotations$percent <- round(annotations$percent_of_reads / annotations$total * 100, digits = 2) @@ -51,7 +51,7 @@ geom_bar(position = "fill", stat = "identity") + facet_wrap(~sample, ncol = 3) + geom_label_repel(aes(label = percent), position = position_fill(vjust = 0.5), - size = 2, show.legend = F) + + size = 2, show.legend = FALSE) + coord_polar(theta = "y") + labs(x = "Class fractions (%)") + scale_fill_manual(values = mycolors) +
--- a/sr_bowtie_dataset_annotation.xml Mon Apr 11 00:27:41 2022 +0000 +++ b/sr_bowtie_dataset_annotation.xml Tue Nov 15 00:45:36 2022 +0000 @@ -1,4 +1,4 @@ -<tool id="sr_bowtie_dataset_annotation" name="Annotate smRNA dataset" version="2.7"> +<tool id="sr_bowtie_dataset_annotation" name="Annotate smRNA dataset" version="2.8"> <description>by iterative alignments with sRbowtie</description> <requirements> <requirement type="package" version="1.3.1">bowtie</requirement> @@ -8,14 +8,14 @@ </requirements> <command detect_errors="exit_code"><![CDATA[ #if $refGenomeSource1.genomeSource == "history": - bowtie-build -f $refGenomeSource1.ownFile genome 1>/dev/null && + bowtie-build --threads \${GALAXY_SLOTS:-4} -f $refGenomeSource1.ownFile genome 1>/dev/null && #set index_path = 'genome' #else: #set index_path = $refGenomeSource1.index.fields.path #end if #for $i in $AdditionalQueries: - bowtie-build -f $i.ownFile $i.ownFile.name 1>/dev/null && + bowtie-build --threads \${GALAXY_SLOTS:-4} -f $i.ownFile $i.ownFile.name 1>/dev/null && #end for #set method_prefix = "-v %s -k 1 --best" % str($mismatches) @@ -121,11 +121,11 @@ <output name="output" ftype="tabular" file="multisample5_output.tab" /> <output name="barplot" ftype="pdf" file="multisample5_output.pdf" compare="sim_size" delta="500" /> <output_collection name="unmatched" type="list" count="5"> - <element name="sample5.fa_unmatched" file="unmatched_5.fa" ftype="fasta"/> - <element name="sample4.fa_unmatched" file="unmatched_4.fa" ftype="fasta"/> - <element name="sample3.fa_unmatched" file="unmatched_3.fa" ftype="fasta"/> - <element name="sample2.fa_unmatched" file="unmatched_2.fa" ftype="fasta"/> - <element name="sample1.fa_unmatched" file="unmatched_1.fa" ftype="fasta"/> + <element name="sample5.fa_unmatched" file="unmatched_5.fa" ftype="fasta" compare="sim_size" delta="0"/> + <element name="sample4.fa_unmatched" file="unmatched_4.fa" ftype="fasta" compare="sim_size" delta="0"/> + <element name="sample3.fa_unmatched" file="unmatched_3.fa" ftype="fasta" compare="sim_size" delta="0"/> + <element name="sample2.fa_unmatched" file="unmatched_2.fa" ftype="fasta" compare="sim_size" delta="0"/> + <element name="sample1.fa_unmatched" file="unmatched_1.fa" ftype="fasta" compare="sim_size" delta="0"/> </output_collection> </test> <test> @@ -137,7 +137,7 @@ <output name="output" ftype="tabular" file="sample1_output.tab" /> <output name="barplot" ftype="pdf" file="sample1_output.pdf" compare="sim_size" delta="500"/> <output_collection name="unmatched" type="list"> - <element name="sample1.fa_unmatched" file="unmatched_1.fa" ftype="fasta"/> + <element name="sample1.fa_unmatched" file="unmatched_6.fa" ftype="fasta" compare="sim_size" delta="0"/> </output_collection> </test> <test>
--- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/unmatched_6.fa Tue Nov 15 00:45:36 2022 +0000 @@ -0,0 +1,530 @@ +>25207 +TCGCACTAGCTTCGGTCGTCTCGGA +>25229 +TCTGTTCGAGGTTCTTTATTTGAA +>25283 +TAAGGGAGCGAGATCGTTCGATGCA +>25363 +TAGTGTTGGGTGTAGGCCAGGGAG +>25376 +TCCGCCGACAATGTTGCAACATGA +>25435 +TTTCTTCAAGCTGCGCGTTTTTCGG +>25593 +TCGAAAACTTCTTCGCACTCTTCGTT +>25660 +TCTCGCTGCGTGAACGATGAAGGC +>25968 +TTTGCTAGGACTGCTGCATAAG +>26220 +GCCCGTGTCGATGAATGCTTCAAACT +>26261 +TATTATCGTCCGCTGCTAAACTGC +>26543 +CTTATGTATAAAAAGCTCTGATGGA +>26610 +TCCTTAAGTTCGTTGATTTGGGCT +>26675 +CAATATCGTCAACATCCTCGAACGAT +>26873 +TTGGGAGCTGAATCCCGTTACGGTA +>26978 +CGCGCATTAGCTCAAATCTAGTTGGA +>27220 +TGTTTATTTGTCAAGTTTAGATAATA +>27397 +TAGTTCACAGCTGTATGTCCAGATGGGT +>27869 +TATGGTCCAGAATGTAGCCTCGGC +>27878 +TATTAATCGGGCCACAAATATCGGTA +>28035 +GGTATTCTTTGCGAGGTCGTCCTGG +>28154 +AAAGACGAGAACGCGTATATGTGTGC +>28319 +TGACCAACCTTAAAAGATCGGGGT +>28387 +TATTACTATTTCTAAGCTTTGTTTAAA +>28594 +TTTTGAGGTTGGTCAAGAAGTTGTT +>28608 +TAAGATTGAAAATTACTGTGGAGT +>28668 +TACAGATTCTAGAGACAAAGACGC +>28674 +TAAGTACATGCGCCCAGCCGCCGTGA +>28836 +TCTGGTTAAGGTCGGAATACTCGTCT +>29056 +TGCTTTACATACCCTTTGGTGCCC +>29323 +TTTTGCTGCAGAGCTTCTTCCAACGT +>29342 +TATGTATGGATATGTATATTTATGGT +>29387 +TGATAATCGACCTCTTCCATCGTTGT +>29423 +TCTAAGAACTTCTGAGGTGAAGG +>29462 +TGCATTTCAATCGGAAGAGTACTCTG +>29492 +TAAAACACAAATCTCGACATACAGA +>29703 +GTACAGGTTCTGATGACAATG +>29785 +TCAGATGAAAGACAAATTAGAATT +>30053 +TAAGAACTTCTGAGATGAAGGGC +>30096 +TGGATATTGAATGTTTTTGATTTGC +>30136 +TGTAGTCGTCGTATGTCCGGA +>30272 +TGCATTCGTGGATTCGCATTCGAGA +>30497 +TGACAAAATATGCCCTTCACCTCAGA +>30787 +TAACTGTTTTTAGTTCAAAGTCTCGGA +>30836 +TAAATATTTTTTTTGAAACA +>30977 +CGACTGTAATTATTAGCACAATACT +>30985 +GACGATATTGCTGCAATAGACCTTGA +>31000 +TCAGATGAGAGACAAATTAGAAT +>31256 +TAATTCGGAATGCCTGCTCTACT +>31417 +TCAATGATCGCTGTGCTCAGTAGGA +>31506 +TTTGTCTGACGTTAAAAAATATA +>31567 +TCCACATTAGGAGGATTATTAGACAAC +>31790 +AAACATAATAATTGATGGCGGAAGA +>31872 +AAGGTAATCATAGAGCACCACGGTT +>32157 +TTTCTGTGAATTCACATGCTGATGA +>32192 +TTTCTCATGTATAAAATGCTCTGATGG +>32223 +TATCTTGTTATTCTAGTGTCTTTGGTT +>32338 +TGTGGGACTCGAGCCAAAATGGCAACCT +>32497 +TGCGGTTGGACAATTTTTTTTTTATA +>32506 +TTGTTGTTTGGAGGAAGTTCCTTT +>32510 +TCTTCCGCCATCAATTATTATGTTTT +>32522 +TACTTGACTTTTCTATAGAATCTGGT +>32540 +TATCGTCAACATCCTCGAACGATCGAGA +>32626 +TTGATCAAGGTAGGGTTGTCGC +>32646 +TCTGTTAAACACCCCTGAATCGTGGAT +>32657 +TTTGGACATTTTGCAGGTGATACAAT +>32682 +TAACTGTTTTTAGTTCAAAGTCTCGGA +>32716 +TATCTATAGTTCCGATTGGCCATCTC +>32885 +GAAAGTGGGTATCTGTATTTTAGGC +>32967 +TAAAGATACCATCTAACCTCCTTGGA +>33075 +ACAGATATTAGTGTTTTTCAAGCAGC +>33147 +ATCGCAATTATGGCATAACAGATTCGGA +>33163 +TTCAGCGTCGCTTGATTGAATAGAT +>33231 +TAAGAACTTCTGAGGTGAAGGGC +>33242 +TTGGGTTTAGAAATTAAAATTAAGGC +>33244 +TATAGAAAGTTACGAATATATTAGGA +>33248 +TTTTTGATCAATTGGCACCGTGCGAA +>33296 +TGCAGAGCTTCTTCCAACGTTGGCAAG +>33318 +TAGATGTCTGCAGGAATAACGGA +>33338 +TCGACTATTAATGGCTGTTAGAATT +>33475 +CAAACTTATCGACCATCTCCTCAAACG +>33601 +TTACCCTTTTTCCGGAGCGTTTGTGC +>33611 +AATGATCGCTGTGCTCAGTATGACGG +>33662 +TTTGATTCATTACAATTTACGCTGAA +>33737 +CAGATATTAGTGTTTTTCAAGCAGC +>33747 +TACATGTAAAGCAGCTGTGTGTGC +>33815 +AGTTTTTGGAATCACTTGA +>34032 +TGCGGACGTGTGCTCGCTGCGTGA +>34200 +TAATATATGTATAATCTGCTTGGTG +>34240 +TCTTTACGCCATATAAATCATTTCGA +>34259 +ACAAATCATAAATTTGATGGGACGA +>34268 +TCTTGTGGACTTCACTCTAG +>34297 +TAAGTAAATAGTCCCCGCCTTATTGAGG +>34337 +TGGATAATGAATGTTTTTGATTTGC +>34569 +TCTAGGTTCTTCTGAAATCGTGGGA +>34643 +TCGTGTAGACCGGATAAGATTTTTT +>34697 +TCTAATACTGTGAAAGGGTGGGG +>34808 +GTAGGATGTGCTCTGCGGTTTCCAC +>34892 +TCTGTCGCAGTTGTAGCTTGCAATA +>34896 +TGTAGTTGCCACTTATGCTGTCCA +>35151 +TAGCAATGTCCGTCTGTCCGTATGA +>35196 +TGTAAATGGTCAGCGAAAGCAAAGG +>35211 +CAGATATTAGTGTTTTTCAAGCAGCGG +>35246 +CCTCAGAGAACGTCAGACCGCG +>35272 +TGCAGAGCTTCTTCCAACGTTGG +>35273 +TCTGGTAGTAAGAAAAATGTAGCTT +>35286 +TATGTATGGATATGTATATTTATGGGT +>35317 +TTTTGGTTTGATCGTCAGGTGGTC +>35512 +GACGATAATAGTGAATTTTGGACA +>35566 +TTCGAATTCGCGCCATTTCACAATC +>35948 +TGGCCTGTATACGCTTTCTGTTG +>36009 +TTGCAAAAGTCATATCTTGAGG +>36059 +TAAGTTACTATGGATCCATAAGGGTA +>36100 +TGATATGGGACTTGTAGCTTTTTTAAA +>36121 +TGTCGTGGGCTGTGCGTTTGAGAA +>36235 +TGCTACCTTTAGCTGCAAGATTAACT +>36238 +CAGATATTAGTGTTTTTCAAGCAGCGG +>36523 +TGCGAGTCCGAGCTTTGAACGTGGG +>36607 +TCTCAATGTAATGTCTTCTTTTTGGA +>36624 +CGTTCTTTAAAACCACCAATGGGA +>36776 +TACTCACGACCATTGTCATTTCTCAAG +>36825 +CGTTCGAGGTCCACTTTCTTAGCGGA +>36850 +TCTGATGTCGGCGAGAAAGGAGTCTCA +>36872 +TCAAGGCCAGCACACAGTAACATGGT +>36968 +ACATTGGAAATACCGCGGGACCGC +>36994 +TATACGTTTTTTGACCTCTTCTCTTTGA +>37110 +TGATAATGTAAACAAAGATAAAGGG +>37210 +TCAGATGAAAGACAAATTAGAATTAAA +>37224 +GACGATAATAGTGAATTTTGGACA +>37226 +TCTGAAGTTGCCGCACTAGAGATGG +>37339 +TATACAGTCCACTATATCGTTGTTTAA +>37395 +TACAATTTACGCTGAATTTAAATGAA +>37460 +CACAAAGTAACGTGCACCACCATTT +>37766 +TCTGTGCAACTTTGTACGCGAAGTCAGC +>37836 +TCAAGGATTAATGTAGGGGGGGGG +>38096 +TTTGGAGGTAGAAGTCTTAGTGGCCGC +>38100 +GACAAAATATGCCCTTCAATTTAGA +>38113 +TATGGTCCAGAATGTAGCCTCGGC +>38213 +TAACTGTTTTTAGTTCAAAGTCTCGAA +>38224 +TTTCAGTTTTTATTGTTAGTCACAGG +>38263 +TAACTGCGAAGTCGATCAGGTCCGA +>38266 +ATCCGGACGATTGACGAGGAGCCCATT +>38271 +TTATGTCAGTGTCGAAGGCGATCGAA +>38373 +TCTATAGCCTTGGCGTAGGAACTCGCA +>38384 +GCTACAACTGCGACAGAAAATTCGGA +>38468 +TATTATCGTCCGCTGCTAAACTGC +>38491 +TGCATACTTCCGTTCTCTTTTCGGGA +>38673 +TTGTGTATTGTGATTCTGATTCGTG +>38745 +TCCCTGGCCCGCTAGACAGCAGGA +>38784 +TGTGCTAATAATTAAAGTCGACTGA +>38873 +TGTCATACTTTCGTCAAAA +>39154 +TAATAGTCAGGGCGCGAATTTTTAAAA +>39325 +TTAGGACTTATTGAACTTTACGGTA +>39359 +TATGCAAATCAAGTGTGACCGTAGCT +>39450 +TTAAACAACGATATAGTGGACAGTA +>39453 +TCTGCCGGATTTTGATCCAATCAAGG +>39819 +GTGGAATTGAAAAAGAACCAGACACA +>40040 +TTTTTGGAACTACCTGAGTCGGTT +>40183 +TAACACAAAGCAGTATGATTTAATAAT +>40189 +CAGCAAGCTGAGATGTACATTAGTATA +>40374 +TACGTTTTCTTGCAGATCAAAAA +>40445 +CGTTCTTTAAAACCACCAATGGGA +>40467 +TACGCAGATTCCTGGGAGTTACAGGA +>40488 +TGATTTGGGCTTGCATACTTGTACT +>40797 +TATATTCGTGTTCATGTGTGAACAGC +>40831 +TCTAAGAACTTCTGAGGTGAAGGGC +>40951 +TTCTTCGTAAGTCAAAATAGTGTCGCC +>40988 +TATGATTGATTGCTTGAGAGT +>40998 +TGATAGAGCTGCATTTGAATTAACGG +>41061 +CTCTTTCCGCTCACTCCCGCTGAGA +>41076 +TGCATTAAGAAGATTTAGGATCC +>41140 +TCAAGGATTAATGTAGGGGGGG +>41143 +CAATAGCGTCGCTGAGTAACAGTG +>41162 +TACGGATTGCAGCGGCTAG +>41183 +TTTTTTGGCACACGATTTTTTGGACGT +>41227 +TAATATATGTATACTCTGCTTGGTG +>41265 +TTTATGATTTTTGGTAATA +>41365 +TAGGAGGGTTCCACAACTATTTCGGGG +>41837 +TAGTTTGACACTGTTTGGAGACGTGG +>42053 +TCTGTGGTCGAATCGAAGGAGTGC +>42113 +TAATAGATCGCTCACCTGTTCCTGG +>42392 +CGGCATCGGAAAACTCCCAGCGGGGC +>42504 +TAACGTTATTATTATTTGAAAATAGAA +>42566 +TTTGTTGGGTAGGAACTTTACTGC +>42668 +TGCTGCAGAGCTTCTTCCAACGTTGG +>42751 +CCAAAGTCTGGTTGTCAGAAAATGTGC +>42777 +AAGGAAGGAACCAAAGAAGCACAAACG +>42804 +TAATTCTAATTTGTCTCTCATCTGA +>42830 +TAGTATACTTATTAAGTCATTTGA +>42857 +AGAGTATTCATCTTGAGGCGTGTG +>42886 +TGAACAACGATTTATGTATATAAGAA +>42899 +TACGATAATAGTGAATTTTGGACA +>42936 +TTTGACTAAAAGTCGCTTGTTTTGGA +>43050 +AATACATAACTCTGGACACAGGAGA +>43219 +TACTTTCGTCAAAATGTTCAGGAGCT +>43242 +TGACATGTCTATTTCCATGGGTTCGGA +>43268 +GTGTATAAAAAAATTTATTGTTGAGCA +>43299 +TCTGGATGATGGCTGATGCTCGTTG +>43491 +TCTGATGACAATGAATTTTTTAGACA +>43520 +TATTGTTGTAATTGCTGCCTCGGTTG +>43654 +ATATGAACAAAGCAAAGACACTAGAA +>43677 +CACGATTCATAACCCTCAGCTGAAG +>43776 +GCTCCTGGCAACTCTGTGATGGAC +>43903 +TATTTTGATGTTTAATGAA +>43990 +TTTCTACTTCGTATTATTTTTATGA +>44062 +AAACATAATAATTGATGGCGGAAGA +>44071 +CACAGACGCAGTGGAAACCGCAGA +>44078 +CGTGCGTCCGAGCAAAAGGTGGT +>44187 +TTATGTAAGAATATTTGTCATTAGA +>44239 +TATCAATGTTGACCGTAATACTCAA +>44253 +TGGATATTGAATGTTTTTGATTTGC +>44279 +TGTGATTTTCCCAATTTATATTAATACA +>44374 +TAGTCGGAGTTGATGAGCTGCC +>44412 +TCCGAATTTTCTGTCGCAGTTGTAGCT +>44423 +TCGGCTTGGGTTTAGAAATTAAAAT +>44558 +ACAAATCATAAATTTGGTGGGA +>44637 +TTTTTTATCAATTGGCACCATGCGAA +>44642 +TACTGTGTGCTGGCCTTGATGAAAGT +>44688 +TAGATGTCTGCACGAATAACGGA +>44945 +TGCTTCCGAGCAATCTACGTTGGTAAAA +>45054 +TCTCATCTGACAATTTTTTAAAAGCGA +>45088 +TCTGAAGCAGCGCTCACGGCAGAATGC +>45203 +TGCCGGATTTTGATCCAATCAAGGGA +>45263 +TATTGATTTTCCTATTTAGTTGAACA +>45274 +AAAAGTCTGGATATTGTAGGATAGGA +>45358 +CAACGCTGGACCTTGGACTCGAGGGC +>45396 +CATCTTGTTATTCTAGTGTCTTTGGTA +>45641 +GAACTAAGATCAGTCGACTGTAATTAT +>45774 +CGACGAACTAGCAGCTCTGGTGT +>45911 +CAGATATTAGTGTTTTTCAAGCAGC +>45997 +TTAACCAGTCGGCGTTGTTTAAGTAGC +>46031 +AAAGCGTCTACTTGAACAATGAGA +>46054 +TTAGATCGTATTACTTGGGTGCTGG +>46199 +TAAGCGTTAGGTCGTATTACTTGGGC +>46255 +TAAGATTGAAAATTACTGTGGAGTAAT +>46366 +TAAGGAATTGTCGGCCATTTAATGTGA +>46387 +CAGAGCTTCTTCCAACGTTGGCAAG +>46701 +TTGTATCTTTTTGCTTTTTATATT +>46705 +TAACTGTTTTTAGTTCAAAGTCTCGGA +>46783 +TCTCATCTGACAATTTTTTAAAAGCGA +>46836 +TCATAAGGACAGACGGACAT +>46892 +AAACATAATAATTGATGGCGGAAGA +>47244 +TCTCTGTCCGCTCGCTTACGATGAGA +>47290 +TTTCAGGAATGGGGTCGTCCCACTA +>47348 +TGCAAAAGTAATATCAAAGACACTA +>47359 +TTTAAAATTATAATAGTCAGGG +>47427 +CATCTTGTTATTCTAGTGTCTTTGGT +>47654 +TTAAACACTGAATTCGGTTTCGAAA +>47656 +TTTCTGAAGAATCCTGTAACTCCC +>47785 +TGTAGATGAGCGGCAAATGTGG +>47827 +TTGATCAAGGTAGAGTTGTCGCGC +>48184 +TTCAAGGATTAATGTAGGGGGGG +>48576 +TTAACCCGGAGACTTGGGTGTGGGT +>48764 +TGCAAAAGTAATATCAAAGACAATAGA +>48782 +TGACAATGTAGTGAACGCCAGTGT +>48893 +TATAAATGCCGTCTGATATTATTAAA +>49017 +ACCGGATGTCATATCCAGCGTCGTGAA +>49381 +TACAATGTAAATTCGTTTCTTCGATCA +>49456 +TTTTGGTTTGATCGTCAGGTGGACGC +>49484 +TCTGCTATCATTGACTCGATCATTGA +>49569 +TCGATTGTATGATCAGTGGAAGTGGC +>49602 +GAAATTGGCCAACATTAATTCGGAA +>49628 +TACTTTCGTCAAAATGTTCAGGAGC +>49715 +TTTGTCCGGGTGCTTCGAAAGAACTCT +>49778 +CAATAGCGTCGCTGAGTAACAGTG