Mercurial > repos > rnateam > graphclust_mlocarna
diff locarna_best_subtree.xml @ 0:15bd4fb05e5c draft
planemo upload for repository https://github.com/eteriSokhoyan/galaxytools/tree/branchForIterations/tools/GraphClust/LocARNAGraphClust commit 21aaee40723b5341b4236edeb0e72995c2054053
author | rnateam |
---|---|
date | Fri, 16 Dec 2016 07:35:29 -0500 |
parents | |
children | c6c4a7adb099 |
line wrap: on
line diff
--- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/locarna_best_subtree.xml Fri Dec 16 07:35:29 2016 -0500 @@ -0,0 +1,190 @@ +<tool id="locarna_best_subtree" name="locarna_best_subtree" version="0.1.0" > + <requirements> + <requirement type="package" version="0.1">graphclust-wrappers</requirement> + <requirement type="package" version='1.8.10'>locarna</requirement> + <requirement type="package" version='2.1'>rnaz</requirement> + <requirement type="package" version='0.07'>perl-math-round</requirement> + </requirements> + <stdio> + <exit_code range="1:" /> + </stdio> + <command> + <![CDATA[ + + 'locARNAGraphClust.pl' '$center_fa_file' '$tree_file' '$tree_matrix' $p $max_diff_am $tau $max_diff '' '$data_map' $plfold_minlen + ]]> + </command> + <inputs> + <param type="data" name="center_fa_file" label="centers" format="fa, fasta" help="fasta format" /> + <param type="data" name="tree_file" label="trees" format="text" help="text format" /> + <param type="data" name="tree_matrix" label="tree_matrix" format="text" help="text format" /> + <param type="data" name="data_map" label="data_map" format="txt" help="text format" /> + <param name="p" type="float" value="0.001" size="5" label="minimal probability" help="-p"/> + <param name="max_diff_am" type="integer" value="50" size="5" label=" maximal difference for sizes of matched arcs" help="--max-diff-am"/> + <param name="tau" type="integer" value="50" size="5" label="Tau factor in percent" help="--tau"/> + <param name="max_diff" type="integer" value="100" size="5" label="maximal difference for alignment traces" help="--max-diff"/> + <param name="plfold_minlen" type="integer" value="210" size="5" label="Minimal length of a sequences for which RNAplfold is used" /> + </inputs> + <outputs> + + <data name="model_tree_stk" format="stockholm" label="model.tree.stk" from_work_dir="MODEL/best_subtree.aln" /> + </outputs> + <tests> + <test> + <param name="tree_file" value="1.1.tree"/> + <param name="center_fa_file" value="1.1.center.fa"/> + <param name="data_map" value="data.map"/> + <param name="tree_matrix" value="1.1.matrix.tree"/> + <param name="p" value="0.001"/> + <param name="max-diff-am" value="50"/> + <param name="tau" value="50"/> + <param name="max-diff-am" value="100"/> + <output name="model_tree_stk" file="best_subtree.aln"/> + </test> + </tests> + <help> + <![CDATA[ +**What it does** + +MLocARNA computes a multiple sequence-structure alignment of RNA sequences. +It uses *treefile* - file with guide tree in NEWICK format. The given tree is used as guide tree for the progressive alignment. +This saves the calculation of pairwise all-vs-all similarities and construction of the guide tree. + + + +]]> + </help> + <citations> + <citation type="bibtex">@inproceedings{costa2010fast, + title={Fast neighborhood subgraph pairwise distance kernel}, + author={Costa, Fabrizio and De Grave, Kurt}, + booktitle={Proceedings of the 26th International Conference on Machine Learning}, + pages={255--262}, + year={2010}, + organization={Omnipress} + } + </citation> + <citation type="bibtex">@Article{Will_Joshi_Hofacker-LocAR_Accur_bound-2012, + author = {Will, Sebastian and Joshi, Tejal and Hofacker, Ivo L. and + Stadler, Peter F. and Backofen, Rolf}, + title = {{LocARNA}-{P}: {Accurate} boundary prediction and improved + detection of structural {RNAs}}, + journal = {RNA}, + year = {2012}, + volume = {18}, + number = {5}, + pages = {900-14}, + user = {will}, + pmid = {22450757}, + doi = {10.1261/rna.029041.111}, + issn = {1469-9001}, + issn = {1355-8382}, + abstract = {Current genomic screens for noncoding RNAs (ncRNAs) predict + a large number of genomic regions containing potential + structural ncRNAs. The analysis of these data requires + highly accurate prediction of ncRNA boundaries and + discrimination of promising candidate ncRNAs from weak + predictions. Existing methods struggle with these goals + because they rely on sequence-based multiple sequence + alignments, which regularly misalign RNA structure and + therefore do not support identification of structural + similarities. To overcome this limitation, we compute + columnwise and global reliabilities of alignments based on + sequence and structure similarity; we refer to these + structure-based alignment reliabilities as STARs. The + columnwise STARs of alignments, or STAR profiles, provide a + versatile tool for the manual and automatic analysis of + ncRNAs. In particular, we improve the boundary prediction of + the widely used ncRNA gene finder RNAz by a factor of 3 from + a median deviation of 47 to 13 nt. Post-processing RNAz + predictions, LocARNA-P's STAR score allows much stronger + discrimination between true- and false-positive predictions + than RNAz's own evaluation. The improved accuracy, in this + scenario increased from AUC 0.71 to AUC 0.87, significantly + reduces the cost of successive analysis steps. The + ready-to-use software tool LocARNA-P produces + structure-based multiple RNA alignments with associated + columnwise STARs and predicts ncRNA boundaries. We provide + additional results, a web server for LocARNA/LocARNA-P, and + the software package, including documentation and a pipeline + for refining screens for structural ncRNA, at + http://www.bioinf.uni-freiburg.de/Supplements/LocARNA-P/.} +} + </citation> + <citation type="bibtex">@Article{Will:etal:_infer_non_codin_rna_famil:PLOS2007, + author = {Sebastian Will and Kristin Reiche and Ivo L. Hofacker and + Peter F. Stadler and Rolf Backofen}, + title = {Inferring Non-Coding {RNA} Families and Classes by Means of + Genome-Scale Structure-Based Clustering}, + journal = {PLoS Comput Biol}, + year = 2007, + volume = {3}, + number = {4}, + pages = {e65}, + issn = {1553-7358}, + issn = {1553-734X}, + pmid = {17432929}, + doi = {10.1371/journal.pcbi.0030065}, + user = {will}, + abstract = {The RFAM database defines families of ncRNAs by means of + sequence similarities that are sufficientto establish + homology. In some cases, such as microRNAs, box H/ACA + snoRNAs, functional commonalities define classes of RNAs + that are characterized by structural similarities, and + typically consist ofmultiple RNA families. Recent advances + in high-throughput transcriptomics and comparative genomics + have produced very large sets of putative non-coding RNAs + and regulatory RNA signals. For many ofthem, evidence for + stabilizing selection acting on their secondary structures + has been derived, and at least approximate models of their + structures have been computed. The overwhelming majority of + these hypo-thetical RNAs cannot be assigned to established + families or classes. We present here a structure-based + clustering approach that is capable of extracting putative + RNA classesfrom genome-wide surveys for structured RNAs. The + LocARNA tool implements a novel variant of theSankoff + algorithm that is sufficiently fast to deal with several + thousand candidate sequences. The method is also robust + against false positive predictions, i.e., a contamination of + the input data with unstructured ornon-conserved + sequences. We have successfully tested the LocARNA-based + clustering approach on the sequences of the + RFAM-seedalignments. Furthermore, we have applied it to a + previously published set of 3332 predicted structured + elements in the Ciona intestinalis genomes (Missal et al., + Bioinformatics 21(S2), i77-i78). In addition torecovering + e.g. tRNAs as a structure-based class, the method identifies + several RNA families, including microRNA and snoRNA + candidates, and suggests several novel classes of ncRNAs for + which to-date norepresentative has been experimentally + characterized.} +} + + </citation> + <citation type="bibtex">@Article{Smith:Heyne:Richter:Freib_RNA_Tools:NAR2010, + author = {Smith, Cameron and Heyne, Steffen and Richter, Andreas S. + and Will, Sebastian and Backofen, Rolf}, + title = {Freiburg {RNA} {Tools}: a web server integrating {IntaRNA}, + {ExpaRNA} and {LocARNA}}, + journal = NAR, + year = {2010}, + volume = {38 Suppl}, + number = {}, + pages = {W373-7}, + user = {arichter}, + pmid = {20444875}, + doi = {10.1093/nar/gkq316}, + issn = {0305-1048}, + issn = {1362-4962}, + abstract = {The Freiburg RNA tools web server integrates three tools + for the advanced analysis of RNA in a common web-based user + interface. The tools IntaRNA, ExpaRNA and LocARNA support + the prediction of RNA-RNA interaction, exact RNA matching + and alignment of RNA, respectively. The Freiburg RNA tools + web server and the software packages of the stand-alone + tools are freely accessible at + http://rna.informatik.uni-freiburg.de.} +} + </citation> + </citations> +</tool>