Next changeset 1:7a84c6c1c4e0 (2017-11-12) |
Commit message:
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/rna_tools/rnacode commit 3f891a4e86b4b127815dc72a4292c232cda79293 |
added:
rnacode.xml test-data/coding.aln test-data/coding.maf test-data/rnacode_result1.tabular test-data/rnacode_result2.gtf tool_dependencies.xml |
b |
diff -r 000000000000 -r 2c51e264432a rnacode.xml --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/rnacode.xml Fri Jun 19 11:13:11 2015 -0400 |
[ |
b'@@ -0,0 +1,190 @@\n+<tool id="rbc_rnacode" name="RNAcode" version="0.3.0">\n+ <description>Analyze the protein coding potential in MSA</description>\n+ <requirements>\n+ <requirement type="package" version="0.3">rnacode</requirement>\n+ </requirements>\n+ <stdio>\n+ <exit_code range="1:" level="fatal" description="Error occurred. Please check Tool Standard Error"/>\n+ <exit_code range=":-1" level="fatal" description="Error occurred. Please check Tool Standard Error"/>\n+ </stdio>\n+ <version_command>RNAcode --version</version_command>\n+ <command>\n+ <![CDATA[\n+ RNAcode\n+ \n+ $outputFormat\n+ \n+ #if $cutoff and $cutoff is not None\n+ --cutoff $cutoff\n+ #end if\n+ \n+ #if $num_samples and $num_samples is not None\n+ --num-samples $num_samples\n+ #end if\n+ \n+ $stop_early\n+ $best_region\n+ $best_only\n+ \n+ #if $cond_generateEPS.generateEPS == \'create\'\n+ --eps\n+ #if $cond_generateEPS.eps_cutoff and $cond_generateEPS.eps_cutoff is not None\n+ --eps-cutoff $cond_generateEPS.eps_cutoff\n+ #end if\n+ #end if\n+ \n+ #if $cond_scoringParameters.scoringParameters == \'custom\'\n+ --pars "$pars"\n+ #end if\n+ \n+ $alignment\n+ \n+ #if $outputFormat.value == \'--tabular\'\n+ --outfile $outFileDefault\n+ #elif $outputFormat.value == \'--gtf\'\n+ --outfile $outFileGTF\n+ #end if\n+ \n+ ]]>\n+ </command>\n+ <inputs>\n+ <param name="alignment" type="data" format="clustal,maf" label="Multiple Alignment" help="Alignment needs to be formatted in ClustalW or MAF format"/>\n+ <param argument="--cutoff" name="cutoff" type="float" optional="true" value="1.0" label="Cutoff" help="Show only regions that have a p-value below the given number. By default all hits are shown."/>\n+ <param argument="--num_samples" name="num_samples" type="integer" optional="true" value="100" label="Number of samples" help="Number of random alignments that are sampled to calculate the p-value. RNAcode estimates the significance of a coding prediction by sampling a given number of random alignments. Default is 100 which gives reasonably stable p-values that are useful for assessing the relevance of a prediction."/>\n+ <param argument="--stop_early" name="stop_early" type="boolean" truevalue="--stop-early" falsevalue="" checked="false" label="Stop early" help="Setting this option stops the sampling process as soon as it is clear that the best hit will not fall below the given p-value cutoff. For example, assume a p-value cutoff of 0.05 (see --cutoff) and a sample size of 1000 is given (see --num-samples). As soon as 50 random samples score better than the original alignment, the process is stopped and all hits in the original alignment are reported as p>0.05 (or by convention as 1.0 in gtf and tabular output)."/>\n+ <param argument="--best_region" name="best_region" type="boolean" truevalue="--best-region" falsevalue="" checked="false" label="Show only best non-overlapping hits" help="By default all positive scoring segments are shown in the output if they fall below the given p-value cutoff. If two hits overlap (different frame or different strand) and --best_region is given only the hit with the highest score is shown. Strong coding regions often lead to statistically significant signals also in other frames. These hits are suppressed by this option and only the correct reading frame is reported."/>\n+ <param argument="--best_only" name="best_only" type="boolean" truevalue="--best-only" falsevalue="" checked="false" label="Show only best hit" help="This options shows only the one single best hit for each alignment."/>\n+ <conditional name="cond_scoringParameters">\n+ <param name="scoringParameters" type="select" label="Scoring paramet'..b' <output name="outFileDefault" ftype="tabular" file="rnacode_result1.tabular" compare="sim_size"/>\n+ <!-- sim_size is needed due to rnacode using random sampling: result files differ, better tests should be implemented -->\n+ </test>\n+ <test>\n+ <param name="alignment" value="coding.maf"/>\n+ <param name="generateEPS" value="nocreate"/>\n+ <param name="outputFormat" value="--gtf"/>\n+ <output name="outFileGTF" ftype="gtf" file="rnacode_result2.gtf" compare="sim_size"/>\n+ <!-- sim_size is needed due to rnacode using random sampling: result files differ, better tests should be implemented -->\n+ </test>\n+ </tests>\n+ <help>\n+<![CDATA[\n+**RNAcode** \n+Predicts protein coding regions in an alignment of homologous\n+nucleotide sequences. The prediction is based on evolutionary\n+signatures typical for protein genese, i.e. the presence of\n+synonyomous/conservative nucleotide mutations, conservation of the\n+reading frame and absence of stop codons.\n+\n+RNAcode does not rely on any species specific sequence characteristics\n+whatsoever and does not use any machine learning techniques. The only\n+input required for RNAcode is a multiple sequence alignment either in\n+MAF or Clustal W format. RNAcode reports local regions of unusual high\n+coding potential together with an associated p-value.\n+\n+**Input alignment**\n+\n+The input alignment needs to be formatted in ClustalW format or MAF\n+format (http://genome.ucsc.edu/FAQ/FAQformat#format5). The latter\n+format allows to include genomic coordinates which can be used to\n+produce annotation files. \n+\n+Important: RNAcode uses the first sequence as reference sequence,\n+i.e. all results and reported coding regions apply to this reference\n+sequence.\n+\n+Currently the alignments has to contain at least 3 sequences. Gaps\n+have to be given as dash (\'-\'). Unspecified letters given as \'N\' are\n+allowed and treated neutrally during all calculations. No difference is\n+made between uppercase or lowercase input, i.e. \'softly\'-repeat masked\n+sequences which use lowercase letters for masked regions are treated\n+the same way as unmasked sequences.\n+\n+**Output format**\n+\n+In the default output each prediction is reported on one line by 10 fields.\n+\n+1. HSS id \n+ Unique running number for each high scoring segment\n+ predicted in one RNAcode call\n+\n+2. Frame \n+ The reading frame phasing relative to the starting\n+ nucleotide position in the reference sequence. +1 means\n+ that the first nucleotide in the reference sequence is in\n+ the same frame as the predicted coding region. Negative\n+ frames indicate that the predicted regions are on the\n+ reverse complement strand.\n+\n+3. Length \n+ The length of the predicted region in amino acids\n+\n+4. From 5. To \n+ The position of the first/last amino acid in the translated\n+ nucleotide sequence of the reference sequence starting\n+ with 1.\n+\n+6. Name \n+ The name of the reference sequence as given in the input alignment.\n+ \n+7. Start 8. End \n+ The nucleotide position in the reference sequence of the\n+ predicted coding region. If no genomic coordinates are given\n+ (if you provide a CLUSTAL W as input) the first nucleotide position in\n+ the references sequence is set to 1, otherwise the positions are the\n+ 1-based genomic coordinates as given in the input MAF file.\n+\n+9. Score \n+ The coding potential score. High scores indicate high coding potential. \n+\n+10. P \n+ The p-value associated with the score. This is the probability\n+ that a random alignment with same properties contains an equally good\n+ or better hit.\n+]]>\n+ </help>\n+ <citations>\n+ <citation type="doi">10.1261/rna.2536111</citation>\n+ </citations>\n+</tool>\n' |
b |
diff -r 000000000000 -r 2c51e264432a test-data/coding.aln --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/coding.aln Fri Jun 19 11:13:11 2015 -0400 |
b |
@@ -0,0 +1,33 @@ +CLUSTAL W(1.81) multiple sequence alignment + + +ec_K12.chr_fwd/3401506-3401703 TGCAGGCGTTACTTTTAGAACAGCAGGACGGCAAAACTCTCGCATCAGTACA--GACTCT +ec_O157H7.chr_fwd/4138444-4138641 TGCAGGCGTTACTTTTAGAACAGCAGGACGGCAAAACTCTCGCATCAGTACA--GACTCT +ec_APEC_O1.chr_fwd/3685781-3685978 TGCAGGCGTTACTTTTAGAACAGCAGGACGGCAAAACTCTCGCATCAGTACA--GACTCT +ente638.chr_fwd/4000173-4000370 TGCAGGCATTGATCTTAGAACAACAAGACGGCAAAACCCTGGCTTCGGTTCA--ATCCAT +shigFlex_2A.chr_fwd/3391056-3391253 TGCAGGCGTTACTTTTAGAACAGCAGGACGGCAAAACTCTCGCATCAGTACA--GACTCT +salmTyph.chr_fwd/3400613-3400810 TGCAGGCGTTGATCTTAGAACAGCAGGACGGTAAAACCCTCGCATCCGTGCA--ACATCT +salmEnte_PARATYPI_ATC.chr_fwd/3353535-3353732 TGCAGGCGTTGATCTTAGAACAGCAGGACGGTAAAACCCTCGCATCCGTGCA--ACATCT +yersPest_CO92.chr_rev/569086-569283 TGCGAGCACTGATACTTGAGCAAATTGAAGGGCGTACCACCGCAGAAGTACGTCAAATTT + + +ec_K12.chr_fwd/3401506-3401703 GGACGAAAGTCGCCTGCCGGAGGGCGATGTCACGGTCGATGTTCACTGGTCGAGCCTGAA +ec_O157H7.chr_fwd/4138444-4138641 GGACGAAAGTCGCCTGCCGGAGGGCGATGTCACGGTCGATGTTCACTGGTCGAGCCTGAA +ec_APEC_O1.chr_fwd/3685781-3685978 GGACGAAAGTCGCCAGCCGGAAGGCGATGTCACGGTTGATGTTCACTGGTCGAGCCTGAA +ente638.chr_fwd/4000173-4000370 CGAGGCTACCCGCCTGCCCGAAGGCGACGTCACCGTTGACATTGACTGGTCCAGCCTGAA +shigFlex_2A.chr_fwd/3391056-3391253 GGACGAACGTCGCCTGCCGGAGGGCGATGTCACGGTCGATGTTCACTGGTCGAGCCTGAA +salmTyph.chr_fwd/3400613-3400810 CGAAGAGAGTCAACTGCCGGCAGGTGATGTGACGGTGGATGTCCACTGGTCCAGCCTGAA +salmEnte_PARATYPI_ATC.chr_fwd/3353535-3353732 CGAAGAGAGTCAACTGCCGGCAGGTGATGTGACGGTGGATGTCCACTGGTCCAGCCTGAA +yersPest_CO92.chr_rev/569086-569283 CGGCCTCA--CAACTGCCTGCGGGTAATGTCACCGTAGATGTCAATTGGTCCAGCCTGAA + + +ec_K12.chr_fwd/3401506-3401703 CTATAAAGATGCGCTGG +ec_O157H7.chr_fwd/4138444-4138641 CTATAAAGATGCGCTGG +ec_APEC_O1.chr_fwd/3685781-3685978 CTACAAAGATGCGCTGG +ente638.chr_fwd/4000173-4000370 TTACAAGGACGCGCTCG +shigFlex_2A.chr_fwd/3391056-3391253 CTATAAAGATGCGCTGG +salmTyph.chr_fwd/3400613-3400810 TTATAAAGATGCTCTGG +salmEnte_PARATYPI_ATC.chr_fwd/3353535-3353732 TTATAAAGATGCTCTGG +yersPest_CO92.chr_rev/569086-569283 TTATAAAGATGCGTTGG + + |
b |
diff -r 000000000000 -r 2c51e264432a test-data/coding.maf --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/coding.maf Fri Jun 19 11:13:11 2015 -0400 |
b |
@@ -0,0 +1,10 @@ +a score=0 +s ec_K12.chr 3401506 198 + 0 TGCAGGCGTTACTTTTAGAACAGCAGGACGGCAAAACTCTCGCATCAGTACA--GACTCTGGACGAAAGTCGCCTGCCGGAGGGCGATGTCACGGTCGATGTTCACTGGTCGAGCCTGAACTATAAAGATGCGCTGG +s ec_O157H7.chr 4138444 198 + 0 TGCAGGCGTTACTTTTAGAACAGCAGGACGGCAAAACTCTCGCATCAGTACA--GACTCTGGACGAAAGTCGCCTGCCGGAGGGCGATGTCACGGTCGATGTTCACTGGTCGAGCCTGAACTATAAAGATGCGCTGG +s ec_APEC_O1.chr 3685781 198 + 0 TGCAGGCGTTACTTTTAGAACAGCAGGACGGCAAAACTCTCGCATCAGTACA--GACTCTGGACGAAAGTCGCCAGCCGGAAGGCGATGTCACGGTTGATGTTCACTGGTCGAGCCTGAACTACAAAGATGCGCTGG +s ente638.chr 4000173 198 + 0 TGCAGGCATTGATCTTAGAACAACAAGACGGCAAAACCCTGGCTTCGGTTCA--ATCCATCGAGGCTACCCGCCTGCCCGAAGGCGACGTCACCGTTGACATTGACTGGTCCAGCCTGAATTACAAGGACGCGCTCG +s shigFlex_2A.chr 3391056 198 + 0 TGCAGGCGTTACTTTTAGAACAGCAGGACGGCAAAACTCTCGCATCAGTACA--GACTCTGGACGAACGTCGCCTGCCGGAGGGCGATGTCACGGTCGATGTTCACTGGTCGAGCCTGAACTATAAAGATGCGCTGG +s salmTyph.chr 3400613 198 + 0 TGCAGGCGTTGATCTTAGAACAGCAGGACGGTAAAACCCTCGCATCCGTGCA--ACATCTCGAAGAGAGTCAACTGCCGGCAGGTGATGTGACGGTGGATGTCCACTGGTCCAGCCTGAATTATAAAGATGCTCTGG +s salmEnte_PARATYPI_ATC.chr 3353535 198 + 0 TGCAGGCGTTGATCTTAGAACAGCAGGACGGTAAAACCCTCGCATCCGTGCA--ACATCTCGAAGAGAGTCAACTGCCGGCAGGTGATGTGACGGTGGATGTCCACTGGTCCAGCCTGAATTATAAAGATGCTCTGG +s yersPest_CO92.chr 569086 198 - 0 TGCGAGCACTGATACTTGAGCAAATTGAAGGGCGTACCACCGCAGAAGTACGTCAAATTTCGGCCTCA--CAACTGCCTGCGGGTAATGTCACCGTAGATGTCAATTGGTCCAGCCTGAATTATAAAGATGCGTTGG + |
b |
diff -r 000000000000 -r 2c51e264432a test-data/rnacode_result1.tabular --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/rnacode_result1.tabular Fri Jun 19 11:13:11 2015 -0400 |
b |
@@ -0,0 +1,7 @@ +0 + 3 44 1 44 ec_K12.chr_fwd/3401506-3401703 3 134 39.108 2.206e-08 +1 - 3 32 12 43 ec_K12.chr_fwd/3401506-3401703 36 131 19.782 7.086e-04 +2 + 2 6 35 40 ec_K12.chr_fwd/3401506-3401703 104 121 2.738 0.999 +3 - 2 13 1 13 ec_K12.chr_fwd/3401506-3401703 2 40 2.426 1.000 +4 - 3 5 6 10 ec_K12.chr_fwd/3401506-3401703 18 32 2.319 1.000 +5 - 3 3 2 4 ec_K12.chr_fwd/3401506-3401703 6 14 1.736 1.000 +6 - 2 3 26 28 ec_K12.chr_fwd/3401506-3401703 77 85 1.344 1.000 |
b |
diff -r 000000000000 -r 2c51e264432a test-data/rnacode_result2.gtf --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/rnacode_result2.gtf Fri Jun 19 11:13:11 2015 -0400 |
b |
@@ -0,0 +1,7 @@ +chr RNAcode CDS 3401509 3401640 39.11|5.98e-10 + . gene_id "Gene0"; transcript_id "transcript 0"; +chr RNAcode CDS 3401574 3401669 19.78|1.33e-04 - . gene_id "Gene1"; transcript_id "transcript 0"; +chr RNAcode CDS 3401610 3401627 2.74|9.99e-01 + . gene_id "Gene2"; transcript_id "transcript 0"; +chr RNAcode CDS 3401665 3401703 2.43|1.00e+00 - . gene_id "Gene3"; transcript_id "transcript 0"; +chr RNAcode CDS 3401673 3401687 2.32|1.00e+00 - . gene_id "Gene4"; transcript_id "transcript 0"; +chr RNAcode CDS 3401691 3401699 1.74|1.00e+00 - . gene_id "Gene5"; transcript_id "transcript 0"; +chr RNAcode CDS 3401620 3401628 1.34|1.00e+00 - . gene_id "Gene6"; transcript_id "transcript 0"; |
b |
diff -r 000000000000 -r 2c51e264432a tool_dependencies.xml --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/tool_dependencies.xml Fri Jun 19 11:13:11 2015 -0400 |
b |
@@ -0,0 +1,17 @@ +<?xml version="1.0"?> +<tool_dependency> + <package name="rnacode" version="0.3"> + <install version="1.0"> + <actions> + <action type="download_by_url">https://raw.githubusercontent.com/bgruening/download_store/master/RNAcode/RNAcode-0.3.tar.gz</action> + <action type="autoconf"/> + <action type="set_environment"> + <environment_variable name="PATH" action="prepend_to">$INSTALL_DIR/bin</environment_variable> + <environment_variable name="RNACODE_ROOT_PATH" action="set_to">$INSTALL_DIR</environment_variable> + </action> + </actions> + </install> + <readme> + </readme> + </package> +</tool_dependency> |