Mercurial > repos > iuc > proteinortho_summary
changeset 5:de26b312c0d2 draft
planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit b4d8b8da2a259973c9ad90e4b9d1a3e22ae4348f
author | iuc |
---|---|
date | Fri, 16 Jun 2023 20:52:56 +0000 |
parents | 9b67a50799e9 |
children | 2bb8251d132c |
files | proteinortho_macros.xml proteinortho_summary.xml |
diffstat | 2 files changed, 23 insertions(+), 11 deletions(-) [+] |
line wrap: on
line diff
--- a/proteinortho_macros.xml Tue Nov 22 16:50:38 2022 +0000 +++ b/proteinortho_macros.xml Fri Jun 16 20:52:56 2023 +0000 @@ -1,6 +1,6 @@ <?xml version="1.0"?> <macros> - <token name="@TOOL_VERSION@">6.1.2</token> + <token name="@TOOL_VERSION@">6.2.3</token> <token name="@WRAPPER_VERSION@">1</token> <token name="@PROFILE@">20.09</token> <xml name="citations"> @@ -12,12 +12,10 @@ <xml name="requirements"> <requirements> <requirement type="package" version="@TOOL_VERSION@">proteinortho</requirement> - <!-- blast, blat, and last are not in the biopython requirements - diamond is, but latest version does not work: https://gitlab.com/paulklemm_PHD/proteinortho/-/issues/55 --> - <requirement type="package" version="2.0.15">diamond</requirement> + <requirement type="package" version="2.1.4">diamond</requirement> <requirement type="package" version="2.13.0">blast</requirement> <requirement type="package" version="377">ucsc-blat</requirement> - <requirement type="package" version="1418">last</requirement> + <requirement type="package" version="1422">last</requirement> </requirements> </xml> <xml name="version_command">
--- a/proteinortho_summary.xml Tue Nov 22 16:50:38 2022 +0000 +++ b/proteinortho_summary.xml Fri Jun 16 20:52:56 2023 +0000 @@ -7,9 +7,6 @@ <expand macro="version_command"/> <command detect_errors="exit_code"><![CDATA[ export TERM=dumb && - ## TODOs: - ## - check if 2>&1 can be removed https://gitlab.com/paulklemm_PHD/proteinortho/-/merge_requests/9 - ## - include output0.tsv as Galaxy output? proteinortho_summary.pl $queryfile #if $queryfile2: @@ -19,6 +16,7 @@ | awk '/^$/ && !f{f=1;next}1' ## remove potentially present 1st empty line | awk 'BEGIN{i=0} /^$/{i+=1}{print > ("output" i ".tsv")}' ## split file at empty lines && + mv output0.tsv '$distribution' && mv output1.tsv '$adjacencyMat' && mv output2.tsv '$average1paths' && mv output3.tsv '$adjacencyMatSquared' && @@ -29,14 +27,20 @@ <param name="queryfile2" type="data" format="tabular" optional="true" label="(optional) A second orthology-pairs / RBH file" help="If you provide a second file, then difference is calculated (GRAPH - second GRAPH)"/> </inputs> <outputs> + <data name="distribution" format="tabular" label="${tool.name} on ${on_string}: Protein-Group distribution"/> <data name="adjacencyMat" format="tabular" label="${tool.name} on ${on_string}: Adjacency Matrix"/> <data name="average1paths" format="tabular" label="${tool.name} on ${on_string}: Average number of Edges"/> <data name="adjacencyMatSquared" format="tabular" label="${tool.name} on ${on_string}: Matrix of 2-paths"/> <data name="average2paths" format="tabular" label="${tool.name} on ${on_string}: Average number of 2-paths"/> </outputs> <tests> - <test expect_num_outputs="4"> + <test expect_num_outputs="5"> <param name="queryfile" value="result.proteinortho-graph"/> + <output name="distribution"> + <assert_contents> + <has_text text="%"/> + </assert_contents> + </output> <output name="adjacencyMat"> <assert_contents> <has_text text="18"/> @@ -66,7 +70,7 @@ </assert_contents> </output> </test> - <test expect_num_outputs="4"> + <test expect_num_outputs="5"> <param name="queryfile" value="result.proteinortho-graph"/> <param name="queryfile2" value="result.blast-graph"/> <output name="average2paths"> @@ -77,6 +81,15 @@ </assert_contents> </output> </test> + <test expect_num_outputs="5"> + <param name="queryfile" value="result.blast-graph"/> + <output name="average2paths"> + <assert_contents> + <has_text text="115.2"/> + <has_text text="TERM" negate="true"/> + </assert_contents> + </output> + </test> </tests> <help><![CDATA[proteinortho summary @@ -84,6 +97,8 @@ proteinortho_summary : Summaries the (orthology-pairs/RBH) file(s) to determine how well the species are connected to each other. + * **Protein-Group distribution** (for orthology-pairs) : This report contains overal statistics about the output. (i) Number of groups that contains at least p% input species (with p ranging between 0 and 100). (ii) number of groups for each input species. + * **Adjacency Matrix** : How well are the species connected to each other directly. * **Average number of Edges** : Averaged number of connections for each species. @@ -92,7 +107,6 @@ * **Average number of 2-paths** : The average number of 2-paths for each species. If a species is not well connected to all the other species, it will result in a low average. - If you supply a second orthology-pairs/RBH then the difference is calculated for all 4 outputs. E.g. given the RBH and the orthology-pairs of the same run : The outputs show how much the clustering removed from the initial reciprocal best hit graph.