Mercurial > repos > rnateam > graphclust_postprocessing
comparison glob_report.xml @ 0:b797e13169a0 draft
planemo upload for repository https://github.com/eteriSokhoyan/galaxytools/tree/branchForIterations/tools/GraphClust/CollectResults commit 21aaee40723b5341b4236edeb0e72995c2054053
author | rnateam |
---|---|
date | Fri, 16 Dec 2016 07:34:49 -0500 |
parents | |
children | b8e32e577597 |
comparison
equal
deleted
inserted
replaced
-1:000000000000 | 0:b797e13169a0 |
---|---|
1 <tool id="glob_report" name="Report_Results" version="0.1"> | |
2 <requirements> | |
3 <requirement type="package" version="0.1">graphclust-wrappers</requirement> | |
4 <requirement type="package" version='0.5'>perl-array-utils</requirement> | |
5 </requirements> | |
6 <stdio> | |
7 <exit_code range="1:" /> | |
8 </stdio> | |
9 <command> | |
10 <![CDATA[ | |
11 | |
12 unzip $FASTA &> /dev/null && | |
13 | |
14 #set $inputFiles = "" | |
15 | |
16 #for $cms_res in $cmsearch_results: | |
17 #set $inputFiles += str($cms_res)+',' | |
18 #end for | |
19 #set $inputFiles = $inputFiles[:-1] | |
20 | |
21 #set $inputFilesTrees = "" | |
22 | |
23 #for $mods in $model_tree_files: | |
24 #set $inputFilesTrees += str($mods)+',' | |
25 #end for | |
26 #set $inputFilesTrees = $inputFilesTrees[:-1] | |
27 | |
28 'glob_res.pl' '$inputFiles' $merge_cluster_ol $merge_overlap $min_cluster_size $cm_min_bitscore $cm_max_eval $cm_bitscore_sig $partition_type '' $cut_type '$inputFilesTrees' | |
29 #if $iteration_num.iteration_num_selector: | |
30 $iteration_num.CI | |
31 | |
32 $final_partition_soft | |
33 $final_partition_used_cmsearch | |
34 #end if | |
35 | |
36 && | |
37 python '$__tool_directory__/evaluation.py' | |
38 ]]> | |
39 </command> | |
40 <inputs> | |
41 <param type="data" name="FASTA" format="zip" /> | |
42 <param type="data" name="cmsearch_results" format="tabular" multiple="True"/> | |
43 <param type="data" name="model_tree_files" format="txt" multiple="True"/> | |
44 <param name="partition_type" type="boolean" checked="True" truevalue="0" falsevalue="1" label="Hard partition"/> | |
45 <param name="cut_type" type="boolean" checked="True" truevalue="0" falsevalue="1" label="Use CM score for cutoff" help="otherwise use E-value"/> | |
46 <conditional name="iteration_num"> | |
47 <param name="iteration_num_selector" type="boolean" checked="no" label="Multiple iterations" help="for single iteration- NO, for multiple-YES"/> | |
48 <when value="true"> | |
49 <param name="CI" type="integer" value="2" size="5" label="Number of current iteration "/> | |
50 <param type="data" name="final_partition_soft" format="txt" /> | |
51 <param type="data" name="final_partition_used_cmsearch" format="txt" /> | |
52 </when> | |
53 <when value="false" ></when> | |
54 </conditional> | |
55 <param name="merge_cluster_ol" type="float" value="0.66" size="5" label="merge_cluster_ol" help=""/> | |
56 <param name="merge_overlap" type="float" value="0.51" size="5" label="merge_overlap" help=""/> | |
57 <param name="min_cluster_size" type="integer" value="3" size="5" label="min_cluster_size" help=""/> | |
58 <param name="cm_min_bitscore" type="integer" value="20" size="5" label="cm_min_bitscore" help=""/> | |
59 <param name="cm_max_eval" type="float" value="0.001" size="5" label="cm_max_eval" help=""/> | |
60 <param name="cm_bitscore_sig" type="integer" value="1" size="5" label="cm_bitscore_sig" help=""/> | |
61 </inputs> | |
62 <outputs> | |
63 <data name="final_stats" format="txt" from_work_dir="RESULTS/cluster.final.stats" label="cluster.final.stats" /> | |
64 <data name="tableForEval" format="tabular" from_work_dir="RESULTS/fullTab.tabular" label="tableForEval" /> | |
65 <data name="final_soft" format="txt" from_work_dir="RESULTS/partitions/final_partition.soft" label="soft_part" /> | |
66 <data name="final_used_cmsearch" format="txt" from_work_dir="RESULTS/partitions/final_partition.used_cmsearch" label="final_partition_used_cmsearch" /> | |
67 <collection name="clusters" type="list" label="CLUSTERS"> | |
68 <discover_datasets pattern="(?P<name>^.*\.all$)" directory="RESULTS" /> | |
69 </collection> | |
70 <collection name="partitions" type="list" label="Partitions"> | |
71 <discover_datasets pattern="(?P<name>^.*$)" directory="RESULTS/partitions" /> | |
72 </collection> | |
73 </outputs> | |
74 <tests> | |
75 <test> | |
76 <param name="FASTA" value="FASTA.zip" ftype="searchgui_archive"/> | |
77 <param name="cmsearch_results" value="1.tabular,2.tabular"/> | |
78 <param name="model_tree_files" value="1.1.model.tree.fa,1.2.model.tree.fa"/> | |
79 <param name="partition_type" value="0"/> | |
80 <param name="cut_type" value="0"/> | |
81 <conditional name="iteration_num"> | |
82 <param name="iteration_num_selector" value="false"/> | |
83 </conditional> | |
84 <param name="merge_cluster_ol" value="0.66"/> | |
85 <param name="merge_overlap" value="0.51"/> | |
86 <param name="min_cluster_size" value="3"/> | |
87 <param name="cm_min_bitscore" value="20"/> | |
88 <param name="cm_max_eval" value="0.001"/> | |
89 <param name="cm_bitscore_sig" value="1"/> | |
90 <output name="final_stats" file="RESULTS/cluster.final.stats" /> | |
91 <output_collection name="clusters" type="list"> | |
92 <element name="1.cluster.all" file="RESULTS/1.cluster.all" compare="contains"/> | |
93 <element name="2.cluster.all" file="RESULTS/2.cluster.all" compare="contains"/> | |
94 </output_collection> | |
95 <output_collection name="partitions"> | |
96 <element name="final_overlap.map" file="RESULTS/partitions/final_overlap.map" compare="contains"> | |
97 <assert_contents> | |
98 <has_text text="1.1 1.1" /> | |
99 <has_text text="1.2 1.2" /> | |
100 </assert_contents> | |
101 </element> | |
102 <element name="final_overlap.matrix" file="RESULTS/partitions/final_overlap.matrix" compare="contains"> | |
103 <assert_contents> | |
104 <has_text text="MODEL CLASS 0 0" /> | |
105 <has_text text="1.2" /> | |
106 <has_text text="1.1" /> | |
107 </assert_contents> | |
108 </element> | |
109 <element name="final_partition.hard.best" file="RESULTS/partitions/final_partition.hard.best" /> | |
110 <element name="final_partition.hard.merged" file="RESULTS/partitions/final_partition.hard.merged" /> | |
111 <element name="final_partition.soft" file="RESULTS/partitions/final_partition.soft" /> | |
112 <element name="final_partition.used_cmsearch" file="RESULTS/partitions/final_partition.used_cmsearch" compare="contains"/> | |
113 </output_collection> | |
114 </test> | |
115 </tests> | |
116 <help> | |
117 <![CDATA[ | |
118 | |
119 **What it does** | |
120 | |
121 Post-processing. Redundant clusters are merged and instances that belong to multiple clusters | |
122 are assigned unambiguously. For every pair of clusters, the relative overlap (i.e. the fraction of | |
123 instances that occur in both clusters) is computed and clusters are merged if the overlap exceeds 50%. | |
124 Cluster members are finally ranked by their CM bitscore. | |
125 | |
126 ]]> | |
127 </help> | |
128 <citations> | |
129 <citation type="bibtex">@inproceedings{costa2010fast, | |
130 title={Fast neighborhood subgraph pairwise distance kernel}, | |
131 author={Costa, Fabrizio and De Grave, Kurt}, | |
132 booktitle={Proceedings of the 26th International Conference on Machine Learning}, | |
133 pages={255--262}, | |
134 year={2010}, | |
135 organization={Omnipress} | |
136 } | |
137 </citation> | |
138 </citations> | |
139 </tool> |