Mercurial > repos > pieterlukasse > primo_multiomics

diff results2o.xml @ 0:5bc82cf5439b
Initial commit
author: pieter.lukasse@wur.nl
date: Fri, 02 May 2014 15:36:43 +0200
children: eb0b7889dd08
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/results2o.xml	Fri May 02 15:36:43 2014 +0200
@@ -0,0 +1,97 @@
+<tool name="Results2O" id="results2o1" version="0.0.1">
+	<description>use ontology mapping to annotate results (e.g. annotate protein identifications with Gene Ontology[GO] terms)</description>
+	<!-- 
+	   For remote debugging start you listener on port 8000 and use the following as command interpreter:
+	       java -jar -Xdebug -Xrunjdwp:transport=dt_socket,address=D0100564.wurnet.nl:8000 
+	    -->
+	<command interpreter="java -jar ">
+	    Results2O.jar 
+		-inputFileName $inputFileName
+ 		-inputIdColumnName "$inputIdColumnName"
+ 		-inputIdPrefix "$inputIdPrefix"  
+		-quantifColumn "$quantifColumn" 
+		
+		-ontologyMappingFileName $ontologyMappingFileName
+		-mappingFileIdColName "$mappingFileIdColName"  
+		-mappingIdPrefix "$mappingIdPrefix"  
+		-mappingFileOntologyTermColName "$mappingFileOntologyTermColName"
+		
+		-outputFileName $outputFileName
+		-outputObservationsFileName $outputObservationsFileName
+        	    
+	</command>
+	
+	<inputs>
+	 	
+  		<param name="inputFileName" type="data" format="tabular,csv" label="Input file (TSV/CSV)" />
+  		<param name="inputIdColumnName" type="text" size="50" value="" label="ID column name" help="Name of the column containing the identification codes (in the given input file)"/>
+  		<param name="inputIdPrefix" type="text" size="50" value="" label="(Optional) Prefix in ID column" 
+  				help="Fill in if any prefix is found in the ID column values (e.g. in some 
+					 files the value is preceded by a fixed value like for example 'lipidmaps:LMFA00000007' instead of just 'LMFA00000007' - in this 
+					 example one would fill in 'lipidmaps:' as prefix)"/>
+  		<param name="quantifColumn" type="text" size="50" value="" label="(Optional) Values column name" help="Name of the column containing the quantification values (in the given input file)"/>
+  		
+  		<!-- =================== ONTOLOGY part ============== -->
+  		<param name="ontologyMappingFileName" type="data" format="obo" label="ID to Ontology mapping file (TSV/CSV)" help="Simple file linking the coding scheme used for the identifications in the given input file to one or more ontology terms."/>
+  		<param name="mappingFileIdColName" type="text" size="50" value="" label="ID column name (in ontology mapping file)" help="Name of the column containing the identification codes (which will in fact link the input file records to the ontology records)"/>
+  		<param name="mappingIdPrefix" type="text" size="50" value="" label="(Optional) Prefix in mapping ID column" 
+  				help="Fill in if any prefix is found in the ID column values (e.g. in some 
+					 files the value is preceded by a fixed value like for example 'lipidmaps:LMFA00000007' instead of just 'LMFA00000007' - in this 
+					 example one would fill in 'lipidmaps:' as prefix)"/>
+
+  		<param name="mappingFileOntologyTermColName" type="text" size="50" value="" label="Ontology term column name" help="Name of the column containing the ontology terms in the ontology mapping file (and which will be transfered to the input file)"/>
+  		
+     	
+	</inputs>
+	<outputs>
+		#if isinstance( $inputFileName.datatype, $__app__.datatypes_registry.get_datatype_by_extension('tabular').__class__):
+			<data name="outputFileName" format="tabular" label="${tool.name} on ${on_string}: annotated file " ></data>
+		#else:
+       		<data name="outputFileName" format="csv" label="${tool.name} on ${on_string}: annotated file " ></data>
+   		#end if
+	  
+	  <data name="outputObservationsFileName" format="tabular" label="${tool.name} on ${on_string}: ontology observations file (TSV)"></data>
+	</outputs>
+	<tests>
+	  <!--  find out how to use -->
+	  <test>
+	  </test>
+	</tests>
+  <help>
+  
+.. class:: infomark
+  
+This tool is responsible for annotating quantifications result file 
+with the ontology terms given in a mapping file. This mapping file links the items found in the result file
+(e.g. protein identifications coded in common protein coding formats such as UniProt )
+to their respective ontology terms (e.g. GO terms). It enables users to use the cross-reference 
+information now available in different repositories (like uniprot and KEGG - see for example
+http://www.uniprot.org/taxonomy/ or http://www.genome.jp/linkdb/ )
+to map their results to other useful coding schemes such as ontologies for functional annotations.  
+ 
+As an example for transcripts and proteins, users can check http://www.uniprot.org/taxonomy/ to
+see if their organism has been mapped to GO terms by Uniprot. For example the link 
+http://www.uniprot.org/uniprot/?query=taxonomy:2850 will show the Uniprot repository and cross-references
+for the taxonomy 2850.
+When the organism being studied is not available, then other strategies 
+could be tried (like Blast2GO for example).
+
+
+Despite the specific examples above, this class is generic and can be used to map any 
+results file to an Ontology according to a given mapping file. One example would be mapping metabolomics
+identifications to the CheBI ontology.    
+  
+
+-----
+
+**Output**
+
+This method will read in the given input file and for each line it will add a new column 
+containing the Ontology terms found for the ID in that line. So the output file is the same as the 
+input file + extra Ontology terms column (separated by ; ).
+
+A second summarized "ontology observations" file is also generated which can be used for visualizing the results
+in an ontology viewer (e.g. see OntologyAndObservationsViewer). 
+
+  </help>
+</tool>
author	pieter.lukasse@wur.nl
date	Fri, 02 May 2014 15:36:43 +0200
parents
children	eb0b7889dd08