Repository 'proteore_clusterprofiler'
hg clone https://toolshed.g2.bx.psu.edu/repos/proteore/proteore_clusterprofiler

Changeset 13:f6107b8ae8f8 (2021-04-09)
Previous changeset 12:85f039f53414 (2020-01-24)
Commit message:
"planemo upload commit be9070db4a3b178ab45ecd9c9c3ab369240f7617-dirty"
modified:
GO-enrich.R
cluster_profiler.xml
test-data/EGO_BP_bar-plot
test-data/EGO_BP_dot-plot
test-data/EGO_CC_bar-plot
test-data/EGO_CC_dot-plot
test-data/GGO_BP_bar-plot
test-data/GGO_CC_bar-plot
test-data/GGO_MF_bar-plot
test-data/cluster_profiler_EGO_CC.csv
test-data/cluster_profiler_EGO_MF.csv
test-data/cluster_profiler_GGO_BP.csv
test-data/cluster_profiler_GGO_CC.csv
test-data/cluster_profiler_GGO_MF.csv
b
diff -r 85f039f53414 -r f6107b8ae8f8 GO-enrich.R
--- a/GO-enrich.R Fri Jan 24 05:12:09 2020 -0500
+++ b/GO-enrich.R Fri Apr 09 14:39:05 2021 +0000
[
b'@@ -1,63 +1,77 @@\n-options(warn=-1)  #TURN OFF WARNINGS !!!!!!\n-suppressMessages(library(clusterProfiler,quietly = TRUE))\n+options(warn = -1)  #TURN OFF WARNINGS !!!!!!\n+suppressMessages(library(clusterProfiler, quietly = TRUE))\n \n # Read file and return file content as data.frame\n-read_file <- function(path,header){\n-  file <- try(read.csv(path,header=header, sep="\\t",stringsAsFactors = FALSE, quote="",check.names = F),silent=TRUE)\n-  if (inherits(file,"try-error")){\n+read_file <- function(path, header) {\n+  file <- try(read.csv(path, header = header, sep = "\\t",\n+                       stringsAsFactors = FALSE, quote = "", check.names = F),\n+                      silent = TRUE)\n+  if (inherits(file, "try-error")) {\n     stop("File not found !")\n   }else{\n-    file <- file[!apply(is.na(file) | file == "", 1, all), , drop=FALSE]\n+    file <- file[!apply(is.na(file) | file == "", 1, all), , drop = FALSE]\n     return(file)\n   }\n }\n \n-#return the number of character from the longest description found (from the 10 first)\n-max_str_length_10_first <- function(vector){\n+\n+#return the number of character from the longest description found\n+#(from the 10 first)\n+max_str_length_10_first <- function(vector) {\n   vector <- as.vector(vector)\n-  nb_description = length(vector)\n-  if (nb_description >= 10){nb_description=10}\n+  nb_description <- length(vector)\n+  if (nb_description >= 10) {\n+    nb_description <- 10\n+    }\n+\n   return(max(nchar(vector[1:nb_description])))\n }\n \n-str2bool <- function(x){\n-  if (any(is.element(c("t","true"),tolower(x)))){\n-    return (TRUE)\n-  }else if (any(is.element(c("f","false"),tolower(x)))){\n-    return (FALSE)\n+str2bool <- function(x) {\n+  if (any(is.element(c("t", "true"), tolower(x)))) {\n+    return(TRUE)\n+  }else if (any(is.element(c("f", "false"), tolower(x)))) {\n+    return(FALSE)\n+\n   }else{\n     return(NULL)\n   }\n }\n \n #used before the limit was set to 50 characters\n-width_by_max_char <- function (nb_max_char) {\n-  if (nb_max_char < 50 ){\n-    width=600\n+width_by_max_char <- function(nb_max_char) {\n+  if (nb_max_char < 50) {\n+    width <- 600\n   } else if (nb_max_char < 75) {\n-    width=800\n+    width <- 800\n   } else if (nb_max_char < 100) {\n-    width=900\n+    width <- 900\n   } else {\n-    width=1000\n+    width <- 1000\n   }\n-  return (width)\n+  return(width)\n }\n \n-repartition_GO <- function(geneid, orgdb, ontology, level=3, readable=TRUE) {\n-  ggo<-groupGO(gene=geneid, \n-               OrgDb = orgdb, \n-               ont=ontology, \n-               level=level, \n-               readable=TRUE)\n+\n+repartition_go <- function(geneid, orgdb, ontology,\n+                           level = 3, readable = TRUE) {\n+  ggo <- groupGO(gene = geneid,\n+                OrgDb = orgdb,\n+                ont = ontology,\n+                level = level,\n+                readable = TRUE)\n+\n \n-  if (length(ggo@result$ID) > 0 ) {\n-    ggo@result$Description <- sapply(as.vector(ggo@result$Description), function(x) {ifelse(nchar(x)>50, substr(x,1,50),x)},USE.NAMES = FALSE)\n-    #nb_max_char = max_str_length_10_first(ggo$Description)\n-    #width = width_by_max_char(nb_max_char)\n+  if (length(ggo@result$ID) > 0) {\n+    ggo@result$Description <- sapply(as.vector(ggo@result$Description), #nolint\n+                              function(x) {\n+                                ifelse(nchar(x) > 50,\n+                                substr(x, 1, 50), x)}, USE.NAMES = FALSE)\n+\n+\n     name <- paste("GGO_", ontology, "_bar-plot", sep = "")\n-    png(name,height = 720, width = 600)\n-    p <- barplot(ggo, showCategory=10)\n+    png(name, height = 720, width = 600)\n+    p <- barplot(ggo, showCategory = 10)\n     print(p)\n     dev.off()\n     ggo <- as.data.frame(ggo)\n@@ -65,75 +79,85 @@\n   }\n }\n \n+# nolint end\n+\n # GO over-representation test\n-enrich_GO <- function(geneid, universe, orgdb, ontology, pval_cutoff, qval_cutoff,plot) {\n-  ego<-enrichGO(gene=geneid,\n-                universe=universe,\n-                OrgDb=orgdb,\n-                '..b'sapply(universe_file[,universe_ncol], function(x) rapply(strsplit(x,";"),c),USE.NAMES = FALSE))\n+        universe <- unlist(sapply(universe_file[, universe_ncol],\n+                function(x) rapply(strsplit(x, ";"), c), USE.NAMES = FALSE))\n       }\n-      universe = clean_ids(input)\n-      universe_id_type = args$universe_id_type\n+      universe <- clean_ids(input)\n+      universe_id_type <- args$universe_id_type\n       ##to initialize\n-      if (universe_id_type=="Uniprot" & any(check_ids(universe,"uniprot"))) {\n-        idFrom<-"UNIPROT"\n-        idTo<-"ENTREZID"\n-        suppressMessages(universe_gene<-bitr(universe, fromType=idFrom, toType=idTo, OrgDb=orgdb))\n-        universe_gene<-unique(universe_gene$ENTREZID)\n-      } else if (universe_id_type=="Entrez" & any(check_ids(universe,"entrez"))) {\n-        universe_gene<-unique(unlist(universe))\n+      if (universe_id_type == "Uniprot" & any(check_ids(universe, "uniprot"))) {\n+        idfrom <- "UNIPROT"\n+        idto <- "ENTREZID"\n+        suppressMessages(universe_gene <- bitr(universe, fromType = idfrom,\n+                                               toType = idto, OrgDb = orgdb))\n+        universe_gene <- unique(universe_gene$ENTREZID)\n+      } else if (universe_id_type == "Entrez" &\n+                 any(check_ids(universe, "entrez"))) {\n+        universe_gene <- unique(unlist(universe))\n       } else {\n-        if (universe_type=="text"){\n-          print(paste(universe_id_type,"not found in your background IDs list",sep=" "))\n+        if (universe_type == "text") {\n+          print(paste(universe_id_type, "not found in your background IDs list",\n+                      sep = " "))\n         } else {\n-          print(paste(universe_id_type,"not found in the column",universe_ncol,"of your background IDs file",sep=" "))\n+          print(paste(universe_id_type, "not found in the column",\n+                      universe_ncol, "of your background IDs file", sep = " "))\n+\n         }\n-        universe_gene = NULL\n-      } \n+        universe_gene <- NULL\n+      }\n     } else {\n-      universe_gene = NULL\n+      universe_gene <- NULL\n     }\n   } else {\n-    universe_gene = NULL\n+    universe_gene <- NULL\n   }\n \n   ##enrichGO : GO over-representation test\n   for (onto in ontology) {\n     if (go_represent) {\n-      ggo<-repartition_GO(gene, orgdb, onto, level, readable=TRUE)\n-      if (is.list(ggo)){ggo <- as.data.frame(apply(ggo, c(1,2), function(x) gsub("^$|^ $", NA, x)))}  #convert "" and " " to NA\n-      output_path = paste("cluster_profiler_GGO_",onto,".tsv",sep="")\n-      write.table(ggo, output_path, sep="\\t", row.names = FALSE, quote = FALSE )\n+      ggo <- repartition_go(gene, orgdb, onto, level, readable = TRUE)\n+      if (is.list(ggo)) {\n+        ggo <- as.data.frame(apply(ggo, c(1, 2),\n+              function(x) gsub("^$|^ $", NA, x)))\n+      }  #convert "" and " " to NA\n+      output_path <- paste("cluster_profiler_GGO_", onto, ".tsv", sep = "")\n+      write.table(ggo, output_path, sep = "\\t",\n+                  row.names = FALSE, quote = FALSE)\n+\n     }\n \n     if (go_enrich) {\n-      ego<-enrich_GO(gene, universe_gene, orgdb, onto, pval_cutoff, qval_cutoff,plot)\n-      if (is.list(ego)){ego <- as.data.frame(apply(ego, c(1,2), function(x) gsub("^$|^ $", NA, x)))}  #convert "" and " " to NA\n-      output_path = paste("cluster_profiler_EGO_",onto,".tsv",sep="")\n-      write.table(ego, output_path, sep="\\t", row.names = FALSE, quote = FALSE )\n+      ego <- enrich_go(gene, universe_gene, orgdb, onto, pval_cutoff,\n+                       qval_cutoff, plot)\n+      if (is.list(ego)) {\n+        ego <- as.data.frame(apply(ego, c(1, 2),\n+                function(x) gsub("^$|^ $", NA, x)))\n+        }  #convert "" and " " to NA\n+      output_path <- paste("cluster_profiler_EGO_", onto, ".tsv", sep = "")\n+      write.table(ego, output_path, sep = "\\t",\n+                  row.names = FALSE, quote = FALSE)\n     }\n   }\n }\n \n-if(!interactive()) {\n+if (!interactive()) {\n   main()\n }\n'
b
diff -r 85f039f53414 -r f6107b8ae8f8 cluster_profiler.xml
--- a/cluster_profiler.xml Fri Jan 24 05:12:09 2020 -0500
+++ b/cluster_profiler.xml Fri Apr 09 14:39:05 2021 +0000
[
@@ -1,12 +1,13 @@
-<tool id="cluter_profiler" name="Classification and enrichment analysis" version="2019.01.23">
+<tool id="cluter_profiler" name="Classification and enrichment analysis" version="2021.04.08">
     <description>(Human, Mouse, Rat)[clusterProfiler]</description>
     <requirements>
-        <requirement type="package">R</requirement>
-        <requirement type="package" version="3.8.2">bioconductor-org.hs.eg.db</requirement>
-        <requirement type="package" version="3.8.2">bioconductor-org.mm.eg.db</requirement>
-        <requirement type="package" version="3.8.2">bioconductor-org.Rn.eg.db</requirement>
-        <requirement type="package" version="3.10.2">bioconductor-dose</requirement>
-        <requirement type="package" version="3.12.0">bioconductor-clusterprofiler</requirement>
+        <requirement type="package" version="4.0.3">r-base</requirement>
+        <requirement type="package" version="3.12.0">bioconductor-org.hs.eg.db</requirement>
+        <requirement type="package" version="3.12.0">bioconductor-org.mm.eg.db</requirement>
+        <requirement type="package" version="3.12.0">bioconductor-org.rn.eg.db</requirement>
+        <requirement type="package" version="1.52.0">bioconductor-annotationdbi</requirement>
+        <requirement type="package" version="3.16.0">bioconductor-dose</requirement>
+        <requirement type="package" version="3.18.1">bioconductor-clusterprofiler</requirement>
     </requirements>
     <command detect_errors="exit_code"><![CDATA[
         Rscript "$__tool_directory__/GO-enrich.R"
@@ -202,12 +203,12 @@
             <param name="plot" value="dotplot,barplot"/>
             <output name="log" file="log.txt" />
             <output_collection name="text_output">
-                <element name="cluster_profiler_GGO_CC.csv" file="cluster_profiler_GGO_CC.csv" ftype="csv"/>
-                <element name="cluster_profiler_EGO_BP.csv" file="cluster_profiler_GGO_BP.csv" ftype="csv"/>
-                <element name="cluster_profiler_GGO_MF.csv" file="cluster_profiler_GGO_MF.csv" ftype="csv"/>
-                <element name="cluster_profiler_EGO_CC.csv" file="cluster_profiler_EGO_CC.csv" ftype="csv"/>
-                <element name="cluster_profiler_EGO_BP.csv" file="cluster_profiler_EGO_BP.csv" ftype="csv"/>
-                <element name="cluster_profiler_EGO_MF.csv" file="cluster_profiler_EGO_MF.csv" ftype="csv"/>
+                <element name="cluster_profiler_GGO_CC.tsv" file="cluster_profiler_GGO_CC.csv" ftype="tsv"/>
+<!---                <element name="cluster_profiler_GGO_BP.tsv" file="cluster_profiler_GGO_BP.csv" ftype="tsv"/> -->
+                <element name="cluster_profiler_GGO_MF.tsv" file="cluster_profiler_GGO_MF.csv" ftype="tsv"/>
+                <element name="cluster_profiler_EGO_CC.tsv" file="cluster_profiler_EGO_CC.csv" ftype="tsv"/>
+                <element name="cluster_profiler_EGO_BP.tsv" file="cluster_profiler_GGO_BP.csv" ftype="tsv"/>
+                <element name="cluster_profiler_EGO_MF.tsv" file="cluster_profiler_EGO_MF.csv" ftype="tsv"/>
             </output_collection>
             <output_collection name="graph_output">
                 <element name="GGO_CC_bar-plot" file="GGO_CC_bar-plot" ftype="png"/>
@@ -289,11 +290,11 @@
 
 Bioconductor Packages used:
 
-    - bioconductor-org.hs.eg.db v3.8.2
-    - bioconductor-org.mm.eg.db v3.8.2
-    - bioconductor-org.rn.eg.db v3.8.2
-    - dose v3.10.2
-    - clusterprofiler v 3.12.0
+    - bioconductor-org.hs.eg.db v3.12.0
+    - bioconductor-org.mm.eg.db v3.12.0
+    - bioconductor-org.rn.eg.db v3.12.0
+    - dose v3.16.0
+    - clusterprofiler v 3.18.1
 
 .. class:: infomark
 
@@ -301,7 +302,7 @@
 
 Lien Nguyen, Florence Combes, Yves Vandenbrouck - CEA, INSERM, CNRS, Grenoble-Alpes University, BIG Institute, FR
 
-Sandra Dérozier, Olivier Rué, Christophe Caron, Valentin Loux - INRA, Paris-Saclay University, MAIAGE Unit, Migale Bioinformatics platform, FR
+Christophe Caron, Valentin Loux - INRAE, Paris-Saclay University, MAIAGE Unit, Migale Bioinformatics platform, FR
 
 This work has been partially funded through the French National Agency for Research (ANR) IFB project.
 
b
diff -r 85f039f53414 -r f6107b8ae8f8 test-data/EGO_BP_bar-plot
b
Binary file test-data/EGO_BP_bar-plot has changed
b
diff -r 85f039f53414 -r f6107b8ae8f8 test-data/EGO_BP_dot-plot
b
Binary file test-data/EGO_BP_dot-plot has changed
b
diff -r 85f039f53414 -r f6107b8ae8f8 test-data/EGO_CC_bar-plot
b
Binary file test-data/EGO_CC_bar-plot has changed
b
diff -r 85f039f53414 -r f6107b8ae8f8 test-data/EGO_CC_dot-plot
b
Binary file test-data/EGO_CC_dot-plot has changed
b
diff -r 85f039f53414 -r f6107b8ae8f8 test-data/GGO_BP_bar-plot
b
Binary file test-data/GGO_BP_bar-plot has changed
b
diff -r 85f039f53414 -r f6107b8ae8f8 test-data/GGO_CC_bar-plot
b
Binary file test-data/GGO_CC_bar-plot has changed
b
diff -r 85f039f53414 -r f6107b8ae8f8 test-data/GGO_MF_bar-plot
b
Binary file test-data/GGO_MF_bar-plot has changed
b
diff -r 85f039f53414 -r f6107b8ae8f8 test-data/cluster_profiler_EGO_CC.csv
--- a/test-data/cluster_profiler_EGO_CC.csv Fri Jan 24 05:12:09 2020 -0500
+++ b/test-data/cluster_profiler_EGO_CC.csv Fri Apr 09 14:39:05 2021 +0000
b
b'@@ -1,18 +1,41 @@\n ID\tDescription\tGeneRatio\tBgRatio\tpvalue\tp.adjust\tqvalue\tgeneID\tCount\n-GO:0034774\tsecretory granule lumen\t22/152\t111/2939\t2.07482731603193e-08\t3.16370874431657e-06\t2.781282412586e-06\tALB/ANXA2/JUP/LTF/SERPINB3/FABP5/CAT/EEF2/TUBB4B/LYZ/CTSD/GSTP1/ALDOA/VCL/SERPINA3/LCN2/GSN/AGA/PNP/S100A11/GDI2/NPC2\t22\n-GO:0031983\tvesicle lumen\t22/152\t114/2939\t3.4766030157325e-08\t3.16370874431657e-06\t2.781282412586e-06\tALB/ANXA2/JUP/LTF/SERPINB3/FABP5/CAT/EEF2/TUBB4B/LYZ/CTSD/GSTP1/ALDOA/VCL/SERPINA3/LCN2/GSN/AGA/PNP/S100A11/GDI2/NPC2\t22\n-GO:0060205\tcytoplasmic vesicle lumen\t22/152\t114/2939\t3.4766030157325e-08\t3.16370874431657e-06\t2.781282412586e-06\tALB/ANXA2/JUP/LTF/SERPINB3/FABP5/CAT/EEF2/TUBB4B/LYZ/CTSD/GSTP1/ALDOA/VCL/SERPINA3/LCN2/GSN/AGA/PNP/S100A11/GDI2/NPC2\t22\n-GO:0030141\tsecretory granule\t30/152\t232/2939\t1.22925605779538e-06\t8.38967259445349e-05\t7.3755363467723e-05\tDSP/ALB/DSG1/ANXA2/JUP/LTF/SERPINB3/FABP5/PIGR/CAT/EEF2/TUBB4B/LYZ/CTSD/DMBT1/SOD1/GSTP1/ALDOA/CAPN1/VCL/SERPINA3/LCN2/GSN/AGA/PNP/LAMP1/LAMP2/S100A11/GDI2/NPC2\t30\n-GO:0099503\tsecretory vesicle\t30/152\t251/2939\t6.60174269183974e-06\t0.00036045515097445\t0.000316883649208308\tDSP/ALB/DSG1/ANXA2/JUP/LTF/SERPINB3/FABP5/PIGR/CAT/EEF2/TUBB4B/LYZ/CTSD/DMBT1/SOD1/GSTP1/ALDOA/CAPN1/VCL/SERPINA3/LCN2/GSN/AGA/PNP/LAMP1/LAMP2/S100A11/GDI2/NPC2\t30\n-GO:0101002\tficolin-1-rich granule\t14/152\t72/2939\t1.18733421290438e-05\t0.000540237066871494\t0.000474933685161753\tDSP/DSG1/JUP/CAT/EEF2/CTSD/GSTP1/ALDOA/CAPN1/VCL/GSN/PNP/LAMP1/LAMP2\t14\n-GO:0005766\tprimary lysosome\t12/152\t61/2939\t4.56978270565284e-05\t0.00143685132139962\t0.00126316599683483\tANXA2/SERPINB3/FABP5/PIGR/TUBB4B/LYZ/SERPINA3/AGA/LAMP1/LAMP2/GDI2/NPC2\t12\n-GO:0042582\tazurophil granule\t12/152\t61/2939\t4.56978270565284e-05\t0.00143685132139962\t0.00126316599683483\tANXA2/SERPINB3/FABP5/PIGR/TUBB4B/LYZ/SERPINA3/AGA/LAMP1/LAMP2/GDI2/NPC2\t12\n-GO:0031012\textracellular matrix\t17/152\t113/2939\t4.73687248813062e-05\t0.00143685132139962\t0.00126316599683483\tDSP/DSG1/ANXA2/JUP/PLEC/LMNA/HSPA5/CSTA/GAPDH/EEF2/MYH9/TUBB4B/CTSD/FLNB/SOD1/HSPB1/ATP5A1\t17\n-GO:0005882\tintermediate filament\t7/152\t21/2939\t5.43339859285434e-05\t0.00148331781584923\t0.00130401566228504\tDSP/KRT6A/JUP/KRT17/KRT6B/LMNA/KRT15\t7\n-GO:0035578\tazurophil granule lumen\t9/152\t39/2939\t0.000116381481601412\t0.00288837677065322\t0.00253923232584899\tANXA2/SERPINB3/FABP5/TUBB4B/LYZ/SERPINA3/AGA/GDI2/NPC2\t9\n-GO:0045111\tintermediate filament cytoskeleton\t8/152\t32/2939\t0.000154925405587284\t0.00352455297711071\t0.00309850811174568\tDSP/KRT6A/JUP/KRT17/PLEC/KRT6B/LMNA/KRT15\t8\n-GO:1904813\tficolin-1-rich granule lumen\t10/152\t53/2939\t0.000289825905131926\t0.00573615147717977\t0.00504277052938881\tJUP/CAT/EEF2/CTSD/GSTP1/ALDOA/CAPN1/VCL/GSN/PNP\t10\n-GO:0005775\tvacuolar lumen\t11/152\t63/2939\t0.000294161614214347\t0.00573615147717977\t0.00504277052938881\tANXA2/SERPINB3/FABP5/TUBB4B/LYZ/CTSD/SERPINA3/AGA/LAMP2/GDI2/NPC2\t11\n-GO:0001533\tcornified envelope\t5/152\t13/2939\t0.000318245371505049\t0.00579206576139188\t0.00509192594408078\tDSP/DSG1/JUP/ANXA1/CSTA\t5\n-GO:0044433\tcytoplasmic vesicle part\t32/152\t338/2939\t0.000357212587465447\t0.00590003159894176\t0.00518684096610265\tDSP/ALB/DSG1/ANXA2/JUP/LTF/SERPINB3/FABP5/PIGR/ANXA1/CAT/SFN/EEF2/TUBB4B/LYZ/CTSD/UBA52/DMBT1/GSTP1/ALDOA/CAPN1/VCL/SERPINA3/LCN2/GSN/AGA/PNP/LAMP1/LAMP2/S100A11/GDI2/NPC2\t32\n-GO:0035580\tspecific granule lumen\t6/152\t20/2939\t0.000367401235098937\t0.00590003159894176\t0.00518684096610265\tJUP/LTF/LYZ/CTSD/VCL/LCN2\t6\n+GO:0034774\tsecretory granule lumen\t40/151\t322/19559\t4.698082e-37\t8.644911e-35\t5.879940e-35\tALB/ANXA2/JUP/LTF/SERPINB3/FABP5/HRNR/TF/CAT/S100A7/PKM/ARG1/EEF2/TUBB4B/LYZ/SERPINA1/HSP90AA1/ACTN4/CTSD/HSPA8/PPIA/GGH/GSTP1/ALDOA/VCL/HP/SERPINA3/ORM1/SERPINB1/LCN2/GSN/AGA/PNP/CSTB/ALDOC/S100A11/GDI2/ACTR2/NPC2/DEFA3\t40\n+GO:0060205\tcytoplasmic vesicle lumen\t40/151\t326/19559\t7.774260e-37\t8.644911e-35\t5.879940e-35\tALB/ANXA2/JUP/LTF/SERPINB3/FABP5/HRNR/TF/CAT/S100A7/PKM/ARG1/EEF2/TUBB4B/LYZ/SERPINA1/HSP90AA1/ACTN4/CTSD/HSPA8/PPIA/GGH/GSTP1/ALDOA/V'..b'TR2\t25\n+GO:0045111\tintermediate filament cytoskeleton\t20/151\t251/19559\t6.453595e-15\t1.290719e-13\t8.778979e-14\tDSP/KRT6A/KRT16/JUP/KRT78/KRT17/CASP14/PLEC/KRT80/KRT13/KRT6B/LMNA/EPPK1/KRT23/KRT15/FLG/KRT1/KRT2/KRT10/KRT85\t20\n+GO:0005925\tfocal adhesion\t24/151\t415/19559\t1.398172e-14\t2.596606e-13\t1.766112e-13\tJUP/ACTG1/PLEC/ANXA1/HSPA5/CAT/S100A7/HSPA1A/HSPA1B/MYH9/ACTN4/FLNB/HSPB1/HSPA8/PPIA/YWHAZ/CAPN1/VCL/YWHAE/GSN/PPIB/RPS3/GDI2/ACTR2\t24\n+GO:0070820\ttertiary granule\t16/151\t164/19559\t1.643373e-13\t2.848514e-12\t1.937451e-12\tDSP/DSG1/LTF/SERPINB12/LYZ/CTSD/GGH/ALDOA/HBB/HP/ORM1/CSTB/ALDOC/LAMP1/LAMP2/FLG2\t16\n+GO:1904724\ttertiary granule lumen\t11/151\t55/19559\t3.591112e-13\t5.835556e-12\t3.969123e-12\tLTF/LYZ/CTSD/GGH/ALDOA/HBB/HP/ORM1/CSTB/ALDOC/FLG2\t11\n+GO:0042470\tmelanosome\t13/151\t105/19559\t1.556349e-12\t2.248059e-11\t1.529044e-11\tANXA2/HSPA5/PRDX1/HSP90AA1/CTSD/HSPA8/YWHAZ/GGH/YWHAE/CTSB/LAMP1/PPIB/CAPG\t13\n+GO:0048770\tpigment granule\t13/151\t105/19559\t1.556349e-12\t2.248059e-11\t1.529044e-11\tANXA2/HSPA5/PRDX1/HSP90AA1/CTSD/HSPA8/YWHAZ/GGH/YWHAE/CTSB/LAMP1/PPIB/CAPG\t13\n+GO:0035580\tspecific granule lumen\t10/151\t62/19559\t4.246476e-11\t5.810967e-10\t3.952398e-10\tJUP/LTF/ARG1/LYZ/CTSD/GGH/VCL/HP/ORM1/LCN2\t10\n+GO:0072562\tblood microparticle\t13/151\t148/19559\t1.281364e-10\t1.665773e-09\t1.132995e-09\tALB/ACTG1/TF/HSPA1A/HSPA1B/HSPA8/YWHAZ/HBB/HP/SERPINA3/ORM1/GSN/KRT1\t13\n+GO:0045095\tkeratin filament\t10/151\t95/19559\t3.212635e-09\t3.977548e-08\t2.705377e-08\tKRT6A/KRT78/CASP14/KRT80/KRT13/KRT6B/EPPK1/KRT1/KRT2/KRT85\t10\n+GO:0030057\tdesmosome\t6/151\t25/19559\t3.006653e-08\t3.553317e-07\t2.416831e-07\tDSP/DSG1/JUP/POF1B/DSC3/PERP\t 6\n+GO:0062023\tcollagen-containing extracellular matrix\t16/151\t427/19559\t2.089490e-07\t2.362033e-06\t1.606565e-06\tANXA2/AZGP1/HRNR/ANXA1/S100A7/SERPINB12/PKM/SERPINA1/CTSD/SERPINA3/ORM1/SERPINB1/CSTB/FLG/CTSB/KRT1\t16\n+GO:0042581\tspecific granule\t10/151\t160/19559\t4.717165e-07\t5.110262e-06\t3.475806e-06\tJUP/LTF/ARG1/LYZ/CTSD/GGH/VCL/HP/ORM1/LCN2\t10\n+GO:0043202\tlysosomal lumen\t8/151\t96/19559\t7.824361e-07\t8.137336e-06\t5.534706e-06\tHSP90AA1/CTSD/HSPA8/CTSV/SERPINB13/CTSB/LAMP2/NPC2\t 8\n+GO:0030139\tendocytic vesicle\t12/151\t313/19559\t5.891879e-06\t5.891879e-05\t4.007432e-05\tLTF/ACTG1/TF/HSP90AA1/UBA52/DMBT1/FLNB/HBB/HP/GSN/LAMP1/LAMP2\t12\n+GO:0008180\tCOP9 signalosome\t5/151\t36/19559\t7.976238e-06\t7.680822e-05\t5.224203e-05\tHSPA5/HSPA1A/HSPA1B/MYH9/ATP5F1A\t 5\n+GO:0030016\tmyofibril\t10/151\t227/19559\t1.094294e-05\t1.016130e-04\t6.911330e-05\tJUP/ACTG1/ENO1/PLEC/ACTN4/FLNB/HSPB1/ALDOA/VCL/CAPZB\t10\n+GO:0031093\tplatelet alpha granule lumen\t6/151\t67/19559\t1.297451e-05\t1.163232e-04\t7.911861e-05\tALB/SERPINA1/ACTN4/ALDOA/SERPINA3/ORM1\t 6\n+GO:0071682\tendocytic vesicle lumen\t4/151\t20/19559\t1.502135e-05\t1.301850e-04\t8.854689e-05\tLTF/HSP90AA1/HBB/HP\t 4\n+GO:0043292\tcontractile fiber\t10/151\t238/19559\t1.649747e-05\t1.383658e-04\t9.411118e-05\tJUP/ACTG1/ENO1/PLEC/ACTN4/FLNB/HSPB1/ALDOA/VCL/CAPZB\t10\n+GO:0005911\tcell-cell junction\t14/151\t493/19559\t2.934284e-05\t2.384106e-04\t1.621578e-04\tDSP/DSG1/ANXA2/JUP/ACTG1/ANXA1/MYH9/POF1B/ACTN4/EPPK1/DSC3/VCL/PERP/S100A11\t14\n+GO:0005916\tfascia adherens\t3/151\t10/19559\t5.202062e-05\t4.098595e-04\t2.787708e-04\tDSP/JUP/VCL\t 3\n+GO:0031091\tplatelet alpha granule\t6/151\t91/19559\t7.444206e-05\t5.692628e-04\t3.871909e-04\tALB/SERPINA1/ACTN4/ALDOA/SERPINA3/ORM1\t 6\n+GO:0101003\tficolin-1-rich granule membrane\t5/151\t61/19559\t1.077869e-04\t7.828748e-04\t5.324816e-04\tDSP/DSG1/SERPINB12/LAMP1/LAMP2\t 5\n+GO:0045335\tphagocytic vesicle\t7/151\t140/19559\t1.083980e-04\t7.828748e-04\t5.324816e-04\tLTF/ACTG1/DMBT1/FLNB/GSN/LAMP1/LAMP2\t 7\n+GO:0005912\tadherens junction\t7/151\t166/19559\t3.098190e-04\t2.177106e-03\t1.480785e-03\tANXA2/JUP/ANXA1/MYH9/POF1B/VCL/S100A11\t 7\n+GO:0030017\tsarcomere\t7/151\t207/19559\t1.147177e-03\t7.849107e-03\t5.338664e-03\tJUP/ENO1/ACTN4/FLNB/HSPB1/ALDOA/CAPZB\t 7\n+GO:0002102\tpodosome\t3/151\t29/19559\t1.422502e-03\t9.280979e-03\t6.312568e-03\tVCL/GSN/ACTR2\t 3\n+GO:0000502\tproteasome complex\t4/151\t63/19559\t1.427843e-03\t9.280979e-03\t6.312568e-03\tHSPB1/IDE/PSMA3/PSMB3\t 4\n'
b
diff -r 85f039f53414 -r f6107b8ae8f8 test-data/cluster_profiler_EGO_MF.csv
--- a/test-data/cluster_profiler_EGO_MF.csv Fri Jan 24 05:12:09 2020 -0500
+++ b/test-data/cluster_profiler_EGO_MF.csv Fri Apr 09 14:39:05 2021 +0000
b
@@ -1,2 +1,33 @@
-x
-No Go terms enriched (EGO) found for  MF ontology
+ID Description GeneRatio BgRatio pvalue p.adjust qvalue geneID Count
+GO:0004866 endopeptidase inhibitor activity 21/152 183/18352 2.879794e-18 8.805006e-16 6.813398e-16 ANXA2/LTF/SERPINB3/SERPINB12/CSTA/GAPDH/SERPINB7/SERPINA1/LCN1/SERPINB4/A2ML1/SERPINA3/SERPINB1/CST6/SERPINB5/CSTB/SERPINB13/CST4/CST1/CST2/SERPINA12 21
+GO:0030414 peptidase inhibitor activity 21/152 189/18352 5.658871e-18 8.805006e-16 6.813398e-16 ANXA2/LTF/SERPINB3/SERPINB12/CSTA/GAPDH/SERPINB7/SERPINA1/LCN1/SERPINB4/A2ML1/SERPINA3/SERPINB1/CST6/SERPINB5/CSTB/SERPINB13/CST4/CST1/CST2/SERPINA12 21
+GO:0061135 endopeptidase regulator activity 21/152 192/18352 7.861613e-18 8.805006e-16 6.813398e-16 ANXA2/LTF/SERPINB3/SERPINB12/CSTA/GAPDH/SERPINB7/SERPINA1/LCN1/SERPINB4/A2ML1/SERPINA3/SERPINB1/CST6/SERPINB5/CSTB/SERPINB13/CST4/CST1/CST2/SERPINA12 21
+GO:0061134 peptidase regulator activity 21/152 229/18352 2.979448e-16 2.502737e-14 1.936642e-14 ANXA2/LTF/SERPINB3/SERPINB12/CSTA/GAPDH/SERPINB7/SERPINA1/LCN1/SERPINB4/A2ML1/SERPINA3/SERPINB1/CST6/SERPINB5/CSTB/SERPINB13/CST4/CST1/CST2/SERPINA12 21
+GO:0045296 cadherin binding 23/152 332/18352 4.823959e-15 3.241700e-13 2.508459e-13 ANXA2/JUP/ENO1/PLEC/ANXA1/HSPA5/SFN/PKM/PRDX1/HSPA1A/EEF2/MYH9/LDHA/FLNB/HSPA8/YWHAZ/ALDOA/VCL/YWHAE/EEF1G/S100A11/CAPG/CAPZB 23
+GO:0004857 enzyme inhibitor activity 24/152 383/18352 1.090413e-14 6.106312e-13 4.725122e-13 ANXA2/LTF/SERPINB3/ANXA1/SFN/SERPINB12/CSTA/GAPDH/SERPINB7/SERPINA1/HSPB1/LCN1/SERPINB4/A2ML1/SERPINA3/SERPINB1/CST6/SERPINB5/CSTB/SERPINB13/CST4/CST1/CST2/SERPINA12 24
+GO:0004867 serine-type endopeptidase inhibitor activity 12/152 98/18352 2.961461e-11 1.421501e-09 1.099971e-09 ANXA2/SERPINB3/SERPINB12/SERPINB7/SERPINA1/SERPINB4/A2ML1/SERPINA3/SERPINB1/SERPINB5/SERPINB13/SERPINA12 12
+GO:0004869 cysteine-type endopeptidase inhibitor activity 10/152 59/18352 5.002870e-11 2.101205e-09 1.625933e-09 LTF/SERPINB3/CSTA/LCN1/CST6/CSTB/SERPINB13/CST4/CST1/CST2 10
+GO:0005200 structural constituent of cytoskeleton 12/152 104/18352 6.039944e-11 2.254912e-09 1.744873e-09 DSP/KRT6A/KRT16/ACTG1/PLEC/KRT6B/TUBB4B/TUBA1B/KRT15/ARPC4/ACTR2/KRT2 12
+GO:0030280 structural constituent of skin epidermis 5/152 14/18352 6.878186e-08 2.311071e-06 1.788328e-06 FLG/KRT1/KRT2/KRT10/SPRR2E  5
+GO:0016209 antioxidant activity 8/152 86/18352 5.656494e-07 1.727802e-05 1.336990e-05 ALB/CAT/PRDX1/TXN/SOD1/GSTP1/HBB/HP  8
+GO:0031625 ubiquitin protein ligase binding 13/152 297/18352 1.180500e-06 3.305399e-05 2.557749e-05 ACTG1/HSPA5/TPI1/HSPA1A/HSPA1B/TUBA1B/HSP90AA1/UBA52/HSPA8/YWHAZ/VCL/YWHAE/PSMA3 13
+GO:0002020 protease binding 9/152 137/18352 2.103106e-06 5.435719e-05 4.206211e-05 ANXA2/SERPINB3/CSTA/SERPINA1/SERPINB4/A2ML1/LCN2/CSTB/SERPINB13  9
+GO:0044389 ubiquitin-like protein ligase binding 13/152 316/18352 2.348473e-06 5.636336e-05 4.361450e-05 ACTG1/HSPA5/TPI1/HSPA1A/HSPA1B/TUBA1B/HSP90AA1/UBA52/HSPA8/YWHAZ/VCL/YWHAE/PSMA3 13
+GO:0044183 protein folding chaperone 5/152 27/18352 2.542764e-06 5.695792e-05 4.407458e-05 HSPA5/HSPA1A/HSPA1B/HSPB1/HSPA8  5
+GO:0051082 unfolded protein binding 8/152 118/18352 6.238763e-06 1.310140e-04 1.013799e-04 HSPA5/HSPA1A/HSPA1B/TUBB4B/HSP90AA1/HSPA8/PPIA/PPIB  8
+GO:0023026 MHC class II protein complex binding 4/152 16/18352 7.618701e-06 1.505814e-04 1.165213e-04 PKM/HSP90AA1/HSPA8/YWHAE  4
+GO:0098631 cell adhesion mediator activity 6/152 60/18352 1.012418e-05 1.889847e-04 1.462382e-04 DSP/ANXA2/JUP/ANXA1/RPSA/S100A11  6
+GO:0003779 actin binding 14/152 437/18352 1.676301e-05 2.964406e-04 2.293885e-04 PLEC/EEF2/MYH9/POF1B/ACTN4/FLNB/ALDOA/VCL/GSN/CAPG/CAPZB/ARPC4/ACTR2/PIP 14
+GO:0001618 virus receptor activity 6/152 74/18352 3.405941e-05 5.449506e-04 4.216880e-04 SERPINB3/HSPA1A/HSPA1B/IDE/RPSA/LAMP1  6
+GO:0140272 exogenous protein binding 6/152 74/18352 3.405941e-05 5.449506e-04 4.216880e-04 SERPINB3/HSPA1A/HSPA1B/IDE/RPSA/LAMP1  6
+GO:0023023 MHC protein complex binding 4/152 25/18352 4.996762e-05 7.631418e-04 5.905264e-04 PKM/HSP90AA1/HSPA8/YWHAE  4
+GO:0051015 actin filament binding 9/152 206/18352 5.582177e-05 8.154832e-04 6.310287e-04 EEF2/MYH9/POF1B/ACTN4/GSN/CAPG/CAPZB/ARPC4/ACTR2  9
+GO:0098632 cell-cell adhesion mediator activity 5/152 51/18352 6.305102e-05 8.827143e-04 6.830528e-04 DSP/ANXA2/JUP/ANXA1/S100A11  5
+GO:0051787 misfolded protein binding 4/152 27/18352 6.843526e-05 9.197699e-04 7.117267e-04 HSPA5/HSPA1A/HSPA1B/HSPA8  4
+GO:0048306 calcium-dependent protein binding 6/152 85/18352 7.462065e-05 9.643284e-04 7.462065e-04 ANXA2/ANXA1/S100A7/DMBT1/S100A14/S100A11  6
+GO:0004175 endopeptidase activity 13/152 440/18352 7.750723e-05 9.645344e-04 7.463659e-04 LTF/CASP14/CTSD/BLMH/CTSV/CAPN1/HP/IDE/PSMA3/KLK1/CTSB/PSMB3/PIP 13
+GO:0016829 lyase activity 8/152 189/18352 1.808982e-04 2.170778e-03 1.679769e-03 ENO1/TPI1/GGCT/ALOX12B/ALDOA/ALDOC/RPS3/HAL  8
+GO:0008144 drug binding 6/152 104/18352 2.275970e-04 2.636986e-03 2.040525e-03 ALB/PPIA/GSTP1/LCN2/PNP/PPIB  6
+GO:0043531 ADP binding 4/152 38/18352 2.681766e-04 3.003578e-03 2.324197e-03 PKM/MYH9/PGK1/ATP5F1A  4
+GO:0098641 cadherin binding involved in cell-cell adhesion 3/152 18/18352 4.148869e-04 4.496839e-03 3.479697e-03 ANXA2/ANXA1/S100A11  3
+GO:0004601 peroxidase activity 4/152 52/18352 8.991179e-04 9.440738e-03 7.305333e-03 CAT/PRDX1/GSTP1/HBB  4
b
diff -r 85f039f53414 -r f6107b8ae8f8 test-data/cluster_profiler_GGO_BP.csv
--- a/test-data/cluster_profiler_GGO_BP.csv Fri Jan 24 05:12:09 2020 -0500
+++ b/test-data/cluster_profiler_GGO_BP.csv Fri Apr 09 14:39:05 2021 +0000
b
b'@@ -1,586 +1,136 @@\n-ID\tDescription\tCount\tGeneRatio\tgeneID\n-GO:0019953\tsexual reproduction\t3\t3/153\tSOD1/CTSV/ALDOA\n-GO:0019954\tasexual reproduction\t0\t0/153\t\n-GO:0022414\treproductive process\t10\t10/153\tDSG1/ANXA1/ARG1/MYH9/SOD1/CTSV/ALDOA/SERPINB5/CTSB/ACTR2\n-GO:0032504\tmulticellular organism reproduction\t6\t6/153\tDSG1/ANXA1/ARG1/SOD1/CTSV/CTSB\n-GO:0032505\treproduction of a single-celled organism\t0\t0/153\t\n-GO:0061887\treproduction of symbiont in host\t0\t0/153\t\n-GO:0055114\toxidation-reduction process\t16\t16/153\tENO1/CAT/PKM/TPI1/PRDX1/GAPDH/LDHA/UBA52/TXN/SOD1/ALOX12B/PGK1/ALDOA/MDH2/ALDOC/APOD\n-GO:0006807\tnitrogen compound metabolic process\t105\t105/153\tDSP/ALB/ANXA2/JUP/LTF/MUC5B/SERPINB3/KRT17/FABP5/CASP14/ENO1/AZGP1/TGM3/ANXA1/HSPA5/TF/CAT/S100A7/SFN/SERPINB12/PKM/TPI1/PRDX1/CSTA/ARG1/GAPDH/HSPA1A/HSPA1B/EEF2/MYH9/SERPINB7/LYZ/SERPINA1/HSP90AA1/ACTN4/GGCT/LDHA/CTSD/UBA52/TXN/DMBT1/CPA4/BLMH/PLBD1/SOD1/HSPB1/HSPA8/EIF4A1/PPIA/YWHAZ/GGH/ALOX12B/GSTP1/LCN1/SERPINB4/C1orf68/CTSV/PGK1/ALDOA/CAPN1/YWHAE/HBB/A2ML1/SERPINA3/SPRR1B/SERPINB1/CST6/GSN/IDE/AGA/PSMA3/EEF1G/SERPINB5/MDH2/LYPD3/PNP/CSTB/ALDOC/FLG/PERP/SERPINB13/APOD/KLK1/CTSB/RPSA/LAMP2/TYMP/PPIB/RPS3/ATP5A1/S100A11/HAL/GSS/PSMB3/PIP/CST4/MUC7/CST1/CST2/KRT1/KRT2/KRT10/SERPINA12/DCD/SPRR2E\n-GO:0009056\tcatabolic process\t41\t41/153\tANXA2/FABP5/ENO1/HSPA5/CAT/SERPINB12/PKM/TPI1/PRDX1/ARG1/GAPDH/HSPA1A/HSPA1B/LYZ/HSP90AA1/LDHA/CTSD/UBA52/BLMH/PLBD1/HSPB1/HSPA8/EIF4A1/YWHAZ/CTSV/PGK1/ALDOA/CAPN1/HBB/HP/IDE/PSMA3/PNP/ALDOC/CTSB/RPSA/LAMP2/TYMP/RPS3/HAL/PSMB3\n-GO:0009058\tbiosynthetic process\t47\t47/153\tJUP/LTF/MUC5B/KRT17/FABP5/ENO1/ANXA1/HSPA5/CAT/PKM/TPI1/ARG1/GAPDH/HSPA1A/HSPA1B/EEF2/SERPINB7/HSP90AA1/ACTN4/GGCT/UBA52/TXN/SOD1/HSPB1/HSPA8/EIF4A1/PPIA/ALOX12B/GSTP1/PGK1/ALDOA/HBB/PSMA3/EEF1G/MDH2/LYPD3/PNP/ALDOC/RPSA/TYMP/RPS3/ATP5A1/S100A11/GSS/PSMB3/MUC7/SERPINA12\n-GO:0009892\tnegative regulation of metabolic process\t42\t42/153\tANXA2/LTF/SERPINB3/ENO1/SFN/SERPINB12/CSTA/GAPDH/HSPA1A/HSPA1B/SERPINB7/SERPINA1/UBA52/TXN/SOD1/HSPB1/HSPA8/EIF4A1/YWHAZ/GSTP1/LCN1/SERPINB4/YWHAE/A2ML1/HP/SERPINA3/SERPINB1/CST6/IDE/PSMA3/SERPINB5/CSTB/SERPINB13/APOD/RPSA/RPS3/S100A11/PSMB3/CST4/CST1/CST2/SERPINA12\n-GO:0009893\tpositive regulation of metabolic process\t31\t31/153\tANXA2/LTF/SERPINB3/KRT17/ENO1/LMNA/ANXA1/HSPA5/S100A7/HSPA1A/HSPA1B/EEF2/MYH9/SERPINB7/HSP90AA1/UBA52/TXN/SOD1/HSPB1/HSPA8/ALOX12B/GSTP1/HBB/LCN2/GSN/IDE/PSMA3/PERP/RPS3/PSMB3/PIP\n-GO:0018933\tnicotine metabolic process\t0\t0/153\t\n-GO:0019222\tregulation of metabolic process\t62\t62/153\tANXA2/JUP/LTF/SERPINB3/KRT17/ENO1/LMNA/ANXA1/HSPA5/CAT/S100A7/SFN/SERPINB12/PRDX1/CSTA/GAPDH/HSPA1A/HSPA1B/EEF2/MYH9/SERPINB7/SERPINA1/HSP90AA1/ACTN4/UBA52/TXN/SOD1/HSPB1/HSPA8/EIF4A1/YWHAZ/ALOX12B/GSTP1/LCN1/SERPINB4/CAPN1/YWHAE/HBB/A2ML1/HP/SERPINA3/SERPINB1/LCN2/CST6/GSN/IDE/PSMA3/SERPINB5/CSTB/PERP/SERPINB13/APOD/RPSA/RPS3/S100A11/PSMB3/NPC2/PIP/CST4/CST1/CST2/SERPINA12\n-GO:0019694\talkanesulfonate metabolic process\t0\t0/153\t\n-GO:0019748\tsecondary metabolic process\t0\t0/153\t\n-GO:0032259\tmethylation\t2\t2/153\tEEF2/HSPA8\n-GO:0042440\tpigment metabolic process\t0\t0/153\t\n-GO:0042445\thormone metabolic process\t1\t1/153\tIDE\n-GO:0044033\tmulti-organism metabolic process\t1\t1/153\tANXA2\n-GO:0044236\tmulticellular organism metabolic process\t4\t4/153\tARG1/SERPINB7/CTSD/CTSB\n-GO:0044237\tcellular metabolic process\t103\t103/153\tDSP/ALB/ANXA2/JUP/LTF/MUC5B/SERPINB3/KRT17/FABP5/ENO1/AZGP1/TGM3/ANXA1/HSPA5/TF/CAT/S100A7/SFN/SERPINB12/PKM/TPI1/PRDX1/CSTA/ARG1/GAPDH/HSPA1A/HSPA1B/EEF2/MYH9/SERPINB7/LYZ/SERPINA1/HSP90AA1/ACTN4/GGCT/LDHA/CTSD/UBA52/TXN/DMBT1/CPA4/BLMH/PLBD1/SOD1/HSPB1/HSPA8/EIF4A1/PPIA/YWHAZ/GGH/ALOX12B/GSTP1/LCN1/SERPINB4/C1orf68/CTSV/PGK1/ALDOA/CAPN1/YWHAE/HBB/A2ML1/HP/SERPINA3/SPRR1B/SERPINB1/CST6/GSN/IDE/AGA/PSMA3/EEF1G/SERPINB5/MDH2/LYPD3/PNP/CSTB/ALDOC/FLG/PERP/SERPINB13/APOD/CTSB/RPSA/LAMP2/TYMP/PPIB/RPS3/ATP5A1/S100A11/HAL/GSS/PSMB3/NPC2/CST4/MUC7/CST1/CST2/KRT1/KRT2/KRT10/SERPINA12/SPRR2E\n-GO:0044238\tprimary metabolic process\t108\t108/153\tDSP/ALB/ANXA2/JUP/LTF/MUC5B/'..b"6686\tresponse to cadmium ion\t5/150\t64/18866\t1.553312e-04\t3.641491e-03\t2.825887e-03\tCAT/ARG1/SOD1/GSN/GSS\t 5\n+GO:0051709\tregulation of killing of cells of other organism\t3/150\t14/18866\t1.681573e-04\t3.905336e-03\t3.030636e-03\tKRT6A/ARG1/GAPDH\t 3\n+GO:0016052\tcarbohydrate catabolic process\t8/150\t200/18866\t2.018295e-04\t4.643948e-03\t3.603818e-03\tENO1/PKM/TPI1/GAPDH/LDHA/PGK1/ALDOA/ALDOC\t 8\n+GO:0051084\t'de novo' posttranslational protein folding\t4/150\t37/18866\t2.067314e-04\t4.713096e-03\t3.657478e-03\tHSPA5/HSPA1A/HSPA1B/HSPA8\t 4\n+GO:0001909\tleukocyte mediated cytotoxicity\t6/150\t108/18866\t2.245249e-04\t5.072222e-03\t3.936169e-03\tAZGP1/PRDX1/ARG1/TUBB4B/SERPINB4/LAMP1\t 6\n+GO:0051014\tactin filament severing\t3/150\t16/18866\t2.557004e-04\t5.623147e-03\t4.363700e-03\tMYH9/GSN/CAPG\t 3\n+GO:0061684\tchaperone-mediated autophagy\t3/150\t16/18866\t2.557004e-04\t5.623147e-03\t4.363700e-03\tHSP90AA1/HSPA8/LAMP2\t 3\n+GO:0090136\tepithelial cell-cell adhesion\t3/150\t16/18866\t2.557004e-04\t5.623147e-03\t4.363700e-03\tDSP/JUP/VCL\t 3\n+GO:0044282\tsmall molecule catabolic process\t12/150\t452/18866\t2.701810e-04\t5.889471e-03\t4.570375e-03\tENO1/PKM/TPI1/ARG1/GAPDH/BLMH/PGK1/ALDOA/PNP/ALDOC/TYMP/HAL\t12\n+GO:0045216\tcell-cell junction organization\t8/150\t210/18866\t2.809166e-04\t6.070241e-03\t4.710656e-03\tDSP/DSG1/JUP/ACTG1/POF1B/ACTN4/VCL/PERP\t 8\n+GO:0035821\tmodulation of process of other organism\t6/150\t113/18866\t2.869769e-04\t6.147737e-03\t4.770795e-03\tANXA2/LTF/GAPDH/HSPA8/PPIB/DEFA3\t 6\n+GO:0016051\tcarbohydrate biosynthetic process\t8/150\t213/18866\t3.090522e-04\t6.513044e-03\t5.054282e-03\tENO1/TPI1/GAPDH/PGK1/ALDOA/MDH2/ALDOC/SERPINA12\t 8\n+GO:0006458\t'de novo' protein folding\t4/150\t41/18866\t3.092713e-04\t6.513044e-03\t5.054282e-03\tHSPA5/HSPA1A/HSPA1B/HSPA8\t 4\n+GO:0045684\tpositive regulation of epidermis development\t4/150\t44/18866\t4.069843e-04\t8.498789e-03\t6.595269e-03\tKRT17/SFN/KRT2/KRT10\t 4\n+GO:0042246\ttissue regeneration\t5/150\t79/18866\t4.173442e-04\t8.571077e-03\t6.651366e-03\tANXA1/PKM/EPPK1/GSN/APOD\t 5\n+GO:1900034\tregulation of cellular response to heat\t5/150\t79/18866\t4.173442e-04\t8.571077e-03\t6.651366e-03\tHSPA1A/HSPA1B/HSP90AA1/HSPA8/YWHAE\t 5\n+GO:0034614\tcellular response to reactive oxygen species\t7/150\t170/18866\t4.259528e-04\t8.635019e-03\t6.700987e-03\tANXA1/PRDX1/ARG1/TXN/SOD1/LCN2/RPS3\t 7\n+GO:0007596\tblood coagulation\t10/150\t343/18866\t4.274074e-04\t8.635019e-03\t6.700987e-03\tANXA2/ACTG1/MYH9/SERPINA1/HSPB1/YWHAZ/VCL/HBB/CAPZB/KRT1\t10\n+GO:0051546\tkeratinocyte migration\t3/150\t19/18866\t4.347782e-04\t8.686713e-03\t6.741103e-03\tKRT16/EPPK1/KRT2\t 3\n+GO:0007584\tresponse to nutrient\t7/150\t171/18866\t4.412214e-04\t8.686713e-03\t6.741103e-03\tCAT/PKM/ARG1/EEF2/LDHA/GSTP1/GSN\t 7\n+GO:0051204\tprotein insertion into mitochondrial membrane\t4/150\t45/18866\t4.439487e-04\t8.686713e-03\t6.741103e-03\tSFN/HSP90AA1/YWHAZ/YWHAE\t 4\n+GO:1901028\tregulation of mitochondrial outer membrane permeab\t4/150\t45/18866\t4.439487e-04\t8.686713e-03\t6.741103e-03\tSFN/HSPA1A/YWHAZ/YWHAE\t 4\n+GO:0050829\tdefense response to Gram-negative bacterium\t5/150\t81/18866\t4.684619e-04\t9.094749e-03\t7.057749e-03\tLTF/S100A7/LYZ/DMBT1/DEFA3\t 5\n+GO:0007599\themostasis\t10/150\t348/18866\t4.785446e-04\t9.218475e-03\t7.153763e-03\tANXA2/ACTG1/MYH9/SERPINA1/HSPB1/YWHAZ/VCL/HBB/CAPZB/KRT1\t10\n+GO:0050817\tcoagulation\t10/150\t349/18866\t4.893589e-04\t9.349316e-03\t7.255299e-03\tANXA2/ACTG1/MYH9/SERPINA1/HSPB1/YWHAZ/VCL/HBB/CAPZB/KRT1\t10\n+GO:0008637\tapoptotic mitochondrial changes\t6/150\t125/18866\t4.928613e-04\t9.349316e-03\t7.255299e-03\tLMNA/SFN/HSPA1A/GGCT/YWHAZ/YWHAE\t 6\n+GO:0006457\tprotein folding\t8/150\t230/18866\t5.153163e-04\t9.701220e-03\t7.528385e-03\tHSPA5/HSPA1A/HSPA1B/HSP90AA1/HSPB1/HSPA8/PPIA/PPIB\t 8\n+GO:0006953\tacute-phase response\t4/150\t47/18866\t5.249594e-04\t9.735254e-03\t7.554796e-03\tSERPINA1/HP/SERPINA3/ORM1\t 4\n+GO:0046677\tresponse to antibiotic\t4/150\t47/18866\t5.249594e-04\t9.735254e-03\t7.554796e-03\tHSPA5/HSP90AA1/SOD1/ACTR2\t 4\n+GO:0043903\tregulation of symbiotic process\t8/150\t231/18866\t5.302696e-04\t9.760888e-03\t7.574689e-03\tKRT6A/LTF/ARG1/GAPDH/HSPA8/PPIA/GSN/PPIB\t 8\n"
b
diff -r 85f039f53414 -r f6107b8ae8f8 test-data/cluster_profiler_GGO_CC.csv
--- a/test-data/cluster_profiler_GGO_CC.csv Fri Jan 24 05:12:09 2020 -0500
+++ b/test-data/cluster_profiler_GGO_CC.csv Fri Apr 09 14:39:05 2021 +0000
b
b'@@ -1,381 +1,980 @@\n ID\tDescription\tCount\tGeneRatio\tgeneID\n-GO:0005886\tplasma membrane\t56\t56/153\tDSP/DSG1/ANXA2/JUP/MUC5B/ACTG1/FABP5/PIGR/ENO1/AZGP1/PLEC/TGM3/HRNR/ANXA1/HSPA5/TF/CAT/SERPINB12/CSTA/GAPDH/EEF2/MYH9/HSP90AA1/UBA52/FLNB/SOD1/HSPB1/HSPA8/EPPK1/GSTP1/DSC3/C1orf68/CTSV/CAPN1/VCL/YWHAE/IL1RN/SPRR1B/CST6/GSN/IDE/LYPD3/FLG/PERP/RPSA/LAMP1/LAMP2/RPS3/ATP5A1/PIP/MUC7/KRT1/KRT2/KRT10/SERPINA12/SPRR2E\n-GO:0005628\tprospore membrane\t0\t0/153\t\n-GO:0005789\tendoplasmic reticulum membrane\t2\t2/153\tHSPA5/UBA52\n-GO:0019867\touter membrane\t2\t2/153\tARG1/UBA52\n-GO:0031090\torganelle membrane\t24\t24/153\tDSP/DSG1/ANXA2/FABP5/PIGR/LMNA/ANXA1/TF/CAT/SFN/SERPINB12/ARG1/GAPDH/SERPINA1/UBA52/DMBT1/HSPA8/YWHAZ/YWHAE/MDH2/LAMP1/LAMP2/RPS3/ATP5A1\n-GO:0034357\tphotosynthetic membrane\t0\t0/153\t\n-GO:0036362\tascus membrane\t0\t0/153\t\n-GO:0042175\tnuclear outer membrane-endoplasmic reticulum membrane network\t2\t2/153\tHSPA5/UBA52\n-GO:0044425\tmembrane part\t29\t29/153\tDSP/DSG1/ANXA2/JUP/PIGR/TGM3/ANXA1/HSPA5/TF/EEF2/MYH9/TUBA1B/HSP90AA1/CTSD/UBA52/DMBT1/FLNB/HSPA8/EPPK1/DSC3/CTSV/PGK1/LYPD3/PERP/LAMP1/LAMP2/RPS3/ATP5A1/PIP\n-GO:0048475\tcoated membrane\t0\t0/153\t\n-GO:0055036\tvirion membrane\t0\t0/153\t\n-GO:0098589\tmembrane region\t7\t7/153\tANXA2/TF/EEF2/TUBA1B/CTSD/PGK1/LAMP2\n-GO:0098590\tplasma membrane region\t10\t10/153\tDSP/DSG1/ANXA2/JUP/ANXA1/TF/HSP90AA1/EPPK1/RPS3/PIP\n-GO:0098805\twhole membrane\t19\t19/153\tDSP/DSG1/ANXA2/FABP5/PIGR/ANXA1/TF/CAT/SERPINB12/ARG1/EEF2/TUBA1B/CTSD/UBA52/DMBT1/HSPA8/PGK1/LAMP1/LAMP2\n-GO:1990578\tperinuclear endoplasmic reticulum membrane\t0\t0/153\t\n-GO:0043083\tsynaptic cleft\t0\t0/153\t\n-GO:0044421\textracellular region part\t141\t141/153\tDSP/KRT6A/ALB/KRT16/DSG1/ANXA2/JUP/LTF/MUC5B/SERPINB3/ACTG1/KRT78/KRT17/FABP5/CASP14/PIGR/ENO1/AZGP1/PLEC/TGM3/KRT13/HRNR/KRT6B/LMNA/ANXA1/HSPA5/TF/CAT/S100A7/SFN/SERPINB12/PKM/TPI1/PRDX1/CSTA/ARG1/GAPDH/HSPA1A/HSPA1B/EEF2/MYH9/TUBB4B/SERPINB7/LYZ/TUBA1B/SERPINA1/HSP90AA1/IL36G/ACTN4/GGCT/LDHA/CTSD/UBA52/TXN/DMBT1/CPA4/LGALS7B/BLMH/PLBD1/FLNB/SOD1/HSPB1/HSPA8/EIF4A1/PPIA/YWHAZ/GGH/GSTP1/LCN1/SERPINB4/C1orf68/SBSN/CTSV/PGK1/ALDOA/CAPN1/VCL/YWHAE/HBB/A2ML1/HP/SERPINA3/ORM1/IL1RN/SPRR1B/SERPINB1/LCN2/CST6/S100A14/GSN/IDE/AGA/PSMA3/EEF1G/SERPINB5/MDH2/FCGBP/LYPD3/PNP/CSTB/ALDOC/KRT15/SERPINB13/APOD/KLK1/CTSB/RPSA/LAMP1/LAMP2/PPIB/RPS3/ATP5A1/CALML3/S100A11/CAPG/CAPZB/GSS/PSMB3/GDI2/ARPC4/ACTR2/NPC2/AMY1A/AMY1B/AMY1C/CALML5/PIP/ZG16B/CST4/MUC7/CST1/CST2/KRT1/KRT2/KRT10/FLG2/KPRP/SERPINA12/DCD/DEFA3/KRT85\n-GO:0048046\tapoplast\t0\t0/153\t\n-GO:0098595\tperivitelline space\t0\t0/153\t\n-GO:0099544\tperisynaptic space\t0\t0/153\t\n-GO:0044464\tcell part\t137\t137/153\tDSP/KRT6A/ALB/KRT16/DSG1/ANXA2/JUP/LTF/MUC5B/SERPINB3/ACTG1/KRT78/KRT17/FABP5/CASP14/PIGR/ENO1/AZGP1/PLEC/KRT80/TGM3/KRT13/HRNR/KRT6B/LMNA/ANXA1/HSPA5/TF/CAT/S100A7/SFN/SERPINB12/PKM/TPI1/PRDX1/CSTA/ARG1/GAPDH/HSPA1A/HSPA1B/EEF2/MYH9/TUBB4B/POF1B/SERPINB7/LYZ/TUBA1B/SERPINA1/HSP90AA1/ACTN4/GGCT/LDHA/CTSD/UBA52/TXN/DMBT1/LGALS7B/BLMH/PLBD1/FLNB/SOD1/HSPB1/HSPA8/EPPK1/EIF4A1/PPIA/YWHAZ/GGH/ALOX12B/GSTP1/SERPINB4/DSC3/C1orf68/CTSV/PGK1/ALDOA/CAPN1/VCL/YWHAE/HBB/KRT23/HP/SERPINA3/ORM1/IL1RN/SPRR1B/SERPINB1/LCN2/CST6/S100A14/GSN/IDE/AGA/PSMA3/EEF1G/SERPINB5/MDH2/LYPD3/PNP/CSTB/ALDOC/KRT15/FLG/PERP/SERPINB13/APOD/KLK1/CTSB/RPSA/LAMP1/LAMP2/TYMP/PPIB/RPS3/ATP5A1/S100A11/CAPG/HAL/CAPZB/GSS/PSMB3/GDI2/ARPC4/ACTR2/NPC2/CALML5/PIP/MUC7/KRT1/KRT2/KRT10/FLG2/KPRP/SERPINA12/SPRR2E/DEFA3/KRT85\n-GO:0039642\tvirion nucleoid\t0\t0/153\t\n-GO:0042645\tmitochondrial nucleoid\t0\t0/153\t\n-GO:0042646\tplastid nucleoid\t0\t0/153\t\n-GO:0043590\tbacterial nucleoid\t0\t0/153\t\n-GO:0044777\tsingle-stranded DNA-binding protein complex\t0\t0/153\t\n-GO:0044423\tvirion part\t0\t0/153\t\n-GO:0005911\tcell-cell junction\t13\t13/153\tDSP/DSG1/ANXA2/JUP/ANXA1/MYH9/POF1B/ACTN4/EPPK1/DSC3/VCL/PERP/S100A11\n-GO:0030055\tcell-substrate junction\t25\t25/153\tJUP/ACTG1/PLEC/ANXA1/HSPA5/CAT/S100A7/HSPA1A/HSPA1B/MYH9/ACTN4/FLNB/HSPB1/HSPA8/EPPK1/PPIA/YWHAZ/CAPN1/VCL/YWHAE/GSN/PPIB/RPS3/GDI2/ACTR2\n-GO:0061466\tplasma membrane part of cell junction\t0\t0/153\t\n'..b'3\tdinoflagellate apex\t  0\t0/153\tNA\n+GO:0097684\tdinoflagellate antapex\t  0\t0/153\tNA\n+GO:0097735\tDIM/DIP cell wall layer\t  0\t0/153\tNA\n+GO:0098552\tside of membrane\t 11\t11/153\tDSG1/JUP/AZGP1/TGM3/ANXA1/TF/HSPA8/CTSV/IDE/CTSB/LAMP1\n+GO:0098687\tchromosomal region\t  0\t0/153\tNA\n+GO:0098793\tpresynapse\t  3\t3/153\tACTG1/HSPA8/LAMP1\n+GO:0098794\tpostsynapse\t  4\t4/153\tFABP5/HSPA8/RPS3/ACTR2\n+GO:0098833\tpresynaptic endocytic zone\t  0\t0/153\tNA\n+GO:0098843\tpostsynaptic endocytic zone\t  0\t0/153\tNA\n+GO:0098862\tcluster of actin-based cell projections\t  4\t4/153\tPLEC/MYH9/ACTN4/FLNB\n+GO:0099079\tactin body\t  0\t0/153\tNA\n+GO:0099080\tsupramolecular complex\t 34\t34/153\tDSP/KRT6A/KRT16/JUP/ACTG1/KRT78/KRT17/CASP14/ENO1/PLEC/KRT80/KRT13/KRT6B/LMNA/ANXA1/MYH9/TUBB4B/POF1B/TUBA1B/ACTN4/FLNB/HSPB1/EPPK1/ALDOA/VCL/KRT23/SERPINB1/KRT15/FLG/CAPZB/KRT1/KRT2/KRT10/KRT85\n+GO:0099086\tsynaptonemal structure\t  0\t0/153\tNA\n+GO:0106124\treservosome lumen\t  0\t0/153\tNA\n+GO:0106125\treservosome matrix\t  0\t0/153\tNA\n+GO:0106126\treservosome membrane\t  0\t0/153\tNA\n+GO:0110071\tcellularization cleavage furrow invagination front\t  0\t0/153\tNA\n+GO:0110092\tnucleus leading edge\t  0\t0/153\tNA\n+GO:0110093\tnucleus lagging edge\t  0\t0/153\tNA\n+GO:0120043\tstereocilium shaft\t  0\t0/153\tNA\n+GO:0120044\tstereocilium base\t  0\t0/153\tNA\n+GO:0120082\tsmooth endoplasmic reticulum cisterna\t  0\t0/153\tNA\n+GO:0120083\trough endoplasmic reticulum cisterna\t  0\t0/153\tNA\n+GO:0120098\tprocentriole\t  0\t0/153\tNA\n+GO:0120100\tbacterial-type flagellum motor\t  0\t0/153\tNA\n+GO:0120102\tbacterial-type flagellum secretion apparatus\t  0\t0/153\tNA\n+GO:0120104\tmitotic actomyosin contractile ring, proximal laye\t  0\t0/153\tNA\n+GO:0120105\tmitotic actomyosin contractile ring, intermediate \t  0\t0/153\tNA\n+GO:0120106\tmitotic actomyosin contractile ring, distal actin \t  0\t0/153\tNA\n+GO:0120107\tbacterial-type flagellum rotor complex\t  0\t0/153\tNA\n+GO:0120120\tbilobe structure\t  0\t0/153\tNA\n+GO:0120121\ttripartite attachment complex\t  0\t0/153\tNA\n+GO:0120134\tproximal portion of axoneme\t  0\t0/153\tNA\n+GO:0120135\tdistal portion of axoneme\t  0\t0/153\tNA\n+GO:0120205\tphotoreceptor proximal connecting cilium\t  0\t0/153\tNA\n+GO:0120206\tphotoreceptor distal connecting cilium\t  0\t0/153\tNA\n+GO:0120212\tsperm head-tail coupling apparatus\t  0\t0/153\tNA\n+GO:0120219\tsubapical part of cell\t  0\t0/153\tNA\n+GO:0120220\tbasal body patch\t  0\t0/153\tNA\n+GO:0140022\tcnida\t  0\t0/153\tNA\n+GO:0140510\tmitotic nuclear bridge\t  0\t0/153\tNA\n+GO:0140511\tmitotic nuclear bridge stalk\t  0\t0/153\tNA\n+GO:0140512\tmitotic nuclear bridge midzone\t  0\t0/153\tNA\n+GO:0150004\tdendritic spine origin\t  0\t0/153\tNA\n+GO:0150034\tdistal axon\t  4\t4/153\tACTG1/HSP90AA1/HSPA8/YWHAE\n+GO:1990013\tpresynaptic grid\t  0\t0/153\tNA\n+GO:1990014\torthogonal array\t  0\t0/153\tNA\n+GO:1990015\tensheathing process\t  0\t0/153\tNA\n+GO:1990016\tneck portion of tanycyte\t  0\t0/153\tNA\n+GO:1990018\ttail portion of tanycyte\t  0\t0/153\tNA\n+GO:1990030\tpericellular basket\t  0\t0/153\tNA\n+GO:1990031\tpinceau fiber\t  0\t0/153\tNA\n+GO:1990037\tLewy body core\t  0\t0/153\tNA\n+GO:1990038\tLewy body corona\t  0\t0/153\tNA\n+GO:1990047\tspindle matrix\t  0\t0/153\tNA\n+GO:1990073\tperforation plate\t  0\t0/153\tNA\n+GO:1990225\trhoptry neck\t  0\t0/153\tNA\n+GO:1990295\tpost-anaphase microtubule array\t  0\t0/153\tNA\n+GO:1990427\tstereocilia tip-link density\t  0\t0/153\tNA\n+GO:1990716\taxonemal central apparatus\t  0\t0/153\tNA\n+GO:1990717\taxonemal central bridge\t  0\t0/153\tNA\n+GO:1990718\taxonemal central pair projection\t  0\t0/153\tNA\n+GO:1990752\tmicrotubule end\t  0\t0/153\tNA\n+GO:1990783\tperiphagosomal region of cytoplasm\t  0\t0/153\tNA\n+GO:1990794\tbasolateral part of cell\t  0\t0/153\tNA\n+GO:1990805\tcentral cylinder\t  0\t0/153\tNA\n+GO:1990819\tactin fusion focus\t  0\t0/153\tNA\n+GO:1990826\tnucleoplasmic periphery of the nuclear pore comple\t  0\t0/153\tNA\n+GO:1990836\tlysosomal matrix\t  1\t1/153\tLAMP2\n+GO:1990875\tnucleoplasmic side of nuclear pore\t  0\t0/153\tNA\n+GO:1990876\tcytoplasmic side of nuclear pore\t  0\t0/153\tNA\n+GO:1990900\tciliary pocket collar\t  0\t0/153\tNA\n+GO:1990916\tIsp3 layer of spore wall\t  0\t0/153\tNA\n'
b
diff -r 85f039f53414 -r f6107b8ae8f8 test-data/cluster_profiler_GGO_MF.csv
--- a/test-data/cluster_profiler_GGO_MF.csv Fri Jan 24 05:12:09 2020 -0500
+++ b/test-data/cluster_profiler_GGO_MF.csv Fri Apr 09 14:39:05 2021 +0000
b
b'@@ -1,155 +1,151 @@\n ID\tDescription\tCount\tGeneRatio\tgeneID\n-GO:0004133\tglycogen debranching enzyme activity\t0\t0/153\t\n-GO:0016491\toxidoreductase activity\t11\t11/153\tCAT/PRDX1/GAPDH/LDHA/TXN/SOD1/ALOX12B/GSTP1/PGK1/HBB/MDH2\n-GO:0008987\tquinolinate synthetase A activity\t0\t0/153\t\n-GO:0009975\tcyclase activity\t0\t0/153\t\n-GO:0010280\tUDP-L-rhamnose synthase activity\t0\t0/153\t\n-GO:0016740\ttransferase activity\t10\t10/153\tTGM3/PKM/GAPDH/HSP90AA1/GGCT/GSTP1/PGK1/EEF1G/PNP/TYMP\n-GO:0016787\thydrolase activity\t37\t37/153\tLTF/CASP14/AZGP1/ANXA1/HSPA5/CAT/ARG1/HSPA1A/HSPA1B/EEF2/MYH9/TUBB4B/LYZ/TUBA1B/HSP90AA1/CTSD/CPA4/BLMH/PLBD1/HSPA8/EIF4A1/GGH/CTSV/CAPN1/IDE/AGA/PSMA3/KLK1/CTSB/RPS3/ATP5A1/PSMB3/AMY1A/AMY1B/AMY1C/PIP/DCD\n-GO:0016829\tlyase activity\t5\t5/153\tENO1/ALDOA/ALDOC/RPS3/HAL\n-GO:0016853\tisomerase activity\t3\t3/153\tTPI1/PPIA/PPIB\n-GO:0016874\tligase activity\t1\t1/153\tGSS\n-GO:0032451\tdemethylase activity\t0\t0/153\t\n-GO:0046572\tversicolorin B synthase activity\t0\t0/153\t\n-GO:0046905\tphytoene synthase activity\t0\t0/153\t\n-GO:0061783\tpeptidoglycan muralytic activity\t1\t1/153\tLYZ\n-GO:0070283\tradical SAM enzyme activity\t0\t0/153\t\n-GO:0140096\tcatalytic activity, acting on a protein\t22\t22/153\tLTF/CASP14/TGM3/GAPDH/HSP90AA1/GGCT/CTSD/CPA4/BLMH/PPIA/GGH/CTSV/CAPN1/IDE/AGA/PSMA3/KLK1/CTSB/PPIB/PSMB3/PIP/DCD\n-GO:0140097\tcatalytic activity, acting on DNA\t2\t2/153\tANXA1/RPS3\n-GO:0140098\tcatalytic activity, acting on RNA\t2\t2/153\tAZGP1/EIF4A1\n-GO:1990055\tphenylacetaldehyde synthase activity\t0\t0/153\t\n-GO:0000156\tphosphorelay response regulator activity\t0\t0/153\t\n-GO:0004879\tnuclear receptor activity\t0\t0/153\t\n-GO:0004708\tMAP kinase kinase activity\t0\t0/153\t\n-GO:0005057\tsignal transducer activity, downstream of receptor\t0\t0/153\t\n-GO:0005068\ttransmembrane receptor protein tyrosine kinase adaptor activity\t0\t0/153\t\n-GO:0030297\ttransmembrane receptor protein tyrosine kinase activator activity\t0\t0/153\t\n-GO:0008086\tlight-activated voltage-gated calcium channel activity\t0\t0/153\t\n-GO:0008384\tIkappaB kinase activity\t0\t0/153\t\n-GO:0009927\thistidine phosphotransfer kinase activity\t0\t0/153\t\n-GO:0038023\tsignaling receptor activity\t3\t3/153\tKRT17/PIGR/DMBT1\n-GO:0038078\tMAP kinase phosphatase activity involved in regulation of innate immune response\t0\t0/153\t\n-GO:0097199\tcysteine-type endopeptidase activity involved in apoptotic signaling pathway\t0\t0/153\t\n-GO:0099107\tion channel regulator activity involved in G-protein coupled receptor signaling pathway\t0\t0/153\t\n-GO:1990890\tnetrin receptor binding\t0\t0/153\t\n-GO:0003735\tstructural constituent of ribosome\t3\t3/153\tUBA52/RPSA/RPS3\n-GO:0005199\tstructural constituent of cell wall\t1\t1/153\tJUP\n-GO:0005200\tstructural constituent of cytoskeleton\t11\t11/153\tDSP/KRT16/ACTG1/KRT17/KRT6B/TUBB4B/TUBA1B/KRT15/ARPC4/ACTR2/KRT2\n-GO:0005201\textracellular matrix structural constituent\t0\t0/153\t\n-GO:0005212\tstructural constituent of eye lens\t0\t0/153\t\n-GO:0005213\tstructural constituent of chorion\t0\t0/153\t\n-GO:0008147\tstructural constituent of bone\t0\t0/153\t\n-GO:0008307\tstructural constituent of muscle\t1\t1/153\tPLEC\n-GO:0016490\tstructural constituent of peritrophic membrane\t0\t0/153\t\n-GO:0017056\tstructural constituent of nuclear pore\t0\t0/153\t\n-GO:0019911\tstructural constituent of myelin sheath\t0\t0/153\t\n-GO:0030280\tstructural constituent of epidermis\t5\t5/153\tFLG/KRT1/KRT2/KRT10/SPRR2E\n-GO:0030527\tstructural constituent of chromatin\t0\t0/153\t\n-GO:0032947\tprotein complex scaffold activity\t0\t0/153\t\n-GO:0035804\tstructural constituent of egg coat\t0\t0/153\t\n-GO:0039660\tstructural constituent of virion\t0\t0/153\t\n-GO:0042302\tstructural constituent of cuticle\t0\t0/153\t\n-GO:0043886\tstructural constituent of carboxysome\t0\t0/153\t\n-GO:0097099\tstructural constituent of albumen\t0\t0/153\t\n-GO:0097493\tstructural molecule activity conferring elasticity\t0\t0/153\t\n-GO:0098918\tstructural constituent of synapse\t0\t0/153\t\n-GO:0005344\toxygen carrier activity\t1\t1/153\tHBB\n-GO:0022857\ttransmembrane transporter activity\t3\t3/153\tAZGP1/TF/ATP5A1\n-GO:0005326\tneurotransmitter transporter activity\t0\t0/153\t\n'..b'ty acid derivative binding\t  0\t0/153\tNA\n+GO:1901681\tsulfur compound binding\t  3\t3/153\tLTF/GSTP1/GSS\n+GO:1902670\tcarbon dioxide binding\t  0\t0/153\tNA\n+GO:1904483\tsynthetic cannabinoid binding\t  0\t0/153\tNA\n+GO:1904493\ttetrahydrofolyl-poly(glutamate) polymer binding\t  0\t0/153\tNA\n+GO:1904517\tMgATP(2-) binding\t  0\t0/153\tNA\n+GO:1990300\tcellulosome binding\t  0\t0/153\tNA\n+GO:0004362\tglutathione-disulfide reductase activity\t  0\t0/153\tNA\n+GO:0004601\tperoxidase activity\t  4\t4/153\tCAT/PRDX1/GSTP1/HBB\n+GO:0004784\tsuperoxide dismutase activity\t  1\t1/153\tSOD1\n+GO:0004791\tthioredoxin-disulfide reductase activity\t  1\t1/153\tTXN\n+GO:0032542\tsulfiredoxin activity\t  0\t0/153\tNA\n+GO:0045174\tglutathione dehydrogenase (ascorbate) activity\t  0\t0/153\tNA\n+GO:0050605\tsuperoxide reductase activity\t  0\t0/153\tNA\n+GO:0051920\tperoxiredoxin activity\t  1\t1/153\tPRDX1\n+GO:0004873\tasialoglycoprotein receptor activity\t  0\t0/153\tNA\n+GO:0004998\ttransferrin receptor activity\t  0\t0/153\tNA\n+GO:0005044\tscavenger receptor activity\t  1\t1/153\tDMBT1\n+GO:0008196\tvitellogenin receptor activity\t  0\t0/153\tNA\n+GO:0016964\talpha-2 macroglobulin receptor activity\t  0\t0/153\tNA\n+GO:0030226\tapolipoprotein receptor activity\t  0\t0/153\tNA\n+GO:0030228\tlipoprotein particle receptor activity\t  0\t0/153\tNA\n+GO:0033568\tlactoferrin receptor activity\t  0\t0/153\tNA\n+GO:0061714\tfolic acid receptor activity\t  0\t0/153\tNA\n+GO:0070287\tferritin receptor activity\t  0\t0/153\tNA\n+GO:0140488\theme receptor activity\t  0\t0/153\tNA\n+GO:0004694\teukaryotic translation initiation factor 2alpha ki\t  0\t0/153\tNA\n+GO:0030371\ttranslation repressor activity\t  0\t0/153\tNA\n+GO:0045183\ttranslation factor activity, non-nucleic acid bind\t  0\t0/153\tNA\n+GO:0090079\ttranslation regulator activity, nucleic acid bindi\t  3\t3/153\tEEF2/EIF4A1/EEF1G\n+GO:0000156\tphosphorelay response regulator activity\t  0\t0/153\tNA\n+GO:0009927\thistidine phosphotransfer kinase activity\t  0\t0/153\tNA\n+GO:0031992\tenergy transducer activity\t  0\t0/153\tNA\n+GO:0038023\tsignaling receptor activity\t  3\t3/153\tPIGR/DMBT1/KRT1\n+GO:0030533\ttriplet codon-amino acid adaptor activity\t  0\t0/153\tNA\n+GO:0030674\tprotein-macromolecule adaptor activity\t  4\t4/153\tJUP/MYH9/HSPA8/ARPC4\n+GO:0005085\tguanyl-nucleotide exchange factor activity\t  0\t0/153\tNA\n+GO:0016247\tchannel regulator activity\t  1\t1/153\tYWHAE\n+GO:0030234\tenzyme regulator activity\t 29\t29/153\tANXA2/LTF/SERPINB3/ANXA1/SFN/SERPINB12/CSTA/GAPDH/SERPINB7/SERPINA1/HSP90AA1/HSPB1/GSTP1/LCN1/SERPINB4/A2ML1/SERPINA3/SERPINB1/CST6/SERPINB5/CSTB/SERPINB13/CALML3/GDI2/CALML5/CST4/CST1/CST2/SERPINA12\n+GO:0030545\treceptor regulator activity\t  3\t3/153\tIL36G/IL1RN/TYMP\n+GO:0097690\tiron ion transmembrane transporter inhibitor activ\t  0\t0/153\tNA\n+GO:0140110\ttranscription regulator activity\t  4\t4/153\tJUP/ENO1/HSPA1A/ACTN4\n+GO:0140416\tDNA-binding transcription factor inhibitor activit\t  0\t0/153\tNA\n+GO:0016530\tmetallochaperone activity\t  1\t1/153\tTF\n+GO:0032977\tmembrane insertase activity\t  0\t0/153\tNA\n+GO:0097163\tsulfur carrier activity\t  0\t0/153\tNA\n+GO:0140132\tiron-sulfur cluster carrier activity\t  0\t0/153\tNA\n+GO:0140414\tphosphopantetheine-dependent carrier activity\t  0\t0/153\tNA\n+GO:0000155\tphosphorelay sensor kinase activity\t  0\t0/153\tNA\n+GO:0005034\tosmosensor activity\t  0\t0/153\tNA\n+GO:0019826\toxygen sensor activity\t  0\t0/153\tNA\n+GO:0035991\tnitric oxide sensor activity\t  0\t0/153\tNA\n+GO:0061891\tcalcium ion sensor activity\t  0\t0/153\tNA\n+GO:0070027\tcarbon monoxide sensor activity\t  0\t0/153\tNA\n+GO:0097063\tcadmium ion sensor activity\t  0\t0/153\tNA\n+GO:0097077\tcopper ion sensor activity\t  0\t0/153\tNA\n+GO:0106219\tzinc ion sensor activity\t  0\t0/153\tNA\n+GO:0106254\tlipid sensor activity\t  0\t0/153\tNA\n+GO:0140442\tperoxide sensor activity\t  0\t0/153\tNA\n+GO:0140482\tiron sensor activity\t  0\t0/153\tNA\n+GO:0140311\tprotein sequestering activity\t  0\t0/153\tNA\n+GO:0140319\treceptor decoy activity\t  0\t0/153\tNA\n+GO:0140487\tmetal ion sequestering activity\t  0\t0/153\tNA\n+GO:0000497\tDNA template activity\t  0\t0/153\tNA\n+GO:0140490\tmicrotubule nucleator activity\t  0\t0/153\tNA\n'