# HG changeset patch # User bgruening # Date 1377517051 14400 # Node ID e1bc8415f875c1c791740bc65d4e9d87dc4d9299 Uploaded diff -r 000000000000 -r e1bc8415f875 chemicaltoolbox_merging_chemical_databases_workflow.ga --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/chemicaltoolbox_merging_chemical_databases_workflow.ga Mon Aug 26 07:37:31 2013 -0400 @@ -0,0 +1,1190 @@ +{ + "a_galaxy_workflow": "true", + "annotation": "Runs the chemicaltoolbox to merge chemical libraries.
\n
\nThis workflow is available on the Galaxy Tool Shed with a README file giving more information, and full citation details (Gruening et al. 2013).", + "format-version": "0.1", + "name": "Preparation of a large compound library by merging of chemical databases.", + "steps": { + "0": { + "annotation": "", + "id": 0, + "input_connections": {}, + "inputs": [], + "name": "Online data", + "outputs": [ + { + "name": "output", + "type": "txt" + } + ], + "position": { + "left": 291, + "top": 391 + }, + "post_job_actions": { + "ChangeDatatypeActionoutput": { + "action_arguments": { + "newtype": "sdf" + }, + "action_type": "ChangeDatatypeAction", + "output_name": "output" + }, + "HideDatasetActionoutput": { + "action_arguments": {}, + "action_type": "HideDatasetAction", + "output_name": "output" + } + }, + "tool_errors": null, + "tool_id": "ctb_online_data_fetch", + "tool_state": "{\"__page__\": 0, \"whitelist\": \"\\\"\\\"\", \"url_paste\": \"\\\"http://www.drugbank.ca/system/downloads/current/structures/all.sdf.zip\\\"\"}", + "tool_version": "0.2", + "type": "tool", + "user_outputs": [] + }, + "1": { + "annotation": "", + "id": 1, + "input_connections": {}, + "inputs": [], + "name": "Online data", + "outputs": [ + { + "name": "output", + "type": "txt" + } + ], + "position": { + "left": 304, + "top": 733 + }, + "post_job_actions": { + "ChangeDatatypeActionoutput": { + "action_arguments": { + "newtype": "tabular" + }, + "action_type": "ChangeDatatypeAction", + "output_name": "output" + }, + "HideDatasetActionoutput": { + "action_arguments": {}, + "action_type": "HideDatasetAction", + "output_name": "output" + } + }, + "tool_errors": null, + "tool_id": "ctb_online_data_fetch", + "tool_state": "{\"__page__\": 0, \"whitelist\": \"\\\"\\\"\", \"url_paste\": \"\\\"http://zinc.docking.org/db/bysubset/6/6_p0.smi.gz\\\\nhttp://zinc.docking.org/db/bysubset/46/46_p0.smi.gz\\\"\"}", + "tool_version": "0.2", + "type": "tool", + "user_outputs": [] + }, + "2": { + "annotation": "", + "id": 2, + "input_connections": {}, + "inputs": [], + "name": "Online data", + "outputs": [ + { + "name": "output", + "type": "txt" + } + ], + "position": { + "left": 305, + "top": 1048 + }, + "post_job_actions": { + "ChangeDatatypeActionoutput": { + "action_arguments": { + "newtype": "sdf" + }, + "action_type": "ChangeDatatypeAction", + "output_name": "output" + }, + "HideDatasetActionoutput": { + "action_arguments": {}, + "action_type": "HideDatasetAction", + "output_name": "output" + } + }, + "tool_errors": null, + "tool_id": "ctb_online_data_fetch", + "tool_state": "{\"__page__\": 0, \"whitelist\": \"\\\"\\\"\", \"url_paste\": \"\\\"ftp://ftp.ebi.ac.uk/pub/databases/chembl/ChEMBLdb/latest/chembl_16.sdf.gz\\\"\"}", + "tool_version": "0.2", + "type": "tool", + "user_outputs": [] + }, + "3": { + "annotation": "", + "id": 3, + "input_connections": {}, + "inputs": [], + "name": "PubChem Download", + "outputs": [ + { + "name": "pubchem_smi", + "type": "smi" + } + ], + "position": { + "left": 312, + "top": 1448 + }, + "post_job_actions": { + "ChangeDatatypeActionpubchem_smi": { + "action_arguments": { + "newtype": "tabular" + }, + "action_type": "ChangeDatatypeAction", + "output_name": "pubchem_smi" + }, + "HideDatasetActionpubchem_smi": { + "action_arguments": {}, + "action_type": "HideDatasetAction", + "output_name": "pubchem_smi" + } + }, + "tool_errors": null, + "tool_id": "ctb_pubchem_download_as_smiles", + "tool_state": "{\"__page__\": 0, \"infile\": \"null\"}", + "tool_version": "1.0.0", + "type": "tool", + "user_outputs": [] + }, + "4": { + "annotation": "", + "id": 4, + "input_connections": { + "infile": { + "id": 0, + "output_name": "output" + } + }, + "inputs": [], + "name": "Change Title", + "outputs": [ + { + "name": "outfile", + "type": "sdf" + } + ], + "position": { + "left": 584, + "top": 297 + }, + "post_job_actions": { + "HideDatasetActionoutfile": { + "action_arguments": {}, + "action_type": "HideDatasetAction", + "output_name": "outfile" + } + }, + "tool_errors": null, + "tool_id": "ctb_change_title", + "tool_state": "{\"__page__\": 0, \"infile\": \"null\", \"key\": \"\\\"DRUGBANK_ID\\\"\"}", + "tool_version": "0.0.1", + "type": "tool", + "user_outputs": [] + }, + "5": { + "annotation": "", + "id": 5, + "input_connections": { + "input": { + "id": 1, + "output_name": "output" + } + }, + "inputs": [], + "name": "Filter", + "outputs": [ + { + "name": "out_file1", + "type": "input" + } + ], + "position": { + "left": 593, + "top": 624 + }, + "post_job_actions": { + "ChangeDatatypeActionout_file1": { + "action_arguments": { + "newtype": "smi" + }, + "action_type": "ChangeDatatypeAction", + "output_name": "out_file1" + }, + "HideDatasetActionout_file1": { + "action_arguments": {}, + "action_type": "HideDatasetAction", + "output_name": "out_file1" + } + }, + "tool_errors": null, + "tool_id": "Filter1", + "tool_state": "{\"input\": \"null\", \"header_lines\": \"\\\"0\\\"\", \"cond\": \"\\\"c1.strip()!='' and c1.strip()!='.'\\\"\", \"__page__\": 0}", + "tool_version": "1.1.0", + "type": "tool", + "user_outputs": [] + }, + "6": { + "annotation": "", + "id": 6, + "input_connections": { + "infile": { + "id": 2, + "output_name": "output" + } + }, + "inputs": [], + "name": "Change Title", + "outputs": [ + { + "name": "outfile", + "type": "sdf" + } + ], + "position": { + "left": 592, + "top": 988 + }, + "post_job_actions": { + "HideDatasetActionoutfile": { + "action_arguments": {}, + "action_type": "HideDatasetAction", + "output_name": "outfile" + } + }, + "tool_errors": null, + "tool_id": "ctb_change_title", + "tool_state": "{\"__page__\": 0, \"infile\": \"null\", \"key\": \"\\\"chembl_id\\\"\"}", + "tool_version": "0.0.1", + "type": "tool", + "user_outputs": [] + }, + "7": { + "annotation": "", + "id": 7, + "input_connections": { + "input": { + "id": 3, + "output_name": "pubchem_smi" + } + }, + "inputs": [], + "name": "Filter", + "outputs": [ + { + "name": "out_file1", + "type": "input" + } + ], + "position": { + "left": 623, + "top": 1365 + }, + "post_job_actions": { + "ChangeDatatypeActionout_file1": { + "action_arguments": { + "newtype": "smi" + }, + "action_type": "ChangeDatatypeAction", + "output_name": "out_file1" + }, + "HideDatasetActionout_file1": { + "action_arguments": {}, + "action_type": "HideDatasetAction", + "output_name": "out_file1" + } + }, + "tool_errors": null, + "tool_id": "Filter1", + "tool_state": "{\"input\": \"null\", \"header_lines\": \"\\\"0\\\"\", \"cond\": \"\\\"c1.strip()!='' and c1.strip()!='.'\\\"\", \"__page__\": 0}", + "tool_version": "1.1.0", + "type": "tool", + "user_outputs": [] + }, + "8": { + "annotation": "", + "id": 8, + "input_connections": { + "infile": { + "id": 4, + "output_name": "outfile" + } + }, + "inputs": [], + "name": "Compound Convert", + "outputs": [ + { + "name": "outfile", + "type": "text" + } + ], + "position": { + "left": 537, + "top": 410 + }, + "post_job_actions": { + "ChangeDatatypeActionoutfile": { + "action_arguments": { + "newtype": "tabular" + }, + "action_type": "ChangeDatatypeAction", + "output_name": "outfile" + }, + "HideDatasetActionoutfile": { + "action_arguments": {}, + "action_type": "HideDatasetAction", + "output_name": "outfile" + } + }, + "tool_errors": null, + "tool_id": "ctb_compound_convert", + "tool_state": "{\"__page__\": 0, \"dative_bonds\": \"\\\"True\\\"\", \"appendtotitle\": \"\\\"\\\"\", \"remove_h\": \"\\\"False\\\"\", \"oformat\": \"{\\\"can_iso_chi\\\": \\\"False\\\", \\\"can_atomclass_out\\\": \\\"False\\\", \\\"can_rad\\\": \\\"False\\\", \\\"can_exp_h\\\": \\\"False\\\", \\\"oformat_opts_selector\\\": \\\"can\\\", \\\"__current_case__\\\": 10}\", \"ph\": \"\\\"7.0\\\"\", \"unique\": \"{\\\"unique_opts_selector\\\": \\\"\\\", \\\"__current_case__\\\": 0}\", \"infile\": \"null\"}", + "tool_version": "1.0.0", + "type": "tool", + "user_outputs": [] + }, + "9": { + "annotation": "", + "id": 9, + "input_connections": { + "infile": { + "id": 5, + "output_name": "out_file1" + } + }, + "inputs": [], + "name": "Compound Convert", + "outputs": [ + { + "name": "outfile", + "type": "text" + } + ], + "position": { + "left": 537, + "top": 741 + }, + "post_job_actions": { + "ChangeDatatypeActionoutfile": { + "action_arguments": { + "newtype": "tabular" + }, + "action_type": "ChangeDatatypeAction", + "output_name": "outfile" + }, + "HideDatasetActionoutfile": { + "action_arguments": {}, + "action_type": "HideDatasetAction", + "output_name": "outfile" + } + }, + "tool_errors": null, + "tool_id": "ctb_compound_convert", + "tool_state": "{\"__page__\": 0, \"dative_bonds\": \"\\\"True\\\"\", \"appendtotitle\": \"\\\"\\\"\", \"remove_h\": \"\\\"False\\\"\", \"oformat\": \"{\\\"can_iso_chi\\\": \\\"False\\\", \\\"can_atomclass_out\\\": \\\"False\\\", \\\"can_rad\\\": \\\"False\\\", \\\"can_exp_h\\\": \\\"False\\\", \\\"oformat_opts_selector\\\": \\\"can\\\", \\\"__current_case__\\\": 10}\", \"ph\": \"\\\"7.0\\\"\", \"unique\": \"{\\\"unique_opts_selector\\\": \\\"\\\", \\\"__current_case__\\\": 0}\", \"infile\": \"null\"}", + "tool_version": "1.0.0", + "type": "tool", + "user_outputs": [] + }, + "10": { + "annotation": "", + "id": 10, + "input_connections": { + "infile": { + "id": 6, + "output_name": "outfile" + } + }, + "inputs": [], + "name": "Compound Convert", + "outputs": [ + { + "name": "outfile", + "type": "text" + } + ], + "position": { + "left": 557, + "top": 1115 + }, + "post_job_actions": { + "ChangeDatatypeActionoutfile": { + "action_arguments": { + "newtype": "tabular" + }, + "action_type": "ChangeDatatypeAction", + "output_name": "outfile" + }, + "HideDatasetActionoutfile": { + "action_arguments": {}, + "action_type": "HideDatasetAction", + "output_name": "outfile" + } + }, + "tool_errors": null, + "tool_id": "ctb_compound_convert", + "tool_state": "{\"__page__\": 0, \"dative_bonds\": \"\\\"True\\\"\", \"appendtotitle\": \"\\\"\\\"\", \"remove_h\": \"\\\"False\\\"\", \"oformat\": \"{\\\"can_iso_chi\\\": \\\"False\\\", \\\"can_atomclass_out\\\": \\\"False\\\", \\\"can_rad\\\": \\\"False\\\", \\\"can_exp_h\\\": \\\"False\\\", \\\"oformat_opts_selector\\\": \\\"can\\\", \\\"__current_case__\\\": 10}\", \"ph\": \"\\\"7.0\\\"\", \"unique\": \"{\\\"unique_opts_selector\\\": \\\"\\\", \\\"__current_case__\\\": 0}\", \"infile\": \"null\"}", + "tool_version": "1.0.0", + "type": "tool", + "user_outputs": [] + }, + "11": { + "annotation": "", + "id": 11, + "input_connections": { + "infile": { + "id": 7, + "output_name": "out_file1" + } + }, + "inputs": [], + "name": "Compound Convert", + "outputs": [ + { + "name": "outfile", + "type": "text" + } + ], + "position": { + "left": 576, + "top": 1480 + }, + "post_job_actions": { + "ChangeDatatypeActionoutfile": { + "action_arguments": { + "newtype": "tabular" + }, + "action_type": "ChangeDatatypeAction", + "output_name": "outfile" + }, + "HideDatasetActionoutfile": { + "action_arguments": {}, + "action_type": "HideDatasetAction", + "output_name": "outfile" + } + }, + "tool_errors": null, + "tool_id": "ctb_compound_convert", + "tool_state": "{\"__page__\": 0, \"dative_bonds\": \"\\\"True\\\"\", \"appendtotitle\": \"\\\"\\\"\", \"remove_h\": \"\\\"False\\\"\", \"oformat\": \"{\\\"can_iso_chi\\\": \\\"False\\\", \\\"can_atomclass_out\\\": \\\"False\\\", \\\"can_rad\\\": \\\"False\\\", \\\"can_exp_h\\\": \\\"False\\\", \\\"oformat_opts_selector\\\": \\\"can\\\", \\\"__current_case__\\\": 10}\", \"ph\": \"\\\"7.0\\\"\", \"unique\": \"{\\\"unique_opts_selector\\\": \\\"\\\", \\\"__current_case__\\\": 0}\", \"infile\": \"null\"}", + "tool_version": "1.0.0", + "type": "tool", + "user_outputs": [] + }, + "12": { + "annotation": "", + "id": 12, + "input_connections": { + "input": { + "id": 8, + "output_name": "outfile" + } + }, + "inputs": [], + "name": "Add column", + "outputs": [ + { + "name": "out_file1", + "type": "input" + } + ], + "position": { + "left": 951, + "top": 295 + }, + "post_job_actions": { + "HideDatasetActionout_file1": { + "action_arguments": {}, + "action_type": "HideDatasetAction", + "output_name": "out_file1" + } + }, + "tool_errors": null, + "tool_id": "addValue", + "tool_state": "{\"__page__\": 0, \"input\": \"null\", \"exp\": \"\\\"_drugbank\\\"\", \"iterate\": \"\\\"no\\\"\"}", + "tool_version": "1.0.0", + "type": "tool", + "user_outputs": [] + }, + "13": { + "annotation": "", + "id": 13, + "input_connections": { + "input": { + "id": 9, + "output_name": "outfile" + } + }, + "inputs": [], + "name": "Add column", + "outputs": [ + { + "name": "out_file1", + "type": "input" + } + ], + "position": { + "left": 963, + "top": 635 + }, + "post_job_actions": { + "HideDatasetActionout_file1": { + "action_arguments": {}, + "action_type": "HideDatasetAction", + "output_name": "out_file1" + } + }, + "tool_errors": null, + "tool_id": "addValue", + "tool_state": "{\"__page__\": 0, \"input\": \"null\", \"exp\": \"\\\"_zinc\\\"\", \"iterate\": \"\\\"no\\\"\"}", + "tool_version": "1.0.0", + "type": "tool", + "user_outputs": [] + }, + "14": { + "annotation": "", + "id": 14, + "input_connections": { + "input": { + "id": 10, + "output_name": "outfile" + } + }, + "inputs": [], + "name": "Add column", + "outputs": [ + { + "name": "out_file1", + "type": "input" + } + ], + "position": { + "left": 981, + "top": 987 + }, + "post_job_actions": { + "HideDatasetActionout_file1": { + "action_arguments": {}, + "action_type": "HideDatasetAction", + "output_name": "out_file1" + } + }, + "tool_errors": null, + "tool_id": "addValue", + "tool_state": "{\"__page__\": 0, \"input\": \"null\", \"exp\": \"\\\"_chembldb\\\"\", \"iterate\": \"\\\"no\\\"\"}", + "tool_version": "1.0.0", + "type": "tool", + "user_outputs": [] + }, + "15": { + "annotation": "", + "id": 15, + "input_connections": { + "input": { + "id": 11, + "output_name": "outfile" + } + }, + "inputs": [], + "name": "Add column", + "outputs": [ + { + "name": "out_file1", + "type": "input" + } + ], + "position": { + "left": 995, + "top": 1358 + }, + "post_job_actions": { + "HideDatasetActionout_file1": { + "action_arguments": {}, + "action_type": "HideDatasetAction", + "output_name": "out_file1" + } + }, + "tool_errors": null, + "tool_id": "addValue", + "tool_state": "{\"__page__\": 0, \"input\": \"null\", \"exp\": \"\\\"_pubchem\\\"\", \"iterate\": \"\\\"no\\\"\"}", + "tool_version": "1.0.0", + "type": "tool", + "user_outputs": [] + }, + "16": { + "annotation": "", + "id": 16, + "input_connections": { + "input": { + "id": 12, + "output_name": "out_file1" + } + }, + "inputs": [], + "name": "Unique", + "outputs": [ + { + "name": "outfile", + "type": "input" + } + ], + "position": { + "left": 960, + "top": 420 + }, + "post_job_actions": { + "ChangeDatatypeActionoutfile": { + "action_arguments": { + "newtype": "smi" + }, + "action_type": "ChangeDatatypeAction", + "output_name": "outfile" + }, + "RenameDatasetActionoutfile": { + "action_arguments": { + "newname": "Non-redundant DrugBank" + }, + "action_type": "RenameDatasetAction", + "output_name": "outfile" + } + }, + "tool_errors": null, + "tool_id": "bg_uniq", + "tool_state": "{\"adv_opts\": \"{\\\"column_end\\\": {\\\"__class__\\\": \\\"UnvalidatedValue\\\", \\\"value\\\": \\\"1\\\"}, \\\"column_start\\\": {\\\"__class__\\\": \\\"UnvalidatedValue\\\", \\\"value\\\": \\\"1\\\"}, \\\"adv_opts_selector\\\": \\\"advanced\\\", \\\"__current_case__\\\": 1}\", \"input\": \"null\", \"ignore_case\": \"\\\"False\\\"\", \"is_numeric\": \"\\\"False\\\"\", \"__page__\": 0}", + "tool_version": "0.3", + "type": "tool", + "user_outputs": [] + }, + "17": { + "annotation": "", + "id": 17, + "input_connections": { + "input": { + "id": 13, + "output_name": "out_file1" + } + }, + "inputs": [], + "name": "Unique", + "outputs": [ + { + "name": "outfile", + "type": "input" + } + ], + "position": { + "left": 955, + "top": 757 + }, + "post_job_actions": { + "ChangeDatatypeActionoutfile": { + "action_arguments": { + "newtype": "smi" + }, + "action_type": "ChangeDatatypeAction", + "output_name": "outfile" + }, + "RenameDatasetActionoutfile": { + "action_arguments": { + "newname": "Non-redundant ZINC" + }, + "action_type": "RenameDatasetAction", + "output_name": "outfile" + } + }, + "tool_errors": null, + "tool_id": "bg_uniq", + "tool_state": "{\"adv_opts\": \"{\\\"column_end\\\": {\\\"__class__\\\": \\\"UnvalidatedValue\\\", \\\"value\\\": \\\"1\\\"}, \\\"column_start\\\": {\\\"__class__\\\": \\\"UnvalidatedValue\\\", \\\"value\\\": \\\"1\\\"}, \\\"adv_opts_selector\\\": \\\"advanced\\\", \\\"__current_case__\\\": 1}\", \"input\": \"null\", \"ignore_case\": \"\\\"False\\\"\", \"is_numeric\": \"\\\"False\\\"\", \"__page__\": 0}", + "tool_version": "0.3", + "type": "tool", + "user_outputs": [] + }, + "18": { + "annotation": "", + "id": 18, + "input_connections": { + "input": { + "id": 14, + "output_name": "out_file1" + } + }, + "inputs": [], + "name": "Unique", + "outputs": [ + { + "name": "outfile", + "type": "input" + } + ], + "position": { + "left": 981, + "top": 1122 + }, + "post_job_actions": { + "ChangeDatatypeActionoutfile": { + "action_arguments": { + "newtype": "smi" + }, + "action_type": "ChangeDatatypeAction", + "output_name": "outfile" + }, + "RenameDatasetActionoutfile": { + "action_arguments": { + "newname": "Non-redundant ChEMBLdb" + }, + "action_type": "RenameDatasetAction", + "output_name": "outfile" + } + }, + "tool_errors": null, + "tool_id": "bg_uniq", + "tool_state": "{\"adv_opts\": \"{\\\"column_end\\\": {\\\"__class__\\\": \\\"UnvalidatedValue\\\", \\\"value\\\": \\\"1\\\"}, \\\"column_start\\\": {\\\"__class__\\\": \\\"UnvalidatedValue\\\", \\\"value\\\": \\\"1\\\"}, \\\"adv_opts_selector\\\": \\\"advanced\\\", \\\"__current_case__\\\": 1}\", \"input\": \"null\", \"ignore_case\": \"\\\"False\\\"\", \"is_numeric\": \"\\\"False\\\"\", \"__page__\": 0}", + "tool_version": "0.3", + "type": "tool", + "user_outputs": [] + }, + "19": { + "annotation": "", + "id": 19, + "input_connections": { + "input1": { + "id": 12, + "output_name": "out_file1" + }, + "queries_0|input2": { + "id": 13, + "output_name": "out_file1" + }, + "queries_1|input2": { + "id": 14, + "output_name": "out_file1" + }, + "queries_2|input2": { + "id": 15, + "output_name": "out_file1" + } + }, + "inputs": [], + "name": "Concatenate datasets", + "outputs": [ + { + "name": "out_file1", + "type": "input" + } + ], + "position": { + "left": 1419, + "top": 824 + }, + "post_job_actions": { + "ChangeDatatypeActionout_file1": { + "action_arguments": { + "newtype": "tabular" + }, + "action_type": "ChangeDatatypeAction", + "output_name": "out_file1" + }, + "HideDatasetActionout_file1": { + "action_arguments": {}, + "action_type": "HideDatasetAction", + "output_name": "out_file1" + } + }, + "tool_errors": null, + "tool_id": "cat1", + "tool_state": "{\"__page__\": 0, \"input1\": \"null\", \"queries\": \"[{\\\"input2\\\": null, \\\"__index__\\\": 0}, {\\\"input2\\\": null, \\\"__index__\\\": 1}, {\\\"input2\\\": null, \\\"__index__\\\": 2}]\"}", + "tool_version": "1.0.0", + "type": "tool", + "user_outputs": [] + }, + "20": { + "annotation": "", + "id": 20, + "input_connections": { + "input": { + "id": 15, + "output_name": "out_file1" + } + }, + "inputs": [], + "name": "Unique", + "outputs": [ + { + "name": "outfile", + "type": "input" + } + ], + "position": { + "left": 1001, + "top": 1476 + }, + "post_job_actions": { + "ChangeDatatypeActionoutfile": { + "action_arguments": { + "newtype": "smi" + }, + "action_type": "ChangeDatatypeAction", + "output_name": "outfile" + }, + "RenameDatasetActionoutfile": { + "action_arguments": { + "newname": "Non-redundant PubChem" + }, + "action_type": "RenameDatasetAction", + "output_name": "outfile" + } + }, + "tool_errors": null, + "tool_id": "bg_uniq", + "tool_state": "{\"adv_opts\": \"{\\\"column_end\\\": {\\\"__class__\\\": \\\"UnvalidatedValue\\\", \\\"value\\\": \\\"1\\\"}, \\\"column_start\\\": {\\\"__class__\\\": \\\"UnvalidatedValue\\\", \\\"value\\\": \\\"1\\\"}, \\\"adv_opts_selector\\\": \\\"advanced\\\", \\\"__current_case__\\\": 1}\", \"input\": \"null\", \"ignore_case\": \"\\\"False\\\"\", \"is_numeric\": \"\\\"False\\\"\", \"__page__\": 0}", + "tool_version": "0.3", + "type": "tool", + "user_outputs": [] + }, + "21": { + "annotation": "", + "id": 21, + "input_connections": { + "input1": { + "id": 19, + "output_name": "out_file1" + } + }, + "inputs": [], + "name": "Merge Columns", + "outputs": [ + { + "name": "out_file1", + "type": "tabular" + } + ], + "position": { + "left": 1763, + "top": 907 + }, + "post_job_actions": { + "HideDatasetActionout_file1": { + "action_arguments": {}, + "action_type": "HideDatasetAction", + "output_name": "out_file1" + } + }, + "tool_errors": null, + "tool_id": "mergeCols1", + "tool_state": "{\"__page__\": 0, \"input1\": \"null\", \"col2\": \"{\\\"__class__\\\": \\\"UnvalidatedValue\\\", \\\"value\\\": \\\"3\\\"}\", \"columns\": \"[]\", \"col1\": \"{\\\"__class__\\\": \\\"UnvalidatedValue\\\", \\\"value\\\": \\\"2\\\"}\"}", + "tool_version": "1.0.1", + "type": "tool", + "user_outputs": [] + }, + "22": { + "annotation": "", + "id": 22, + "input_connections": { + "input": { + "id": 21, + "output_name": "out_file1" + } + }, + "inputs": [], + "name": "Cut", + "outputs": [ + { + "name": "out_file1", + "type": "tabular" + } + ], + "position": { + "left": 1763, + "top": 797 + }, + "post_job_actions": { + "HideDatasetActionout_file1": { + "action_arguments": {}, + "action_type": "HideDatasetAction", + "output_name": "out_file1" + } + }, + "tool_errors": null, + "tool_id": "Cut1", + "tool_state": "{\"columnList\": \"\\\"c1,c4\\\"\", \"input\": \"null\", \"delimiter\": \"\\\"T\\\"\", \"__page__\": 0}", + "tool_version": "1.0.2", + "type": "tool", + "user_outputs": [] + }, + "23": { + "annotation": "", + "id": 23, + "input_connections": { + "input": { + "id": 22, + "output_name": "out_file1" + } + }, + "inputs": [], + "name": "Filter", + "outputs": [ + { + "name": "out_file1", + "type": "input" + } + ], + "position": { + "left": 2094, + "top": 912 + }, + "post_job_actions": { + "HideDatasetActionout_file1": { + "action_arguments": {}, + "action_type": "HideDatasetAction", + "output_name": "out_file1" + } + }, + "tool_errors": null, + "tool_id": "Filter1", + "tool_state": "{\"input\": \"null\", \"header_lines\": \"\\\"0\\\"\", \"cond\": \"\\\"c1.strip()!='' and c1.strip()!='.'\\\"\", \"__page__\": 0}", + "tool_version": "1.1.0", + "type": "tool", + "user_outputs": [] + }, + "24": { + "annotation": "", + "id": 24, + "input_connections": { + "input": { + "id": 23, + "output_name": "out_file1" + } + }, + "inputs": [], + "name": "Manipulation", + "outputs": [ + { + "name": "outfile", + "type": "input" + } + ], + "position": { + "left": 2099, + "top": 804 + }, + "post_job_actions": { + "HideDatasetActionoutfile": { + "action_arguments": {}, + "action_type": "HideDatasetAction", + "output_name": "outfile" + } + }, + "tool_errors": null, + "tool_id": "sed_stream_editor", + "tool_state": "{\"__page__\": 0, \"input\": \"null\", \"pattern\": \"\\\"s/ /_/g\\\"\"}", + "tool_version": "0.0.1", + "type": "tool", + "user_outputs": [] + }, + "25": { + "annotation": "", + "id": 25, + "input_connections": { + "input": { + "id": 24, + "output_name": "outfile" + } + }, + "inputs": [], + "name": "Unique", + "outputs": [ + { + "name": "outfile", + "type": "input" + } + ], + "position": { + "left": 2098, + "top": 681 + }, + "post_job_actions": { + "ChangeDatatypeActionoutfile": { + "action_arguments": { + "newtype": "smi" + }, + "action_type": "ChangeDatatypeAction", + "output_name": "outfile" + }, + "RenameDatasetActionoutfile": { + "action_arguments": { + "newname": "Non-redundant merged libraries" + }, + "action_type": "RenameDatasetAction", + "output_name": "outfile" + } + }, + "tool_errors": null, + "tool_id": "bg_uniq", + "tool_state": "{\"adv_opts\": \"{\\\"column_end\\\": {\\\"__class__\\\": \\\"UnvalidatedValue\\\", \\\"value\\\": \\\"1\\\"}, \\\"column_start\\\": {\\\"__class__\\\": \\\"UnvalidatedValue\\\", \\\"value\\\": \\\"1\\\"}, \\\"adv_opts_selector\\\": \\\"advanced\\\", \\\"__current_case__\\\": 1}\", \"input\": \"null\", \"ignore_case\": \"\\\"False\\\"\", \"is_numeric\": \"\\\"False\\\"\", \"__page__\": 0}", + "tool_version": "0.3", + "type": "tool", + "user_outputs": [] + }, + "26": { + "annotation": "", + "id": 26, + "input_connections": { + "infile": { + "id": 25, + "output_name": "outfile" + } + }, + "inputs": [], + "name": "Remove counterions and fragments", + "outputs": [ + { + "name": "outfile", + "type": "sdf" + } + ], + "position": { + "left": 2392, + "top": 907 + }, + "post_job_actions": { + "HideDatasetActionoutfile": { + "action_arguments": {}, + "action_type": "HideDatasetAction", + "output_name": "outfile" + } + }, + "tool_errors": null, + "tool_id": "ctb_remIons", + "tool_state": "{\"__page__\": 0, \"infile\": \"null\"}", + "tool_version": "1.0", + "type": "tool", + "user_outputs": [] + }, + "27": { + "annotation": "", + "id": 27, + "input_connections": { + "input": { + "id": 26, + "output_name": "outfile" + } + }, + "inputs": [], + "name": "Select", + "outputs": [ + { + "name": "out_file1", + "type": "input" + } + ], + "position": { + "left": 2447, + "top": 795 + }, + "post_job_actions": { + "HideDatasetActionout_file1": { + "action_arguments": {}, + "action_type": "HideDatasetAction", + "output_name": "out_file1" + } + }, + "tool_errors": null, + "tool_id": "Grep1", + "tool_state": "{\"__page__\": 0, \"input\": \"null\", \"invert\": \"\\\"true\\\"\", \"pattern\": \"\\\"\\\\\\\\*\\\"\"}", + "tool_version": "1.0.1", + "type": "tool", + "user_outputs": [] + }, + "28": { + "annotation": "", + "id": 28, + "input_connections": { + "input": { + "id": 27, + "output_name": "out_file1" + } + }, + "inputs": [], + "name": "Unique", + "outputs": [ + { + "name": "outfile", + "type": "input" + } + ], + "position": { + "left": 2444, + "top": 678 + }, + "post_job_actions": { + "ChangeDatatypeActionoutfile": { + "action_arguments": { + "newtype": "tabular" + }, + "action_type": "ChangeDatatypeAction", + "output_name": "outfile" + }, + "RenameDatasetActionoutfile": { + "action_arguments": { + "newname": "Filtered merged libraries" + }, + "action_type": "RenameDatasetAction", + "output_name": "outfile" + } + }, + "tool_errors": null, + "tool_id": "bg_uniq", + "tool_state": "{\"adv_opts\": \"{\\\"adv_opts_selector\\\": \\\"basic\\\", \\\"__current_case__\\\": 0}\", \"input\": \"null\", \"ignore_case\": \"\\\"False\\\"\", \"is_numeric\": \"\\\"False\\\"\", \"__page__\": 0}", + "tool_version": "0.3", + "type": "tool", + "user_outputs": [] + }, + "29": { + "annotation": "", + "id": 29, + "input_connections": { + "input": { + "id": 28, + "output_name": "outfile" + } + }, + "inputs": [], + "name": "Unique", + "outputs": [ + { + "name": "outfile", + "type": "input" + } + ], + "position": { + "left": 2444, + "top": 562 + }, + "post_job_actions": { + "ChangeDatatypeActionoutfile": { + "action_arguments": { + "newtype": "smi" + }, + "action_type": "ChangeDatatypeAction", + "output_name": "outfile" + }, + "RenameDatasetActionoutfile": { + "action_arguments": { + "newname": "Non-redundant filtered merged libraries" + }, + "action_type": "RenameDatasetAction", + "output_name": "outfile" + } + }, + "tool_errors": null, + "tool_id": "bg_uniq", + "tool_state": "{\"adv_opts\": \"{\\\"column_end\\\": {\\\"__class__\\\": \\\"UnvalidatedValue\\\", \\\"value\\\": \\\"1\\\"}, \\\"column_start\\\": {\\\"__class__\\\": \\\"UnvalidatedValue\\\", \\\"value\\\": \\\"1\\\"}, \\\"adv_opts_selector\\\": \\\"advanced\\\", \\\"__current_case__\\\": 1}\", \"input\": \"null\", \"ignore_case\": \"\\\"False\\\"\", \"is_numeric\": \"\\\"False\\\"\", \"__page__\": 0}", + "tool_version": "0.3", + "type": "tool", + "user_outputs": [] + } + } +} diff -r 000000000000 -r e1bc8415f875 readme.rst --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/readme.rst Mon Aug 26 07:37:31 2013 -0400 @@ -0,0 +1,44 @@ +This package is a Galaxy workflow for merging of chemical libraries using the chemicaltoolbox. + +To learn more about the chemicaltoolbox and all the integrated tools, +please have a look at https://github.com/bgruening/galaxytools/tree/master/chemicaltoolbox. + + +Sample Data +=========== + +The workflow will fetch the sample data from online resources, like PubChem, DrugBank. + + +Citation +======== + +If you use this workflow directly, or a derivative of it, or the associated +chemicaltoolbox wrappers for Galaxy, in work leading to a scientific publication, +please cite: + +GrĂ¼ning, B. et al. (2013) +ChemicalToolBoX, a new Galaxy for cheminformatics (Submitted). + + +Availability +============ + +This workflow is available on the main Galaxy Tool Shed: + + http://toolshed.g2.bx.psu.edu/view/bgruening/chemicaltoolbox_merging_chemical_databases_workflow + +Development is being done on github: + +https://github.com/bgruening/galaxytools/workflows/chemicaltoolbox + + +Dependencies +============ + +These dependencies should be resolved automatically via the Galaxy Tool Shed: + +* http://toolshed.g2.bx.psu.edu/view/bgruening/unique +* http://toolshed.g2.bx.psu.edu/view/bjoern-gruening/sed_wrapper +* http://toolshed.g2.bx.psu.edu/view/bgruening/chemicaltoolbox + diff -r 000000000000 -r e1bc8415f875 repository_dependencies.xml --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/repository_dependencies.xml Mon Aug 26 07:37:31 2013 -0400 @@ -0,0 +1,6 @@ + + + + + +