# HG changeset patch # User bgruening # Date 1531161135 14400 # Node ID 6352834b1c999500451a45a7cbe3dafdac87a9a2 # Parent a78f96f64939cdd17dd369c8ff9b431ff6fe07f6 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 5d71c93a3dd804b1469852240a86021ab9130364 diff -r a78f96f64939 -r 6352834b1c99 ensemble.xml --- a/ensemble.xml Sun Jul 01 03:19:54 2018 -0400 +++ b/ensemble.xml Mon Jul 09 14:32:15 2018 -0400 @@ -23,6 +23,7 @@ from scipy.io import mmread @COLUMNS_FUNCTION@ +@GET_X_y_FUNCTION@ input_json_path = sys.argv[1] params = json.load(open(input_json_path, "r")) @@ -46,40 +47,8 @@ options["min_samples_leaf"] = 1 if "min_samples_split" in options and options["min_samples_split"] > 1.0: options["min_samples_split"] = int(options["min_samples_split"]) -input_type = params["selected_tasks"]["selected_algorithms"]["input_options"]["selected_input"] -if input_type=="tabular": - header = 'infer' if params["selected_tasks"]["selected_algorithms"]["input_options"]["header1"] else None - column_option = params["selected_tasks"]["selected_algorithms"]["input_options"]["column_selector_options_1"]["selected_column_selector_option"] - if column_option in ["by_index_number", "all_but_by_index_number", "by_header_name", "all_but_by_header_name"]: - c = params["selected_tasks"]["selected_algorithms"]["input_options"]["column_selector_options_1"]["col1"] - else: - c = None - X = read_columns( - "$selected_tasks.selected_algorithms.input_options.infile1", - c = c, - c_option = column_option, - sep='\t', - header=header, - parse_dates=True - ) -else: - X = mmread(open("$selected_tasks.selected_algorithms.input_options.infile1", 'r')) -header = 'infer' if params["selected_tasks"]["selected_algorithms"]["input_options"]["header2"] else None -column_option = params["selected_tasks"]["selected_algorithms"]["input_options"]["column_selector_options_2"]["selected_column_selector_option2"] -if column_option in ["by_index_number", "all_but_by_index_number", "by_header_name", "all_but_by_header_name"]: - c = params["selected_tasks"]["selected_algorithms"]["input_options"]["column_selector_options_2"]["col2"] -else: - c = None -y = read_columns( - "$selected_tasks.selected_algorithms.input_options.infile2", - c = c, - c_option = column_option, - sep='\t', - header=header, - parse_dates=True -) -y=y.ravel() +X, y = get_X_y(params, "$selected_tasks.selected_algorithms.input_options.infile1" ,"$selected_tasks.selected_algorithms.input_options.infile2") my_class = getattr(sklearn.ensemble, algorithm) estimator = my_class(**options) diff -r a78f96f64939 -r 6352834b1c99 main_macros.xml --- a/main_macros.xml Sun Jul 01 03:19:54 2018 -0400 +++ b/main_macros.xml Mon Jul 09 14:32:15 2018 -0400 @@ -64,6 +64,45 @@ return new_selector + +def get_X_y(params, file1, file2): + input_type = params["selected_tasks"]["selected_algorithms"]["input_options"]["selected_input"] + if input_type=="tabular": + header = 'infer' if params["selected_tasks"]["selected_algorithms"]["input_options"]["header1"] else None + column_option = params["selected_tasks"]["selected_algorithms"]["input_options"]["column_selector_options_1"]["selected_column_selector_option"] + if column_option in ["by_index_number", "all_but_by_index_number", "by_header_name", "all_but_by_header_name"]: + c = params["selected_tasks"]["selected_algorithms"]["input_options"]["column_selector_options_1"]["col1"] + else: + c = None + X = read_columns( + file1, + c = c, + c_option = column_option, + sep='\t', + header=header, + parse_dates=True + ) + else: + X = mmread(open(file1, 'r')) + + header = 'infer' if params["selected_tasks"]["selected_algorithms"]["input_options"]["header2"] else None + column_option = params["selected_tasks"]["selected_algorithms"]["input_options"]["column_selector_options_2"]["selected_column_selector_option2"] + if column_option in ["by_index_number", "all_but_by_index_number", "by_header_name", "all_but_by_header_name"]: + c = params["selected_tasks"]["selected_algorithms"]["input_options"]["column_selector_options_2"]["col2"] + else: + c = None + y = read_columns( + file2, + c = c, + c_option = column_option, + sep='\t', + header=header, + parse_dates=True + ) + y=y.ravel() + return X, y + + python @@ -81,34 +120,6 @@ - - - - - - - - - - - - - - - - - - - - - - - - - - - -