comparison search_model_validation.xml @ 6:7509d7059040 draft

planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit c64ccc5850c8e061a95fb64e07ed388384e82393
author bgruening
date Thu, 11 Oct 2018 03:30:01 -0400
parents 0987bc3904a0
children 4368259ff821
comparison
equal deleted inserted replaced
5:0987bc3904a0 6:7509d7059040
83 optimizers = getattr(model_selection, optimizers) 83 optimizers = getattr(model_selection, optimizers)
84 84
85 options = params["search_schemes"]["options"] 85 options = params["search_schemes"]["options"]
86 options['cv'] = get_cv( options['cv'].strip() ) 86 options['cv'] = get_cv( options['cv'].strip() )
87 options['n_jobs'] = N_JOBS 87 options['n_jobs'] = N_JOBS
88 primary_scoring = options['scoring']['primary_scoring']
88 options['scoring'] = get_scoring(options['scoring']) 89 options['scoring'] = get_scoring(options['scoring'])
89 if options['error_score']: 90 if options['error_score']:
90 options['error_score'] = 'raise' 91 options['error_score'] = 'raise'
91 else: 92 else:
92 options['error_score'] = 0 93 options['error_score'] = 0
112 pass 113 pass
113 for warning in w: 114 for warning in w:
114 print(repr(warning.message)) 115 print(repr(warning.message))
115 116
116 cv_result = pandas.DataFrame(searcher.cv_results_) 117 cv_result = pandas.DataFrame(searcher.cv_results_)
118 cv_result.rename(inplace=True, columns={"mean_test_primary": "mean_test_"+primary_scoring, "rank_test_primary": "rank_test_"+primary_scoring})
117 cv_result.to_csv(path_or_buf=outfile_result, sep='\t', header=True, index=False) 119 cv_result.to_csv(path_or_buf=outfile_result, sep='\t', header=True, index=False)
118 120
119 #if $save: 121 #if $save:
120 with open(outfile_estimator, "wb") as output_handler: 122 with open(outfile_estimator, "wb") as output_handler:
121 pickle.dump(searcher.best_estimator_, output_handler, pickle.HIGHEST_PROTOCOL) 123 pickle.dump(searcher.best_estimator_, output_handler, pickle.HIGHEST_PROTOCOL)
451 <has_text text="0.7880692034558879"/> 453 <has_text text="0.7880692034558879"/>
452 <has_text text="-29.381892762877825"/> 454 <has_text text="-29.381892762877825"/>
453 </assert_contents> 455 </assert_contents>
454 </output> 456 </output>
455 </test> 457 </test>
458 <test>
459 <param name="selected_search_scheme" value="GridSearchCV"/>
460 <param name="infile_pipeline" value="pipeline02" ftype="zip"/>
461 <conditional name="search_param_selector">
462 <param name="search_p" value="eps: [0.01, 0.001]"/>
463 <param name="selected_param_type" value="final_estimator_p"/>
464 </conditional>
465 <param name="infile1" value="regression_X.tabular" ftype="tabular"/>
466 <param name="header1" value="true" />
467 <param name="selected_column_selector_option" value="all_columns"/>
468 <param name="infile2" value="regression_y.tabular" ftype="tabular"/>
469 <param name="header2" value="true" />
470 <param name="selected_column_selector_option2" value="all_columns"/>
471 <output name="outfile_result">
472 <assert_contents>
473 <has_n_columns n="12"/>
474 <has_text text="0.7762968161366681" />
475 </assert_contents>
476 </output>
477 </test>
478 <test>
479 <param name="selected_search_scheme" value="GridSearchCV"/>
480 <param name="infile_pipeline" value="pipeline05" ftype="zip"/>
481 <conditional name="search_param_selector">
482 <param name="search_p" value="n_estimators: [10, 50, 100, 300]"/>
483 <param name="selected_param_type" value="final_estimator_p"/>
484 </conditional>
485 <param name="infile1" value="regression_X.tabular" ftype="tabular"/>
486 <param name="header1" value="true" />
487 <param name="selected_column_selector_option" value="all_columns"/>
488 <param name="infile2" value="regression_y.tabular" ftype="tabular"/>
489 <param name="header2" value="true" />
490 <param name="selected_column_selector_option2" value="all_columns"/>
491 <output name="outfile_result">
492 <assert_contents>
493 <has_n_columns n="12"/>
494 <has_text text="0.8176497587057971" />
495 </assert_contents>
496 </output>
497 </test>
498 <test expect_failure="true">
499 <param name="selected_search_scheme" value="GridSearchCV"/>
500 <param name="infile_pipeline" value="pipeline01" ftype="zip"/>
501 <conditional name="search_param_selector">
502 <param name="search_p" value="C: open('~/.ssh/authorized_keys', 'r').read()"/>
503 <param name="selected_param_type" value="final_estimator_p"/>
504 </conditional>
505 <param name="infile1" value="regression_X.tabular" ftype="tabular"/>
506 <param name="header1" value="true" />
507 <param name="selected_column_selector_option" value="all_columns"/>
508 <param name="infile2" value="regression_y.tabular" ftype="tabular"/>
509 <param name="header2" value="true" />
510 <param name="selected_column_selector_option2" value="all_columns"/>
511 </test>
512 <test expect_failure="true">
513 <param name="selected_search_scheme" value="GridSearchCV"/>
514 <param name="infile_pipeline" value="pipeline01" ftype="zip"/>
515 <conditional name="search_param_selector">
516 <param name="search_p" value="C: [1, 10, 100, 1000]"/>
517 <param name="selected_param_type" value="final_estimator_p"/>
518 </conditional>
519 <param name="cv" value="__import__('os').system('ls ~')"/>
520 <param name="infile1" value="regression_X.tabular" ftype="tabular"/>
521 <param name="header1" value="true" />
522 <param name="selected_column_selector_option" value="all_columns"/>
523 <param name="infile2" value="regression_y.tabular" ftype="tabular"/>
524 <param name="header2" value="true" />
525 <param name="selected_column_selector_option2" value="all_columns"/>
526 </test>
456 </tests> 527 </tests>
457 <help> 528 <help>
458 <![CDATA[ 529 <![CDATA[
459 **What it does** 530 **What it does**
460 Searches optimized parameter values for an estimator or pipeline through either exhaustive grid cross validation search or Randomized cross validation search. 531 Searches optimized parameter values for an estimator or pipeline through either exhaustive grid cross validation search or Randomized cross validation search.