Mercurial > repos > bgruening > sklearn_searchcv
comparison search_model_validation.xml @ 6:7509d7059040 draft
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit c64ccc5850c8e061a95fb64e07ed388384e82393
author | bgruening |
---|---|
date | Thu, 11 Oct 2018 03:30:01 -0400 |
parents | 0987bc3904a0 |
children | 4368259ff821 |
comparison
equal
deleted
inserted
replaced
5:0987bc3904a0 | 6:7509d7059040 |
---|---|
83 optimizers = getattr(model_selection, optimizers) | 83 optimizers = getattr(model_selection, optimizers) |
84 | 84 |
85 options = params["search_schemes"]["options"] | 85 options = params["search_schemes"]["options"] |
86 options['cv'] = get_cv( options['cv'].strip() ) | 86 options['cv'] = get_cv( options['cv'].strip() ) |
87 options['n_jobs'] = N_JOBS | 87 options['n_jobs'] = N_JOBS |
88 primary_scoring = options['scoring']['primary_scoring'] | |
88 options['scoring'] = get_scoring(options['scoring']) | 89 options['scoring'] = get_scoring(options['scoring']) |
89 if options['error_score']: | 90 if options['error_score']: |
90 options['error_score'] = 'raise' | 91 options['error_score'] = 'raise' |
91 else: | 92 else: |
92 options['error_score'] = 0 | 93 options['error_score'] = 0 |
112 pass | 113 pass |
113 for warning in w: | 114 for warning in w: |
114 print(repr(warning.message)) | 115 print(repr(warning.message)) |
115 | 116 |
116 cv_result = pandas.DataFrame(searcher.cv_results_) | 117 cv_result = pandas.DataFrame(searcher.cv_results_) |
118 cv_result.rename(inplace=True, columns={"mean_test_primary": "mean_test_"+primary_scoring, "rank_test_primary": "rank_test_"+primary_scoring}) | |
117 cv_result.to_csv(path_or_buf=outfile_result, sep='\t', header=True, index=False) | 119 cv_result.to_csv(path_or_buf=outfile_result, sep='\t', header=True, index=False) |
118 | 120 |
119 #if $save: | 121 #if $save: |
120 with open(outfile_estimator, "wb") as output_handler: | 122 with open(outfile_estimator, "wb") as output_handler: |
121 pickle.dump(searcher.best_estimator_, output_handler, pickle.HIGHEST_PROTOCOL) | 123 pickle.dump(searcher.best_estimator_, output_handler, pickle.HIGHEST_PROTOCOL) |
451 <has_text text="0.7880692034558879"/> | 453 <has_text text="0.7880692034558879"/> |
452 <has_text text="-29.381892762877825"/> | 454 <has_text text="-29.381892762877825"/> |
453 </assert_contents> | 455 </assert_contents> |
454 </output> | 456 </output> |
455 </test> | 457 </test> |
458 <test> | |
459 <param name="selected_search_scheme" value="GridSearchCV"/> | |
460 <param name="infile_pipeline" value="pipeline02" ftype="zip"/> | |
461 <conditional name="search_param_selector"> | |
462 <param name="search_p" value="eps: [0.01, 0.001]"/> | |
463 <param name="selected_param_type" value="final_estimator_p"/> | |
464 </conditional> | |
465 <param name="infile1" value="regression_X.tabular" ftype="tabular"/> | |
466 <param name="header1" value="true" /> | |
467 <param name="selected_column_selector_option" value="all_columns"/> | |
468 <param name="infile2" value="regression_y.tabular" ftype="tabular"/> | |
469 <param name="header2" value="true" /> | |
470 <param name="selected_column_selector_option2" value="all_columns"/> | |
471 <output name="outfile_result"> | |
472 <assert_contents> | |
473 <has_n_columns n="12"/> | |
474 <has_text text="0.7762968161366681" /> | |
475 </assert_contents> | |
476 </output> | |
477 </test> | |
478 <test> | |
479 <param name="selected_search_scheme" value="GridSearchCV"/> | |
480 <param name="infile_pipeline" value="pipeline05" ftype="zip"/> | |
481 <conditional name="search_param_selector"> | |
482 <param name="search_p" value="n_estimators: [10, 50, 100, 300]"/> | |
483 <param name="selected_param_type" value="final_estimator_p"/> | |
484 </conditional> | |
485 <param name="infile1" value="regression_X.tabular" ftype="tabular"/> | |
486 <param name="header1" value="true" /> | |
487 <param name="selected_column_selector_option" value="all_columns"/> | |
488 <param name="infile2" value="regression_y.tabular" ftype="tabular"/> | |
489 <param name="header2" value="true" /> | |
490 <param name="selected_column_selector_option2" value="all_columns"/> | |
491 <output name="outfile_result"> | |
492 <assert_contents> | |
493 <has_n_columns n="12"/> | |
494 <has_text text="0.8176497587057971" /> | |
495 </assert_contents> | |
496 </output> | |
497 </test> | |
498 <test expect_failure="true"> | |
499 <param name="selected_search_scheme" value="GridSearchCV"/> | |
500 <param name="infile_pipeline" value="pipeline01" ftype="zip"/> | |
501 <conditional name="search_param_selector"> | |
502 <param name="search_p" value="C: open('~/.ssh/authorized_keys', 'r').read()"/> | |
503 <param name="selected_param_type" value="final_estimator_p"/> | |
504 </conditional> | |
505 <param name="infile1" value="regression_X.tabular" ftype="tabular"/> | |
506 <param name="header1" value="true" /> | |
507 <param name="selected_column_selector_option" value="all_columns"/> | |
508 <param name="infile2" value="regression_y.tabular" ftype="tabular"/> | |
509 <param name="header2" value="true" /> | |
510 <param name="selected_column_selector_option2" value="all_columns"/> | |
511 </test> | |
512 <test expect_failure="true"> | |
513 <param name="selected_search_scheme" value="GridSearchCV"/> | |
514 <param name="infile_pipeline" value="pipeline01" ftype="zip"/> | |
515 <conditional name="search_param_selector"> | |
516 <param name="search_p" value="C: [1, 10, 100, 1000]"/> | |
517 <param name="selected_param_type" value="final_estimator_p"/> | |
518 </conditional> | |
519 <param name="cv" value="__import__('os').system('ls ~')"/> | |
520 <param name="infile1" value="regression_X.tabular" ftype="tabular"/> | |
521 <param name="header1" value="true" /> | |
522 <param name="selected_column_selector_option" value="all_columns"/> | |
523 <param name="infile2" value="regression_y.tabular" ftype="tabular"/> | |
524 <param name="header2" value="true" /> | |
525 <param name="selected_column_selector_option2" value="all_columns"/> | |
526 </test> | |
456 </tests> | 527 </tests> |
457 <help> | 528 <help> |
458 <![CDATA[ | 529 <![CDATA[ |
459 **What it does** | 530 **What it does** |
460 Searches optimized parameter values for an estimator or pipeline through either exhaustive grid cross validation search or Randomized cross validation search. | 531 Searches optimized parameter values for an estimator or pipeline through either exhaustive grid cross validation search or Randomized cross validation search. |