zoukankan html css js c++ java

封装GridSearchCV的训练包

import xgboost as xgb
from sklearn.model_selection import GridSearchCV
from sklearn.metrics import make_scorer
from sklearn.metrics import accuracy_score
from sklearn.datasets import load_breast_cancer  
from sklearn.model_selection import train_test_split
from sklearn.model_selection import ParameterGrid
from sklearn.model_selection import ParameterSampler
from scipy.stats.distributions import expon
import numpy as np



#从给定分布中生成采样参数
np.random.seed(0)
param = {"a":[1,2],"b":expon()}
param = list(ParameterSampler(param,n_iter=4))



##################################################################################


def get_model_GridSearchCV(estimator,parameters,X_train,y_train,scoring,cv=5): 
    """
    return:返回训练过的最好模型
    """
    
    #refit:Refit an estimator using the best found parameters on the whole dataset.
    model = GridSearchCV(estimator=estimator,param_grid=parameters,scoring=scoring,cv=5,refit=True)    
    
    model.fit(X_train, y_train)
    
    #打印结果
    print("best score in GridSearchCV:
",model.best_score_)
    print("best param in GridSearchCV:
",model.best_params_)     
    
    return model.best_estimator_


#########################################测试########################################

X,y = load_breast_cancer(return_X_y=True)  

#分隔训练集和测试集
X_train,X_test,y_train,y_test = train_test_split(X,y,test_size=0.3,random_state=0,stratify=y)

#配置参数
param = [{
         "learning_rate":[0.1,0.3,0.6],
         "max_depth":[5,6,7],
         "n_estimators":[100,200,300], 
        }]


#scoring = make_scorer(accuracy_score, greater_is_better=True)

estimator = xgb.XGBClassifier(objective="reg:logistic")

#训练模型
model = get_model_GridSearchCV(estimator=estimator,
                               parameters=param,
                               cv=5,
                               X_train=X_train,
                               y_train=y_train,
                               scoring="roc_auc")

#采用训练得模型做测试
"""
decision_function(*args, **kwargs)    Call decision_function on the estimator with the best found parameters.
fit(X[, y, groups])    Run fit with all sets of parameters.
get_params([deep])    Get parameters for this estimator.
inverse_transform(*args, **kwargs)    Call inverse_transform on the estimator with the best found params.
predict(*args, **kwargs)    Call predict on the estimator with the best found parameters.
predict_log_proba(*args, **kwargs)    Call predict_log_proba on the estimator with the best found parameters.
predict_proba(*args, **kwargs)    Call predict_proba on the estimator with the best found parameters.
score(X[, y])    Returns the score on the given data, if the estimator has been refit.
set_params(**params)    Set the parameters of this estimator.
transform(*args, **kwargs)    Call transform on the estimator with the best found parameters.
"""
y_pred = model.predict(X_test)

#模型评价
print(accuracy_score(y_test,y_pred))

查看全文

相关阅读:
一个想法开发与业务，我们互相依赖
 vs2005中文包，和sqlserver2005中文开发版
 C中的指针
 建立一个新的web Site
Visual Studio 2005 中的新增安全性功能
 htm和html的区别
 完美实现导航滑动功能
 如何避免AJAX的缓存问题
 两个常用的稳定的远端CDN jquery
推荐一个CSS排错的网址

原文地址：https://www.cnblogs.com/wzdLY/p/9840192.html