zoukankan      html  css  js  c++  java
  • 决策树

    import os
    import pandas as pd
    from sklearn.cross_validation import train_test_split
    from sklearn import tree
    from sklearn import metrics
    
    infile = 'sales_data.xls'
    os.chdir('E:pycharmmachine learning')
    data  = pd.read_excel(infile,index_col=u'序号')
    
    #print(data.dtypes)
    data[data == u'']=1
    data[data == u'']=1
    data[data == u'']=1
    data[data != 1] = -1
    print(data.dtypes)
    print('----------------------------------------')
    x = data.iloc[:,:-1].as_matrix().astype(int)
    y = data.iloc[:,-1].as_matrix().astype(int)
    
    x_train,x_test,y_train,y_test = train_test_split(x,y,test_size=0.4,random_state=12345)
    print('-----------------------------')
    print('划分数据集:')
    print(y_train)
    print('-----------------------------')
    print(y_train.dtype)
    
    print('训练模型:')
    clt = tree.DecisionTreeClassifier()
    clt.fit(x_train,y_train)
    
    print('-----------------------------')
    print('准确率:{}'.format(metrics.accuracy_score(y_train,clt.predict(x_train))))
    
    print('精确率:{}'.format(metrics.precision_score(y_train,clt.predict(x_train))))
    
    print('召回率:{}'.format(metrics.recall_score(y_train,clt.predict(x_train))))
    
    print(metrics.confusion_matrix(y_train,clt.predict(x_train)))#混淆矩阵
    
    print(clt.predict(x_train))
    print('-------预测---------实际-------------')
    print(y_train)
  • 相关阅读:
    贝叶斯定理
    用matplotlib统计数据并画图
    词云图
    一行python代码能写出啥?
    用python生成二维码
    18个python的高效编程技巧
    django简介
    vue点击变色
    selenium破解人人登陆验证码
    selenium请求豆瓣网
  • 原文地址:https://www.cnblogs.com/zft710/p/8898097.html
Copyright © 2011-2022 走看看