• Python随机森林算法的使用


    #coding:utf-8
    
    # from python.Lib.packages.sklearn.tree import DecisionTreeClassifier
    # from python.Lib.packages.matplotlib.pyplot import *
    # from python.Lib.packages.sklearn.cross_validation import train_test_split
    # from python.Lib.packages.sklearn.ensemble import RandomForestClassifier
    # from python.Lib.packages.sklearn.externals.joblib import Parallel,delayed
    # from python.Lib.packages.sklearn.tree import export_graphviz
    # from python.Lib.packages.sklearn.datasets import load_iris
    # import python.Lib.packages.pandas as pd
    
    
    from sklearn.tree import DecisionTreeClassifier
    from matplotlib.pyplot import *
    from sklearn.cross_validation import train_test_split
    from sklearn.ensemble import RandomForestClassifier
    from sklearn.externals.joblib import Parallel,delayed
    from sklearn.tree import export_graphviz
    from sklearn.datasets import load_iris
    import pandas as pd
    
    def RandomForest(dir):
        # final = open('F:/test/final.dat' , 'r')
        data=pd.read_csv(dir)
        # data = [line.strip().split('	') for line in final]
        feature=data[[i for i in range(8)]].values
        target=data[[8]].values
        # target1=[target[0][i] for i in range(len(target[0]))]
        # print feature
        # print target
        # feature = [[float(x) for x in row[3:]] for row in data]
        # target = [int(row[0]) for row in data]
    
        #拆分训练集和测试集
        # iris=load_iris()
        #
        # feature=iris.data
        # target=iris.target
        # print iris['target'].shape
        feature_train, feature_test, target_train, target_test = train_test_split(feature, target, test_size=0.1, random_state=42)
    
        #分类型决策树
        clf = RandomForestClassifier()
    
        #训练模型
        s = clf.fit(feature_train,target_train)
        print s
    
        #评估模型准确率
        r = clf.score(feature_test , target_test)
        print r
    
        print u'判定结果:%s' % clf.predict(feature_test[0])
        #print clf.predict_proba(feature_test[0])
    
        print u'所有的树:%s' % clf.estimators_
    
        print clf.classes_
        print clf.n_classes_
    
        print u'各feature的重要性:%s' % clf.feature_importances_
    if __name__=="__main__":
        dir="Carseats.csv"
        RandomForest(dir)
  • 相关阅读:
    验证码
    SQL给字段加上统一的某个字符
    科讯CMS V9标签清单
    需要重新启动计算机.必须重新启动计算机才能安装 SQL Server
    父页面iframe自动适应子页面的宽高度
    div随另一个div自动增高
    让图片在DIV中垂直居中
    nginx default server
    zabbix proxy 分布式监控
    openjdk tomcat 安装
  • 原文地址:https://www.cnblogs.com/wuchuanying/p/6228675.html
Copyright © 2020-2023  润新知