DT

751 ワード

    path ='iris.data'  #       
    data = pd.read_csv(path, header=None)
    x = data[[0, 1]]
    # y = pd.Categorical(data[4]).codes
    y = LabelEncoder().fit_transform(data[4])
    #      ,        
    x = x.iloc[:, :2]
    # x = x[[0,1]]
    x_train, x_test, y_train, y_test = train_test_split(x, y, train_size=0.7, random_state=1)

    #        
    # min_samples_split = 10:              10, (   )    
    # min_samples_leaf = 10:        ,               10,     ;  ,     
    model = DecisionTreeClassifier(criterion='entropy', min_samples_leaf=3)
    model.fit(x_train, y_train)
    y_test_hat = model.predict(x_test)      #     
    print('accuracy_score:', accuracy_score(y_test, y_test_hat))