DT
751 ワード
path ='iris.data' #
data = pd.read_csv(path, header=None)
x = data[[0, 1]]
# y = pd.Categorical(data[4]).codes
y = LabelEncoder().fit_transform(data[4])
# ,
x = x.iloc[:, :2]
# x = x[[0,1]]
x_train, x_test, y_train, y_test = train_test_split(x, y, train_size=0.7, random_state=1)
#
# min_samples_split = 10: 10, ( )
# min_samples_leaf = 10: , 10, ; ,
model = DecisionTreeClassifier(criterion='entropy', min_samples_leaf=3)
model.fit(x_train, y_train)
y_test_hat = model.predict(x_test) #
print('accuracy_score:', accuracy_score(y_test, y_test_hat))