import numpy as np
import matplotlib.pyplot as plt
import pandas as pd
import seaborn as sns
from sklearn.model_selection import train_test_split
from sklearn.metrics import accuracy_score
from sklearn.neighbors import KNeighborsClassifier
%matplotlib inlinedom
# 加载数据集
fruits_df = pd.read_table('fruit_data_with_colors.txt')ui
X = fruits_df[['mass', 'width', 'height', 'color_score']]
y = fruits_df['fruit_label']spa
# 分割数据集
X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=1/4, random_state=0)pandas
# 创建模型
knn = KNeighborsClassifier(n_neighbors=5)it
# 训练模型
knn.fit(X_train, y_train)io
# 验证模型
y_pred = knn.predict(X_test)table
acc = accuracy_score(y_test, y_pred)
print('准确率:', acc)test
===================================import
准确率: 0.533333333333