使用python语言 学习k近邻分类器的api

 from sklearn.datasets import load_iris
from sklearn.cross_validation import train_test_split
from sklearn.preprocessing import StandardScaler
from sklearn.neighbors import KNeighborsClassifier
from sklearn.metrics import classification_report '''
''' '''
1 准备数据
# 读取鸢尾花数据集
iris = load_iris()
# 检查数据规模
# print(iris.data.shape) # (150, 4)
# 查看数据说明
# print(iris.DESCR)
''' '''
2 划分训练集合和测试集合
x_train, x_test, y_train, y_test = train_test_split(iris.data,
random_state=33) '''
3 k近邻分类器 学习模型和预测
# 训练数据和测试数据进行标准化
ss = StandardScaler()
x_train = ss.fit_transform(x_train)
x_test = ss.transform(x_test) # 建立一个k近邻模型对象
knc = KNeighborsClassifier()
# 输入训练数据进行学习建模
knc.fit(x_train, y_train)
# 对测试数据进行预测
y_predict = knc.predict(x_test) '''
4 模型评估
print("准确率:", knc.score(x_test, y_test))
print("其他指标:\n", classification_report(y_test, y_predict, target_names=iris.target_names))
准确率: 0.8947368421052632
precision recall f1-score support setosa 1.00 1.00 1.00 8
versicolor 0.73 1.00 0.85 11
virginica 1.00 0.79 0.88 19 avg / total 0.92 0.89 0.90 38


