import numpy as np

import matplotlib.pyplot as plt

from matplotlib.colors import ListedColormap

from sklearn import neighbors,datasets

iris=datasets.load_iris()

print(iris.data[0:5])#打印數據的前五行

[[ 5.1  3.5  1.4  0.2]
 [ 4.9  3.   1.4  0.2]
 [ 4.7  3.2  1.3  0.2]
 [ 4.6  3.1  1.5  0.2]
 [ 5.   3.6  1.4  0.2]]

print(iris.target)

[0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0
 0 0 0 0 0 0 0 0 0 0 0 0 0 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1
 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 2 2 2 2 2 2 2 2 2 2 2
 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2
 2 2]

#設置iris數據集的前兩個屬性做爲一個變量x

X=iris.data[:,:2]

print(X[0:5])

[[ 5.1  3.5]
 [ 4.9  3. ]
 [ 4.7  3.2]
 [ 4.6  3.1]
 [ 5.   3.6]]

#取出類別標籤所在的列存儲在變量y中

Y=iris.target

#訓練knn分類器，設置最近鄰的個數爲15，權重參數爲uniform(最近鄰的全部點都具有相同的權重)

clf=neighbors.KNeighborsClassifier(n_neighbors=15,weights='uniform').fit(X,Y)

print(clf)

KNeighborsClassifier(algorithm='auto', leaf_size=30, metric='minkowski',
           metric_params=None, n_jobs=1, n_neighbors=15, p=2,
           weights='uniform')

#繪圖

h=0.02

#設置網格縱橫座標的最小值和最大值，限定範圍

x_min,x_max=X[:,0].min()-1,X[:,0].max()+1

y_min,y_max=X[:,1].min()-1,X[:,1].max()+1

#使用np.arrange（x_min，x_max，h）生成起始值爲x_min，終止值爲x_max，步長爲0.02的等差數列。

#使用meshgrid（np.arrange(x_min，x_max，h)，np.arrange(y_min,y_max,h)）生成兩個矩陣分別進行行填充和列填充

xx,yy=np.meshgrid(np.arange(x_min,x_max,h),np.arange(y_min,y_max,h))

#使用ravel()將這兩個矩陣變爲按順序輸出的一維數組，np.c_()將兩組的一維數組，兩兩組隊，造成網格中的點#

#使用clf.predict()預測這些點的所屬類別

Z=clf.predict(np.c_[xx.ravel(),yy.ravel()])

xx

array([[ 3.3 ,  3.32,  3.34, ...,  8.84,  8.86,  8.88],
       [ 3.3 ,  3.32,  3.34, ...,  8.84,  8.86,  8.88],
       [ 3.3 ,  3.32,  3.34, ...,  8.84,  8.86,  8.88],
       ..., 
       [ 3.3 ,  3.32,  3.34, ...,  8.84,  8.86,  8.88],
       [ 3.3 ,  3.32,  3.34, ...,  8.84,  8.86,  8.88],
       [ 3.3 ,  3.32,  3.34, ...,  8.84,  8.86,  8.88]])

yy

array([[ 1.  ,  1.  ,  1.  , ...,  1.  ,  1.  ,  1.  ],
       [ 1.02,  1.02,  1.02, ...,  1.02,  1.02,  1.02],
       [ 1.04,  1.04,  1.04, ...,  1.04,  1.04,  1.04],
       ..., 
       [ 5.34,  5.34,  5.34, ...,  5.34,  5.34,  5.34],
       [ 5.36,  5.36,  5.36, ...,  5.36,  5.36,  5.36],
       [ 5.38,  5.38,  5.38, ...,  5.38,  5.38,  5.38]])

xx.ravel()

array([ 3.3 ,  3.32,  3.34, ...,  8.84,  8.86,  8.88])

yy.ravel()

array([ 1.  ,  1.  ,  1.  , ...,  5.38,  5.38,  5.38])

np.c_[xx.ravel(),yy.ravel()]

array([[ 3.3 ,  1.  ],
       [ 3.32,  1.  ],
       [ 3.34,  1.  ],
       ..., 
       [ 8.84,  5.38],
       [ 8.86,  5.38],
       [ 8.88,  5.38]])

Z

array([0, 0, 0, ..., 2, 2, 2])

#填充顏色繪圖

camp_light=ListedColormap(['#FFAAAA','#AAFFAA','#AAAAFF'])

camp_bold=ListedColormap(['#FF0000','#00FF00','#0000FF'])

Z=Z.reshape(xx.shape)

plt.pcolormesh(xx,yy,Z,cmap=camp_light)#根據預測結果爲網格填充

<matplotlib.collections.QuadMesh at 0xa1846d8>

plt.scatter(X[:,0],X[:,1],c=Y,cmap=camp_bold,marker='o')#根據原始類別爲全部的點填充顏色

<matplotlib.collections.PathCollection at 0xa184f60>

plt.xlim(xx.min(),xx.max())

(3.2999999999999998, 8.8800000000000061)

plt.ylim(yy.min(),yy.max())

(1.0, 5.3800000000000043)

#plt.title("3-Class classfication(k= % i,weights='distance')" % k_neighbors)

plt.show()

correct=0.0

Z1=clf.predict(np.c_[xx.ravel(),yy.ravel()])

for i in range(len(iris.data)):
    if Z1[i]== iris.target[i]: 
        correct+=1

correct/len(iris.data)  #正確率

0.4666666666666667

Scikit-Learn實戰KNN

Scikit-Learn總結

1.Scikit-Learn基本知識的瞭解

2.Scikit-learn的六大功能

3.Scikit-Learn實戰KNNDemo