import numpy as np

data_arr = []
label_arr = []
f = open('D:\\mlInAction\\data\\5.Logistic\\TestSet.txt', 'r')
for line in f.readlines():
    line_arr = line.strip().split()
    # 爲了方便計算，咱們將 X0 的值設爲 1.0 ，也就是在每一行的開頭添加一個 1.0 做爲 X0
    data_arr.append([1.0, np.float(line_arr[0]), np.float(line_arr[1])])
    label_arr.append(int(line_arr[2]))

data_arr

[[1.0, -0.017612, 14.053064],
 [1.0, -1.395634, 4.662541],
 [1.0, -0.752157, 6.53862],
 [1.0, -1.322371, 7.152853],
 [1.0, 0.423363, 11.054677],
 [1.0, 0.406704, 7.067335],
 [1.0, 0.667394, 12.741452],
 [1.0, -2.46015, 6.866805],
 [1.0, 0.569411, 9.548755],
 [1.0, -0.026632, 10.427743],
 [1.0, 0.850433, 6.920334],
 [1.0, 1.347183, 13.1755],
 [1.0, 1.176813, 3.16702],
 [1.0, -1.781871, 9.097953],
 [1.0, -0.566606, 5.749003],
 [1.0, 0.931635, 1.589505],
 [1.0, -0.024205, 6.151823],
 [1.0, -0.036453, 2.690988],
 [1.0, -0.196949, 0.444165],
 [1.0, 1.014459, 5.754399],
 [1.0, 1.985298, 3.230619],
 [1.0, -1.693453, -0.55754],
 [1.0, -0.576525, 11.778922],
 [1.0, -0.346811, -1.67873],
 [1.0, -2.124484, 2.672471],
 [1.0, 1.217916, 9.597015],
 [1.0, -0.733928, 9.098687],
 [1.0, -3.642001, -1.618087],
 [1.0, 0.315985, 3.523953],
 [1.0, 1.416614, 9.619232],
 [1.0, -0.386323, 3.989286],
 [1.0, 0.556921, 8.294984],
 [1.0, 1.224863, 11.58736],
 [1.0, -1.347803, -2.406051],
 [1.0, 1.196604, 4.951851],
 [1.0, 0.275221, 9.543647],
 [1.0, 0.470575, 9.332488],
 [1.0, -1.889567, 9.542662],
 [1.0, -1.527893, 12.150579],
 [1.0, -1.185247, 11.309318],
 [1.0, -0.445678, 3.297303],
 [1.0, 1.042222, 6.105155],
 [1.0, -0.618787, 10.320986],
 [1.0, 1.152083, 0.548467],
 [1.0, 0.828534, 2.676045],
 [1.0, -1.237728, 10.549033],
 [1.0, -0.683565, -2.166125],
 [1.0, 0.229456, 5.921938],
 [1.0, -0.959885, 11.555336],
 [1.0, 0.492911, 10.993324],
 [1.0, 0.184992, 8.721488],
 [1.0, -0.355715, 10.325976],
 [1.0, -0.397822, 8.058397],
 [1.0, 0.824839, 13.730343],
 [1.0, 1.507278, 5.027866],
 [1.0, 0.099671, 6.835839],
 [1.0, -0.344008, 10.717485],
 [1.0, 1.785928, 7.718645],
 [1.0, -0.918801, 11.560217],
 [1.0, -0.364009, 4.7473],
 [1.0, -0.841722, 4.119083],
 [1.0, 0.490426, 1.960539],
 [1.0, -0.007194, 9.075792],
 [1.0, 0.356107, 12.447863],
 [1.0, 0.342578, 12.281162],
 [1.0, -0.810823, -1.466018],
 [1.0, 2.530777, 6.476801],
 [1.0, 1.296683, 11.607559],
 [1.0, 0.475487, 12.040035],
 [1.0, -0.783277, 11.009725],
 [1.0, 0.074798, 11.02365],
 [1.0, -1.337472, 0.468339],
 [1.0, -0.102781, 13.763651],
 [1.0, -0.147324, 2.874846],
 [1.0, 0.518389, 9.887035],
 [1.0, 1.015399, 7.571882],
 [1.0, -1.658086, -0.027255],
 [1.0, 1.319944, 2.171228],
 [1.0, 2.056216, 5.019981],
 [1.0, -0.851633, 4.375691],
 [1.0, -1.510047, 6.061992],
 [1.0, -1.076637, -3.181888],
 [1.0, 1.821096, 10.28399],
 [1.0, 3.01015, 8.401766],
 [1.0, -1.099458, 1.688274],
 [1.0, -0.834872, -1.733869],
 [1.0, -0.846637, 3.849075],
 [1.0, 1.400102, 12.628781],
 [1.0, 1.752842, 5.468166],
 [1.0, 0.078557, 0.059736],
 [1.0, 0.089392, -0.7153],
 [1.0, 1.825662, 12.693808],
 [1.0, 0.197445, 9.744638],
 [1.0, 0.126117, 0.922311],
 [1.0, -0.679797, 1.22053],
 [1.0, 0.677983, 2.556666],
 [1.0, 0.761349, 10.693862],
 [1.0, -2.168791, 0.143632],
 [1.0, 1.38861, 9.341997],
 [1.0, 0.317029, 14.739025]]

label_arr

[0,
 1,
 0,
 0,
 0,
 1,
 0,
 1,
 0,
 0,
 1,
 0,
 1,
 0,
 1,
 1,
 1,
 1,
 1,
 1,
 1,
 1,
 0,
 1,
 1,
 0,
 0,
 1,
 1,
 0,
 1,
 1,
 0,
 1,
 1,
 0,
 0,
 0,
 0,
 0,
 1,
 1,
 0,
 1,
 1,
 0,
 1,
 1,
 0,
 0,
 0,
 0,
 0,
 0,
 1,
 1,
 0,
 1,
 0,
 1,
 1,
 1,
 0,
 0,
 0,
 1,
 1,
 0,
 0,
 0,
 0,
 1,
 0,
 1,
 0,
 0,
 1,
 1,
 1,
 1,
 0,
 1,
 0,
 1,
 1,
 1,
 1,
 0,
 1,
 1,
 1,
 0,
 0,
 1,
 1,
 1,
 0,
 1,
 0,
 0]

def sigmoid(x):
    # 這裏其實很是有必要解釋一下，會出現的錯誤 RuntimeWarning: overflow encountered in exp
    # 這個錯誤在學習階段雖然能夠忽略，可是咱們至少應該知道爲何
    # 這裏是由於咱們輸入的有的 x 實在是過小了，好比 -6000之類的，那麼計算一個數字 np.exp(6000)這個結果太大了，無法表示，因此就溢出了
    # 若是是計算 np.exp（-6000），這樣雖然也會溢出，可是這是下溢，就是表示成零
    # 去網上搜了不少方法，好比 使用bigfloat這個庫（我居然沒有安裝成功，就不嘗試了，反正應該是有用的
    return 1.0 / (1 + np.exp(-x))

def grad_ascent(data_arr, class_labels):
    """
    梯度上升法，其實就是由於使用了極大似然估計，這個你們有必要去看推導，只看代碼感受不太夠
    :param data_arr: 傳入的就是一個普通的數組，固然你傳入一個二維的ndarray也行
    :param class_labels: class_labels 是類別標籤，它是一個 1*100 的行向量。
                    爲了便於矩陣計算，須要將該行向量轉換爲列向量，作法是將原向量轉置，再將它賦值給label_mat
    :return: 
    """
    # 注意一下，我把原來 data_mat_in 改爲data_arr,由於傳進來的是一個數組，用這個比較不容易搞混
    # turn the data_arr to numpy matrix
    data_mat = np.mat(data_arr)
    # 變成矩陣以後進行轉置
    label_mat = np.mat(class_labels).transpose()
    # m->數據量，樣本數 n->特徵數
    m, n = np.shape(data_mat)
    # 學習率，learning rate
    alpha = 0.001
    # 最大迭代次數，僞裝迭代這麼屢次就能收斂2333
    max_cycles = 500
    # 生成一個長度和特徵數相同的矩陣，此處n爲3 -> [[1],[1],[1]]
    # weights 表明迴歸係數， 此處的 ones((n,1)) 建立一個長度和特徵數相同的矩陣，其中的數所有都是 1
    weights = np.ones((n, 1))
    for k in range(max_cycles):
        # 這裏是點乘  m x 3 dot 3 x 1
        h = sigmoid(data_mat * weights)
        error = label_mat - h
        # 這裏比較建議看一下推導，爲何這麼作能夠，這裏已是求導以後的
        weights = weights + alpha * data_mat.transpose() * error
    return weights

weights = grad_ascent(data_arr, label_arr)
weights

matrix([[ 4.12414349],
        [ 0.48007329],
        [-0.6168482 ]])

import matplotlib.pyplot as plt


def plot_best_fit(data_mat, label_mat, weights):
    """
    可視化
    :param weights: 
    :return: 
    """
    data_arr = np.array(data_mat)
    n = np.shape(data_mat)[0]
    x_cord1 = []
    y_cord1 = []
    x_cord2 = []
    y_cord2 = []
    for i in range(n):
        if int(label_mat[i]) == 1:
            x_cord1.append(data_arr[i, 1])
            y_cord1.append(data_arr[i, 2])
        else:
            x_cord2.append(data_arr[i, 1])
            y_cord2.append(data_arr[i, 2])
    fig = plt.figure()
    ax = fig.add_subplot(111)
    ax.scatter(x_cord1, y_cord1, s=30, color='k', marker='^')
    ax.scatter(x_cord2, y_cord2, s=30, color='red', marker='s')
    x = np.arange(-3.0, 3.0, 0.1)
    # print(x)
    y = (-weights[0] - weights[1] * x) / weights[2]
    # type(y)
    y = np.ravel(y)  # y原來是一個二維，須要轉化爲1維
    """
    y的由來，臥槽，是否是沒看懂？
    首先理論上是這個樣子的。
    dataMat.append([1.0, float(lineArr[0]), float(lineArr[1])])
    w0*x0+w1*x1+w2*x2=f(x)
    x0最開始就設置爲1叻， x2就是咱們畫圖的y值，而f(x)被咱們磨合偏差給算到w0,w1,w2身上去了
    因此： w0+w1*x+w2*y=0 => y = (-w0-w1*x)/w2   
    """
    ax.plot(x, y)
    plt.xlabel('x1')
    plt.ylabel('y1')
    plt.show()

plot_best_fit(data_arr, label_arr, weights)

def stoc_grad_ascent0(data_mat, class_labels):
    """
    隨機梯度上升，只使用一個樣本點來更新迴歸係數
    :param data_mat: 輸入數據的數據特徵（除去最後一列）,ndarray
    :param class_labels: 輸入數據的類別標籤（最後一列數據）
    :return: 獲得的最佳迴歸係數
    """
    m, n = np.shape(data_mat)
    alpha = 0.01
    weights = np.ones(n)
    for i in range(m):
        # sum(data_mat[i]*weights)爲了求 f(x)的值， f(x)=a1*x1+b2*x2+..+nn*xn,
        # 此處求出的 h 是一個具體的數值，而不是一個矩陣
        h = sigmoid(sum(data_mat[i] * weights))
        error = class_labels[i] - h
        # 仍是和上面同樣，這個先去看推導，再寫程序
        weights = weights + alpha * error * data_mat[i]
    return weights

def stoc_grad_ascent1(data_mat, class_labels, num_iter=150):
    """
    改進版的隨機梯度上升，使用隨機的一個樣原本更新迴歸係數
    :param data_mat: 輸入數據的數據特徵（除去最後一列）,ndarray
    :param class_labels: 輸入數據的類別標籤（最後一列數據
    :param num_iter: 迭代次數
    :return: 獲得的最佳迴歸係數
    """
    m, n = np.shape(data_mat)
    weights = np.ones(n)
    for j in range(num_iter):
        # 這裏必需要用list，否則後面的del無法使用
        data_index = list(range(m))
        for i in range(m):
            # i和j的不斷增大，致使alpha的值不斷減小，可是不爲0
            alpha = 4 / (1.0 + j + i) + 0.01
            # 隨機產生一個 0～len()之間的一個值
            # random.uniform(x, y) 方法將隨機生成下一個實數，它在[x,y]範圍內,x是這個範圍內的最小值，y是這個範圍內的最大值。
            rand_index = int(np.random.uniform(0, len(data_index)))
            h = sigmoid(np.sum(data_mat[data_index[rand_index]] * weights))
            error = class_labels[data_index[rand_index]] - h
            weights = weights + alpha * error * data_mat[data_index[rand_index]]
            del(data_index[rand_index])
    return weights

weights1 = stoc_grad_ascent1(np.array(data_arr), np.array(label_arr))
weights1

array([13.97204276,  1.24615972, -1.9102347 ])

plot_best_fit(data_arr, label_arr, weights1)

05機器學習實戰之Logistic 迴歸

Logistic 迴歸概述

須知概念

Sigmoid 函數

迴歸概念

二值型輸出分類函數

基於最優化方法的迴歸係數肯定

梯度上升法

梯度上升法的思想

Logistic 迴歸原理

Logistic 迴歸工做原理

Logistic 迴歸開發流程

Logistic 迴歸算法特色

附加方向導數與梯度

Logistic 迴歸項目案例

項目概述

開發流程

注意

05機器學習實戰之Logistic 迴歸

Logistic 迴歸 概述

須知概念

Sigmoid 函數

迴歸 概念

二值型輸出分類函數

基於最優化方法的迴歸係數肯定

梯度上升法

梯度上升法的思想

Logistic 迴歸 原理

Logistic 迴歸 工做原理

Logistic 迴歸 開發流程

Logistic 迴歸 算法特色

附加 方向導數與梯度

Logistic 迴歸 項目案例

項目概述

開發流程

注意

Logistic 迴歸概述

迴歸概念

Logistic 迴歸原理

Logistic 迴歸工做原理

Logistic 迴歸開發流程

Logistic 迴歸算法特色

附加方向導數與梯度

Logistic 迴歸項目案例