codingLv
diff --git a/‎LogisticRegression/LogisticRegression_OneVsAll.py‎
Lines changed: 25 additions & 15 deletions b/‎LogisticRegression/LogisticRegression_OneVsAll.py‎
Lines changed: 25 additions & 15 deletions
diff --git a/‎LogisticRegression/LogisticRegression_OneVsAll_scikit-learn.py‎
Lines changed: 27 additions & 0 deletions b/‎LogisticRegression/LogisticRegression_OneVsAll_scikit-learn.py‎
Lines changed: 27 additions & 0 deletions
diff --git a/‎LogisticRegression/class_y.csv‎
Lines changed: 600 additions & 0 deletions b/‎LogisticRegression/class_y.csv‎
Lines changed: 600 additions & 0 deletions
diff --git a/‎images/LogisticRegression_08.png‎
153 KB b/‎images/LogisticRegression_08.png‎
153 KB
diff --git a/‎images/LogisticRegression_09.png‎
85 KB b/‎images/LogisticRegression_09.png‎
85 KB
diff --git a/‎images/LogisticRegression_10.png‎
17.5 KB b/‎images/LogisticRegression_10.png‎
17.5 KB
diff --git a/‎images/LogisticRegression_11.png‎
10.4 KB b/‎images/LogisticRegression_11.png‎
10.4 KB
diff --git a/‎images/LogisticRegression_12.png‎
32.4 KB b/‎images/LogisticRegression_12.png‎
32.4 KB
diff --git a/‎images/LogisticRegression_13.png‎
5.45 KB b/‎images/LogisticRegression_13.png‎
5.45 KB
diff --git a/‎readme.md‎
Lines changed: 138 additions & 2 deletions b/‎readme.md‎
Lines changed: 138 additions & 2 deletions
@@ -12,8 +12,9 @@ def logisticRegression_OneVsAll():
     X = data['X']   # 获取X数据，每一行对应一个数字20x20px
     y = data['y']
     m,n = X.shape
-    num_labels = 10
+    num_labels = 10 # 数字个数，0-9
 
+    ##　随机显示几行数据
     rand_indices = [t for t in [np.random.randint(x-x, m) for x in range(100)]]  # 生成100个0-m的随机数
     display_data(X[rand_indices,:])     # 显示100个数字
 
@@ -32,36 +33,45 @@ def logisticRegression_OneVsAll():
 def loadmat_data(fileName):
     return spio.loadmat(fileName)
 
-# 显示10个数字
+# 显示100个数字
 def display_data(imgData):
     sum = 0
-    display_array = np.ones((200,200))
+    '''
+    显示100个数（若是一个一个绘制将会非常慢，可以将要画的数字整理好，放到一个矩阵中，显示这个矩阵即可）
+    - 初始化一个二维数组
+    - 将每行的数据调整成图像的矩阵，放进二维数组
+    - 显示即可
+    '''
+    pad = 1
+    display_array = -np.ones((pad+10*(20+pad),pad+10*(20+pad)))
     for i in range(10):
         for j in range(10):
-            display_array[i*20:(i+1)*20,j*20:(j+1)*20] = imgData[sum,:].reshape(20,20)
+            display_array[pad+i*(20+pad):pad+i*(20+pad)+20,pad+j*(20+pad):pad+j*(20+pad)+20] = (imgData[sum,:].reshape(20,20,order="F"))    # order=F指定以列优先，在matlab中是这样的，python中需要指定，默认以行
             sum += 1
 
-    plt.imshow(display_array,cmap='gray')
+    plt.imshow(display_array,cmap='gray')   #显示灰度图像
     plt.axis('off')
     plt.show()
 
-# 求每个分类的theta    
+# 求每个分类的theta，最后返回所有的all_theta    
 def oneVsAll(X,y,num_labels,Lambda):
     # 初始化变量
     m,n = X.shape
-    all_theta = np.zeros((n+1,num_labels))
-    X = np.hstack((np.ones((m,1)),X))
-    class_y = np.zeros((m,num_labels))
-    initial_theta = np.zeros((n+1,1))
+    all_theta = np.zeros((n+1,num_labels))  # 每一列对应相应分类的theta,共10列
+    X = np.hstack((np.ones((m,1)),X))       # X前补上一列1的偏置bias
+    class_y = np.zeros((m,num_labels))      # 数据的y对应0-9，需要映射为0/1的关系
+    initial_theta = np.zeros((n+1,1))       # 初始化一个分类的theta
 
-    # 格式化y，将y两两分类
+    # 映射y
     for i in range(num_labels):
-        class_y[:,i] = np.int32(y==i).reshape(1,-1)
+        class_y[:,i] = np.int32(y==i).reshape(1,-1) # 注意reshape(1,-1)才可以赋值
+    
+    #np.savetxt("class_y.csv", class_y[0:600,:], delimiter=',')    
 
+    '''遍历每个分类，计算对应的theta值'''
     for i in range(num_labels):
-        #all_theta[:,i] = optimize.fmin(costFunction,initial_theta,args=(X,class_y[:,i].reshape(-1,1),Lambda),maxiter=50)
-        result = optimize.fmin_bfgs(costFunction, initial_theta, fprime=gradient, args=(X,class_y[:,i],Lambda))
-        all_theta[:,i] = result.reshape(1,-1)
+        result = optimize.fmin_bfgs(costFunction, initial_theta, fprime=gradient, args=(X,class_y[:,i],Lambda)) # 调用梯度下降的优化方法
+        all_theta[:,i] = result.reshape(1,-1)   # 放入all_theta中
 
     all_theta = np.transpose(all_theta) 
     return all_theta
 
@@ -0,0 +1,27 @@
+#-*- coding: utf-8 -*-
+from scipy import io as spio
+import numpy as np
+from sklearn import svm
+from sklearn.linear_model import LogisticRegression
+
+
+
+def logisticRegression_oneVsAll():
+    data = loadmat_data("data_digits.mat") 
+    X = data['X']   # 获取X数据，每一行对应一个数字20x20px
+    y = data['y']   # 这里读取mat文件y的shape=(5000, 1)
+    y = np.ravel(y) # 调用sklearn需要转化成一维的(5000,)
+    
+    model = LogisticRegression()
+    model.fit(X, y) # 拟合
+    
+    predict = model.predict(X) #预测
+    
+    print u"预测准确度为：%f%%"%np.mean(np.float64(predict == y)*100)
+
+# 加载mat文件
+def loadmat_data(fileName):
+    return spio.loadmat(fileName)
+
+if __name__ == "__main__":
+    logisticRegression_oneVsAll()
@@ -106,7 +106,7 @@ from sklearn.preprocessing import StandardScaler    #引入缩放的包
     result = model.predict(x_test)
 ```
 
-## 二、逻辑回归
+## 二、[逻辑回归](/LogisticRegression)
 - [全部代码](/LogisticRegression/LogisticRegression.py)
 
 ### 1、代价函数
@@ -256,11 +256,147 @@ import numpy as np
 ```
 
 
+-------------
+
+ ## [逻辑回归_手写数字识别_OneVsAll](/LogisticRegression)
+- [全部代码](/LogisticRegression/LogisticRegression_OneVsAll.py)
+
+### 1、随机显示100个数字
+- 我没有使用scikit-learn中的数据集，像素是20*20px，彩色图如下
+![enter description here][9]
+灰度图：
+![enter description here][10]
+- 实现代码：
+```
+# 显示100个数字
+def display_data(imgData):
+    sum = 0
+    '''
+    显示100个数（若是一个一个绘制将会非常慢，可以将要画的数字整理好，放到一个矩阵中，显示这个矩阵即可）
+    - 初始化一个二维数组
+    - 将每行的数据调整成图像的矩阵，放进二维数组
+    - 显示即可
+    '''
+    pad = 1
+    display_array = -np.ones((pad+10*(20+pad),pad+10*(20+pad)))
+    for i in range(10):
+        for j in range(10):
+            display_array[pad+i*(20+pad):pad+i*(20+pad)+20,pad+j*(20+pad):pad+j*(20+pad)+20] = (imgData[sum,:].reshape(20,20,order="F"))    # order=F指定以列优先，在matlab中是这样的，python中需要指定，默认以行
+            sum += 1
+            
+    plt.imshow(display_array,cmap='gray')   #显示灰度图像
+    plt.axis('off')
+    plt.show()
+```
+
+### 2、OneVsAll
+- 如何利用逻辑回归解决多分类的问题，OneVsAll就是把当前某一类看成一类，其他所有类别看作一类，这样有成了二分类的问题了
+- 如下图，把途中的数据分成三类，先把红色的看成一类，把其他的看作另外一类，进行逻辑回归，然后把蓝色的看成一类，其他的再看成一类，以此类推...
+![enter description here][11]
+- 可以看出大于2类的情况下，有多少类就要进行多少次的逻辑回归分类
+
+### 3、手写数字识别
+- 共有0-9，10个数字，需要10次分类
+- 由于**数据集y**给出的是`0,1,2...9`的数字，而进行逻辑回归需要`0/1`的label标记，所以需要对y处理
+- 说一下数据集，前`500`个是`0`,`500-1000`是`1`,`...`,所以如下图，处理后的`y`，**前500行的第一列是1，其余都是0,500-1000行第二列是1，其余都是0....**
+![enter description here][12]
+- 然后调用**梯度下降算法**求解`theta`
+- 实现代码：
+```
+# 求每个分类的theta，最后返回所有的all_theta    
+def oneVsAll(X,y,num_labels,Lambda):
+    # 初始化变量
+    m,n = X.shape
+    all_theta = np.zeros((n+1,num_labels))  # 每一列对应相应分类的theta,共10列
+    X = np.hstack((np.ones((m,1)),X))       # X前补上一列1的偏置bias
+    class_y = np.zeros((m,num_labels))      # 数据的y对应0-9，需要映射为0/1的关系
+    initial_theta = np.zeros((n+1,1))       # 初始化一个分类的theta
+    
+    # 映射y
+    for i in range(num_labels):
+        class_y[:,i] = np.int32(y==i).reshape(1,-1) # 注意reshape(1,-1)才可以赋值
+    
+    #np.savetxt("class_y.csv", class_y[0:600,:], delimiter=',')    
+    
+    '''遍历每个分类，计算对应的theta值'''
+    for i in range(num_labels):
+        result = optimize.fmin_bfgs(costFunction, initial_theta, fprime=gradient, args=(X,class_y[:,i],Lambda)) # 调用梯度下降的优化方法
+        all_theta[:,i] = result.reshape(1,-1)   # 放入all_theta中
+        
+    all_theta = np.transpose(all_theta) 
+    return all_theta
+```
+
+### 4、预测
+- 之前说过，预测的结果是一个**概率值**，利用学习出来的`theta`代入预测的**S型函数**中，每行的最大值就是是某个数字的最大概率，所在的**列号**就是预测的数字的真实值,因为在分类时，所有为`0`的将`y`映射在第一列，为1的映射在第二列，依次类推
+- 实现代码：
+```
+# 预测
+def predict_oneVsAll(all_theta,X):
+    m = X.shape[0]
+    num_labels = all_theta.shape[0]
+    p = np.zeros((m,1))
+    X = np.hstack((np.ones((m,1)),X))   #在X最前面加一列1
+    
+    h = sigmoid(np.dot(X,np.transpose(all_theta)))  #预测
+
+    '''
+    返回h中每一行最大值所在的列号
+    - np.max(h, axis=1)返回h中每一行的最大值（是某个数字的最大概率）
+    - 最后where找到的最大概率所在的列号（列号即是对应的数字）
+    '''
+    p = np.array(np.where(h[0,:] == np.max(h, axis=1)[0]))  
+    for i in np.arange(1, m):
+        t = np.array(np.where(h[i,:] == np.max(h, axis=1)[i]))
+        p = np.vstack((p,t))
+    return p
+```
+
+### 5、运行结果
+- 10次分类，在训练集上的准确度：
+![enter description here][13]
+
+### 6、[使用scikit-learn库中的逻辑回归模型实现](/LogisticRegression/LogisticRegression_OneVsAll_scikit-learn.py)
+- 1、导入包
+```
+from scipy import io as spio
+import numpy as np
+from sklearn import svm
+from sklearn.linear_model import LogisticRegression
+```
+- 2、加载数据
+```
+    data = loadmat_data("data_digits.mat") 
+    X = data['X']   # 获取X数据，每一行对应一个数字20x20px
+    y = data['y']   # 这里读取mat文件y的shape=(5000, 1)
+    y = np.ravel(y) # 调用sklearn需要转化成一维的(5000,)
+```
+- 3、拟合模型
+```
+    model = LogisticRegression()
+    model.fit(X, y) # 拟合
+```
+- 4、预测
+```
+    predict = model.predict(X) #预测
+    
+    print u"预测准确度为：%f%%"%np.mean(np.float64(predict == y)*100)
+```
+- 5、输出结果（在训练集上的准确度）
+![enter description here][14]
+
+
   [1]: ./images/LinearRegression_01.png "LinearRegression_01.png"
   [2]: ./images/LogisticRegression_01.png "LogisticRegression_01.png"
   [3]: ./images/LogisticRegression_02.png "LogisticRegression_02.png"
   [4]: ./images/LogisticRegression_03.jpg "LogisticRegression_03.jpg"
   [5]: ./images/LogisticRegression_04.png "LogisticRegression_04.png"
   [6]: ./images/LogisticRegression_05.png "LogisticRegression_05.png"
   [7]: ./images/LogisticRegression_06.png "LogisticRegression_06.png"
-  [8]: ./images/LogisticRegression_07.png "LogisticRegression_07.png"
+  [8]: ./images/LogisticRegression_07.png "LogisticRegression_07.png"
+  [9]: ./images/LogisticRegression_08.png "LogisticRegression_08.png"
+  [10]: ./images/LogisticRegression_09.png "LogisticRegression_09.png"
+  [11]: ./images/LogisticRegression_11.png "LogisticRegression_11.png"
+  [12]: ./images/LogisticRegression_10.png "LogisticRegression_10.png"
+  [13]: ./images/LogisticRegression_12.png "LogisticRegression_12.png"
+  [14]: ./images/LogisticRegression_13.png "LogisticRegression_13.png"