digits: Clean up code a bit

2015-11-06 00:59:03 +01:00 · 2015-11-06 00:59:03 +01:00 · 6f6d06ec91
commit 6f6d06ec91
parent 347f9edc8d
1 changed files with 46 additions and 32 deletions
--- a/digits.py
+++ b/digits.py
@ -1,11 +1,12 @@
 #!/usr/bin/env python
 # vim:tabstop=4 shiftwidth=4 tw=79:
 '''
 SVM, Random forest and KNearest digit recognition.
 Modified from the OpenCV example.
-Sample loads a dataset of handwritten digits from '../data/digits.png'.
+Sample loads a dataset of handwritten digits from '../data/digits.png'.  Then
-Then it trains a Random Forest, SVM and KNearest classifiers on it and evaluates
+it trains a Random Forest, SVM and KNearest classifiers on it and evaluates
 their accuracy.
 Following preprocessing is applied to the dataset:
@ -25,22 +26,20 @@ Usage:
     digits.py
 '''
 # built-in modules
 from multiprocessing.pool import ThreadPool
 import cv2
 import numpy as np
 from numpy.linalg import norm
 # local modules
-from common import clock, mosaic
+from common import mosaic
-
+SZ = 20  # size of each digit is SZ x SZ
 SZ = 20 # size of each digit is SZ x SZ
 CLASS_N = 10
 DIGITS_FN = 'digits.png'
 SIMPLE = True  # Use simple preprocessing or HOG features (for SVM)
 def split2d(img, cell_size, flatten=True):
    h, w = img.shape[:2]
@ -51,6 +50,7 @@ def split2d(img, cell_size, flatten=True):
        cells = cells.reshape(-1, sy, sx)
    return cells
 def load_digits(fn):
    print 'loading "%s" ...' % fn
    digits_img = cv2.imread(fn, 0)
@ -58,23 +58,28 @@ def load_digits(fn):
    labels = np.repeat(np.arange(CLASS_N), len(digits)/CLASS_N)
    return digits, labels
 def deskew(img):
    m = cv2.moments(img)
    if abs(m['mu02']) < 1e-2:
        return img.copy()
    skew = m['mu11']/m['mu02']
    M = np.float32([[1, skew, -0.5*SZ*skew], [0, 1, 0]])
-    img = cv2.warpAffine(img, M, (SZ, SZ), flags=cv2.WARP_INVERSE_MAP | cv2.INTER_LINEAR)
+    img = cv2.warpAffine(img, M, (SZ, SZ),
                         flags=cv2.WARP_INVERSE_MAP | cv2.INTER_LINEAR)
    return img
 class StatModel(object):
    def load(self, fn):
        self.model.load(fn)
    def save(self, fn):
        self.model.save(fn)
 class KNearest(StatModel):
-    def __init__(self, k = 3):
+    def __init__(self, k=3):
        self.k = k
        self.model = cv2.KNearest()
@ -83,42 +88,47 @@ class KNearest(StatModel):
        self.model.train(samples, responses)
    def predict(self, samples):
-        retval, results, neigh_resp, dists = self.model.find_nearest(samples, self.k)
+        retval, results, neigh_resp, dists = self.model.find_nearest(samples,
                                                                     self.k)
        return results.ravel()
 class SVM(StatModel):
    def __init__(self, kernel_type=cv2.SVM_RBF, C=1, gamma=0.5):
-        self.params = dict( kernel_type = kernel_type,
+        self.params = dict(kernel_type=kernel_type,
-                            svm_type = cv2.SVM_C_SVC,
+                           svm_type=cv2.SVM_C_SVC,
-                            C = C,
+                           C=C,
-                            gamma = gamma )
+                           gamma=gamma)
        self.model = cv2.SVM()
    def train(self, samples, responses):
        self.model = cv2.SVM()
-        self.model.train(samples, responses, params = self.params)
+        self.model.train(samples, responses, params=self.params)
    def train_auto(self, samples, responses):
        self.model = cv2.SVM()
-        self.model.train_auto(samples, responses, None, None, params = self.params)
+        self.model.train_auto(samples, responses, None, None,
                              params=self.params)
    def predict(self, samples):
        return self.model.predict_all(samples).ravel()
 class RForest(StatModel):
    def __init__(self):
-        self.params = dict( max_depth=20 )
+        self.params = dict(max_depth=20)
        self.model = cv2.RTrees()
    def train(self, samples, responses):
        self.model = cv2.RTrees()
        self.model.train(samples, cv2.CV_ROW_SAMPLE, responses,
-              params=self.params)
+                         params=self.params)
    def predict(self, samples):
        predictions = map(self.model.predict, samples)
        return predictions
 def evaluate_model(model, digits, samples, labels):
    resp = model.predict(samples)
    err = (labels != resp).mean()
@ -135,13 +145,15 @@ def evaluate_model(model, digits, samples, labels):
    for img, flag in zip(digits, resp == labels):
        img = cv2.cvtColor(img, cv2.COLOR_GRAY2BGR)
        if not flag:
-            img[...,:2] = 0
+            img[..., :2] = 0
        vis.append(img)
    return mosaic(25, vis)
 def preprocess_simple(digits):
    return np.float32(digits).reshape(-1, SZ*SZ) / 255.0
 def preprocess_hog(digits):
    samples = []
    for img in digits:
@ -150,9 +162,10 @@ def preprocess_hog(digits):
        mag, ang = cv2.cartToPolar(gx, gy)
        bin_n = 16
        bin = np.int32(bin_n*ang/(2*np.pi))
-        bin_cells = bin[:10,:10], bin[10:,:10], bin[:10,10:], bin[10:,10:]
+        bin_cells = bin[:10, :10], bin[10:, :10], bin[:10, 10:], bin[10:, 10:]
-        mag_cells = mag[:10,:10], mag[10:,:10], mag[:10,10:], mag[10:,10:]
+        mag_cells = mag[:10, :10], mag[10:, :10], mag[:10, 10:], mag[10:, 10:]
-        hists = [np.bincount(b.ravel(), m.ravel(), bin_n) for b, m in zip(bin_cells, mag_cells)]
+        hists = [np.bincount(b.ravel(), m.ravel(), bin_n)
                 for b, m in zip(bin_cells, mag_cells)]
        hist = np.hstack(hists)
        # transform to Hellinger kernel
@ -177,8 +190,10 @@ if __name__ == '__main__':
    digits, labels = digits[shuffle], labels[shuffle]
    digits2 = map(deskew, digits)
-    samples = preprocess_simple(digits2)
+    if SIMPLE:
-    #samples = preprocess_hog(digits2)
+        samples = preprocess_simple(digits2)
    else:
        samples = preprocess_hog(digits2)
    train_n = int(0.9*len(samples))
    cv2.imshow('test set', mosaic(25, digits[train_n:]))
@ -201,17 +216,16 @@ if __name__ == '__main__':
    print 'training SVM...'
-    # HOG (original digits.py)
+    if SIMPLE:
-    #model = SVM(kernel_type=cv2.SVM_RBF, C=2.67, gamma=5.383)
+        model = SVM(kernel_type=cv2.SVM_LINEAR, C=0.1)
-    #model.train(samples_train, labels_train)
+        model.train(samples_train, labels_train)
-    # Simple (cross-validation)
+    else:
-    model = SVM(kernel_type=cv2.SVM_LINEAR, C=0.1)
+        model = SVM(kernel_type=cv2.SVM_RBF, C=2.67, gamma=5.383)
-    model.train(samples_train, labels_train)
+        model.train(samples_train, labels_train)
    vis = evaluate_model(model, digits_test, samples_test, labels_test)
    cv2.imshow('SVM test', vis)
    print 'saving SVM as "digits_svm.dat"...'
    model.save('digits_svm.dat')
    cv2.waitKey(0)