14 anos atrás · f957089b14
--- a/.gitignore
+++ b/.gitignore
@@ -15,3 +15,4 @@ images/BBB
 
				 images/Images
			
 
				 images/Infos
			
 
				 images/licenseplates
			
 
				+images/faulty
			
--- a/src/Classifier.py
+++ b/src/Classifier.py
@@ -3,7 +3,8 @@ from svmutil import svm_train, svm_problem, svm_parameter, svm_predict, \
 
				 
			
 
				 
			
 
				 class Classifier:
			
 
				-    def __init__(self, c=None, gamma=None, filename=None, neighbours=3):
			
 
				+    def __init__(self, c=None, gamma=None, filename=None, neighbours=3, \
			
 
				+            verbose=0):
			
 
				         self.neighbours = neighbours
			
 
				 
			
 
				         if filename:
			
@@ -18,6 +19,8 @@ class Classifier:
 
				             self.param.gamma = gamma  # Parameter for radial kernel
			
 
				             self.model = None
			
 
				 
			
 
				+        self.verbose = verbose
			
 
				+
			
 
				     def save(self, filename):
			
 
				         """Save the SVM model in the given filename."""
			
 
				         svm_save_model(filename, self.model)
			
@@ -30,8 +33,9 @@ class Classifier:
 
				         l = len(learning_set)
			
 
				 
			
 
				         for i, char in enumerate(learning_set):
			
 
				-            print 'Found "%s"  --  %d of %d (%d%% done)' \
			
 
				-                  % (char.value, i + 1, l, int(100 * (i + 1) / l))
			
 
				+            if self.verbose:
			
 
				+                print 'Found "%s"  --  %d of %d (%d%% done)' \
			
 
				+                    % (char.value, i + 1, l, round(100 * (i + 1) / l))
			
 
				             classes.append(float(ord(char.value)))
			
 
				             #features.append(char.get_feature_vector())
			
 
				             char.get_single_cell_feature_vector(self.neighbours)
			
@@ -57,6 +61,7 @@ class Classifier:
 
				         true_value = 0 if true_value == None else ord(true_value)
			
 
				         #x = character.get_feature_vector(self.cell_size)
			
 
				         character.get_single_cell_feature_vector(self.neighbours)
			
 
				+        #p = svm_predict([true_value], [character.feature], self.model, '-b 1')
			
 
				         p = svm_predict([true_value], [character.feature], self.model)
			
 
				         prediction_class = int(p[0][0])
			
 
				 
			
--- a/src/GaussianFilter.py
+++ b/src/GaussianFilter.py
@@ -2,8 +2,10 @@ from GrayscaleImage import GrayscaleImage
 
				 from scipy.ndimage import gaussian_filter
			
 
				 
			
 
				 class GaussianFilter:
			
 
				+    """This class can apply a Gaussian blur on an image."""
			
 
				 
			
 
				     def __init__(self, scale):
			
 
				+        """Create a GaussianFilter object with a given scale."""
			
 
				         self.scale = scale
			
 
				 
			
 
				     def get_filtered_copy(self, image):
			
@@ -12,12 +14,15 @@ class GaussianFilter:
 
				         return GrayscaleImage(None, image)
			
 
				 
			
 
				     def filter(self, image):
			
 
				+        """Apply a Gaussian blur on the image data."""
			
 
				         image.data = gaussian_filter(image.data, self.scale)
			
 
				 
			
 
				     def get_scale(self):
			
 
				-      return self.scale
			
 
				+        """Return the scale of the Gaussian kernel."""
			
 
				+        return self.scale
			
 
				 
			
 
				     def set_scale(self, scale):
			
 
				+        """Set the scale of the Gaussian kernel."""
			
 
				         self.scale = float(scale)
			
 
				 
			
 
				     scale = property(get_scale, set_scale)
			
--- a/src/LocalBinaryPatternizer.py
+++ b/src/LocalBinaryPatternizer.py
@@ -57,7 +57,7 @@ class LocalBinaryPatternizer:
 
				              | (self.is_pixel_darker(y - 2, x - 1, value))
			
 
				 
			
 
				     def create_features_vector(self):
			
 
				-        '''Walk around the pixels in clokwise order, shifting 1 bit less at
			
 
				+        '''Walk around the pixels in clockwise order, shifting 1 bit less at
			
 
				         each neighbour starting at 7 in the top-left corner. This gives a 8-bit
			
 
				         feature number of a pixel'''
			
 
				         self.setup_histograms()
			
--- a/src/find_svm_params.py
+++ b/src/find_svm_params.py
@@ -86,7 +86,7 @@ i = 0
 
				 
			
 
				 for c in C:
			
 
				     for y in Y:
			
 
				-        classifier = Classifier(c=c, gamma=y, neighbours=neighbours)
			
 
				+        classifier = Classifier(c=c, gamma=y, neighbours=neighbours, verbose=1)
			
 
				         classifier.train(learning_set)
			
 
				         result = classifier.test(test_set)
			
 
				 
			
--- a/src/run_classifier.py
+++ b/src/run_classifier.py
@@ -0,0 +1,81 @@
 
				+#!/usr/bin/python
			
 
				+from cPickle import load
			
 
				+from sys import argv, exit
			
 
				+from pylab import imsave, plot, subplot, imshow, show, axis, title
			
 
				+from math import sqrt, ceil
			
 
				+import os
			
 
				+
			
 
				+from Classifier import Classifier
			
 
				+
			
 
				+if len(argv) < 3:
			
 
				+    print 'Usage: python %s NEIGHBOURS BLUR_SCALE' % argv[0]
			
 
				+    exit(1)
			
 
				+
			
 
				+neighbours = int(argv[1])
			
 
				+blur_scale = float(argv[2])
			
 
				+suffix = '_%s_%s' % (blur_scale, neighbours)
			
 
				+
			
 
				+test_set_file = 'test_set%s.dat' % suffix
			
 
				+classifier_file = 'classifier%s.dat' % suffix
			
 
				+
			
 
				+print 'Loading classifier...'
			
 
				+classifier = Classifier(filename=classifier_file)
			
 
				+classifier.neighbours = neighbours
			
 
				+
			
 
				+print 'Loading test set...'
			
 
				+test_set = load(file(test_set_file, 'r'))
			
 
				+l = len(test_set)
			
 
				+matches = 0
			
 
				+#classified = {}
			
 
				+classified = []
			
 
				+
			
 
				+for i, char in enumerate(test_set):
			
 
				+    prediction = classifier.classify(char, char.value)
			
 
				+
			
 
				+    if char.value != prediction:
			
 
				+        classified.append((char, prediction))
			
 
				+
			
 
				+        #key = '%s_as_%s' % (char.value, prediction)
			
 
				+
			
 
				+        #if key not in classified:
			
 
				+        #    classified[key] = [char]
			
 
				+        #else:
			
 
				+        #    classified[key].append(char)
			
 
				+
			
 
				+        print '"%s" was classified as "%s"' \
			
 
				+                % (char.value, prediction)
			
 
				+    else:
			
 
				+        matches += 1
			
 
				+
			
 
				+    print '%d of %d (%d%% done)' % (i + 1, l, round(100 * (i + 1) / l))
			
 
				+
			
 
				+print '\n%d matches (%d%%), %d fails' % (matches, \
			
 
				+        round(100 * matches / l), \
			
 
				+        len(test_set) - matches)
			
 
				+
			
 
				+# Show a grid plot of all faulty classified characters
			
 
				+print 'Plotting faulty classified characters...'
			
 
				+rows = int(ceil(sqrt(l - matches)))
			
 
				+columns = int(ceil((l - matches) / float(rows)))
			
 
				+
			
 
				+for i, pair in enumerate(classified):
			
 
				+    char, prediction = pair
			
 
				+    subplot(rows, columns, i + 1)
			
 
				+    title('%s as %s' % (char.value, prediction))
			
 
				+    imshow(char.image.data, cmap='gray')
			
 
				+    axis('off')
			
 
				+
			
 
				+show()
			
 
				+
			
 
				+#print 'Saving faulty classified characters...'
			
 
				+#folder = '../images/faulty/'
			
 
				+#
			
 
				+#if not os.path.exists(folder):
			
 
				+#    os.mkdir(folder)
			
 
				+#
			
 
				+#for filename, chars in classified.iteritems():
			
 
				+#    if len(chars) == 1:
			
 
				+#        imsave('%s%s' % (folder, filename), char.image.data, cmap='gray')
			
 
				+#    else:
			
 
				+#        for i, char in enumerate(chars):
			
 
				+#            imsave('%s%s_%d' % (folder, filename, i), char.image.data, cmap='gray')
			
--- a/src/test_classifier.py
+++ b/src/test_classifier.py
@@ -1,38 +0,0 @@
 
				-#!/usr/bin/python
			
 
				-from cPickle import dump, load
			
 
				-
			
 
				-from Classifier import Classifier
			
 
				-
			
 
				-if len(argv) < 5:
			
 
				-    print 'Usage: python %s FILE_SUFFIX C GAMMA NEIGHBOURS' % argv[0]
			
 
				-    exit(1)
			
 
				-
			
 
				-print 'Loading learning set'
			
 
				-learning_set = load(file('learning_set%s.dat' % argv[1], 'r'))
			
 
				-
			
 
				-# Train the classifier with the learning set
			
 
				-classifier = Classifier(c=float(argv[1]), \
			
 
				-                        gamma=float(argv[2]), \
			
 
				-                        neighbours=int(argv[3]))
			
 
				-classifier.train(learning_set)
			
 
				-
			
 
				-print 'Loading test set'
			
 
				-test_set = load(file('test_set%s.dat' % argv[1], 'r'))
			
 
				-l = len(test_set)
			
 
				-matches = 0
			
 
				-
			
 
				-for i, char in enumerate(test_set):
			
 
				-    prediction = classifier.classify(char, char.value)
			
 
				-
			
 
				-    if char.value == prediction:
			
 
				-        print ':-----> Successfully recognized "%s"' % char.value,
			
 
				-        matches += 1
			
 
				-    else:
			
 
				-        print ':( Expected character "%s", got "%s"' \
			
 
				-                % (char.value, prediction),
			
 
				-
			
 
				-    print '  --  %d of %d (%d%% done)' % (i + 1, l, int(100 * (i + 1) / l))
			
 
				-
			
 
				-print '\n%d matches (%d%%), %d fails' % (matches, \
			
 
				-        int(100 * matches / len(test_set)), \
			
 
				-        len(test_set) - matches)
			
--- a/src/test_compare.py
+++ b/src/test_compare.py
@@ -1,9 +1,8 @@
 
				 #!/usr/bin/python
			
 
				 from matplotlib.pyplot import imshow, subplot, show
			
 
				 from LocalBinaryPatternizer import LocalBinaryPatternizer
			
 
				-from GrayscaleImage import GrayscaleImage
			
 
				 from cPickle import load
			
 
				-from numpy import zeros, resize
			
 
				+from numpy import zeros
			
 
				 
			
 
				 chars = load(file('characters.dat', 'r'))[::2]
			
 
				 left = None
			
--- a/src/test_performance.py
+++ b/src/test_performance.py
@@ -1,6 +1,5 @@
 
				 #!/usr/bin/python
			
 
				 from os import listdir
			
 
				-from cPickle import load
			
 
				 from sys import argv, exit
			
 
				 from time import time
			
 
				 
			
--- a/src/xml_helper_functions.py
+++ b/src/xml_helper_functions.py
@@ -1,17 +1,21 @@
 
				 from os import mkdir
			
 
				 from os.path import exists
			
 
				-from pylab import imsave, array, zeros, inv, dot, norm, svd, floor
			
 
				+from pylab import array, zeros, inv, dot, svd, floor
			
 
				 from xml.dom.minidom import parse
			
 
				+from Point import Point
			
 
				 from Character import Character
			
 
				 from GrayscaleImage import GrayscaleImage
			
 
				 from NormalizedCharacterImage import NormalizedCharacterImage
			
 
				 from LicensePlate import LicensePlate
			
 
				 
			
 
				-# Gets the character data from a picture with a license plate
			
 
				-def retrieve_data(plate, corners):
			
 
				-    x0,y0, x1,y1, x2,y2, x3,y3 = corners
			
 
				+# sets the entire license plate of an image
			
 
				+def retrieve_data(image, corners):
			
 
				+    x0, y0 = corners[0].to_tuple()
			
 
				+    x1, y1 = corners[1].to_tuple()
			
 
				+    x2, y2 = corners[2].to_tuple()
			
 
				+    x3, y3 = corners[3].to_tuple()
			
 
				 
			
 
				-    M = max(x0, x1, x2, x3) - min(x0, x1, x2, x3)
			
 
				+    M = int(1.2 * (max(x0, x1, x2, x3) - min(x0, x1, x2, x3)))
			
 
				     N = max(y0, y1, y2, y3) - min(y0, y1, y2, y3)
			
 
				 
			
 
				     matrix = array([
			
@@ -25,7 +29,7 @@ def retrieve_data(plate, corners):
 
				       [ 0,  0, 0, x3, y3, 1, -N * x3, -N * y3, -N]
			
 
				     ])
			
 
				 
			
 
				-    P = get_transformation_matrix(matrix)
			
 
				+    P = inv(get_transformation_matrix(matrix))
			
 
				     data = array([zeros(M, float)] * N)
			
 
				 
			
 
				     for i in range(M):
			
@@ -34,7 +38,7 @@ def retrieve_data(plate, corners):
 
				             or_coor_h = (or_coor[1][0] / or_coor[2][0],
			
 
				                          or_coor[0][0] / or_coor[2][0])
			
 
				 
			
 
				-            data[j][i] = pV(plate, or_coor_h[0], or_coor_h[1])
			
 
				+            data[j][i] = pV(image, or_coor_h[0], or_coor_h[1])
			
 
				 
			
 
				     return data
			
 
				 
			
@@ -46,92 +50,108 @@ def get_transformation_matrix(matrix):
 
				     U, D, V = svd(matrix)
			
 
				     p = V[8][:]
			
 
				 
			
 
				-    return inv(array([[p[0],p[1],p[2]], [p[3],p[4],p[5]], [p[6],p[7],p[8]]]))
			
 
				+    return array([
			
 
				+        [ p[0], p[1], p[2] ],
			
 
				+        [ p[3], p[4], p[5] ],
			
 
				+        [ p[6], p[7], p[8] ]
			
 
				+    ])
			
 
				 
			
 
				 def pV(image, x, y):
			
 
				     #Get the value of a point (interpolated x, y) in the given image
			
 
				-    if not image.in_bounds(x, y):
			
 
				-      return 0
			
 
				+    if image.in_bounds(x, y):
			
 
				+        x_low  = floor(x)
			
 
				+        x_high = floor(x + 1)
			
 
				+        y_low  = floor(y)
			
 
				+        y_high = floor(y + 1)
			
 
				+        x_y    = (x_high - x_low) * (y_high - y_low)
			
 
				 
			
 
				-    x_low, x_high = floor(x), floor(x+1)
			
 
				-    y_low, y_high = floor(y), floor(y+1)
			
 
				-    x_y    = (x_high - x_low) * (y_high - y_low)
			
 
				+        a = x_high - x
			
 
				+        b = y_high - y
			
 
				+        c = x - x_low
			
 
				+        d = y - y_low
			
 
				 
			
 
				-    a = x_high - x
			
 
				-    b = y_high - y
			
 
				-    c = x - x_low
			
 
				-    d = y - y_low
			
 
				+        return image[x_low,  y_low] / x_y * a * b \
			
 
				+            + image[x_high,  y_low] / x_y * c * b \
			
 
				+            + image[x_low , y_high] / x_y * a * d \
			
 
				+            + image[x_high, y_high] / x_y * c * d
			
 
				 
			
 
				-    return image[x_low,  y_low] / x_y * a * b \
			
 
				-        + image[x_high,  y_low] / x_y * c * b \
			
 
				-        + image[x_low , y_high] / x_y * a * d \
			
 
				-        + image[x_high, y_high] / x_y * c * d
			
 
				+    return 0
			
 
				 
			
 
				 def xml_to_LicensePlate(filename, save_character=None):
			
 
				-    plate   = GrayscaleImage('../images/Images/%s.jpg' % filename)
			
 
				-    dom     = parse('../images/Infos/%s.info' % filename)
			
 
				-    country = ''
			
 
				-    result  = []
			
 
				-    version = get_node(dom, "current-version")
			
 
				-    infos   = by_tag(dom, "info")
			
 
				-
			
 
				-    for info in infos:
			
 
				-        if not version == get_node(info, "version"):
			
 
				-            continue
			
 
				+    image = GrayscaleImage('../images/Images/%s.jpg' % filename)
			
 
				+    dom   = parse('../images/Infos/%s.info' % filename)
			
 
				+    result_characters = []
			
 
				 
			
 
				-        country = get_node(info, "identification-letters")
			
 
				-        temp    = by_tag(info, "characters")
			
 
				+    version = dom.getElementsByTagName("current-version")[0].firstChild.data
			
 
				+    info    = dom.getElementsByTagName("info")
			
 
				 
			
 
				-        if not temp: # no characters where found in the file
			
 
				-            break
			
 
				+    for i in info:
			
 
				+        if version == i.getElementsByTagName("version")[0].firstChild.data:
			
 
				 
			
 
				-        characters = temp[0].childNodes
			
 
				+            country = i.getElementsByTagName("identification-letters")[0].firstChild.data
			
 
				+            temp = i.getElementsByTagName("characters")
			
 
				 
			
 
				-        for i, char in enumerate(characters):
			
 
				-            if not char.nodeName == "character":
			
 
				-              continue
			
 
				+            if len(temp):
			
 
				+              characters = temp[0].childNodes
			
 
				+            else:
			
 
				+              characters = []
			
 
				+              break
			
 
				 
			
 
				-            value   = get_node(char, "char")
			
 
				-            corners = get_corners(char)
			
 
				+            for i, character in enumerate(characters):
			
 
				+                if character.nodeName == "character":
			
 
				+                    value   = character.getElementsByTagName("char")[0].firstChild.data
			
 
				+                    corners = get_corners(character)
			
 
				 
			
 
				-            if not len(corners) == 8:
			
 
				-                break
			
 
				+                    if not len(corners) == 4:
			
 
				+                      break
			
 
				 
			
 
				-            data  = retrieve_data(plate, corners)
			
 
				-            image = NormalizedCharacterImage(data=data)
			
 
				-            result.append(Character(value, corners, image, filename))
			
 
				-        
			
 
				-            if save_character:
			
 
				-                character_image = GrayscaleImage(data=data)
			
 
				-                path       = "../images/LearningSet/%s" % value
			
 
				-                image_path = "%s/%d_%s.jpg" % (path, i, filename.split('/')[-1])
			
 
				+                    character_data  = retrieve_data(image, corners)
			
 
				+                    character_image = NormalizedCharacterImage(data=character_data)
			
 
				 
			
 
				-                if not exists(path):
			
 
				-                  mkdir(path)
			
 
				+                    result_characters.append(Character(value, corners, character_image, filename))
			
 
				 
			
 
				-                if not exists(image_path):
			
 
				-                  character_image.save(image_path)
			
 
				+                    if save_character:
			
 
				+                        single_character = GrayscaleImage(data=character_data)
			
 
				 
			
 
				-    return LicensePlate(country, result)
			
 
				+                        path = "../images/LearningSet/%s" % value
			
 
				+                        image_path = "%s/%d_%s.jpg" % (path, i, filename.split('/')[-1])
			
 
				 
			
 
				-def get_node(node, tag):
			
 
				-    return by_tag(node, tag)[0].firstChild.data
			
 
				+                        if not exists(path):
			
 
				+                          mkdir(path)
			
 
				 
			
 
				-def by_tag(node, tag):
			
 
				-    return node.getElementsByTagName(tag)
			
 
				+                        if not exists(image_path):
			
 
				+                          single_character.save(image_path)
			
 
				 
			
 
				-def get_attr(node, attr):
			
 
				-  return int(node.getAttribute(attr))
			
 
				+    return LicensePlate(country, result_characters)
			
 
				 
			
 
				 def get_corners(dom):
			
 
				-    p = by_tag(dom, "point")
			
 
				+  nodes = dom.getElementsByTagName("point")
			
 
				+  corners = []
			
 
				+
			
 
				+  margin_y = 3
			
 
				+  margin_x = 2
			
 
				+
			
 
				+  corners.append(
			
 
				+    Point(get_coord(nodes[0], "x") - margin_x,
			
 
				+          get_coord(nodes[0], "y") - margin_y)
			
 
				+  )
			
 
				+
			
 
				+  corners.append(
			
 
				+    Point(get_coord(nodes[1], "x") + margin_x,
			
 
				+          get_coord(nodes[1], "y") - margin_y)
			
 
				+  )
			
 
				+
			
 
				+  corners.append(
			
 
				+    Point(get_coord(nodes[2], "x") + margin_x,
			
 
				+          get_coord(nodes[2], "y") + margin_y)
			
 
				+  )
			
 
				+
			
 
				+  corners.append(
			
 
				+    Point(get_coord(nodes[3], "x") - margin_x,
			
 
				+          get_coord(nodes[3], "y") + margin_y)
			
 
				+  )
			
 
				 
			
 
				-    # Extra padding
			
 
				-    y = 3
			
 
				-    x = 2
			
 
				+  return corners
			
 
				 
			
 
				-    # return 8 values (x0,y0, .., x3,y3)
			
 
				-    return get_attr(p[0], "x") - x, get_attr(p[0], "y") - y,\
			
 
				-           get_attr(p[1], "x") + x, get_attr(p[1], "y") - y,\
			
 
				-           get_attr(p[2], "x") + x, get_attr(p[2], "y") + y,\
			
 
				-           get_attr(p[3], "x") - x, get_attr(p[3], "y") + y
			
 
				+def get_coord(node, attribute):
			
 
				+  return int(node.getAttribute(attribute))
			
--- a/todo.txt
+++ b/todo.txt
@@ -0,0 +1,3 @@
 
				+- Beste classifier runnen en kijken welke karakters fout gaan
			
 
				+- code documenteren
			
 
				+- verslag: conclusies aan parameters verbinden