-
Notifications
You must be signed in to change notification settings - Fork 12
/
Copy pathSVCDigitDetector.py
100 lines (59 loc) · 2.66 KB
/
SVCDigitDetector.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
import logging
from SimpleCV import ImageSet
from sklearn.svm import LinearSVC
from os.path import isfile
import pickle
class SVCDigitDetector(object):
TEMPLATE_SIZE = (10, 40)
dataset_array = []
dataset_digit = []
neural_network = LinearSVC()
neural_network_cache = "./linear_svc_model.pickle"
# See black magic below in the code for explanation
crop_top_percent = 10
def __init__(self):
if isfile(self.neural_network_cache):
logging.debug("Loading neural netowrk from cache")
cache_file = open(self.neural_network_cache, "rb")
self.neural_network = pickle.load(cache_file)
else:
self.train("./images/dataset/")
cache_file = open(self.neural_network_cache, "wb+")
pickle.dump(self.neural_network, cache_file)
cache_file.close()
def train(self, digits_path):
for digit_to_train in range(-1, 10):
logging.info("Training digit " + str(digit_to_train))
digit_images = ImageSet(digits_path + str(digit_to_train))
logging.debug("Loaded " + str(len(digit_images)) + " digits")
for digit_image in digit_images:
self.train_image(digit_image, digit_to_train)
logging.info("Digit " + str(digit_to_train) + " trained")
self.train_network()
def train_network(self):
logging.info("Training the model")
self.neural_network.fit(self.dataset_array, self.dataset_digit)
def image_to_array(self, image):
resiezed_image = image.resize(self.TEMPLATE_SIZE[0], self.TEMPLATE_SIZE[1])
resiezed_image_numpy = resiezed_image.getNumpy().ravel()
return resiezed_image_numpy
def train_image(self, image, digit):
self.dataset_array.append(self.image_to_array(image))
self.dataset_digit.append(digit)
# Black magic below :
# Camera is positioned slightly above the gas meter, therefore sometime we don't
# see top of the rounded digits.
# We can train the model even for 'cropped' images without top part
resize_to_height = int((image.height / 100.0) * self.crop_top_percent)
crop_start = (0, resize_to_height)
crop_stop = (image.width, image.height)
self.dataset_array.append(self.image_to_array(image.crop(crop_start, crop_stop)))
self.dataset_digit.append(digit)
def detect_digit(self, image):
image_array = self.image_to_array(image).reshape(1, -1)
name = self.neural_network.predict(image_array)
if name[0] >= 0:
return name[0]
else:
# -1 are invalid blobs
return None