-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathpreprocess.py
161 lines (131 loc) · 5.59 KB
/
preprocess.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
import numpy as np
from skimage.io import imread
from skimage import restoration
from skimage import measure
from skimage.measure import regionprops
from skimage.filters import threshold_otsu
from skimage.transform import resize
class PreProcess():
def __init__(self, image_location):
"""
reads the image in grayscale and thresholds the image
Parameters:
-----------
image_location: str; full image directory path
"""
self.full_car_image = imread(image_location, as_grey=True)
self.full_car_image = self.resize_if_necessary(self.full_car_image)
self.binary_image = self.threshold(self.full_car_image)
def denoise(sefl, imgDetails):
return restoration.denoise_tv_chambolle(imgDetails)
def threshold(self, gray_image):
"""
uses the otsu threshold method to generate a binary image
Parameters:
-----------
gray_image: 2D array: gray scale image to be thresholded
Return:
--------
2-D array of the binary image each pixel is either 1 or 0
"""
thresholdValue = threshold_otsu(gray_image)
return gray_image > thresholdValue
def get_plate_like_objects(self):
"""
uses principles of connected component analysis and labelling to map
out object regions.
The plate dimensions were based on the following characteristics
i. They are rectangular in shape.
ii. The width is more than the height
iii. The ratio of the width to height is approximately 2:1
iv. The proportion of the width of the license plate region to the
full image ranges between 15% to 40% depending on how the car image
was taken
v. The proportion of the height of the license plate region to the
full image is between 8% to 20%
Return:
--------
3-D Array of license plate candidates region
"""
self.label_image = measure.label(self.binary_image)
self.plate_objects_cordinates = []
threshold = self.binary_image
plate_dimensions = (0.08*threshold.shape[0], 0.2*threshold.shape[0], 0.15*threshold.shape[1], 0.4*threshold.shape[1])
minHeight, maxHeight, minWidth, maxWidth = plate_dimensions
plate_like_objects = []
for region in regionprops(self.label_image):
if region.area < 10:
continue
minimumRow, minimumCol, maximumRow, maximumCol = region.bbox
regionHeight = maximumRow - minimumRow
regionWidth = maximumCol - minimumCol
if regionHeight >= minHeight and regionHeight <= maxHeight and regionWidth >= minWidth and regionWidth <= maxWidth and regionWidth > regionHeight:
plate_like_objects.append(self.full_car_image[minimumRow:maximumRow,
minimumCol:maximumCol])
self.plate_objects_cordinates.append((minimumRow, minimumCol,
maximumRow, maximumCol))
return plate_like_objects
def validate_plate(self, candidates):
"""
validates the candidate plate objects by using the idea
of vertical projection to calculate the sum of pixels across
each column and then find the average.
This method still needs improvement
Parameters:
------------
candidate: 3D Array containing 2D arrays of objects that looks
like license plate
Returns:
--------
a 2D array of the likely license plate region
"""
for each_candidate in candidates:
height, width = each_candidate.shape
each_candidate = self.inverted_threshold(each_candidate)
license_plate = []
highest_average = 0
total_white_pixels = 0
for column in range(width):
total_white_pixels += sum(each_candidate[:, column])
average = float(total_white_pixels) / width
if average >= highest_average:
license_plate = each_candidate
return license_plate
def inverted_threshold(self, grayscale_image):
"""
used to invert the threshold of the candidate regions of the plate
localization process. The inversion was neccessary
because the license plate area is white dominated which means
they have a greater gray scale value than the character region
Parameters:
-----------
grayscale_image: 2D array of the gray scale image of the
candidate region
Returns:
--------
a 2D binary image
"""
threshold_value = threshold_otsu(grayscale_image) - 0.05
return grayscale_image < threshold_value
def resize_if_necessary(self, image_to_resize):
"""
function is used to resize the image before further
processing if the image is too big. The resize is done
in such a way that the aspect ratio is still maintained
Parameters:
------------
image_to_resize: 2D-Array of the image to be resized
3D array image (RGB channel) can also be resized
Return:
--------
resized image or the original image if resize is not
neccessary
"""
height, width = image_to_resize.shape
ratio = float(width) / height
# if the image is too big, resize
if width > 600:
width = 600
height = round(width / ratio)
return resize(image_to_resize, (height, width))
return image_to_resize