DigitRecognizer/recognize.py at master · saideeptalari/DigitRecognizer · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
__author__ = 'saideeptalari'
import numpy as np
import cv2
import imutils
import argparse
from skimage.filters import threshold_adaptive
from keras.models import load_model

#parse arguments
ap = argparse.ArgumentParser()
ap.add_argument("-i","--image",required=True,help="Path to image to recognize")
ap.add_argument("-m","--model",required=True,help="Path to saved classifier")
args = vars(ap.parse_args())

#read,resize and convert to grayscale
image = cv2.imread(args["image"])
image = imutils.resize(image,width=320)
gray = cv2.cvtColor(image,cv2.COLOR_BGR2GRAY)

#Rectangular kernel with size 5x5
kernel = cv2.getStructuringElement(cv2.MORPH_RECT,(5,5))

#apply blackhat and otsu thresholding
blackhat = cv2.morphologyEx(gray,cv2.MORPH_BLACKHAT,kernel)
_,thresh = cv2.threshold(blackhat,0,255,cv2.THRESH_BINARY|cv2.THRESH_OTSU)
thresh = cv2.dilate(thresh,None)        #dilate thresholded image for better segmentation

#find external contours
(cnts,_) = cv2.findContours(thresh.copy(),cv2.RETR_EXTERNAL,cv2.CHAIN_APPROX_SIMPLE)
avgCntArea = np.mean([cv2.contourArea(k) for k in cnts])      #contourArea for digit approximation

digits = []
boxes = []


for i,c in enumerate(cnts):
    if cv2.contourArea(c)<avgCntArea/10:
        continue
    mask = np.zeros(gray.shape,dtype="uint8")   #empty mask for each iteration

    (x,y,w,h) = cv2.boundingRect(c)
    hull = cv2.convexHull(c)
    cv2.drawContours(mask,[hull],-1,255,-1)     #draw hull on mask
    mask = cv2.bitwise_and(thresh,thresh,mask=mask) #segment digit from thresh

    digit = mask[y-8:y+h+8,x-8:x+w+8]       #just for better approximation
    digit = cv2.resize(digit,(28,28))
    boxes.append((x,y,w,h))
    digits.append(digit)

digits = np.array(digits)
model = load_model(args["model"])
#digits = digits.reshape(-1,784)    #for Multi-Layer-Perceptron
digits = digits.reshape(digits.shape[0],28,28,1)    #for Convolution Neural Networks
labels = model.predict_classes(digits)

cv2.imshow("Original",image)
cv2.imshow("Thresh",thresh)

#draw bounding boxes and print digits on them
for (x,y,w,h),label in sorted(zip(boxes,labels)):
    cv2.rectangle(image,(x,y),(x+w,y+h),(0,0,255),1)
    cv2.putText(image,str(label),(x+2,y-5),cv2.FONT_HERSHEY_SIMPLEX,1.0,(0,255,0),2)
    cv2.imshow("Recognized",image)
    cv2.waitKey(0)

cv2.destroyAllWindows()