forked from bthicks/OMR-Grader
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathutils.py
100 lines (72 loc) · 2.6 KB
/
utils.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
import base64
import math
import cv2 as cv
from imutils.perspective import four_point_transform
import numpy as np
def get_threshold(im):
"""
Performs a Gaussian blur and threshold on an image for image processing.
Returns the blurred and thresholded image.
Args:
im (numpy.ndarray): An ndarray representing an image.
Returns:
threshold (numpy.ndarray): An ndarray representing the blurred and
thresholded image.
"""
blurred = cv.GaussianBlur(im, (5, 5), 0)
_, threshold = cv.threshold(blurred, 0, 255, cv.THRESH_BINARY_INV
| cv.THRESH_OTSU)
return threshold
def get_transform(contour, im):
"""
Returns the portion of an image bounded by a contour.
Args:
contour (numpy.ndarray): An ndarray representing a contour.
im (numpy.ndarray): An ndarray representing an image.
Returns:
numpy.ndarray: An ndarray representing the portion of the image bounded
by the contour.
"""
peri = cv.arcLength(contour, True)
approx = cv.approxPolyDP(contour, 0.02 * peri, True)
return four_point_transform(im, approx.reshape(4, 2))
def rotate_image(im, angle):
"""
Rotates an image by a specified angle.
Args:
im (numpy.ndarray): An ndarray representing the entire test image.
angle (int): The angle, in degrees, by which the image should be
rotated.
Returns:
numpy.ndarray: An ndarray representing the rotated test image.
"""
w = im.shape[1]
h = im.shape[0]
rads = np.deg2rad(angle)
# Calculate new image width and height.
nw = abs(np.sin(rads) * h) + abs(np.cos(rads) * w)
nh = abs(np.cos(rads) * h) + abs(np.sin(rads) * w)
# Get the rotation matrix.
rot_mat = cv.getRotationMatrix2D((nw * 0.5, nh * 0.5), angle, 1)
# Calculate the move from old center to new center combined with the
# rotation.
rot_move = np.dot(rot_mat, np.array([(nw - w) * 0.5, (nh - h) * 0.5, 0]))
# Update the translation of the transform.
rot_mat[0,2] += rot_move[0]
rot_mat[1,2] += rot_move[1]
return cv.warpAffine(im, rot_mat, (int(math.ceil(nw)),
int(math.ceil(nh))), flags=cv.INTER_LANCZOS4)
def encode_image(image):
"""
Encodes a .png image into a base64 string.
Args:
image (numpy.ndarray): An ndarray representing an image.
Returns:
str: A base64 string encoding of the image.
"""
if image is None:
return None
else:
_, binary = cv.imencode('.png', image)
encoded = base64.b64encode(binary)
return encoded.decode('utf-8')