-
Notifications
You must be signed in to change notification settings - Fork 15
/
Copy pathimage_text_extractor.py
67 lines (55 loc) · 2.59 KB
/
image_text_extractor.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
# importing all required libraries
import os
import traceback
# importing libraries for computer vision
import numpy as np
import cv2
import imutils
from imutils import contours
from imutils.perspective import four_point_transform
from skimage.filters import threshold_local
# importing libraries to read text from image
from PIL import Image
import pytesseract
# exploring the directory for all jpg files
for file in os.listdir("/home/deepshikha/Workspace/Text-Extraction-From-Image/set10"):
if file.endswith(".jpg"):
file_path = "/home/deepshikha/Workspace/Text-Extraction-From-Image/set10/" + str(file)
# reading file with cv2
img = cv2.imread(file_path)
ratio = img.shape[0]/500.0
original_img = img.copy()
# converting image into grayscale
gray = cv2.cvtColor(img, cv2.COLOR_BGR2GRAY)
# blurring and finding edges of the image
blurred = cv2.GaussianBlur(gray, (5,5) ,0)
edged = cv2.Canny(gray, 75, 200)
# applying threshold to grayscale image
thresh = cv2.threshold(gray, 225, 255, cv2.THRESH_BINARY_INV)[1]
# finding contours
(_, cnts, _) = cv2.findContours(thresh.copy(), cv2.RETR_EXTERNAL, cv2.CHAIN_APPROX_SIMPLE)
# draw contours on image
cv2.drawContours(img, cnts, -1, (240, 0, 159), 3)
H,W = img.shape[:2]
for cnt in cnts:
x,y,w,h = cv2.boundingRect(cnt)
if cv2.contourArea(cnt) > 100 and (0.7 < w/h < 1.3) and (W/4 < x + w//2 < W*3/4) and (H/4 < y + h//2 < H*3/4):
break
# creating mask and performing bitwise-op
mask = np.zeros(img.shape[:2],np.uint8)
cv2.drawContours(mask, [cnt],-1, 255, -1)
dst = cv2.bitwise_and(img, img, mask=mask)
# displaying image and saving in the directory
gray = cv2.cvtColor(dst, cv2.COLOR_BGR2GRAY)
gray = cv2.medianBlur(gray, 3)
gray = cv2.threshold(gray, 0, 255, cv2.THRESH_BINARY | cv2.THRESH_OTSU)[1]
scanned_file_name = "/home/deepshikha/Workspace/Text-Extraction-From-Image/set10/" + str(file[:-4]) + "-Scanned.png"
cv2.imwrite(scanned_file_name, dst)
# cv2.imshow("gray.png", dst)
# cv2.waitKey()
# fetching text from the image and storing it into a text file
file_text = pytesseract.image_to_string(Image.open(scanned_file_name))
text_file_name = "/home/deepshikha/Workspace/Text-Extraction-From-Image/set10/" + str(file[:-4]) + "-Scanned.txt"
with open(text_file_name, "a") as f:
f.write(file_text + "\n")
# import pdb; pdb.set_trace()