Document-Word-Detection/Word_detection.py

'''
output : word detection on document (Simple OCR type of application)
'''

import cv2
import numpy as np
import imutils

# frame read
frame = cv2.imread('test.jpeg')

# resize
frame = cv2.resize(frame, (600, 600))

# grayscale
gray = cv2.cvtColor(frame, cv2.COLOR_BGR2GRAY)

# remove noise
blur = cv2.GaussianBlur(gray, (5, 5), 0)

# otsu thresh (bimodel thresold)
thresh = cv2.threshold(blur, 0, 255,
                       cv2.THRESH_BINARY_INV + cv2.THRESH_OTSU)[1]

# get structuring element

horizontal_kernel = cv2.getStructuringElement(cv2.MORPH_RECT, (25, 1))
vertical_kernel = cv2.getStructuringElement(cv2.MORPH_RECT, (1, 25))
print('horizontal kernel : {}'.format(horizontal_kernel))
print('vertical kernel : {}'.format(vertical_kernel))

# opening (erosion followed by dilation)

horizontal_lines = cv2.morphologyEx(thresh,
                                    cv2.MORPH_OPEN,
                                    horizontal_kernel,
                                    iterations=2)
vertical_lines = cv2.morphologyEx(thresh,
                                  cv2.MORPH_OPEN,
                                  vertical_kernel,
                                  iterations=2)

# contours apply on detected lines
# First one is source image, second is contour retrieval mode, third is contour approximation method

cnts = cv2.findContours(horizontal_lines, cv2.RETR_EXTERNAL,
                        cv2.CHAIN_APPROX_SIMPLE)
cntsv = cv2.findContours(vertical_lines, cv2.RETR_EXTERNAL,
                         cv2.CHAIN_APPROX_SIMPLE)

# find contours
cnts = cnts[0] if len(cnts) == 2 else cnts[1]
cntsv = cntsv[0] if len(cntsv) == 2 else cntsv[1]

for c in cnts:
    cv2.drawContours(frame, [c], -1, (255, 255, 255), 2)
for c in cntsv:
    cv2.drawContours(frame, [c], -1, (255, 255, 255), 2)

# imshow
cv2.imshow('thresh', thresh)
cv2.imshow('horizontal_lines', horizontal_lines)
cv2.imshow('vertical_lines', vertical_lines)
cv2.imshow('frame', frame)

# grayscale

gray1 = cv2.cvtColor(frame, cv2.COLOR_BGR2GRAY)
thresh1 = cv2.adaptiveThreshold(gray1, 255, cv2.ADAPTIVE_THRESH_GAUSSIAN_C,
                                cv2.THRESH_BINARY, 23, 30)
canny = imutils.auto_canny(thresh1)

output = cv2.bitwise_not(canny)
kernel = np.ones((5, 5), np.uint8)

opening = cv2.morphologyEx(canny, cv2.MORPH_CLOSE, kernel)

dilation = cv2.dilate(canny, kernel, iterations=1)

contour, hierachy = cv2.findContours(dilation, cv2.RETR_TREE,
                                     cv2.CHAIN_APPROX_SIMPLE)

for i in contour:
    area = cv2.contourArea(i)
    if area > 20:
        x, y, w, h = cv2.boundingRect(i)
        cv2.rectangle(frame, (x, y), (x + w, y + h), (0, 120, 255), 2)

cv2.imshow('output', output)
cv2.imshow('dilate', dilation)
cv2.imshow('opening', opening)
cv2.imshow('original_frame', frame)
cv2.imshow('canny', canny)
cv2.imshow('thresh1', thresh1)

# Saving output image
cv2.imwrite('output.jpg', frame)

# destroy all window
cv2.waitKey(0)
cv2.destroyAllWindows()