pyimgscan.py

import cv2
import argparse

from cvtools import resize
from cvtools import perspective_transform
from cvtools import getoutlines
from cvtools import simple_erode
from cvtools import simple_dilate
from cvtools import brightness_contrast
from cvtools import blank

# PARSE COMMAND-LINE ARGUMENTS WITH ARGPARSE
ap = argparse.ArgumentParser()
ap.add_argument(
    "-i", "--image", required=True, help="Path to the image to be corrected."
)
ap.add_argument(
    "-I",
    "--inverted",
    required=False,
    nargs="?",
    const="Ture",
    help="Invert the output if this argument present.",
)
args = vars(ap.parse_args())

# READ INPUT IMAGE
img = cv2.imread(args["image"])

# if input image is empty, notify the user and quit program
if img is None:
    print()
    print("The file does not exist or is empty!")
    print("Please select a valid image file!")
    print()
    exit(0)  # exit code zero means a clean exit with no output/errors etc.


"""
Primary Functions
"""


def preprocess(img):
    """
    BAISC PRE-PROCESSING TO OBTAIN A CANNY EDGE IMAGE
    """

    # increase contrast between paper and background
    img_adj = brightness_contrast(img, 1.56, -60)

    # calculate the ratio of the image to the new height (500px) so we
    # can scale the manipulated image back to the original size later
    scale = img_adj.shape[0] / 500.0

    # scale the image down to 500px in height;
    img_scaled = resize(img_adj, height=500)

    # convert image to grayscale
    img_gray = cv2.cvtColor(img_scaled, cv2.COLOR_BGR2GRAY)

    # apply gaussian blur with a 11x11 kernel
    img_gray = cv2.GaussianBlur(img_gray, (11, 11), 0)

    # apply canny edge detection
    img_edge = cv2.Canny(img_gray, 60, 245)

    # dilate the edge image to connect any small gaps
    img_edge = simple_dilate(img_edge)

    return img_adj, scale, img_scaled, img_edge


def gethull(img_edge):
    """
    1st ROUND OF OUTLINE FINDING, + CONVEX HULL
    """

    # make a copy of the edge image because the following function manipulates
    # the input
    img_prehull = img_edge.copy()

    # find outlines in the (newly copied) edge image
    outlines = getoutlines(img_prehull)

    # create a blank image for convex hull operation
    img_hull = blank(img_prehull.shape, img_prehull.dtype, "0")

    # draw convex hulls (fit polygon) for all outlines detected to 'img_contour'
    for outline in range(len(outlines)):

        hull = cv2.convexHull(outlines[outline])

        # parameters: source image, outlines (contours),
        #             contour index (-1 for all), color, thickness
        cv2.drawContours(img_hull, [hull], 0, 255, 3)

    # erode the hull image to make the outline closer to paper
    img_hull = simple_erode(img_hull)

    return img_hull


def getcorners(img_hull):
    """
    2nd ROUND OF OUTLINE FINDING, + SORTING & APPROXIMATION
    """

    # make a copy of the edge image because the following function manipulates
    # the input
    img_outlines = img_hull.copy()

    # find outlines in the convex hull image
    outlines = getoutlines(img_outlines)

    # sort the outlines by area from large to small, and only take the largest 4
    # outlines in order to speed up the process and not waste time
    outlines = sorted(outlines, key=cv2.contourArea, reverse=True)[:4]

    # loop over outlines
    for outline in outlines:

        # find the perimeter of each outline for use in approximation
        perimeter = cv2.arcLength(outline, True)

        # > approximate a rough contour for each outline found, with (hopefully)
        #   4 points (rectangular sheet of paper); [Douglas-Peuker Algorithm]
        # > FIRST OPTION is the input outline;
        # > SECOND OPTION is the accuracy of approximation (epsilon), here it
        #   is set to a percentage of the perimeter of the outline
        # > THIRD OPTION is whether to assume an outline
        #   is closed, which in this case is yes (sheet of paper)
        approx = cv2.approxPolyDP(outline, 0.02 * perimeter, True)

        # if the approximation has 4 points, then assume it is correct, and
        # assign these points to the 'corners' variable
        if len(approx) == 4:
            corners = approx
            break

    return corners


"""
Main Proccess of the Program
"""

# obtain the adjusted image, scaled image along with its scale factor, and the
# Canny edge image
img_adj, scale, img_scaled, img_edge = preprocess(img)

# perform convex hull on edge image to prevent imcomplete outline
img_hull = gethull(img_edge)

# obtain 4 corner points of the convex hull image
corners = getcorners(img_hull)

# scale the corner points back to the original size of the image using the scale
# calculated previously
corners = corners.reshape(4, 2) * scale

# finally correct the perspective of the image by applying four-point
# perspective transform
img_corrected = perspective_transform(img_adj, corners)

# write corrected image to file
cv2.imwrite("./corrected.png", img_corrected)

# convert the corrected image to grayscale to prepare for thresholding
img_corrected = cv2.cvtColor(img_corrected, cv2.COLOR_BGR2GRAY)

# if given the argument "-I" or "--inverted", output an inverted binary image,
# otherwise output a normal image
if args["inverted"] is not None:

    # conduct simple binary thresholding for ease of further processing; the first
    # option of the function is the actual threshold value
    img_thresh = cv2.threshold(img_corrected, 135, 255, cv2.THRESH_BINARY_INV)[1]

    # write inverted binary image to file
    cv2.imwrite("./thresholded_inverted.png", img_thresh)

else:

    # conduct simple binary thresholding for ease of further processing; the first
    # option of the function is the actual threshold value
    img_thresh = cv2.threshold(img_corrected, 135, 255, cv2.THRESH_BINARY)[1]

    # write binary image to file
    cv2.imwrite("./thresholded.png", img_thresh)