paper_detection.py

__author__ = 'zhangm2'

import cv2
import numpy
from imutil import show_img
from custom_exceptions import PaperDetectionError

DEBUG = True
ANS_REGION_HIEGHT = 1125
ANS_REGION_WIDTH = 1155

def get_paper(img):
    # Read in file and resize
    oriImg = img
    ratio = .5
    resizedImg = cv2.resize(oriImg, (0, 0), fx = ratio, fy = ratio)
    if DEBUG:
        show_img(resizedImg)

    # Convert to gray scale
    img = cv2.cvtColor(resizedImg, cv2.COLOR_RGB2GRAY)
    if DEBUG:
        show_img(img)

    # Gaussian Blur
    img = cv2.GaussianBlur(img, (7, 7), 0)
    if DEBUG:
        show_img(img)

    # Adaptive Threshold
    img = cv2.adaptiveThreshold(img, 255, cv2.ADAPTIVE_THRESH_GAUSSIAN_C, cv2.THRESH_BINARY, 11, 2)
    if DEBUG:
        show_img(img)

    # Find contours
    ret, thresh = cv2.threshold(img, 127, 255, 0)
    imgCont, contrs, hier = cv2.findContours(thresh,cv2.RETR_TREE,cv2.CHAIN_APPROX_SIMPLE)

    # Find the largest contour
    index_of_largest_contour = get_index_of_largest_contour(contrs)
    largest_contour = contrs[index_of_largest_contour]
    image_size = img.shape[0] * img.shape[1]

    if DEBUG:
        cv2.drawContours(resizedImg, [largest_contour], -1, (255, 0, 0), 3)
        show_img(resizedImg)

    # Approximate the answer region contour to a polygon
    final_contr = get_answer_region_contour(contrs, hier[0], index_of_largest_contour, resizedImg)
    epsilon = 0.1 * cv2.arcLength(final_contr, True)
    final_contr = cv2.approxPolyDP(final_contr, epsilon, True)
    # Assuming the answer region takes up the majority of the screen.
    # If the max-sized contour is too small compared to the image (<20%),
    # we probably didn't find the paper.
    if cv2.contourArea(final_contr) / image_size < 0.05:
        raise PaperDetectionError('No answer region of the right size found')
    if len(final_contr) != 4:
        raise PaperDetectionError('Detected answer region cannot be approximated to a quadrilateral')

    # Draw Contours & corners
    if DEBUG:
        contrs = [final_contr]
        cv2.drawContours(resizedImg, contrs, -1, (0, 255, 0), 3)

        for point in final_contr:
            x = point[0][0]
            y = point[0][1]
            cv2.circle(resizedImg, (x, y), 5, (255, 0, 255))

        show_img(resizedImg)

    #Calculate image dimensions
    maxX = max(final_contr[0][0][0], final_contr[1][0][0], final_contr[2][0][0], final_contr[3][0][0])
    maxY = max(final_contr[0][0][1], final_contr[1][0][1], final_contr[2][0][1], final_contr[3][0][1])
    minX = min((final_contr[0][0][0], final_contr[1][0][0], final_contr[2][0][0], final_contr[3][0][0]))
    minY = min(final_contr[0][0][1], final_contr[1][0][1], final_contr[2][0][1], final_contr[3][0][1])

    imgCenter = [[(maxX + minX) / 2, (maxY + minY) / 2]]

    #Assign each corner
    lowLeft = imgCenter
    lowRight = imgCenter
    upLeft = imgCenter
    upRight = imgCenter

    for point in final_contr:
        x = point[0][0]
        y = point[0][1]
        if x >= imgCenter[0][0] and y >= imgCenter[0][1]:
            lowRight = point
        elif x <= imgCenter[0][0] and y >= imgCenter[0][1]:
            lowLeft = point
        elif x >= imgCenter[0][0] and y <= imgCenter[0][1]:
            upRight = point
        elif x <= imgCenter[0][0] and y <= imgCenter[0][1]:
            upLeft = point

    height = ANS_REGION_HIEGHT
    width = ANS_REGION_WIDTH

    #Perspective Transform
    origPts = numpy.float32([upLeft[0] / ratio, lowLeft[0] / ratio, upRight[0] / ratio, lowRight[0] / ratio])
    newPts = numpy.float32([[0, 0], [0, height - 1], [width - 1, 0], [width - 1, height - 1]])
    mat = cv2.getPerspectiveTransform(origPts, newPts)
    workImg = cv2.warpPerspective(oriImg, mat, (width, height))
    return workImg

def get_index_of_largest_contour(contours):
    """Return the contour that has the largest area in a list of contours"""
    largest_contour_index = 0
    largest_area = -1
    for i, contour in enumerate(contours):
        area = cv2.contourArea(contour)
        if area > largest_area:
            largest_area = area
            largest_contour_index = i
    return largest_contour_index

def get_answer_region_contour(contours, hier, i, img):
    """Recursively find the contour enclosing the answer region
    Returns a contour that occupies at least 20% of the area of its direct parent contour,
    repeat until no such contours can be found

    Keyword arguments:
    contours -- the list of all contours
    hier -- contour tree hierarchy returned by cv2.findCountours
    i -- the index of the current contour candidate
    """
    def is_valid_contour(index):
        """Helper function that verifies whether a contour meets the condition of
        occuping at least 20% of the area of its direct parent contour
        """
        area = cv2.contourArea(contours[index])
        if area / parent_area > 0.2:
            return True

    if DEBUG:
        cv2.drawContours(img, [contours[i]], -1, (0, 255, 0), 3)
        show_img(img)

    # If this contour does not have a child, simply return it
    if hier[i][2] < 0:
        return contours[i]
    # Loop through the children of this contour,
    # find the first contour that occupies at least 20% of the area of contours[i]
    parent_area = cv2.contourArea(contours[i])
    child_index = hier[i][2]
    # If this (first) child contour is valid,
    # set it as the the parent contour and recursively call get_answer_region_contour
    if is_valid_contour(child_index):
        return get_answer_region_contour(contours, hier, child_index, img)
    # Otherwise, loop through other children contours
    while hier[child_index][0] >= 0:
        child_index = hier[child_index][0]
        if is_valid_contour(child_index):
            return get_answer_region_contour(contours, hier, child_index, img)
    # If no suitable contours are found, return the current one
    return contours[i]