In [None]:
import PIL
from PIL import ImageFont
from PIL import Image
from PIL import ImageDraw, ImageChops, ImageFilter
import random
import cv2
import numpy as np

In [None]:
# 常量定义
DOC_DIM = (16, 12)
BOARDER_SIZE = 2
MARGIN_SIZE = 4
FONT_SIZE = 40
FOREGROUND_COLOR = (255, 255, 255)
BACKGROUND_COLOR = (0, 0, 0)
FONT_NAME = "FangZhengKaiTi.ttf"
IMAGE_SIZE = ((FONT_SIZE+2*MARGIN_SIZE) *DOC_DIM[0] + 2*BOARDER_SIZE, (FONT_SIZE+2*MARGIN_SIZE)*DOC_DIM[1] + 2*BOARDER_SIZE)

In [None]:
def generate_doc(char, font_name, FONT_SIZE):
    img=Image.new("RGB", IMAGE_SIZE, FOREGROUND_COLOR)
    font = ImageFont.truetype(font_name, FONT_SIZE)
    draw = ImageDraw.Draw(img)
    draw.rectangle(xy=[(0, 0), (IMAGE_SIZE[0]-1, IMAGE_SIZE[1]-1)], outline=BACKGROUND_COLOR, width=BOARDER_SIZE)
    try:
        cursor = 0
        for row in range(1, DOC_DIM[1]-1):
            for col in range(1, DOC_DIM[0]-1):
                draw.text((BOARDER_SIZE + col*(FONT_SIZE+2*MARGIN_SIZE) + MARGIN_SIZE, BOARDER_SIZE + row*(FONT_SIZE+2*MARGIN_SIZE) + MARGIN_SIZE), char[cursor], BACKGROUND_COLOR,font=font)
                cursor += 1
    except IndexError:
        pass
    return img

In [None]:
# 生成文档，敲回车生成下一页
chars = open('data/frequent_chars.txt', 'r').read()
for i in range(0, len(chars), DOC_DIM[0]*DOC_DIM[1]):
    image = generate_doc(chars[i:], "fonts/{}".format(FONT_NAME), FONT_SIZE)
#     display(generate_doc(chars[i:], "fonts/{}".format(FONT_NAME), FONT_SIZE))
    img = cv2.cvtColor(np.asarray(image),cv2.COLOR_RGB2BGR)  
    cv2.imshow("OpenCV",img)
    cv2.waitKey()

In [None]:
def crop_image(image):
    """Crop largest box from and return as pillow image.
    """
    image = image.resize((image.size[0], image.size[1]))  # Shrink to make boarder clear
    image = np.asarray(image)
    # Generate edge image
    edge_img = cv2.GaussianBlur(image, (3,3), 0)
    edge_img = cv2.cvtColor(edge_img, cv2.COLOR_BGR2GRAY)
    edge_img = cv2.Canny(edge_img, 50, 150, apertureSize=3)
    # Find contour
    contours, _ = cv2.findContours(edge_img, cv2.RETR_EXTERNAL, cv2.CHAIN_APPROX_SIMPLE)
    contour = sorted(contours, key=cv2.contourArea)[-1]
    epsilon = 0.1*cv2.arcLength(contour, True)
    contour = cv2.approxPolyDP(contour, epsilon, True)
    
    def four_point_transform(image, pts):
        def order_points(pts):
            rect = np.zeros((4, 2), dtype = "float32")

            s = pts.sum(axis = 1)
            rect[0] = pts[np.argmin(s)]
            rect[2] = pts[np.argmax(s)]

            diff = np.diff(pts, axis = 1)
            rect[1] = pts[np.argmin(diff)]
            rect[3] = pts[np.argmax(diff)]

            return rect

        rect = order_points(pts)
        (tl, tr, br, bl) = rect

        widthA = np.sqrt(((br[0] - bl[0]) ** 2) + ((br[1] - bl[1]) ** 2))
        widthB = np.sqrt(((tr[0] - tl[0]) ** 2) + ((tr[1] - tl[1]) ** 2))
        maxWidth = max(int(widthA), int(widthB))

        heightA = np.sqrt(((tr[0] - br[0]) ** 2) + ((tr[1] - br[1]) ** 2))
        heightB = np.sqrt(((tl[0] - bl[0]) ** 2) + ((tl[1] - bl[1]) ** 2))
        maxHeight = max(int(heightA), int(heightB))

        dst = np.array([
            [0, 0],
            [maxWidth - 1, 0],
            [maxWidth - 1, maxHeight - 1],
            [0, maxHeight - 1]], dtype = "float32")

        M = cv2.getPerspectiveTransform(rect, dst)
        warped = cv2.warpPerspective(image, M, (maxWidth, maxHeight))

        return warped

    paper = four_point_transform(image, contour.reshape(4, 2))
    return Image.fromarray(paper).resize(IMAGE_SIZE)

def cut_chars(image):
    ret = []
    for row in range(1, DOC_DIM[1]-1):
        for col in range(1, DOC_DIM[0]-1):
            left = BOARDER_SIZE + col*(FONT_SIZE+2*MARGIN_SIZE)
            upper = BOARDER_SIZE + row*(FONT_SIZE+2*MARGIN_SIZE)
            tmp = image.crop((left, upper, left + FONT_SIZE + 2*MARGIN_SIZE, upper + FONT_SIZE + 2*MARGIN_SIZE))
            ret.append(tmp)
    return ret

def preprocess(image):
    """"""
    return cut_chars(crop_image(image))

In [None]:
import os
CURRENT_FONT='__test__'
chars = []
for i in os.listdir('data/doc_photo'+'/'+CURRENT_FONT):
    chars += preprocess(Image.open('data/doc_photo'+'/'+CURRENT_FONT+'/'+i))
for idx, c in enumerate(chars):
    c.save('data/char_photo'+'/'+CURRENT_FONT+'/'+str(idx)+'.jpg')