-
Notifications
You must be signed in to change notification settings - Fork 183
/
windows_media_ocr_impl.py
67 lines (46 loc) · 1.9 KB
/
windows_media_ocr_impl.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
import asyncio
import base64
from PIL import ImageOps
from winrt.windows.globalization import Language
from winrt.windows.graphics.imaging import SoftwareBitmap, BitmapAlphaMode, BitmapPixelFormat
# pip3 install winrt
from winrt.windows.media.ocr import OcrEngine
from winrt.windows.security.cryptography import CryptographicBuffer
from .common import *
def _dump_rect(rtrect):
return Rect(rtrect.x, rtrect.y, rtrect.width, rtrect.height)
def _dump_ocrword(word):
return OcrWord(_dump_rect(word.bounding_rect), word.text)
def _dump_ocrline(line):
words = list(map(_dump_ocrword, line.words))
return OcrLine(words)
def _dump_ocrresult(ocrresult):
lines = list(map(_dump_ocrline, ocrresult.lines))
result = OcrResult(lines)
if ocrresult.text_angle:
result.text_angle = ocrresult.text_angle.value
return result
def _ibuffer(s):
"""create WinRT IBuffer instance from a bytes-like object"""
return CryptographicBuffer.decode_from_base64_string(base64.b64encode(s).decode('ascii'))
def _swbmp_from_pil_image(img):
if img.mode != "RGBA":
img = img.convert("RGBA")
pybuf = img.tobytes()
rtbuf = _ibuffer(pybuf)
return SoftwareBitmap.create_copy_from_buffer(rtbuf, BitmapPixelFormat.RGBA8, img.width, img.height,
BitmapAlphaMode.STRAIGHT)
async def _ensure_coroutine(awaitable):
return await awaitable
def _blocking_wait(awaitable):
return asyncio.run(_ensure_coroutine(awaitable))
def recognize(img, lang, *, hints=None):
if hints == None:
hints = []
if OcrHint.SINGLE_LINE in hints:
img = ImageOps.expand(img, 32, fill=img.getpixel((0, 0)))
lang = Language(lang)
assert (OcrEngine.is_language_supported(lang))
eng = OcrEngine.try_create_from_language(lang)
swbmp = _swbmp_from_pil_image(img)
return _dump_ocrresult(_blocking_wait(eng.recognize_async(swbmp)))