X-Nicolo
diff --git a/‎my01-OCR文字识别/Tessract-OCR/README.md‎
Lines changed: 2 additions & 0 deletions b/‎my01-OCR文字识别/Tessract-OCR/README.md‎
Lines changed: 2 additions & 0 deletions
diff --git a/‎my01-OCR文字识别/Tessract-OCR/ocr.py‎ renamed to ‎my01-OCR文字识别/Tessract-OCR/pytesseract/ocr.py‎ b/‎my01-OCR文字识别/Tessract-OCR/ocr.py‎ renamed to ‎my01-OCR文字识别/Tessract-OCR/pytesseract/ocr.py‎
diff --git a/‎my01-OCR文字识别/Tessract-OCR/tesserocr/sample.jpg‎
1.51 KB b/‎my01-OCR文字识别/Tessract-OCR/tesserocr/sample.jpg‎
1.51 KB
diff --git a/‎my01-OCR文字识别/Tessract-OCR/tesserocr/sample1.jpeg‎
1.18 KB b/‎my01-OCR文字识别/Tessract-OCR/tesserocr/sample1.jpeg‎
1.18 KB
diff --git a/‎my01-OCR文字识别/Tessract-OCR/tesserocr/sample2.jpeg‎
1.18 KB b/‎my01-OCR文字识别/Tessract-OCR/tesserocr/sample2.jpeg‎
1.18 KB
diff --git a/‎my01-OCR文字识别/Tessract-OCR/tesserocr/sample3.jpeg‎
1.27 KB b/‎my01-OCR文字识别/Tessract-OCR/tesserocr/sample3.jpeg‎
1.27 KB
diff --git a/‎my01-OCR文字识别/Tessract-OCR/tesserocr/tesserocr_demo1.py‎
Lines changed: 21 additions & 0 deletions b/‎my01-OCR文字识别/Tessract-OCR/tesserocr/tesserocr_demo1.py‎
Lines changed: 21 additions & 0 deletions
diff --git a/‎my01-OCR文字识别/Tessract-OCR/tesserocr/tesserocr_demo2.py‎
Lines changed: 17 additions & 0 deletions b/‎my01-OCR文字识别/Tessract-OCR/tesserocr/tesserocr_demo2.py‎
Lines changed: 17 additions & 0 deletions
diff --git a/‎my01-OCR文字识别/Tessract-OCR/tesserocr/tesserocr_demo3.py‎
Lines changed: 22 additions & 0 deletions b/‎my01-OCR文字识别/Tessract-OCR/tesserocr/tesserocr_demo3.py‎
Lines changed: 22 additions & 0 deletions
@@ -7,7 +7,9 @@ http://www.pyimagesearch.com/2017/07/10/using-tesseract-ocr-python/
 * ubuntu: sudo apt-get install tesseract-ocr
 * pip install pillow
 * pip install pytesseract
+* pip install tesserocr
 
+# tesserocr更好用
 
 ## 运行
 * 标准输出，不用输出到TXT文件:
 
@@ -0,0 +1,21 @@
+# -*-coding:utf8-*-#
+
+__author__ = 'play4fun'
+"""
+create time:16/10/21 11:44
+"""
+
+from tesserocr import PyTessBaseAPI
+
+images = ['/Volumes/GF/Project/Python/Tesserocr/tesserocr/sample1.jpeg', '/Volumes/GF/Project/Python/Tesserocr/tesserocr/sample2.jpeg',
+          '/Volumes/GF/Project/Python/Tesserocr/tesserocr/sample3.jpeg']
+
+with PyTessBaseAPI() as api:
+    for img in images:
+        api.SetImageFile(img)
+        print('text:', api.GetUTF8Text())
+        print('-----')
+        print(api.AllWordConfidences())
+        print('-----')
+# api is automatically finalized when used in a with-statement (context manager).
+# otherwise api.End() should be explicitly called when it's no longer needed.
@@ -0,0 +1,17 @@
+# -*-coding:utf8-*-#
+
+__author__ = 'play4fun'
+"""
+create time:16/10/21 11:47
+"""
+
+import tesserocr
+from PIL import Image
+
+print(tesserocr.tesseract_version())  # print tesseract-ocr version
+print(tesserocr.get_languages())  # prints tessdata path and list of available languages
+
+image = Image.open('sample.jpg')
+print(tesserocr.image_to_text(image))  # print ocr text from image
+# or
+print(tesserocr.file_to_text('sample.jpg'))
@@ -0,0 +1,22 @@
+# -*-coding:utf8-*-#
+
+__author__ = 'play4fun'
+"""
+create time:16/10/21 11:47
+"""
+# Orientation and script detection (OSD)
+
+from PIL import Image
+from tesserocr import PyTessBaseAPI, PSM
+
+with PyTessBaseAPI(psm=PSM.AUTO_OSD) as api:
+    image = Image.open("/usr/src/tesseract/testing/eurotext.tif")#No such file
+    api.SetImage(image)
+    api.Recognize()
+
+    it = api.AnalyseLayout()
+    orientation, direction, order, deskew_angle = it.Orientation()
+    print("Orientation: {:d}".format(orientation))
+    print("WritingDirection: {:d}".format(direction))
+    print("TextlineOrder: {:d}".format(order))
+    print("Deskew angle: {:.4f}".format(deskew_angle))