使用pytesseract时得先安装tesseract,tesseract-ocr和pytesseract

from PIL import Image
from PIL import ImageEnhance
import pytesseract
import re
# 如果报错加上下面两行代码,更改tesseract路径
pytesseract.pytesseract.tesseract_cmd = 'D:\\Program Files\\Tesseract-OCR\\tesseract.exe'
tessdata_dir_config = '--tessdata-dir "D:\\Program Files\\Tesseract-OCR\\tessdata"'
im=Image.open("./img/10.jpg")
im=im.convert('L')
im.show()
im=ImageEnhance.Contrast(im)
im=im.enhance(1)
#im = im.resize((300, 90))
ltext = pytesseract.image_to_string(im)
#去掉非法字符,只保留字母数字
ltext = re.sub("\W", "", ltext)
im.show()
print(ltext)
#print(pytesseract.image_to_string(im))
#print(pytesseract.image_to_boxes(im))
#print(im.format, im.size, im.mode)

 

相关文章:

  • 2021-12-27
  • 2021-09-21
  • 2021-11-18
  • 2021-11-28
  • 2020-01-03
猜你喜欢
  • 2021-11-18
  • 2021-05-18
  • 2021-11-07
  • 2022-12-23
  • 2022-12-23
  • 2021-05-23
相关资源
相似解决方案