willsonlincake 发表于 2022-4-14 00:29:55

Tesseract获取识别后的版面

from PIL import Image

import pytesseract



pytesseract.pytesseract.tesseract_cmd = r'C:/Users/Dell/AppData/Local/Tesseract-OCR/tesseract.exe'



# Get ALTO XML output

xml = pytesseract.image_to_alto_xml('test.png')
页: [1]
查看完整版本: Tesseract获取识别后的版面