pip install "paddleocr>=2.0.1"
对图像进行识别
from paddleocr import PaddleOCR, draw_ocr
from PIL import Image
if __name__ == '__main__':
ocr = PaddleOCR(use_angle_cls=True, lang='ch')
img_path = 'demo/demo_kie.jpeg'
result = ocr.ocr(img_path, cls=True)
for line in result:
print(line)
image = Image.open(img_path).convert('RGB')
boxes = [line[0] for line in result]
txts = [line[1][0] for line in result]
scores = [line[1][1] for line in result]
im_show = draw_ocr(image, boxes, txts, scores, font_path='data/chineseocr/labels/font.TTF')
im_show = Image.fromarray(im_show)
im_show.save('output/result5.jpg')
这里的PaddleOCR(use_angle_cls=True, lang='ch')中的lang可以是很多种语言,比如`ch`, `en`, `fr`, `german`, `korean`, `japan`。
这里即包含了文字检测,也包含了文本识别,一般结果如下
但如果是一张比较简单的文字,如
这个时候,我们只需要识别,无需检测
from paddleocr import PaddleOCR, draw_ocr
if __name__ == '__main__':
ocr = PaddleOCR(use_angle_cls=True, lang='en')
img_path = 'demo/demo_text_recog.jpg'
result = ocr.ocr(img_path, cls=True, det=False)
for line in result:
print(line)
运行结果(部分)
('STAR', 0.8838256597518921)
{{o.name}}
{{m.name}}