OliveSensorAPI/IOTLLM/generate_data/EC_process/processPDF/OCR.py

# -*- coding: utf-8 -*-
# @Time : 2024/10/18 22:09
# @Author : 黄子寒
# @Email : 1064071566@qq.com
# @File : OCR.py
# @Project : EmoLLM
import cv2
from paddleocr import PaddleOCR
import os
import glob

# 初始化OCR模型
ocr = PaddleOCR(use_angle_cls=True, lang='ch')


image_dir = "output"
output_txt_dir = "output_txt"


if not os.path.exists(output_txt_dir):
    os.makedirs(output_txt_dir)

image_list = glob.glob(os.path.join(image_dir, "*.png"))

# 批量识别处理
for img_path in image_list:
    # 读取图像
    img = cv2.imread(img_path)

    # 使用OCR模型进行识别
    result = ocr.ocr(img)

    # 获取图像文件名（不带扩展名）
    img_name = os.path.splitext(os.path.basename(img_path))[0]

    # 将OCR结果整理为文本
    txt_file_path = os.path.join(output_txt_dir, f"{img_name}.txt")

    # 打开文件以写入OCR结果
    with open(txt_file_path, 'w', encoding='utf-8') as f:
        for line in result:
            for word_info in line:
                # 提取识别到的文本和其置信度
                word, confidence = word_info[1][0], word_info[1][1]

                f.write(f"{word}\n")

                print(f" {word}, C: {confidence}")

    print(f"{txt_file_path}")
自定义数据集处理脚本 2024-11-11 17:32:36 +08:00			`# -- coding: utf-8 --`
			`# @Time : 2024/10/18 22:09`
			`# @Author : 黄子寒`
			`# @Email : 1064071566@qq.com`
			`# @File : OCR.py`
			`# @Project : EmoLLM`
			`import cv2`
			`from paddleocr import PaddleOCR`
			`import os`
			`import glob`

			`# 初始化OCR模型`
			`ocr = PaddleOCR(use_angle_cls=True, lang='ch')`


			`image_dir = "output"`
			`output_txt_dir = "output_txt"`


			`if not os.path.exists(output_txt_dir):`
			`os.makedirs(output_txt_dir)`

			`image_list = glob.glob(os.path.join(image_dir, "*.png"))`

			`# 批量识别处理`
			`for img_path in image_list:`
			`# 读取图像`
			`img = cv2.imread(img_path)`

			`# 使用OCR模型进行识别`
			`result = ocr.ocr(img)`

			`# 获取图像文件名（不带扩展名）`
			`img_name = os.path.splitext(os.path.basename(img_path))[0]`

			`# 将OCR结果整理为文本`
			`txt_file_path = os.path.join(output_txt_dir, f"{img_name}.txt")`

			`# 打开文件以写入OCR结果`
			`with open(txt_file_path, 'w', encoding='utf-8') as f:`
			`for line in result:`
			`for word_info in line:`
			`# 提取识别到的文本和其置信度`
			`word, confidence = word_info[1][0], word_info[1][1]`

			`f.write(f"{word}\n")`

自定义数据集处理脚本 2024-12-10 23:37:45 +08:00			`print(f" {word}, C: {confidence}")`
自定义数据集处理脚本 2024-11-11 17:32:36 +08:00
			`print(f"{txt_file_path}")`