[OCR][Python]測試tesseract與easyOCR誰比較準跟快

螃蟹_crab

2024/06/01閱讀時間約 17 分鐘

平時都在用tesseract來辨識OCR的部分，在網路上也常常聽說easyOCR比tesseract好用，就拿之前測試的OCR素材來比較看看囉。

以下輸入同樣圖片直接測試，並非絕對誰就比較準，只單純測試數字含英文的部分。

圖片素材就是15碼(英文加數字)，檔名為OCR正確結果

保密原則，只好模糊掉數字跟英文

Tesseract 測試結果

Easy OCR 測試結果

Tesseract 程式範例

輸入的圖片檔名，OCR_數字為正確的OCR

讀圖辨識結果與檔名比較，得知誤判率

import os
import pytesseract
from PIL import Image
import re
import time
import numpy as np
from collections import Counter
import cv2

def find_errors(ocr_results, file_names):
    error_details = []

    for ocr, file_name in zip(ocr_results, file_names):
        if ocr != file_name:
            error_positions = [(i, a, b) for i, (a, b) in enumerate(zip(ocr, file_name)) if a != b]
            error_details.append({"ocr": ocr, "file_name": file_name, "error_positions": error_positions})

    return error_details

def rename_images():
    res_str = 0
    ocr_results = []  # 你的OCR結果清單
    file_names = []  # 你的檔案名稱清單
    all_time = 0
    all_count = 0
    '''
    Change File Name -> OCR.Png
    '''
    folder_path = "D:/SaveImg/PSN/20240531"
    valid_extensions = [".jpg", ".png", ".jpeg"]

    pytesseract.pytesseract.tesseract_cmd = r"tesseract路徑"
    config = f'--oem 3 --psm 7'
    image_files = [f for f in os.listdir(folder_path) if os.path.isfile(os.path.join(folder_path, f)) and any(f.lower().endswith(ext) for ext in valid_extensions)]
    files = [f for f in os.listdir(folder_path) if os.path.isfile(os.path.join(folder_path, f)) and f.lower().endswith(".png")]
    
    for i, (image_file, file_1) in enumerate(zip(image_files, files)):

        _, extension = os.path.splitext(image_file)
        original_path = os.path.join(folder_path, image_file)
        file = file_1.split('_')[0]
        # 使用 pytesseract 讀取文字
        try:
            start_time = time.time()
            img = cv2.imread(original_path)
            gray = cv2.cvtColor(img, cv2.COLOR_BGR2GRAY)
            labels = cv2.threshold(gray, 0, 255, cv2.THRESH_BINARY_INV + cv2.THRESH_OTSU)[1]
            ocr_text = pytesseract.image_to_string(labels, lang="eng", config=config)
            print(ocr_text)
        except Exception as e:
            print(f"Error reading text from {image_file}: {e}")
            continue
                
        ocr_text = ocr_text.strip()
        # print(f'辨識到的OCR:{ocr_text}')
        ocr_results.append(ocr_text)  # 你的OCR結果清單
        file_names.append(file)  # 你的檔案名稱清單        
        if ocr_text == file:
            res_str += 1

        end_time = time.time()
        elapsed_time = end_time - start_time
        all_time += elapsed_time
        print(f"處理 第{i} 張圖片共花費 {elapsed_time:.2f} 秒")

    print(f'準確率:{(res_str/(i + 1) )*100}%,總共測試了{i + 1}張,誤判{((i + 1)-res_str)}張')

    error_details = find_errors(ocr_results, file_names)
    print("錯誤字母詳細資訊：")
    for error in error_details:
        print(f"OCR: {error['ocr']}, 檔案名稱: {error['file_name']}, 錯誤位置: {error['error_positions']}")
    # 統計重複的錯誤位置及其次數
    error_positions_counter = Counter([pos for error in error_details for pos in error["error_positions"]])
    print("錯誤位置及其次數：")
    for position, count in error_positions_counter.items():
        print(f"位置 {position}: {count} 次")
        all_count += count
    print(f'總花費時間:{all_time}秒，單測項平均時間:{round((all_time/i),3)}秒')
    print(f'誤判率 :{round(all_count/(i*15),2)*100}%')
    print(f'總字元數:{i*15}，誤判總字元數:{all_count}')
        
if __name__ == "__main__":
    rename_images()

Easy OCR程式範例

import os
from PIL import Image
import re
import time
import numpy as np
from collections import Counter
import easyocr
import cv2

def find_errors(ocr_results, file_names):
    error_details = []

    for ocr, file_name in zip(ocr_results, file_names):
        if ocr != file_name:
            error_positions = [(i, a, b) for i, (a, b) in enumerate(zip(ocr, file_name)) if a != b]
            error_details.append({"ocr": ocr, "file_name": file_name, "error_positions": error_positions})

    return error_details

def rename_images():
    res_str = 0
    ocr_results = []  # 你的OCR結果清單
    file_names = []  # 你的檔案名稱清單
    all_time = 0
    all_count = 0
    count = 0
    '''
    Change File Name -> OCR.Png
    '''
    folder_path = "圖片路徑"
    valid_extensions = [".jpg", ".png", ".jpeg"]
    reader = easyocr.Reader(['ch_sim','en'], gpu=False) # this needs to run only once to load the model into memory

    image_files = [f for f in os.listdir(folder_path) if os.path.isfile(os.path.join(folder_path, f)) and any(f.lower().endswith(ext) for ext in valid_extensions)]
    files = [f for f in os.listdir(folder_path) if os.path.isfile(os.path.join(folder_path, f)) and f.lower().endswith(".png")]
    
    for i, (image_file, file_1) in enumerate(zip(image_files, files)):

        _, extension = os.path.splitext(image_file)
        original_path = os.path.join(folder_path, image_file)
        file = file_1.split('_')[0]
        # 使用 pytesseract 讀取文字
        try:
            start_time = time.time()
            img = cv2.imread(original_path)
            gray = cv2.cvtColor(img, cv2.COLOR_BGR2GRAY)
            labels = cv2.threshold(gray, 0, 255, cv2.THRESH_BINARY_INV + cv2.THRESH_OTSU)[1]
            ocr_text = reader.readtext(labels, detail = 0)
            print(ocr_text)
        except Exception as e:
            print(f"Error reading text from {image_file}: {e}")
            continue
        # 使用 join 方法將列表轉換為字符串
        result_string = ''.join(ocr_text)
        # print(f'辨識到的OCR:{ocr_text}')
        ocr_results.append(result_string)  # 你的OCR結果清單
        file_names.append(file)  # 你的檔案名稱清單        
        if ocr_text == file:
            res_str += 1

        end_time = time.time()
        elapsed_time = end_time - start_time
        all_time += elapsed_time
        print(f"處理 第{i} 張圖片共花費 {elapsed_time:.2f} 秒")

    print(f'準確率:{(res_str/(i + 1) )*100}%,總共測試了{i + 1}張,誤判{((i + 1)-res_str)}張')

    error_details = find_errors(ocr_results, file_names)
    print("錯誤字母詳細資訊：")
    for error in error_details:
        print(f"OCR: {error['ocr']}, 檔案名稱: {error['file_name']}, 錯誤位置: {error['error_positions']}")
    # 統計重複的錯誤位置及其次數
    error_positions_counter = Counter([pos for error in error_details for pos in error["error_positions"]])
    print("錯誤位置及其次數：")
    for position, count in error_positions_counter.items():
        print(f"位置 {position}: {count} 次")
        all_count += count
    print(f'總花費時間:{all_time}秒，單測項平均時間:{round((all_time/i),3)}秒')
    print(f'誤判率 :{round(all_count/(i*15),2)*100}%')
    print(f'總字元數:{i*15}，誤判總字元數:{all_count}')
        
if __name__ == "__main__":
    rename_images()

螃蟹_crab的沙龍AI深度學習筆記視覺辨識

螃蟹_crab的沙龍

119會員

201內容數

本業是影像辨識軟體開發，閒暇時間進修AI相關內容，將學習到的內容寫成文章分享。

留言0

查看全部

發表第一個留言支持創作者！

螃蟹_crab的沙龍的其他內容

[深度學習][Python]多層感知器（MLP）模型使用不同激活函數（ReLU 和 Sigmoid）的效果

本文將展示使用不同激活函數（ReLU 和 Sigmoid）的效果。一個簡單的多層感知器（MLP）模型來對 Fashion-MNIST 資料集進行分類。函數定義 Sigmoid 函數 Sigmoid 函數將輸入壓縮到 0到 1 之間：特性：輸出範圍是 (0,1)(0, 1)(0,1

#ReLU和Sigmoid #多層感知器 #MLP

[深度學習][Python]使用簡單的神經網路來訓練辨識fashion_mnist資料

本文主要介紹神經網路訓練辨識的過程，利用fashion_mnist及簡單的神經網路來進行分類。使用只有兩層的神經網路來訓練辨識fashion_mnist資料。

#fashion #神經網路 #深度學習

[Python][人臉辨識]應用Deepface辨識臉部情緒

本文主要應用deepface的正面（frontal）人臉檢測的預設模型，使用analyze 函數，用於分析一張人臉圖像的情感（emotion）。在Colab上實現，若用其他平台需稍微修改程式碼。 Deepface Deepface是一個輕量級的Python人臉辨識和臉部屬性分析

#人臉辨識 #人臉辨識應用 #Deepface

[OCR_應用]Tesseract-OCR_Config說明

Google Tesseract Config說明，程式範例實際修改示範前言 Tesseract 的 config 檔案用於指定 OCR 引擎的設定和參數。這些參數可以影響文本識別的結果本文將彙整常用參數調整，並呈現不同參數出現不同的辨識結果官網Tesseract OCR參數說明連結

#OCR應用 #Tesseract #pytesseract

[OCR_應用]Tesseract-OCR_擷取字元面積

使用Google Tesseract應用，擷取圖像的OCR並將讀取到的字元標註在原圖上光學字元辨識功能 (Optical character recognition，光學字符辨識）可以將影像中特徵範圍內的文本轉換為數字形式的文本。使用前必須安装Google Tesseract並更新

#OCR應用 #Tesseract #OCR長寬面積

[Python][物件辨識]Yolo v8_Streamlit_網頁預測

python Streamlit連動github程式碼實現YoloV8網頁版偵測物件先致敬，YoloV8原作Github程式碼 Streamlit網頁實現YoloV8 偵測物件套用模型為YoloV8(YOLOv8n)最小模型，因github上傳檔案最大上限為25mb 導入圖像(搜尋街景

#yolov8 #Stramlit網頁 #物件偵測

[深度學習][Python]多層感知器（MLP）模型使用不同激活函數（ReLU 和 Sigmoid）的效果

#ReLU和Sigmoid #多層感知器 #MLP

[深度學習][Python]使用簡單的神經網路來訓練辨識fashion_mnist資料

本文主要介紹神經網路訓練辨識的過程，利用fashion_mnist及簡單的神經網路來進行分類。使用只有兩層的神經網路來訓練辨識fashion_mnist資料。

#fashion #神經網路 #深度學習

「天天秋嗨嗨」：vocus 秋季徵文，五大主題 & 獎品登場！

這個秋，Chill 嗨嗨！穿搭美美去賞楓，裝備款款去露營⋯⋯你的秋天怎麼過？秋日 To Do List 等你分享！秋季全站徵文，我們準備了五個創作主題，參賽還有機會獲得「火烤兩用鍋」，一起來看看如何參加吧～

#天天秋嗨嗨 #秋季旅遊 #秋季穿搭

MimiVsJames的美股投資分享

2024/11/03

美國大選『終局之戰』（Endgame）即將展開，美股將迎來新世紀？（上篇：模型推導寶座花落誰家？）

美國總統大選只剩下三天，我們觀察一整週民調與金融市場的變化（包含賭局），到本週五下午3:00前為止，誰是美國總統幾乎大概可以猜到60-70%的機率，本篇文章就是以大選結局為主軸來討論近期甚至到未來四年美股可能的改變

#美股 #美國大選 #投資理財

Aniceee

2024/05/14

What is OCR? Discover the Advantages and Applications of OCR

OCR (Optical Character Recognition) technology revolutionizes the conversion of texts from physical documents into digital data, enhancing processing

Aniceee

2024/05/05

光學字元辨識（OCR）技術：提升數位轉型的關鍵利器

什麼是 OCR 光學字元辨識技術？它是當今數位時代中不可或缺的重要工具之一，能夠將紙本文件、圖片或 PDF 中的文字快速、準確地轉換成數位檔案，從而極大地提升了資料處理效率，成為各行各業數位轉型的關鍵利器。不僅如此，OCR 技術還能有效減少人為錯誤，幫助企業提升整體營運效率，從而在市場競爭中取得優勢

#OCR #科技