EasyOCR

vntocr_easyocr.py
# Intégration de VNTranslator OCR avec le moteur EasyOCR
# Version : 1.0
# Auteur : Fazx - GarudaMods | https://www.patreon.com/vntranslator

"""
# ==================================================================
# EasyOCR : https://github.com/JaidedAI/EasyOCR
# Requis : python 3.10+ et PyTorch
# Installer avec : pip install easyocr
# ==================================================================
# Exécutez ce script avec : python vntocr_easyocr.py
# Dans VNTranslator utilisez le moteur personnalisé - HTTP POST avec la configuration :
# -- URL : http://127.0.0.1:5353
# -- Type de contenu : application/json
# -- En-têtes : {}
# -- Corps : {"image":"$IMAGE_BASE64", "langs": ["ja"]}
# -- Type de réponse : JSON
# -- Requête de réponse : fullText
# ==================================================================
# Langues (codes ISO à deux lettres) https://en.wikipedia.org/wiki/List_of_ISO_639_language_codes
# -- Japonais = ja
# -- Anglais = en
# ==================================================================
"""

from flask import Flask, request, jsonify
from PIL import Image
from io import BytesIO
import base64
import re
import json
import numpy as np
import easyocr

APP_HOST = "localhost"
APP_PORT = 5353
APP_DEBUG = True

def parse_ocr_result(easyocr_result):
    full_text = ""
    lines = []

    for entry in easyocr_result:
        polygon = entry[0]
        text = entry[1]
        confidence = entry[2]
        x_min = int(min(point[0] for point in polygon))
        y_min = int(min(point[1] for point in polygon))
        x_max = int(max(point[0] for point in polygon))
        y_max = int(max(point[1] for point in polygon))
        w = x_max - x_min
        h = y_max - y_min
        x = x_min
        y = y_min
        lines.append({
            "text": text,
            "w": int(w),
            "h": int(h),
            "x": int(x),
            "y": int(y),
            "confidence": float(confidence)
        })
        full_text += text + " "

    full_text = full_text.strip()
    return {
        "fullText": full_text,
        "lines": lines
    }

def base64_to_numpy(base64_string):
    if not base64_string:
        raise ValueError("La chaîne Base64 est vide ou manquante")

    if "," in base64_string:
        base64_string = base64_string.split(",")[1]

    try:
        image_decode = base64.b64decode(base64_string)
        print("Décodage Base64 réussi")

        # ouvrir l'image avec PIL
        image = Image.open(BytesIO(image_decode))
        print(f"Format de l'image : {image.format}, taille : {image.size}")

        # convertir l'image PIL en tableau NumPy
        image_np = np.array(image)
        print(f"Image convertie en tableau NumPy avec la forme : {image_np.shape}")

        return image_np
    except Exception as e:
        raise ValueError(f"Échec du décodage de l'image : {e}")

############################################################

app = Flask(__name__)
default_langs = ["ja"]
reader = easyocr.Reader(default_langs)

@app.route("/", methods=["POST"])
def ocr_endpoint(): 
    global default_langs, reader

    try:
        print("\n\n=== Requête OCR ===")
        print(f"Méthode : {request.method}")
        print(f"En-têtes : {dict(request.headers)}")
        
        if not request.is_json:
            print("La requête n'est pas au format JSON")
            return jsonify({"error": "La requête doit être au format JSON"}), 400
        
        data = request.get_json()

        # journaliser la charge utile
        print(f"Clés JSON de la requête : {list(data.keys())}")

        # vérifier l'image
        if "image" not in data:
            print("Aucune donnée d'image")
            return jsonify({"error": "Aucune donnée d'image"}), 400
        
        # décoder l'image base64
        try:            
            image = base64_to_numpy(data["image"])
        except Exception as e:
            print(f"Échec du décodage de l'image : {e}")
            return jsonify({"error": f"Échec du décodage de l'image : {str(e)}"}), 400

        # vérifier les langues
        langs = data.get("langs", ["ja"])
        try:
            if langs != default_langs:
                default_langs = langs
                reader = easyocr.Reader(default_langs)
        except Exception as e:
            print(f"Échec du chargement du modèle : {e}")
            return jsonify({"error": f"Échec du chargement du modèle : {str(e)}"}), 400
        print(f"langs : {langs}")

        # vérifier le dessin des boîtes englobantes
        draw_bounding_box = data.get("draw_bounding_box", False)
        print(f"draw_bounding_box : {draw_bounding_box}")

        # exécuter l'OCR
        # https://github.com/JaidedAI/EasyOCR?tab=readme-ov-file#usage
        result = reader.readtext(image)
        print(f"OCR terminé avec succès : {result}")

        # analyser le résultat
        parsed_result = parse_ocr_result(result)       
        parsed_result["draw_bounding_box"] = draw_bounding_box
        json_result = json.dumps(parsed_result, indent=4, ensure_ascii=False)
        return json_result

    except Exception as e:
        print(f"Erreur de la requête : {e}")
        return jsonify({"error": str(e)}), 500

if __name__ == "__main__":
    print(f"=== Démarrage du serveur OCR {APP_HOST} sur le port {APP_PORT} ===")
    app.run(debug=APP_DEBUG, host=APP_HOST, port=APP_PORT)
PrécédentKit de serveur OCR SuivantSuryaOCR