Spaces:

lterriel
/

kraken-htr-ocr-app

Sleeping

App Files Files Community

lterriel commited on 12 days ago

Commit

7c68c4f

•

1 Parent(s): 5091111

Upload 21 files

Browse files

Files changed (22) hide show

.gitattributes +5 -0
app.py +255 -0
data/catmus/images/Les_glorieuses_conquestes_de_Louis_[...]Beaulieu_S/303/251bastien_bpt6k1090945b_13.jpeg +0 -0
data/catmus/images/Rhodiorum_historia_Caoursin_Guillaume_bpt6k10953875_13.jpeg +0 -0
data/catmus/images/Rhodiorum_historia_Caoursin_Guillaume_bpt6k10953875_35.jpeg +0 -0
data/catmus/models/catmus-tiny.mlmodel +3 -0
data/default/blla.mlmodel +3 -0
data/endp/images/FRAN_0393_00571.jpg +3 -0
data/endp/images/FRAN_0393_13559.jpg +3 -0
data/endp/images/FRAN_0393_14537.jpg +3 -0
data/endp/models/e-NDP-seg_V3.mlmodel +3 -0
data/endp/models/e-NDP_V7.mlmodel +3 -0
data/lectaurep/images/DAFANCH96_048MIC07692_L-1.jpg +0 -0
data/lectaurep/images/FRAN_0025_0080_L-0.jpg +3 -0
data/lectaurep/images/FRAN_0187_16406_L-0.jpg +3 -0
data/lectaurep/models/lectaurep_base.mlmodel +3 -0
lib/__init__.py +0 -0
lib/constants.py +52 -0
lib/display_utils.py +61 -0
lib/kraken_utils.py +30 -0
requirements.txt +4 -0
tmp/.keepfile +0 -0

.gitattributes CHANGED Viewed

@@ -33,3 +33,8 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text

 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text
+data/endp/images/FRAN_0393_00571.jpg filter=lfs diff=lfs merge=lfs -text
+data/endp/images/FRAN_0393_13559.jpg filter=lfs diff=lfs merge=lfs -text
+data/endp/images/FRAN_0393_14537.jpg filter=lfs diff=lfs merge=lfs -text
+data/lectaurep/images/FRAN_0025_0080_L-0.jpg filter=lfs diff=lfs merge=lfs -text
+data/lectaurep/images/FRAN_0187_16406_L-0.jpg filter=lfs diff=lfs merge=lfs -text

app.py ADDED Viewed

	@@ -0,0 +1,255 @@

+#! /usr/bin/env python3
+# -*- coding: utf-8 -*-
+"""Streamlit interface for OCR/HTR with Kraken"""
+import os
+import datetime
+import random
+import streamlit as st
+from lib.constants import CONFIG_METADATA
+from lib.display_utils import (display_baselines,
+                               display_baselines_with_text,
+                               prepare_segments,
+                               open_image)
+from lib.kraken_utils import (load_model_seg,
+                              load_model_rec,
+                              segment_image,
+                              recognize_text)
+# === PAGE CONFIGURATION ===
+st.set_page_config(layout="wide")
+# === I/O UTILS ===
+def get_real_path(path: str) -> str:
+    """Get absolute path of a file."""
+    return os.path.join(os.path.dirname(__file__), path)
+def load_random_example_image(folder_path: str):
+    """Load a random image from a folder."""
+    images = [os.path.join(folder_path, img) for img in os.listdir(folder_path) if img.endswith(('jpg', 'jpeg'))]
+    return random.choice(images) if images else None
+def write_temporary_model(file_path, custom_model_loaded):
+    """Write a temporary model to disk."""
+    with open(get_real_path(file_path), "wb") as file:
+        file.write(custom_model_loaded.getbuffer())
+def load_model_seg_cache(model_path):
+    return load_model_seg(model_path)
+def load_model_rec_cache(model_path):
+    return load_model_rec(model_path)
+MODEL_SEG_BLLA = load_model_seg_cache(get_real_path("data/default/blla.mlmodel"))
+def load_models(model_rec_in, model_seg_in=None):
+    """Generic bridge to load models.
+    """
+    if model_rec_in is not None:
+        try:
+            model_rec_out = load_model_rec_cache(model_rec_in)
+        except Exception as e:
+            st.error(f" ❌ Modèle de reconnaissance non chargé. Erreur : {e}")
+            return None, None
+    else:
+        st.error(" ❌ Modèle de reconnaissance non trouvé.")
+        return None, None
+    if model_seg_in is not None:
+        try:
+            model_seg_out = load_model_seg_cache(model_seg_in)
+        except Exception as e:
+            st.error(f" ❌ Modèle de segmentation non chargé. Erreur : {e}")
+            return None, None
+    else:
+        model_seg_out = MODEL_SEG_BLLA
+    return model_rec_out, model_seg_out
+# === MODELS EXAMPLES ===
+endp_model_rec, endp_model_seg = load_models(model_rec_in=get_real_path("data/endp/models/e-NDP_V7.mlmodel"),
+                                             model_seg_in=get_real_path("data/endp/models/e-NDP-seg_V3.mlmodel"))
+lectaurep_model_rec = load_model_rec(get_real_path("data/lectaurep/models/lectaurep_base.mlmodel"))
+catmus_model_rec = load_model_rec(get_real_path("data/catmus/models/catmus-tiny.mlmodel"))
+# === MODELS EXAMPLES CONFIGURATION ===
+DEFAULT_CONFIG = {
+    'endp': {
+        'model_rec': endp_model_rec,
+        'model_seg': endp_model_seg,
+        'example_images': get_real_path("data/endp/images")
+    },
+    'lectaurep': {
+        'model_rec': lectaurep_model_rec,
+        'model_seg': None,
+        'example_images': get_real_path("data/lectaurep/images")
+    },
+    'catmus':{
+        'model_rec': catmus_model_rec,
+        'model_seg': None,
+        'example_images': get_real_path("data/catmus/images")
+    }
+}
+# === USER INTERFACE ===
+st.title("📜🦑 Reconnaissance de Texte (OCR/HTR) avec Kraken")
+st.markdown("[![https://img.shields.io/badge/Kraken_version-5.2.9-orange](https://img.shields.io/badge/Kraken_version-5.2.9-orange)](https://github.com/mittagessen/kraken)")
+st.markdown(
+    """
+    *⚠️ Cette application est à visée pédagogique ou à des fins de tests uniquement.
+    L'auteur se dégage de toutes responsabilités quant à son usage pour la production.*
+    """
+)
+st.markdown(
+    """
+    ##### 🔗 Ressources :
+    - 📂 Données de tests ou d'entraînement dans l'organisation [HTR United](https://htr-united.github.io/index.html)
+    - 📦 Modèles (mlmodel) à tester sur le groupe [OCR/HTR Zenodo](https://zenodo.org/communities/ocr_models/records?q=&l=list&p=1&s=10&sort=newest)
+    - 🛠 Évaluer vos prédictions avec l'application [KaMI (Kraken as Model Inspector)](https://huggingface.co/spaces/lterriel/kami-app)
+    """,
+    unsafe_allow_html=True
+)
+# Configuration choices
+st.sidebar.header("📁 Configuration HTR")
+st.sidebar.markdown('---')
+button_placeholder = st.sidebar.empty()
+success_loaded_models_msg_container = st.sidebar.empty()
+download_predictions_placeholder = st.sidebar.empty()
+st.sidebar.markdown('---')
+config_choice = st.sidebar.radio(
+    "Choisissez une configuration :", options=["Custom", "endp (exemple)", "lectaurep (exemple)", "catmus (exemple)"]
+)
+config_choice_placeholder = st.sidebar.empty()
+info_title_desc = st.sidebar.empty()
+place_metadata = st.sidebar.empty()
+map_config_choice = {
+    "Custom": "Custom",
+    "endp (exemple)": "endp",
+    "lectaurep (exemple)": "lectaurep",
+    "catmus (exemple)": "catmus"
+}
+config_choice = map_config_choice[config_choice]
+flag_rec_model = False
+flag_seg_model = False
+if config_choice != "Custom":
+    config = DEFAULT_CONFIG[config_choice]
+    config_choice_placeholder.success(f"Configuration sélectionnée : {CONFIG_METADATA[config_choice]['title']}")
+    place_metadata.markdown(CONFIG_METADATA[config_choice]['description'], unsafe_allow_html=True)
+    flag_rec_model = True
+else:
+    st.sidebar.warning("Configuration personnalisée")
+    custom_model_seg = st.sidebar.file_uploader(
+        "Modèle de segmentation (optionnel)", type=["mlmodel"]
+    )
+    custom_model_rec = st.sidebar.file_uploader(
+        "Modèle de reconnaissance", type=["mlmodel"]
+    )
+    if custom_model_rec:
+        write_temporary_model('tmp/model_rec_temp.mlmodel', custom_model_rec)
+        flag_rec_model = True
+    if custom_model_seg:
+        write_temporary_model('tmp/model_seg_temp.mlmodel', custom_model_seg)
+        flag_seg_model = True
+# Image choice
+flag_image = False
+image_source = st.radio("Source de l'image :", options=["Exemple", "Personnalisée"])
+info_example_image = st.empty()
+info_example_image_description = st.empty()
+upload_image_placeholder = st.empty()
+col1, col2, col3 = st.columns([1, 1, 1])
+image = None
+with col1:
+    st.markdown("## 🖼 Image Originale")
+    st.markdown("---")
+    if image_source == "Exemple":
+        if config_choice != "Custom":
+            example_image_path = load_random_example_image(config["example_images"])
+            if example_image_path:
+                image = open_image(example_image_path)
+                flag_image = True
+                info_example_image.info(f"Image d'exemple chargée : {os.path.basename(example_image_path)}")
+                info_title_desc.markdown(
+                    "<h4>Métadonnées de la configuration</h3>", unsafe_allow_html=True)
+                info_example_image_description.markdown(
+                    f"Source : {CONFIG_METADATA[config_choice]['examples_info'][os.path.basename(example_image_path)]}",
+                    unsafe_allow_html=True)
+            else:
+                info_example_image.error("Aucune image d'exemple trouvée.")
+        else:
+            info_example_image.error("Les images d'exemple ne sont pas disponibles pour la configuration personnalisée.")
+    else:
+        image_file = upload_image_placeholder.file_uploader("Téléchargez votre image :", type=["jpg", "jpeg"])
+        if image_file:
+            image = open_image(image_file)
+            flag_image = True
+        else:
+            info_example_image.warning("Veuillez télécharger une image.")
+    if flag_image:
+        st.image(image, use_container_width=True)
+# Display the results
+col4, col5, col6 = st.columns([1, 1, 1])
+if "image" in locals() and flag_rec_model and flag_image:
+    button_pred = button_placeholder.button('🚀Lancer la prédiction', key='but_pred')
+    if button_pred:
+        with st.spinner("⚙️ Chargement des nouveaux modèles..."):
+            if config_choice != "Custom":
+                model_rec, model_seg = DEFAULT_CONFIG[config_choice]['model_rec'], DEFAULT_CONFIG[config_choice]['model_seg']
+            else:
+                model_rec = load_model_rec_cache(get_real_path('tmp/model_rec_temp.mlmodel')) if flag_rec_model else None
+                model_seg = load_model_seg_cache(get_real_path('tmp/model_seg_temp.mlmodel')) if flag_seg_model else None
+            success_loaded_models_msg_container.success("✅️ Configuration OK!")
+        with col2:
+            st.markdown("## ✂️Segmentation")
+            st.markdown("---")
+            with st.spinner("⚙️ Segmentation en cours..."):
+                baseline_seg = segment_image(image, model_seg)
+                baselines, boundaries = prepare_segments(baseline_seg)
+            fig1, fig2 = display_baselines(image, baselines, boundaries)
+            st.pyplot(fig1)
+        with col3:
+            st.markdown("## ✍️ Texte")
+            st.markdown("---")
+            with st.spinner("⚙️ Reconnaissance en cours..."):
+                pred = recognize_text(model_rec, image, baseline_seg)
+                lines = [record.prediction.strip() for record in pred]
+                lines_with_idx = [f"{idx}: {line}" for idx, line in enumerate(lines)]
+            st.text_area(label='', value="\n".join(lines), height=570, label_visibility="collapsed")
+            date = datetime.datetime.now().strftime("%Y-%m-%d_%H-%M-%S")
+        with col4:
+            st.markdown("## ✂ Segmentation (Index)")
+            st.markdown("---")
+            st.pyplot(fig2)
+        with col5:
+            st.markdown("## ✏ Texte (Index)")
+            st.markdown("---")
+            st.text_area(label='', value="\n".join(lines_with_idx), height=570, label_visibility="collapsed")
+        with col6:
+            st.markdown("## 🔎 Texte (Image)")
+            st.markdown("---")
+            st.pyplot(display_baselines_with_text(image, baselines, lines))
+        download_predictions_placeholder.download_button(
+            "💾 Télécharger votre prédiction (txt)",
+            "\n".join(lines),
+            file_name=f"prediction_{date}.txt",
+        )

data/catmus/images/Les_glorieuses_conquestes_de_Louis_[...]Beaulieu_S/303/251bastien_bpt6k1090945b_13.jpeg ADDED Viewed

data/catmus/images/Rhodiorum_historia_Caoursin_Guillaume_bpt6k10953875_13.jpeg ADDED Viewed

data/catmus/images/Rhodiorum_historia_Caoursin_Guillaume_bpt6k10953875_35.jpeg ADDED Viewed

data/catmus/models/catmus-tiny.mlmodel ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:ef14f71c787543f46ded86fbb55b9739b314c04847820fef1a454b9665309002
+size 1183001

data/default/blla.mlmodel ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:77a638a83c9e535620827a09e410ed36391e9e8e8126d5796a0f15b978186056
+size 5047020

data/endp/images/FRAN_0393_00571.jpg ADDED Viewed

Git LFS Details

SHA256: 8c1a6ab81b3cfb458a292054cf7b361451e311a2fe8c8bf27c9030e048b05036
Pointer size: 132 Bytes
Size of remote file: 1.14 MB

data/endp/images/FRAN_0393_13559.jpg ADDED Viewed

Git LFS Details

SHA256: d791450e81c305e197833fafafb38b6bf1252c766e93a0c932fe1752771bbf96
Pointer size: 132 Bytes
Size of remote file: 1.07 MB

data/endp/images/FRAN_0393_14537.jpg ADDED Viewed

Git LFS Details

SHA256: 0975d01366d4c90b4a52fdc1d8c39f9d6ebf665c54612212ec4e4cc11c6b763a
Pointer size: 132 Bytes
Size of remote file: 1.01 MB

data/endp/models/e-NDP-seg_V3.mlmodel ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:35c942713fc252cc8851541ad870e3611335a222df45b97f42a8b65cf7081405
+size 5049049

data/endp/models/e-NDP_V7.mlmodel ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:3ade5ee65254d1366e34efd25d9cf159b4e15c6938a8ce3f193403b7081f4cd1
+size 23658117

data/lectaurep/images/DAFANCH96_048MIC07692_L-1.jpg ADDED Viewed

data/lectaurep/images/FRAN_0025_0080_L-0.jpg ADDED Viewed

Git LFS Details

SHA256: 68756e4fb30a129549c3f02d0aeb94d8c9eca13d827237eb2aab72dd923e5575
Pointer size: 132 Bytes
Size of remote file: 2.29 MB

data/lectaurep/images/FRAN_0187_16406_L-0.jpg ADDED Viewed

Git LFS Details

SHA256: 5a06ca83aaaf41435713b53cef2193294c1d1fc9d5bd517feb8729e67be2d1c2
Pointer size: 133 Bytes
Size of remote file: 12.6 MB

data/lectaurep/models/lectaurep_base.mlmodel ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:7d7f4217482fbaef8eb6faab18644bdb708d3a5d18391699dec4f9e559086f88
+size 16120811

lib/__init__.py ADDED Viewed

File without changes

lib/constants.py ADDED Viewed

	@@ -0,0 +1,52 @@

+CONFIG_METADATA = {
+    "endp": {
+        "title": "e-NDP project [exemple configuration]",
+        "description": """
+        <div style="text-align: justify;">
+            <p>The e-NDP project: collaborative digital edition of the Chapter registers of Notre-Dame of Paris (1326-1504) </p>
+            <p>Project information: <a href='https://endp.hypotheses.org/' target='blank'>here</a>.</p>
+            <p>Model & Dataset description:</p>
+            <ul>
+                <li><pre>Claustre, J., Smith, D., Torres Aguilar, S., Bretthauer, I., Brochard, P., Canteaut, O., Cottereau, E., Delivré, F., Denglos, M., Jolivet, V., Julerot, V., Kouamé, T., Lusset, E., Massoni, A., Nadiras, S., Perreaux, N., Regazzi, H., & Treglia, M. (2023). The e-NDP project : collaborative digital edition of the Chapter registers of Notre-Dame of Paris (1326-1504). Ground-truth for handwriting text recognition (HTR) on late medieval manuscripts. (1.0, p. https://zenodo.org/record/7575693) [Data set]. Zenodo. <a href='https://doi.org/10.5281/zenodo.7575693' target='blank'>https://doi.org/10.5281/zenodo.7575693</a><pre></li>
+                <li>Models: <a href="https://github.com/chartes/e-NDP_HTR/releases/tag/V7.1">https://github.com/chartes/e-NDP_HTR/releases/tag/V7.1</a></li>
+            </ul>
+        </div>
+        """,
+        "examples_info": {
+            "FRAN_0393_00571.jpg":"Archives nationales, LL109A , p. 43, février 1400. <a href='https://nakala.fr/10.34847/nkl.bced06qw#7ad1dde915d5ed70d2dd3fb3f8dffebf551b313c'>Nakala</a>",
+            "FRAN_0393_13559.jpg":"Archives nationales, LL120, p. 555, décembre 1463. <a href='https://nakala.fr/10.34847/nkl.205cj7td#2e5831e14350511c42b938c0274246aa858c8fec'>Nakala</a>",
+            "FRAN_0393_14537.jpg":"Archives nationales, LL127, p. 625, février 1504. <a href='https://nakala.fr/10.34847/nkl.7a9e99jb#fbadd2c18fa17df2ea56c98c8af0a4452aef2fa8'>Nakala</a>"
+        }
+    },
+    "lectaurep": {
+        "title": "LECTAUREP project [exemple configuration]",
+        "description": """
+        <div style="text-align: justify;">
+            <p>LECTAUREP Contemporary French Model (Administration)</p>
+            <p>Project information: <a href='https://lectaurep.hypotheses.org/'>here</a>.</p>
+            <p>Model & Dataset description: <pre>Chagué, A. (2022). LECTAUREP Contemporary French Model (Administration) (1.0.0). Zenodo. <a href='https://zenodo.org/records/6542744'>https://zenodo.org/records/6542744</a></pre></p>
+        </div>
+        """,
+        "examples_info": {
+            "DAFANCH96_048MIC07692_L-1.jpg": "Archives nationales, Répertoire de notaires (19e-20e)",
+            "FRAN_0025_0080_L-0.jpg": "Archives nationales, Répertoire de notaires (19e-20e)",
+            "FRAN_0187_16406_L-0.jpg": "Archives nationales, Répertoire de notaires (19e-20e)"
+        }
+    },
+    "catmus": {
+        "title": "CATMuS-Print [exemple configuration]",
+        "description": """
+        <div style="text-align: justify;">
+            <p>CATMuS-Print (Tiny) - Diachronic model for French prints and other West European languages</p>
+            <p>CATMuS (Consistent Approach to Transcribing ManuScript) Print is a Kraken HTR model trained on data produced by several projects, dealing with different languages (French, Spanish, German, English, Corsican, Catalan, Latin, Italian…) and different centuries (from the first prints of the 16th c. to digital documents of the 21st century).</p>
+            <p>Model & Dataset description: <pre>Gabay, S., & Clérice, T. (2024). CATMuS-Print [Tiny] (31-01-2024). Zenodo. <a href='https://doi.org/10.5281/zenodo.10602357' target='blank'>https://doi.org/10.5281/zenodo.10602357</a></pre></p>
+        </div>
+        """,
+        "examples_info": {
+            "Rhodiorum_historia_Caoursin_Guillaume_bpt6k10953875_35.jpeg": "Caoursin, Guillaume, Rhodiorum historia (1496),  BnF, <a href='https://gallica.bnf.fr/ark:/12148/bpt6k10953875' target='blank'>Gallica</a>",
+            "Rhodiorum_historia_Caoursin_Guillaume_bpt6k10953875_13.jpeg": "Caoursin, Guillaume, Rhodiorum historia (1496),  BnF, <a href='https://gallica.bnf.fr/ark:/12148/bpt6k10953875/f13.item' target='blank'>Gallica</a>",
+            "Les_glorieuses_conquestes_de_Louis_[...]Beaulieu_Sébastien_bpt6k1090945b_13.jpeg":"Beaulieu, Sébastien de, Les glorieuses conquestes de Louis le Grand, roy de France et de Navarre [Grand Beaulieu]. Tome 2 (16.), BnF, <a href='https://gallica.bnf.fr/ark:/12148/bpt6k10953875' target='blank'>Gallica</a>"
+        }
+    }
+}

lib/display_utils.py ADDED Viewed

	@@ -0,0 +1,61 @@

+# -*- coding: utf-8 -*-
+"""Utils for display input and output"""
+import matplotlib.pyplot as plt
+from PIL import Image
+def open_image(image_path: str) -> Image.Image:
+    """Open an image from a path."""
+    return Image.open(image_path)
+def display_baselines(image, baselines, boundaries=None):
+    """Display baselines and boundaries on an image."""
+    fig, ax = plt.subplots(figsize=(10, 10))
+    ax.imshow(image, cmap='gray')
+    ax.axis('off')
+    for idx, baseline in enumerate(baselines):
+        baseline_x = [point[0] for point in baseline]
+        baseline_y = [point[1] for point in baseline]
+        ax.plot(baseline_x, baseline_y, color='blue', linewidth=0.7)
+    if boundaries:
+        for boundary in boundaries:
+            boundary_x = [point[0] for point in boundary]
+            boundary_y = [point[1] for point in boundary]
+            ax.plot(boundary_x, boundary_y, color='red', linestyle='--', linewidth=1)
+    fig_special, ax_special = plt.subplots(figsize=(10, 10))
+    ax_special.set_xlim(0, image.size[0])
+    ax_special.set_ylim(0, image.size[1])
+    ax_special.invert_yaxis()
+    for idx, baseline in enumerate(baselines):
+        baseline_x = [point[0] for point in baseline]
+        baseline_y = [point[1] for point in baseline]
+        ax_special.plot(baseline_x, baseline_y, color='blue', linewidth=0.7)
+        ax_special.text(baseline_x[0], baseline_y[0], str(idx), fontsize=10, color='red')
+    return fig, fig_special
+def display_baselines_with_text(image, baselines, lines):
+    """Display baselines with text on an image."""
+    fig_special, ax_special = plt.subplots(figsize=(10, 10))
+    ax_special.set_xlim(0, image.size[0])
+    ax_special.set_ylim(0, image.size[1])
+    ax_special.invert_yaxis()
+    for idx, group in enumerate(zip(lines, baselines)):
+        baseline_x = [point[0] for point in group[1]]
+        baseline_y = [point[1] for point in group[1]]
+        ax_special.text(baseline_x[0], baseline_y[0], f"{str(idx)}: {group[0]}", fontsize=5.5, color='black')
+    ax_special.axis('off')
+    return fig_special
+def prepare_segments(seg_obj):
+    """Prepare baselines and boundaries for display."""
+    baselines = []
+    boundaries = []
+    for line in seg_obj.lines:
+        baselines.append(line.baseline)
+        boundaries.append(line.boundary)
+    return baselines, boundaries

lib/kraken_utils.py ADDED Viewed

	@@ -0,0 +1,30 @@

+# -*- coding: utf-8 -*-
+"""Kraken utils for OCR/HTR engine"""
+import streamlit as st
+from kraken.lib import (vgsl,
+                        models)
+from kraken import (blla,
+                    rpred)
+from PIL import Image
+@st.cache_data(show_spinner=False)
+def load_model_seg(model_path: str) -> vgsl.TorchVGSLModel:
+    """Load a segmentation model"""
+    return vgsl.TorchVGSLModel.load_model(model_path)
+@st.cache_data(show_spinner=False)
+def load_model_rec(model_path: str):
+    """Load a recognition model"""
+    return models.load_any(model_path)
+def segment_image(image: Image, model_seg: vgsl.TorchVGSLModel):
+    """Segment an image"""
+    return blla.segment(image, model=model_seg)
+def recognize_text(model, image: Image, baseline_seg):
+    """Recognize text in an image"""
+    return rpred.rpred(network=model, im=image, bounds=baseline_seg, pad=16, bidi_reordering=True)

requirements.txt ADDED Viewed

	@@ -0,0 +1,4 @@

+kraken==5.2.9
+matplotlib==3.9.2
+Pillow==11.0.0
+streamlit==1.40.1

tmp/.keepfile ADDED Viewed

File without changes