How to extract characters from the image using Google's Tesseract and print them on the streamlit application?

djidji · September 26, 2021, 4:16am

Hi,

I want to extract characters from image using Google’s Tesseract and print them on the streamlit application.
What are the steps to do that?
Thank you for your help.

kareemrasheed89 · March 14, 2022, 4:17am

Am looking for a way as well. Hope we get solution soon even if is a component

Franky1 · March 14, 2022, 2:12pm

andfanilo · March 14, 2022, 2:12pm

I think I did something similar a long time ago to apply OCR to a twitter image.

I found the following code snippet I created a long time ago which hopefully still works (haven’t tested it in months), hope you can extract the things that interest you

# on unix machine or docker Ubuntu container 
# apt-get install tesseract-ocr imagemagick libtesseract-dev  (should be included with most languages)
# tesseract --version
# tesseract --list-langs
# pip install pytesseract pillow
# pip install tensorflow
# pip install --upgrade tensorflow-hub
# pip3 install torch==1.10.0+cpu torchvision==0.11.1+cpu torchaudio==0.10.0+cpu -f https://download.pytorch.org/whl/cpu/torch_stable.html
# pip install keras-ocr easyocr
import cv2
import easyocr
import keras_ocr
import matplotlib.pyplot as plt
import numpy as np
import pytesseract as tess
import requests
import streamlit as st


def main():
    st.title("Testing OCR libraries on code snippets")

    picture_url = st.text_input(
        "Enter Tweet picture ID",
        value="https://pbs.twimg.com/media/FCIX6IUWQAgpiPT?format=jpg&name=large",
    )
    if picture_url == "":
        st.info("Please enter an ID")
        st.stop()

    with st.sidebar:
        st.header("Configuration")
        select_tesseract = st.checkbox("Compute tesseract")
        select_keras = st.checkbox("Compute keras-ocr")
        select_easyocr = st.checkbox("Compute easyocr")

    if select_tesseract:
        compute_tesseract(picture_url)
    if select_keras:
        compute_keras(picture_url)
    if select_easyocr:
        compute_easyocr(picture_url)


def compute_tesseract(picture_url: str):
    """
    https://www.opcito.com/blogs/extracting-text-from-images-with-tesseract-ocr-opencv-and-python
    https://tesseract-ocr.github.io/tessdoc/ImproveQuality.html
    """
    r = requests.get(picture_url, stream=True).raw
    raw_image_data = np.asarray(bytearray(r.read()), dtype="uint8")
    image = cv2.imdecode(raw_image_data, cv2.COLOR_BGR2RGB)
    rgb_image = cv2.cvtColor(image, cv2.COLOR_BGR2RGB)
    gray_image = cv2.cvtColor(image, cv2.COLOR_BGR2GRAY)
    threshold_img = cv2.threshold(
        gray_image, 0, 255, cv2.THRESH_BINARY | cv2.THRESH_OTSU
    )[1]
    inverted_img = cv2.bitwise_not(threshold_img)

    def _compute_ocr(label, img):
        # Engine Mode (--oem)
        # OCR engine mode 	Working description
        # 0 	Legacy engine only
        # 1 	Neural net LSTM only
        # 2 	Legacy + LSTM mode only
        # 3 	By Default, based on what is currently available
        custom_oem_psm_config = r"--oem 3 --psm 6"
        text = tess.image_to_string(img, config=custom_oem_psm_config)
        st.subheader(label)
        c1, c2 = st.columns((1, 2))
        c1.image(img)
        c2.code(text)

    _compute_ocr("BGR image", image)
    _compute_ocr("RGB image", rgb_image)
    _compute_ocr("Binary image", threshold_img)
    _compute_ocr("Inverted image", inverted_img)


def compute_keras(picture_url):
    """
    Keras-ocr
    Keras CRNN (text recognizer https://github.com/janzd/CRNN)
    CRAFT (text detector https://github.com/clovaai/CRAFT-pytorch)
    """
    pipeline = keras_ocr.pipeline.Pipeline()

    images = [keras_ocr.tools.read(url) for url in [picture_url]]
    prediction_groups = pipeline.recognize(images)

    fig, ax = plt.subplots(figsize=(20, 20))
    keras_ocr.tools.drawAnnotations(
        image=images[0], predictions=prediction_groups[0], ax=ax
    )

    st.pyplot(fig)


def compute_easyocr(picture_url: str):
    r = requests.get(picture_url, stream=True).raw
    raw_image_data = np.asarray(bytearray(r.read()), dtype="uint8")
    image = cv2.imdecode(raw_image_data, cv2.COLOR_BGR2RGB)
    rgb_image = cv2.cvtColor(image, cv2.COLOR_BGR2RGB)
    gray_image = cv2.cvtColor(image, cv2.COLOR_BGR2GRAY)
    threshold_img = cv2.threshold(
        gray_image, 0, 255, cv2.THRESH_BINARY | cv2.THRESH_OTSU
    )[1]
    inverted_img = cv2.bitwise_not(threshold_img)

    reader = easyocr.Reader(["en"], gpu=False)
    resp = reader.readtext(inverted_img, detail=0, paragraph=False)

    st.subheader("EasyOCR")
    c1, c2 = st.columns((1, 2))
    c1.image(inverted_img)
    c2.write(resp)

if __name__ == "__main__":
    main()

Happy Streamlitin’
Fanilo

system · March 14, 2023, 2:13pm

This topic was automatically closed 365 days after the last reply. New replies are no longer allowed.

Topic		Replies	Views
Text-extraction-app Show the Community! nlp , computer-vision	11	5578	June 7, 2021
Tesseract OCR Stopped Working [May 2024] Using Streamlit tesseract , debugging	4	548	November 25, 2024
Character Recognition with Pytesseract Show the Community!	0	1775	September 11, 2021
Tesseract is not installed or it's not in my PATH Community Cloud tesseract	3	8798	December 30, 2022
Text Extraction Application Show the Community! nlp , computer-vision	1	1006	January 26, 2023

How to extract characters from the image using Google's Tesseract and print them on the streamlit application?

Related topics