Spaces:

Shabdobhedi
/

Ocr-Using-Easy-Ocr

Sleeping

Shabdobhedi commited on Sep 30, 2024

Commit

0c75190

verified ·

1 Parent(s): 17bce12

Upload 3 Files

Files changed (3) hide show

new.py ADDED Viewed

+import streamlit as st
+from PIL import Image
+from ocr_utils import extract_text
+import numpy as np
+# Streamlit application title
+st.title("OCR and Keyword Search Application")
+st.write("Upload an image containing Hindi and English text to extract and search within the text.")
+# File uploader for image
+uploaded_file = st.file_uploader("Upload Image", type=["jpg", "jpeg", "png"])
+if uploaded_file is not None:
+    # Open the uploaded image using PIL
+    image = Image.open(uploaded_file)
+    st.image(image, caption='Uploaded Image', use_column_width=True)
+    # Convert the image to a NumPy array
+    image_np = np.array(image)
+    # Perform OCR on the uploaded image using the utility function
+    full_text = extract_text(image_np)
+    # Display the extracted text
+    st.subheader("Extracted Text")
+    st.write(full_text)
+    # Text input for keyword search
+    keyword = st.text_input("Enter Keyword to Search")
+# Highlight the keyword in the extracted text
+    if keyword:
+        highlighted_text = full_text.replace(
+            keyword, f"<mark style='background-color: yellow; color: black;'>{keyword}</mark>")
+        st.subheader("Highlighted Search Results")
+        st.markdown(highlighted_text, unsafe_allow_html=True)
+    else:
+        st.subheader("Highlighted Search Results")
+        st.write("No keyword entered for highlighting.")

ocr_utils.py ADDED Viewed

+# ocr_utils.py
+import easyocr
+import numpy as np
+# Initialize the EasyOCR reader for Hindi and English
+reader = easyocr.Reader(['hi', 'en'])
+def extract_text(image_np):
+    """
+    Extract text from a NumPy array image using EasyOCR.
+    Parameters:
+    - image_np: NumPy array representation of the image.
+    Returns:
+    - full_text: Extracted text as a single string.
+    """
+    extracted_text = reader.readtext(image_np, detail=0)
+    full_text = " ".join(extracted_text)
+    return full_text

requirements.txt ADDED Viewed

+easyocr
+streamlit
+Pillow
+numpy