Spaces:

UniquePratham
/

DualTextOCRFusion

Sleeping

UniquePratham commited on Sep 27, 2024

Commit

aba3166

verified ·

1 Parent(s): afedbd6

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -1,3 +1,5 @@
 import streamlit as st
 from ocr_cpu import extract_text_got, clean_text_with_ai  # Import OCR and AI cleaning functions
 import json
@@ -45,20 +47,25 @@ if uploaded_file is not None:
             extracted_text = extract_text_got(uploaded_file)  # Use GOT OCR to extract text
             if not extracted_text.strip():
                 st.warning("No text extracted from the image.")
             else:
                 # Clean the extracted text using AI
-                cleaned_text = clean_text_with_ai(extracted_text)
-                st.success("Text extraction and cleaning successful.")
         except Exception as e:
             st.error(f"Error during text extraction: {str(e)}")
             extracted_text = cleaned_text = ""
     # Display cleaned text
-    st.subheader("Cleaned Extracted Text")
-    st.text_area("Cleaned Text", cleaned_text, height=250)
-    # Save cleaned text for search
-    if cleaned_text:
         with open("extracted_text.json", "w") as json_file:
             json.dump({"text": cleaned_text}, json_file)

+# app.py
 import streamlit as st
 from ocr_cpu import extract_text_got, clean_text_with_ai  # Import OCR and AI cleaning functions
 import json
             extracted_text = extract_text_got(uploaded_file)  # Use GOT OCR to extract text
             if not extracted_text.strip():
                 st.warning("No text extracted from the image.")
+                cleaned_text = ""
             else:
                 # Clean the extracted text using AI
+                with st.spinner("Cleaning the extracted text using AI..."):
+                    cleaned_text = clean_text_with_ai(extracted_text)
+                    if cleaned_text.startswith("Error"):
+                        st.error(cleaned_text)
+                    else:
+                        st.success("Text extraction and cleaning successful.")
         except Exception as e:
             st.error(f"Error during text extraction: {str(e)}")
             extracted_text = cleaned_text = ""
     # Display cleaned text
+    if cleaned_text and not cleaned_text.startswith("Error"):
+        st.subheader("Cleaned Extracted Text")
+        st.text_area("Cleaned Text", cleaned_text, height=250)
+        # Save cleaned text for search
         with open("extracted_text.json", "w") as json_file:
             json.dump({"text": cleaned_text}, json_file)