ocr-orderid3

Sleeping

App Files Files Community

ethanrom commited on Apr 2, 2023

Commit

7d30f01

0 Parent(s):

Duplicate from ethanrom/ocr-orderid

Browse files

Files changed (12) hide show

.gitattributes +34 -0
3app.py +43 -0
README.md +13 -0
app.py +26 -0
button_click.py +44 -0
button_click_alt.py +60 -0
model.h5 +3 -0
packages.txt +1 -0
process.py +78 -0
requirements.txt +4 -0
wapp.py +53 -0
workingapp.py +26 -0

.gitattributes ADDED Viewed

	@@ -0,0 +1,34 @@

+*.7z filter=lfs diff=lfs merge=lfs -text
+*.arrow filter=lfs diff=lfs merge=lfs -text
+*.bin filter=lfs diff=lfs merge=lfs -text
+*.bz2 filter=lfs diff=lfs merge=lfs -text
+*.ckpt filter=lfs diff=lfs merge=lfs -text
+*.ftz filter=lfs diff=lfs merge=lfs -text
+*.gz filter=lfs diff=lfs merge=lfs -text
+*.h5 filter=lfs diff=lfs merge=lfs -text
+*.joblib filter=lfs diff=lfs merge=lfs -text
+*.lfs.* filter=lfs diff=lfs merge=lfs -text
+*.mlmodel filter=lfs diff=lfs merge=lfs -text
+*.model filter=lfs diff=lfs merge=lfs -text
+*.msgpack filter=lfs diff=lfs merge=lfs -text
+*.npy filter=lfs diff=lfs merge=lfs -text
+*.npz filter=lfs diff=lfs merge=lfs -text
+*.onnx filter=lfs diff=lfs merge=lfs -text
+*.ot filter=lfs diff=lfs merge=lfs -text
+*.parquet filter=lfs diff=lfs merge=lfs -text
+*.pb filter=lfs diff=lfs merge=lfs -text
+*.pickle filter=lfs diff=lfs merge=lfs -text
+*.pkl filter=lfs diff=lfs merge=lfs -text
+*.pt filter=lfs diff=lfs merge=lfs -text
+*.pth filter=lfs diff=lfs merge=lfs -text
+*.rar filter=lfs diff=lfs merge=lfs -text
+*.safetensors filter=lfs diff=lfs merge=lfs -text
+saved_model/**/* filter=lfs diff=lfs merge=lfs -text
+*.tar.* filter=lfs diff=lfs merge=lfs -text
+*.tflite filter=lfs diff=lfs merge=lfs -text
+*.tgz filter=lfs diff=lfs merge=lfs -text
+*.wasm filter=lfs diff=lfs merge=lfs -text
+*.xz filter=lfs diff=lfs merge=lfs -text
+*.zip filter=lfs diff=lfs merge=lfs -text
+*.zst filter=lfs diff=lfs merge=lfs -text
+*tfevents* filter=lfs diff=lfs merge=lfs -text

3app.py ADDED Viewed

	@@ -0,0 +1,43 @@

+import cv2
+import pytesseract
+import streamlit as st
+import numpy as np
+def main():
+    st.set_page_config(page_title='Order ID Finder', layout='wide', page_icon='https://example.com/favicon.ico')
+    st.title('Order ID Finder')
+    st.image('https://seeklogo.com/images/S/streamlit-logo-1A3B208AE4-seeklogo.com.png', width=200)
+    st.write('This app helps you find the order ID from an image of customized jewellery.')
+    with st.sidebar:
+        st.write('## Input')
+        uploaded_file = st.file_uploader('Upload the image file (PNG or JPG)', type=['png', 'jpg'], help='Upload an image of customized jewellery')
+        input_file = st.file_uploader('Upload the input file (TXT)', type=['txt'], help='Upload a TXT file that contains a list of order IDs, names, and font types')
+    if st.button('Find Order ID') and uploaded_file and input_file:
+        with st.spinner('Processing image...'):
+            img = cv2.imdecode(np.fromstring(uploaded_file.read(), np.uint8), 1)
+            gray = cv2.cvtColor(img, cv2.COLOR_BGR2GRAY)
+            text = pytesseract.image_to_string(gray)
+            with input_file as file:
+                file_contents = file.read()
+                lines = file_contents.decode().splitlines()
+                found = False
+                for line in lines:
+                    order_id, name, font = line.strip().split(',')
+                    if name.strip() in text:
+                        st.success(f'Order ID: {order_id}')
+                        found = True
+                        break
+                if not found:
+                    st.error('Could not find the order ID in the image. Please try again with a different image or input file.')
+    st.write('')
+    st.write('')
+    st.write('')
+    st.image('https://www.canpackmachinery.com/wp-content/uploads/2018/03/Footer-Background-01-1.png', width=600)
+    st.write('Contact us: [email protected]')
+    st.write('Follow us on social media: @example')
+if __name__ == '__main__':
+    main()

README.md ADDED Viewed

	@@ -0,0 +1,13 @@

+---
+title: Ocr Orderid
+emoji: 🌍
+colorFrom: pink
+colorTo: gray
+sdk: streamlit
+sdk_version: 1.17.0
+app_file: app.py
+pinned: false
+duplicated_from: ethanrom/ocr-orderid
+---
+Check out the configuration reference at https://huggingface.co/docs/hub/spaces-config-reference

app.py ADDED Viewed

	@@ -0,0 +1,26 @@

+import streamlit as st
+#from button_click import find_order_id
+import tensorflow as tf
+from button_click_alt import find_order_id
+def main():
+    st.set_page_config(page_title='Order ID Finder', layout='wide')
+    st.title('OCR + Font type demo')
+    st.write('intro')
+    with st.sidebar:
+        st.write('## Input')
+        uploaded_file = st.file_uploader('Upload the image file (PNG or JPG)', type=['png', 'jpg'], help='help')
+        input_file = st.file_uploader('Upload the input file (TXT)', type=['txt'], help='help')
+    if st.button('Find Order ID') and uploaded_file and input_file:
+        st.write('## Output')
+        model = tf.keras.models.load_model('model.h5')
+        result = find_order_id(uploaded_file, input_file, model)
+        if result['status'] == 'success':
+            st.success(result['message'])
+        elif result['status'] == 'warning':
+            st.warning(result['message'])
+if __name__ == '__main__':
+    main()

button_click.py ADDED Viewed

	@@ -0,0 +1,44 @@

+import cv2
+import numpy as np
+import pytesseract
+import tensorflow as tf
+from tensorflow.keras.preprocessing.image import img_to_array, load_img
+def find_order_id(uploaded_file, input_file, model):
+    img = cv2.imdecode(np.fromstring(uploaded_file.read(), np.uint8), 1)
+    gray = cv2.cvtColor(img, cv2.COLOR_BGR2GRAY)
+    text = pytesseract.image_to_string(gray)
+    with input_file as file:
+        file_contents = file.read().decode()
+        lines = file_contents.split('\n')
+        found = False
+        for line in lines:
+            order_id, name, font = line.strip().split(',')
+            if name.strip() in text:
+                image = load_img(uploaded_file, target_size=(64, 64))
+                image = img_to_array(image)
+                image = np.expand_dims(image, axis=0)
+                image = image / 255.0
+                prediction = model.predict(image)
+                font_type = 'Pacifico' if prediction[0, 0] > prediction[0, 1] else 'OpenSans-Light'
+                result = {
+                    'status': 'success',
+                    'message': f'Detected Text: {text.strip()}\n, Order ID: {order_id}, Predicted Font Type: {font_type}'
+                }
+                found = True
+                break
+        if not found:
+            image = load_img(uploaded_file, target_size=(64, 64))
+            image = img_to_array(image)
+            image = np.expand_dims(image, axis=0)
+            image = image / 255.0
+            prediction = model.predict(image)
+            font_type = 'Pacifico' if prediction[0, 0] > prediction[0, 1] else 'OpenSans-Light'
+            result = {
+                'status': 'warning',
+                'message': f'Detected Text: {text.strip()}\n, Could not find the Order ID, Predicted Font Type: {font_type}'
+            }
+    return result

button_click_alt.py ADDED Viewed

	@@ -0,0 +1,60 @@

+import cv2
+import numpy as np
+import pytesseract
+import tensorflow as tf
+from tensorflow.keras.preprocessing.image import img_to_array, load_img
+from process import preprocess_image
+def find_order_id(uploaded_file, input_file, model):
+    rotated = preprocess_image(uploaded_file)
+    text = pytesseract.image_to_string(rotated)
+    with input_file as file:
+        file_contents = file.read().decode()
+        lines = file_contents.split('\n')
+        found = False
+        possible_order_ids = []
+        for line in lines:
+            order_id, name, font = line.strip().split(',')
+            if name.strip() in text:
+                image = load_img(uploaded_file, target_size=(64, 64))
+                image = img_to_array(image)
+                image = np.expand_dims(image, axis=0)
+                image = image / 255.0
+                prediction = model.predict(image)
+                font_type = 'Pacifico' if prediction[0, 0] > prediction[0, 1] else 'OpenSans-Light'
+                if font_type == font.strip():
+                    result = {
+                        'status': 'success',
+                        'message': f'Detected Text: {text.strip()}\n, Order ID: {order_id}, Predicted Font Type: {font_type}'
+                    }
+                    found = True
+                    break
+                else:
+                    possible_order_ids.append(order_id)
+        if not found:
+            image = load_img(uploaded_file, target_size=(64, 64))
+            image = img_to_array(image)
+            image = np.expand_dims(image, axis=0)
+            image = image / 255.0
+            prediction = model.predict(image)
+            font_type = 'Pacifico' if prediction[0, 0] > prediction[0, 1] else 'OpenSans-Light'
+            for line in lines:
+                order_id, name, font = line.strip().split(',')
+                if font.strip() == font_type:
+                    possible_order_ids.append(order_id)
+            if len(possible_order_ids) > 0:
+                result = {
+                    'status': 'warning',
+                    'message': f'Detected Text: {text.strip()}\n, Possible Order IDs: {",".join(possible_order_ids)}, Predicted Font Type: {font_type}'
+                }
+            else:
+                result = {
+                    'status': 'error',
+                    'message': f'Detected Text: {text.strip()}\n, Could not find the Order ID and possible font matches.'
+                }
+    return result

model.h5 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:148ca2bd9a8292808dd8ab5e1cfde8164fc92c3a8658ea1007cd2f0b4caacd14
+size 8253400

packages.txt ADDED Viewed

	@@ -0,0 +1 @@


1	+ tesseract-ocr-all

process.py ADDED Viewed

	@@ -0,0 +1,78 @@

+import cv2
+import numpy as np
+def preprocess_image_simple(image_file):
+    img = cv2.imdecode(np.fromstring(image_file.read(), np.uint8), 1)
+    gray = cv2.cvtColor(img, cv2.COLOR_BGR2GRAY)
+    return gray
+def preprocess_image(image_file):
+    img = cv2.imdecode(np.fromstring(image_file.read(), np.uint8), 1)
+    gray = cv2.cvtColor(img, cv2.COLOR_BGR2GRAY)
+    # Thresholding
+    _, thresh = cv2.threshold(gray, 0, 255, cv2.THRESH_BINARY + cv2.THRESH_OTSU)
+    # Image Denoising
+    blur = cv2.GaussianBlur(thresh, (3,3), 0)
+    # Image Binarization
+    thresh = cv2.adaptiveThreshold(blur, 255, cv2.ADAPTIVE_THRESH_MEAN_C, cv2.THRESH_BINARY_INV, 11, 4)
+    # Skew Correction
+    coords = np.column_stack(np.where(thresh > 0))
+    angle = cv2.minAreaRect(coords)[-1]
+    if angle < -45:
+        angle = -(90 + angle)
+    else:
+        angle = -angle
+    (h, w) = thresh.shape[:2]
+    center = (w // 2, h // 2)
+    M = cv2.getRotationMatrix2D(center, angle, 1.0)
+    rotated = cv2.warpAffine(thresh, M, (w, h), flags=cv2.INTER_CUBIC, borderMode=cv2.BORDER_REPLICATE)
+    return rotated
+#not yet working
+def preprocess_image_high(image_file):
+    img = cv2.imread(image_file)
+    gray = cv2.cvtColor(img, cv2.COLOR_BGR2GRAY)
+    # Adaptive thresholding
+    thresh = cv2.adaptiveThreshold(gray, 255, cv2.ADAPTIVE_THRESH_GAUSSIAN_C, cv2.THRESH_BINARY, 11, 2)
+    # Morphological operations
+    kernel = cv2.getStructuringElement(cv2.MORPH_RECT, (3, 3))
+    closed = cv2.morphologyEx(thresh, cv2.MORPH_CLOSE, kernel)
+    kernel = cv2.getStructuringElement(cv2.MORPH_RECT, (5, 5))
+    opened = cv2.morphologyEx(closed, cv2.MORPH_OPEN, kernel)
+    # Connected Component Analysis (CCA)
+    num_labels, labels, stats, centroids = cv2.connectedComponentsWithStats(opened)
+    filtered_labels = []
+    for i in range(1, num_labels):
+        # Filter out components based on their size, aspect ratio, and position
+        x, y, w, h, area = stats[i]
+        aspect_ratio = float(w) / h
+        if area > 100 and aspect_ratio < 5 and aspect_ratio > 0.2 and x > 10 and y > 10:
+            filtered_labels.append(i)
+    filtered = np.zeros_like(labels)
+    for i, label in enumerate(filtered_labels):
+        filtered[labels == label] = i + 1
+    # Skew correction
+    coords = np.column_stack(np.where(filtered > 0))
+    angle = cv2.minAreaRect(coords)[-1]
+    if angle < -45:
+        angle = -(90 + angle)
+    else:
+        angle = -angle
+    (h, w) = filtered.shape[:2]
+    center = (w // 2, h // 2)
+    M = cv2.getRotationMatrix2D(center, angle, 1.0)
+    rotated = cv2.warpAffine(filtered, M, (w, h), flags=cv2.INTER_CUBIC, borderMode=cv2.BORDER_REPLICATE)
+    return rotated

requirements.txt ADDED Viewed

	@@ -0,0 +1,4 @@

+opencv-python-headless
+pytesseract
+numpy
+tensorflow

wapp.py ADDED Viewed

	@@ -0,0 +1,53 @@

+import cv2
+import pytesseract
+import streamlit as st
+import numpy as np
+import tensorflow as tf
+from tensorflow.keras.preprocessing.image import load_img, img_to_array
+def main():
+    st.set_page_config(page_title='Order ID Finder', layout='wide')
+    st.title('OCR + Font type demo')
+    st.write('uses OCR to extract text from an uploaded image of a name. The app then attempts to match the extracted text with the corresponding order ID from a uploaded text file. Also uses pre-trained TensorFlow CNN to classify the font type of the extracted text as either Pacifico or OpenSans-Light. If the app successfully matches the text with an order ID, it outputs the order ID, predicted font type, and detected text. If no match is found, it outputs the predicted font type and detected text.')
+    with st.sidebar:
+        st.write('## Input')
+        uploaded_file = st.file_uploader('Upload the image file (PNG or JPG)', type=['png', 'jpg'], help='help')
+        input_file = st.file_uploader('Upload the input file (TXT)', type=['txt'], help='help')
+    if st.button('Find Order ID') and uploaded_file and input_file:
+        st.write('## Output')
+        img = cv2.imdecode(np.fromstring(uploaded_file.read(), np.uint8), 1)
+        gray = cv2.cvtColor(img, cv2.COLOR_BGR2GRAY)
+        text = pytesseract.image_to_string(gray)
+        with input_file as file:
+            file_contents = file.read().decode()
+            lines = file_contents.split('\n')
+            found = False
+            for line in lines:
+                order_id, name, font = line.strip().split(',')
+                if name.strip() in text:
+                    image = load_img(uploaded_file, target_size=(64, 64))
+                    image = img_to_array(image)
+                    image = np.expand_dims(image, axis=0)
+                    image = image / 255.0
+                    prediction = model.predict(image)
+                    font_type = 'Pacifico' if prediction[0, 0] > prediction[0, 1] else 'OpenSans-Light'
+                    st.success(f'Detected Text: {text.strip()}\n, Order ID: {order_id}, Predicted Font Type: {font_type}')
+                    found = True
+                    break
+            if not found:
+                image = load_img(uploaded_file, target_size=(64, 64))
+                image = img_to_array(image)
+                image = np.expand_dims(image, axis=0)
+                image = image / 255.0
+                prediction = model.predict(image)
+                font_type = 'Pacifico' if prediction[0, 0] > prediction[0, 1] else 'OpenSans-Light'
+                st.warning(f'Detected Text: {text.strip()}\n, Could not find the Order ID, Predicted Font Type: {font_type}')
+if __name__ == '__main__':
+    model = tf.keras.models.load_model('model.h5')
+    main()

workingapp.py ADDED Viewed

	@@ -0,0 +1,26 @@

+import cv2
+import pytesseract
+import streamlit as st
+import numpy as np
+def main():
+    st.title('Order ID Finder')
+    uploaded_file = st.file_uploader('Upload an image', type=['png', 'jpg'])
+    input_file = st.file_uploader('Upload the input file', type=['txt'])
+    if uploaded_file and input_file:
+        img = cv2.imdecode(np.fromstring(uploaded_file.read(), np.uint8), 1)
+        gray = cv2.cvtColor(img, cv2.COLOR_BGR2GRAY)
+        text = pytesseract.image_to_string(gray)
+        with input_file as file:
+            file_contents = file.read()
+            lines = file_contents.decode().splitlines()
+            for line in lines:
+                order_id, name, font = line.strip().split(',')
+                if name.strip() in text:
+                    st.success(f'Order ID: {order_id}')
+                    break
+if __name__ == '__main__':
+    main()