Spaces:
Sleeping
Sleeping
File size: 1,241 Bytes
4dd8bbe 5695a1d c5c8132 4dd8bbe c5c8132 4dd8bbe c5c8132 4dd8bbe c5c8132 4dd8bbe c5c8132 4dd8bbe 5695a1d c5c8132 5695a1d c5c8132 5695a1d 4dd8bbe c5c8132 4dd8bbe 5695a1d 4dd8bbe cfbb0f6 4dd8bbe 5695a1d 4dd8bbe |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 |
import gradio as gr
import pytesseract
import cv2
import os
def process(files, lang: str = 'eng') -> str:
results = []
for file in files:
try:
img = cv2.imread(file)
gray = cv2.cvtColor(img, cv2.COLOR_BGR2GRAY)
_, threshold_img = cv2.threshold(gray, 127, 255, cv2.THRESH_TOZERO)
result = pytesseract.image_to_string(threshold_img, lang=lang)
results.append(result)
except Exception as e:
results.append(f"Error processing {file}: {str(e)}")
finally:
os.remove(file)
return "\n\n".join(results)
# Get available languages for pytesseract
langs = pytesseract.get_languages()
# Define the Gradio interface using gr.Files to allow multiple file uploads
interface = gr.Interface(
fn=process,
inputs=[
gr.Files(label="Upload Images", file_count="multiple", type="filepath"),
gr.Dropdown(label="Select Language", choices=langs, type="value")
],
outputs="text",
css="footer {visibility: hidden}",
title="Optical Character Recognition | Batch Image To Text",
article="""
<p style='text-align: center;'>
</p>
"""
)
# Launch the interface
interface.launch(show_api=False)
|