Spaces:

MultiTransformer
/

AyaTonic

Runtime error

App Files Files Community

ahmadtalha commited on Feb 25, 2024

Commit

a05af10

verified ·

1 Parent(s): c44ba13

Update app.py

Browse files

Files changed (1) hide show

app.py +3 -5

app.py CHANGED Viewed

@@ -76,6 +76,7 @@ def process_audio_to_text(audio_path):
         "English",
         api_name="/s2tt"
     )
     return result['text']  # Adjust based on the actual response
 def process_text_to_audio(text, target_language="English"):
@@ -119,8 +120,6 @@ def process_input(image=None, file=None, audio=None, text=""):
         for idx in range(len((list(ocr_prediction)[0][1]))):
             final_text += " "
             final_text += list((list(ocr_prediction)[0][1])[idx])[1][1]
-        # final_text += "\n" + ocr_processor.process_image(image)
-        print(final_text)
     if file is not None:
         if file.name.lower().endswith(('.png', '.jpg', '.jpeg')):
             pil_image = Image.open(file)
@@ -129,17 +128,15 @@ def process_input(image=None, file=None, audio=None, text=""):
             for idx in range(len((list(ocr_prediction)[0][1]))):
                 final_text += " "
                 final_text += list((list(ocr_prediction)[0][1])[idx])[1][1]
-            print(final_text)
         elif file.name.lower().endswith('.pdf'):
             ocr_prediction = ocr_processor.process_pdf(file.name)
             # gettig text from ocr object
             for idx in range(len((list(ocr_prediction)[0][1]))):
                 final_text += " "
                 final_text += list((list(ocr_prediction)[0][1])[idx])[1][1]
-            print(final_text)
-            # final_text += "\n" + ocr_processor.process_pdf(file.name)
         else:
             final_text += "\nUnsupported file type."
     if audio is not None:
         audio_text = process_audio_to_text(audio)
         final_text += "\n" + audio_text
@@ -151,6 +148,7 @@ def process_input(image=None, file=None, audio=None, text=""):
         temperature=0.5
     )
     generated_text = response.generations[0].text
     # Process generated text with command-nightly model
     response = co.generate(

         "English",
         api_name="/s2tt"
     )
+    print("Audio Result: ", result)
     return result['text']  # Adjust based on the actual response
 def process_text_to_audio(text, target_language="English"):
         for idx in range(len((list(ocr_prediction)[0][1]))):
             final_text += " "
             final_text += list((list(ocr_prediction)[0][1])[idx])[1][1]
     if file is not None:
         if file.name.lower().endswith(('.png', '.jpg', '.jpeg')):
             pil_image = Image.open(file)
             for idx in range(len((list(ocr_prediction)[0][1]))):
                 final_text += " "
                 final_text += list((list(ocr_prediction)[0][1])[idx])[1][1]
         elif file.name.lower().endswith('.pdf'):
             ocr_prediction = ocr_processor.process_pdf(file.name)
             # gettig text from ocr object
             for idx in range(len((list(ocr_prediction)[0][1]))):
                 final_text += " "
                 final_text += list((list(ocr_prediction)[0][1])[idx])[1][1]
         else:
             final_text += "\nUnsupported file type."
+    print(final_text)
     if audio is not None:
         audio_text = process_audio_to_text(audio)
         final_text += "\n" + audio_text
         temperature=0.5
     )
     generated_text = response.generations[0].text
+    print("Generated Text: ", generated_text)
     # Process generated text with command-nightly model
     response = co.generate(