Spaces:

mehdi364
/

Speech_to_text

Sleeping

mehdi364 commited on 29 days ago

Commit

0b41553

verified ·

1 Parent(s): ec17e9c

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -1,27 +1,19 @@
 from transformers import pipeline
-def transcribe_with_whisper():
-    temp_dir = tempfile.gettempdir()
-    if not os.access(temp_dir, os.W_OK):
-        raise PermissionError("No write access to the temporary directory.")
-    audio_path = os.path.join(temp_dir, "temp_audio.wav")
-    subprocess.run([
-        "ffmpeg", "-f", "alsa", "-i", "default", "-t", "5", "-ar", "16000", "-ac", "1", audio_path
-    ], check=True)
-    transcriber = pipeline("automatic-speech-recognition", model="openai/whisper-base.en")
-    result = transcriber(audio_path)
-    return result["text"]
 interface = gr.Interface(
-    fn=transcribe_with_whisper,
-    inputs=[],
     outputs="text",
-    title="تبدیل گفتار به نوشتار با Whisper - فقط فارسی",
-    description="برای شروع ضبط صدا، روی دکمه زیر کلیک کنید و سپس صحبت کنید."
 )
 if __name__ == "__main__":
-    interface.launch(server_name="0.0.0.0", server_port=7860)

+import gradio as gr
 from transformers import pipeline
+def transcribe_audio(audio):
+    transcriber = pipeline("automatic-speech-recognition", model="openai/whisper-base")
+    result = transcriber(audio)
+    return result['text']
 interface = gr.Interface(
+    fn=transcribe_audio,
+    inputs=gr.Audio(source="microphone", type="filepath", label="Input Audio"),
     outputs="text",
+    live=True,
+    title="Speech to Text - Persian",
+    description="Record your voice in Persian and see the transcription here."
 )
 if __name__ == "__main__":
+    interface.launch()