Spaces:

renatotn7
/

vozparatexto

Runtime error

App Files Files Community

renatotn7 commited on Nov 22, 2022

Commit

7f51198

1 Parent(s): 3892f6c

Update app.py

Browse files

Files changed (1) hide show

app.py +7 -16

app.py CHANGED Viewed

@@ -1,5 +1,5 @@
 from typing import Iterator
-import streamlit as st
 from io import StringIO
 import os
 import pathlib
@@ -17,7 +17,7 @@ from src.utils import slugify, write_srt, write_vtt
 from src.vad import NonSpeechStrategy, PeriodicTranscriptionConfig, TranscriptionConfig, VadPeriodicTranscription, VadSileroTranscription
 # Limitations (set to -1 to disable)
-DEFAULT_INPUT_AUDIO_MAX_DURATION = 600 # seconds
 # Whether or not to automatically delete all uploaded files, to save disk space
 DELETE_UPLOADED_FILES = True
@@ -221,10 +221,11 @@ def create_ui(inputAudioMaxDuration, share=False, server_name: str = None):
     ui_article = "Read the [documentation here](https://huggingface.co/spaces/aadnk/whisper-webui/blob/main/docs/options.md)"
     demo = gr.Interface(fn=ui.transcribe_webui, description=ui_description, article=ui_article, inputs=[
-        gr.Dropdown(choices=["tiny", "base", "small", "medium", "large"], value="medium", label="Model"),
         gr.Dropdown(choices=sorted(LANGUAGES), label="Language"),
         gr.Text(label="URL (YouTube, etc.)"),
-        gr.Audio(source="upload", type="filepath", label="Upload Audio"),
         gr.Audio(source="microphone", type="filepath", label="Microphone Input"),
         gr.Dropdown(choices=["transcribe", "translate"], label="Task"),
         gr.Dropdown(choices=["none", "silero-vad", "silero-vad-skip-gaps", "silero-vad-expand-into-gaps", "periodic-vad"], label="VAD"),
@@ -236,21 +237,11 @@ def create_ui(inputAudioMaxDuration, share=False, server_name: str = None):
         gr.File(label="Download"),
         gr.Text(label="Transcription"),
         gr.Text(label="Segments")
     ])
     demo.launch(share=share, server_name=server_name)
 if __name__ == '__main__':
-    uploaded_file = st.file_uploader("Choose a file")
-    if uploaded_file is not None:
-        # To read file as bytes:
-        bytes_data = uploaded_file.getvalue()
-        st.video(bytes_data)
-        os.system("rm -R /tmp/*")
-        os.system("mkdir /tmp/_input")
-        os.system("mkdir /tmp/_output")
-        os.system("mkdir /tmp/_outputf")
-        os.system("mkdir /tmp/videoSaida")
-        with open("/tmp/inputvideo", "wb") as binary_file:
-           binary_file.write(bytes_data)
     create_ui(DEFAULT_INPUT_AUDIO_MAX_DURATION)

 from typing import Iterator
 from io import StringIO
 import os
 import pathlib
 from src.vad import NonSpeechStrategy, PeriodicTranscriptionConfig, TranscriptionConfig, VadPeriodicTranscription, VadSileroTranscription
 # Limitations (set to -1 to disable)
+DEFAULT_INPUT_AUDIO_MAX_DURATION = 1200 # seconds
 # Whether or not to automatically delete all uploaded files, to save disk space
 DELETE_UPLOADED_FILES = True
     ui_article = "Read the [documentation here](https://huggingface.co/spaces/aadnk/whisper-webui/blob/main/docs/options.md)"
     demo = gr.Interface(fn=ui.transcribe_webui, description=ui_description, article=ui_article, inputs=[
+        gr.Dropdown(choices=["medium.en", "large"], value="medium.en", label="Model"),
         gr.Dropdown(choices=sorted(LANGUAGES), label="Language"),
         gr.Text(label="URL (YouTube, etc.)"),
+        gr.Audio(source="upload", type="filepath", label="Upload Audio"),
+        gr.File(label="submeta seu video",interactive=True)
         gr.Audio(source="microphone", type="filepath", label="Microphone Input"),
         gr.Dropdown(choices=["transcribe", "translate"], label="Task"),
         gr.Dropdown(choices=["none", "silero-vad", "silero-vad-skip-gaps", "silero-vad-expand-into-gaps", "periodic-vad"], label="VAD"),
         gr.File(label="Download"),
         gr.Text(label="Transcription"),
         gr.Text(label="Segments")
+        gr.Text(label="Videos")
     ])
     demo.launch(share=share, server_name=server_name)
 if __name__ == '__main__':
     create_ui(DEFAULT_INPUT_AUDIO_MAX_DURATION)