Spaces:

tensorkelechi
/

vidtext

Paused

App Files Files Community

tensorkelechi commited on Apr 19, 2024

Commit

c76caf9

verified ·

1 Parent(s): 48266b9

Update app.py

Browse files

Files changed (1) hide show

app.py +6 -7

app.py CHANGED Viewed

@@ -33,6 +33,7 @@ def youtube_video_downloader(url):
 def audio_extraction(video_file, output_format):
     temp_filename = video_file.name
     video_path = f"{temp_filename}"
     audio = extract_audio(
         input_path=os.fspath(video_file), output_path=f"{str(video_path)[:-4]}.mp3", output_format=f"{output_format}"
@@ -51,13 +52,11 @@ def audio_processing(mp3_audio):
 def load_asr_model():
     asr_model = pipeline(task="automatic-speech-recognition", model="openai/whisper-large-v3")
     return asr_model
 def transcriber_pass(processed_audio):
-    # stime = time.time()
-    transcriber_model = load_asr_model()
     text_extract = transcriber_model(processed_audio)
-    # et = time.time()
-    # run_time = et - stime
     return text_extract['text']
 def generate_ai_summary(transcript):
@@ -80,7 +79,7 @@ with youtube_url_tab:
         if url:
            if st.button("Transcribe", key="yturl"):
                with st.spinner("Transcribing..."):
-                   audio = audio_extraction(os.fspath(yt_video), "mp3")
                    audio = audio_processing(audio)
                    ytvideo_transcript = transcriber_pass(audio)
                st.success(f"Transcription successful")
@@ -106,7 +105,7 @@ with file_select_tab:
         if video_file:
            if st.button("Transcribe", key="vidfile"):
                with st.spinner("Transcribing..."):
-                   audio = audio_extraction(video_file, "mp3")
                    audio = audio_processing(audio)
                    video_transcript = transcriber_pass(audio)
                    st.success(f"Transcription successful")

 def audio_extraction(video_file, output_format):
     temp_filename = video_file.name
     video_path = f"{temp_filename}"
     audio = extract_audio(
         input_path=os.fspath(video_file), output_path=f"{str(video_path)[:-4]}.mp3", output_format=f"{output_format}"
 def load_asr_model():
     asr_model = pipeline(task="automatic-speech-recognition", model="openai/whisper-large-v3")
     return asr_model
+transcriber_model = load_asr_model()
 def transcriber_pass(processed_audio):
     text_extract = transcriber_model(processed_audio)
     return text_extract['text']
 def generate_ai_summary(transcript):
         if url:
            if st.button("Transcribe", key="yturl"):
                with st.spinner("Transcribing..."):
+                   audio = audio_extraction(yt_video, "mp3")
                    audio = audio_processing(audio)
                    ytvideo_transcript = transcriber_pass(audio)
                st.success(f"Transcription successful")
         if video_file:
            if st.button("Transcribe", key="vidfile"):
                with st.spinner("Transcribing..."):
+                   audio = audio_extraction(os.fspath(video_file), "mp3")
                    audio = audio_processing(audio)
                    video_transcript = transcriber_pass(audio)
                    st.success(f"Transcription successful")