Ktk

Sleeping

App Files Files Community

NeuralFalcon commited on Jan 21

Commit

78e1d58

verified ·

1 Parent(s): 852635a

Update app.py

Browse files

Files changed (1) hide show

app.py +4 -5

app.py CHANGED Viewed

@@ -44,7 +44,7 @@ def update_model(model_name):
-def text_to_speech(text, model_name="kokoro-v0_19-half.pth", voice_name="af", speed=1.0, trim=1.0, pad_between_segments=0, remove_silence=True, minimum_silence=0.20):
     """
     Converts text to speech using the specified parameters and ensures the model is updated only if necessary.
     """
@@ -129,7 +129,6 @@ with gr.Blocks() as demo1:
                 #     minimum=0, maximum=1, value=0, step=0.1,
                 #     label='🔪 Trim', info='How much to cut from both ends of each segment'
                 # )
-                trim=0.5
                 pad_between = gr.Slider(
                     minimum=0, maximum=2, value=0, step=0.1,
                     label='🔇 Pad Between', info='Silent Duration between segments [For Large Text]'
@@ -143,12 +142,12 @@ with gr.Blocks() as demo1:
     text.submit(
         text_to_speech,
-        inputs=[text, model_name,voice, speed, trim, pad_between, remove_silence, minimum_silence],
         outputs=[audio]
     )
     generate_btn.click(
         text_to_speech,
-        inputs=[text,model_name, voice, speed, trim, pad_between, remove_silence, minimum_silence],
         outputs=[audio]
     )
@@ -258,7 +257,7 @@ import time
 def your_tts(text,audio_path,actual_duration,speed=1.0):
   global srt_voice_name
   model_name="kokoro-v0_19.pth"
-  tts_path=text_to_speech(text, model_name, voice_name=srt_voice_name,speed=speed)
   print(tts_path)
   tts_audio = AudioSegment.from_file(tts_path)
   tts_duration = len(tts_audio)

+def text_to_speech(text, model_name="kokoro-v0_19-half.pth", voice_name="af", speed=1.0, trim=0.5, pad_between_segments=0, remove_silence=True, minimum_silence=0.20):
     """
     Converts text to speech using the specified parameters and ensures the model is updated only if necessary.
     """
                 #     minimum=0, maximum=1, value=0, step=0.1,
                 #     label='🔪 Trim', info='How much to cut from both ends of each segment'
                 # )
                 pad_between = gr.Slider(
                     minimum=0, maximum=2, value=0, step=0.1,
                     label='🔇 Pad Between', info='Silent Duration between segments [For Large Text]'
     text.submit(
         text_to_speech,
+        inputs=[text, model_name,voice, speed, pad_between, remove_silence, minimum_silence],
         outputs=[audio]
     )
     generate_btn.click(
         text_to_speech,
+        inputs=[text,model_name, voice, speed, pad_between, remove_silence, minimum_silence],
         outputs=[audio]
     )
 def your_tts(text,audio_path,actual_duration,speed=1.0):
   global srt_voice_name
   model_name="kokoro-v0_19.pth"
+  tts_path=text_to_speech(text, model_name, voice_name=srt_voice_name,speed=speed,trim=1.0)
   print(tts_path)
   tts_audio = AudioSegment.from_file(tts_path)
   tts_duration = len(tts_audio)