Spaces:

Blane187
/

TESTGroq-API-Chat

Paused

App Files Files Community

Nick088 commited on Jul 8, 2024

Commit

b6d6c4d

verified ·

1 Parent(s): df9a14a

Update app.py

Browse files

Files changed (1) hide show

app.py +18 -18

app.py CHANGED Viewed

@@ -256,31 +256,32 @@ def translate_audio(audio_file_path, prompt):
 # subtitles maker
-def create_srt_from_json(transcription_json):
-    """Converts Whisper JSON transcription to SRT format."""
     srt_lines = []
-    for i, segment in enumerate(transcription_json["segments"]):
-        start_time = timedelta(seconds=segment["start"])
-        end_time = timedelta(seconds=segment["end"])
-        text = segment["text"]
-        # Format SRT timestamp
-        start_timestamp = f"{start_time.seconds}:{start_time.microseconds // 1000:03}"
-        end_timestamp = f"{end_time.seconds}:{end_time.microseconds // 1000:03}"
-        srt_lines.append(f"{i+1}\n{start_timestamp} --> {end_timestamp}\n{text}\n\n")
     return "".join(srt_lines)
 def generate_subtitles(audio_file_path, prompt, language, auto_detect_language):
     # Check and process the file first
     processed_path, error_message = check_file(audio_file_path)
     # If there's an error during file check
     if error_message:
         return error_message
     with open(processed_path, "rb") as file:
         transcription_json = client.audio.transcriptions.create(
             file=(os.path.basename(processed_path), file.read()),
@@ -291,11 +292,10 @@ def generate_subtitles(audio_file_path, prompt, language, auto_detect_language):
             temperature=0.0,
         )
-    transcription_json = json.loads(transcription_json.to_json())
-    print(transcription_json)
-    srt_content = create_srt_from_json(transcription_json)
     return srt_content

 # subtitles maker
+def create_srt_from_text(transcription_text):
+    """Converts Groq text transcription to SRT format (assuming no timestamps)."""
     srt_lines = []
+    # Assuming no timestamps, we'll assign a default duration of 1 second to each line
+    duration = timedelta(seconds=1)
+    text_parts = transcription_text.split(".") # Split by periods to separate sentences
+    start_time = timedelta(seconds=0)
+    for i, text_part in enumerate(text_parts):
+        text_part = text_part.strip()
+        if text_part: # Only add lines with text
+            start_timestamp = f"{start_time.seconds}:{start_time.microseconds // 1000:03}"
+            end_timestamp = f"{(start_time + duration).seconds}:{(start_time + duration).microseconds // 1000:03}"
+            srt_lines.append(f"{i+1}\n{start_timestamp} --> {end_timestamp}\n{text_part.strip()}\n\n")
+            start_time += duration
     return "".join(srt_lines)
 def generate_subtitles(audio_file_path, prompt, language, auto_detect_language):
+    """Converts Whisper JSON transcription to SRT format."""
     # Check and process the file first
     processed_path, error_message = check_file(audio_file_path)
     # If there's an error during file check
     if error_message:
         return error_message
     with open(processed_path, "rb") as file:
         transcription_json = client.audio.transcriptions.create(
             file=(os.path.basename(processed_path), file.read()),
             temperature=0.0,
         )
+    # Extract the text from the Groq JSON response
+    transcription_text = transcription_json['text']
+    srt_content = create_srt_from_text(transcription_text)
     return srt_content