Spaces:
Runtime error
Runtime error
Vincent Claes
commited on
Commit
·
9fcc04d
1
Parent(s):
5aae428
first working version
Browse files- .gitignore +1 -0
- README.md +3 -0
- app.py +87 -0
- requirements.txt +4 -0
.gitignore
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
.env
|
README.md
CHANGED
|
@@ -20,4 +20,7 @@ You are a podcast editor that specialized to create a script out of a webpage.
|
|
| 20 |
[BREAKS]
|
| 21 |
- Use the <break time="1s"/> tag to add a pause in the speech. Use it after each paragraph and after a sentence when appropriate to get to a relax tone.
|
| 22 |
- Use <break time="3s"/> for longer pauses, to emphasize a point.
|
|
|
|
|
|
|
|
|
|
| 23 |
```
|
|
|
|
| 20 |
[BREAKS]
|
| 21 |
- Use the <break time="1s"/> tag to add a pause in the speech. Use it after each paragraph and after a sentence when appropriate to get to a relax tone.
|
| 22 |
- Use <break time="3s"/> for longer pauses, to emphasize a point.
|
| 23 |
+
|
| 24 |
+
[LINK]
|
| 25 |
+
{link}
|
| 26 |
```
|
app.py
ADDED
|
@@ -0,0 +1,87 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
# import numpy as np
|
| 2 |
+
import gradio
|
| 3 |
+
from openai import OpenAI
|
| 4 |
+
import tempfile
|
| 5 |
+
import os
|
| 6 |
+
|
| 7 |
+
from dotenv import load_dotenv
|
| 8 |
+
load_dotenv()
|
| 9 |
+
|
| 10 |
+
import uuid
|
| 11 |
+
|
| 12 |
+
|
| 13 |
+
client = OpenAI()
|
| 14 |
+
|
| 15 |
+
DEFAULT_SYSTEM_PROMPT = """
|
| 16 |
+
You are a podcast editor that specialized to create a script out of a webpage.
|
| 17 |
+
|
| 18 |
+
[TASKS]
|
| 19 |
+
- You will receive a link to a webpage about some content.
|
| 20 |
+
- You will create a script out of the content.
|
| 21 |
+
- The script should be 1 minute long if you read it out loud.
|
| 22 |
+
- Start with an intro to peak the interest of the listener.
|
| 23 |
+
- Then, summarize the content in a way that is easy to understand. Ask questions about the the content and answer them.
|
| 24 |
+
- Conclude with the most intriguing part of the content.
|
| 25 |
+
- Refrain from adding section headers in the script like [INTRUCTION], [CONTENT], [CONCLUSION].
|
| 26 |
+
- The script should be inspiring, written in colloquialism with english words and proverbs understood around the world.
|
| 27 |
+
- Write in a relax tone.
|
| 28 |
+
- Use filler words like 'um', 'ah', 'well' etc. to make it sound more natural.
|
| 29 |
+
|
| 30 |
+
[BREAKS]
|
| 31 |
+
- Use the <break time="1s"/> tag to add a pause in the speech. Use it after each paragraph and after a sentence when appropriate to get to a relax tone.
|
| 32 |
+
- Use <break time="3s"/> for longer pauses, to emphasize a point.
|
| 33 |
+
"""
|
| 34 |
+
|
| 35 |
+
def generate_episode(system_prompt, weblink):
|
| 36 |
+
# sr = 48000
|
| 37 |
+
# a4_freq, tones_from_a4 = 440, 12 * (octave - 4) + (note - 9)
|
| 38 |
+
# frequency = a4_freq * 2 ** (tones_from_a4 / 12)
|
| 39 |
+
# duration = int(duration)
|
| 40 |
+
# audio = np.linspace(0, duration, duration * sr)
|
| 41 |
+
# audio = (20000 * np.sin(audio * (2 * np.pi * frequency))).astype(np.int16)
|
| 42 |
+
# return sr, audio
|
| 43 |
+
response = client.chat.completions.create(
|
| 44 |
+
model="gpt-4o",
|
| 45 |
+
messages=[
|
| 46 |
+
{"role": "system", "content": system_prompt},
|
| 47 |
+
{"role": "user", "content": weblink},
|
| 48 |
+
]
|
| 49 |
+
)
|
| 50 |
+
script = response.choices[0].message.content
|
| 51 |
+
response = client.audio.speech.create(
|
| 52 |
+
model="tts-1",
|
| 53 |
+
voice="fable",
|
| 54 |
+
input=script,
|
| 55 |
+
)
|
| 56 |
+
|
| 57 |
+
with tempfile.NamedTemporaryFile(suffix=".mp3", delete=False) as temp_file:
|
| 58 |
+
temp_file.write(response.content)
|
| 59 |
+
# state["mp3_file"] = temp_file.name
|
| 60 |
+
return temp_file.name
|
| 61 |
+
|
| 62 |
+
|
| 63 |
+
def cleanup(state):
|
| 64 |
+
mp3_file_name = state.get("mp3_file")
|
| 65 |
+
if mp3_file_name and os.path.exists(mp3_file_name):
|
| 66 |
+
os.remove(mp3_file_name)
|
| 67 |
+
print(f"Removed file: {mp3_file_name}")
|
| 68 |
+
else:
|
| 69 |
+
print(f"No file found to delete: {mp3_file_name}")
|
| 70 |
+
|
| 71 |
+
demo = gradio.Interface(
|
| 72 |
+
fn=generate_episode,
|
| 73 |
+
inputs=[
|
| 74 |
+
gradio.Textbox(value=DEFAULT_SYSTEM_PROMPT, label="System Prompt"),
|
| 75 |
+
gradio.Textbox(value="https://en.wikipedia.org/wiki/Mount_Tambora", label="Weblink"),
|
| 76 |
+
# gradio.State(), # State to track the mp3 file
|
| 77 |
+
|
| 78 |
+
],
|
| 79 |
+
# outputs=["audio", gradio.State()],
|
| 80 |
+
outputs="audio",
|
| 81 |
+
|
| 82 |
+
)
|
| 83 |
+
|
| 84 |
+
# demo.cleanup(cleanup)
|
| 85 |
+
|
| 86 |
+
if __name__ == "__main__":
|
| 87 |
+
demo.launch()
|
requirements.txt
ADDED
|
@@ -0,0 +1,4 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
gradio
|
| 2 |
+
numpy
|
| 3 |
+
python-dotenv
|
| 4 |
+
openai
|