TulipAIs commited on
Commit
ca4a31b
1 Parent(s): 91f4b0a

Updating Wiki tabs in AudioGen and MusicGen

Browse files
Files changed (1) hide show
  1. app.py +106 -103
app.py CHANGED
@@ -959,11 +959,12 @@ def ui_full(launch_kwargs):
959
  Welcome to Soundscapes - TulipAI’s flagship Audio Storytelling Toolkit. Designed with modern content creators in mind, our AI-driven platform generates audio sound effects in just minutes tailored to your unique needs.
960
  """
961
  )
962
- with gr.Tab("AudioGen"):
963
  with gr.Tab("Generate Sound Effects"):
964
  gr.Markdown(
965
  """
966
  ### AudioGen
 
967
  """
968
  )
969
  with gr.Row():
@@ -1052,7 +1053,7 @@ def ui_full(launch_kwargs):
1052
  send_audio_a = gr.Button("Send to Input Audio")
1053
  seed_used_a = gr.Number(label='Seed used', value=-1, interactive=False)
1054
  download_a = gr.File(label="Generated Files", interactive=False)
1055
- with gr.Tab("Wiki"):
1056
  gr.Markdown(
1057
  """
1058
  - **[Generate (button)]:**
@@ -1179,111 +1180,113 @@ def ui_full(launch_kwargs):
1179
  """
1180
  )
1181
  with gr.Tab("MusicGen"):
1182
- gr.Markdown(
1183
- """
1184
- ### MusicGen
1185
- """
1186
- )
1187
- with gr.Row():
1188
- with gr.Column():
1189
- with gr.Tab("Generation"):
1190
- with gr.Accordion("Structure Prompts", open=False):
1191
- with gr.Column():
1192
- with gr.Row():
1193
- struc_prompts = gr.Checkbox(label="Enable", value=False, interactive=True, container=False)
1194
- bpm = gr.Number(label="BPM", value=120, interactive=True, scale=1, precision=0)
1195
- key = gr.Dropdown(["C", "C#", "D", "D#", "E", "F", "F#", "G", "G#", "A", "Bb", "B"], label="Key", value="C", interactive=True)
1196
- scale = gr.Dropdown(["Major", "Minor"], label="Scale", value="Major", interactive=True)
1197
- with gr.Row():
1198
- global_prompt = gr.Text(label="Global Prompt", interactive=True, scale=3)
1199
- with gr.Row():
1200
- s = gr.Slider(1, max_textboxes, value=1, step=1, label="Prompts:", interactive=True, scale=2)
1201
- #s_mode = gr.Radio(["segmentation", "batch"], value="segmentation", interactive=True, scale=1, label="Generation Mode")
1202
- with gr.Column():
1203
- textboxes = []
1204
- prompts = []
1205
- repeats = []
1206
- calcs = []
1207
  with gr.Row():
1208
- text0 = gr.Text(label="Input Text", interactive=True, scale=4)
1209
- prompts.append(text0)
1210
- drag0 = gr.Number(label="Repeat", value=1, interactive=True, scale=1)
1211
- repeats.append(drag0)
1212
- calc0 = gr.Text(interactive=False, value="00:00 - 00:00", scale=1, label="Time")
1213
- calcs.append(calc0)
1214
- for i in range(max_textboxes):
1215
- with gr.Row(visible=False) as t:
1216
- text = gr.Text(label="Input Text", interactive=True, scale=3)
1217
- repeat = gr.Number(label="Repeat", minimum=1, value=1, interactive=True, scale=1)
1218
- calc = gr.Text(interactive=False, value="00:00 - 00:00", scale=1, label="Time")
1219
- textboxes.append(t)
1220
- prompts.append(text)
1221
- repeats.append(repeat)
1222
- calcs.append(calc)
1223
- to_calc = gr.Button("Calculate Timings", variant="secondary")
1224
- with gr.Row():
1225
- duration = gr.Slider(minimum=1, maximum=300, value=10, step=1, label="Duration", interactive=True)
1226
- with gr.Row():
1227
- overlap = gr.Slider(minimum=1, maximum=29, value=12, step=1, label="Overlap", interactive=True)
1228
- with gr.Row():
1229
- seed = gr.Number(label="Seed", value=-1, scale=4, precision=0, interactive=True)
1230
- gr.Button('\U0001f3b2\ufe0f', scale=1).click(fn=lambda: -1, outputs=[seed], queue=False)
1231
- reuse_seed = gr.Button('\u267b\ufe0f', scale=1)
1232
-
1233
- with gr.Tab("Audio"):
1234
- with gr.Row():
1235
- with gr.Column():
1236
- input_type = gr.Radio(["file", "mic"], value="file", label="Input Type (optional)", interactive=True)
1237
- mode = gr.Radio(["melody", "sample"], label="Input Audio Mode (optional)", value="sample", interactive=True)
1238
- with gr.Row():
1239
- trim_start = gr.Number(label="Trim Start", value=0, interactive=True)
1240
- trim_end = gr.Number(label="Trim End", value=0, interactive=True)
1241
- audio = gr.Audio(source="upload", type="numpy", label="Input Audio (optional)", interactive=True)
1242
-
1243
- with gr.Tab("Customization"):
1244
- with gr.Row():
1245
- with gr.Column():
1246
- background = gr.ColorPicker(value="#0f0f0f", label="background color", interactive=True, scale=0)
1247
- bar1 = gr.ColorPicker(value="#84cc16", label="bar color start", interactive=True, scale=0)
1248
- bar2 = gr.ColorPicker(value="#10b981", label="bar color end", interactive=True, scale=0)
1249
  with gr.Column():
1250
- image = gr.Image(label="Background Image", type="filepath", interactive=True, scale=4)
 
 
 
1251
  with gr.Row():
1252
- height = gr.Number(label="Height", value=512, interactive=True)
1253
- width = gr.Number(label="Width", value=768, interactive=True)
1254
-
1255
- with gr.Tab("Settings"):
1256
- with gr.Row():
1257
- channel = gr.Radio(["mono", "stereo", "stereo effect"], label="Output Audio Channels", value="stereo", interactive=True, scale=1)
1258
- sr_select = gr.Dropdown(["11025", "16000", "22050", "24000", "32000", "44100", "48000"], label="Output Audio Sample Rate", value="48000", interactive=True)
1259
- with gr.Row():
1260
- model = gr.Radio(["melody", "small", "medium", "large", "custom"], label="Model", value="large", interactive=True, scale=1)
1261
- with gr.Column():
1262
- dropdown = gr.Dropdown(choices=get_available_models(), value=("No models found" if len(get_available_models()) < 1 else get_available_models()[0]), label='Custom Model (models folder)', elem_classes='slim-dropdown', interactive=True)
1263
- ui.create_refresh_button(dropdown, lambda: None, lambda: {'choices': get_available_models()}, 'refresh-button')
1264
- basemodel = gr.Radio(["small", "medium", "melody", "large"], label="Base Model", value="medium", interactive=True, scale=1)
1265
- with gr.Row():
1266
- decoder = gr.Radio(["Default", "MultiBand_Diffusion"], label="Decoder", value="Default", interactive=True)
1267
- with gr.Row():
1268
- topk = gr.Number(label="Top-k", value=250, interactive=True)
1269
- topp = gr.Number(label="Top-p", value=0, interactive=True)
1270
- temperature = gr.Number(label="Temperature", value=1.0, interactive=True)
1271
- cfg_coef = gr.Number(label="Classifier Free Guidance", value=3.0, interactive=True)
1272
- with gr.Row():
1273
- submit = gr.Button("Generate", variant="primary")
1274
- # Adapted from https://github.com/rkfg/audiocraft/blob/long/app.py, MIT license.
1275
- _ = gr.Button("Interrupt").click(fn=interrupt, queue=False)
1276
- with gr.Column() as c:
1277
- with gr.Tab("Output"):
1278
- output = gr.Video(label="Generated Music", scale=0)
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1279
  with gr.Row():
1280
- audio_only = gr.Audio(type="numpy", label="Audio Only", interactive=False)
1281
- backup_only = gr.Audio(type="numpy", label="Backup Audio", interactive=False, visible=False)
1282
- send_audio = gr.Button("Send to Input Audio")
1283
- seed_used = gr.Number(label='Seed used', value=-1, interactive=False)
1284
- download = gr.File(label="Generated Files", interactive=False)
1285
- with gr.Tab("Wiki"):
1286
- gr.Markdown(
 
 
 
 
 
 
 
1287
  """
1288
  - **[Generate (button)]:**
1289
  Generates the music with the given settings and prompts.
 
959
  Welcome to Soundscapes - TulipAI’s flagship Audio Storytelling Toolkit. Designed with modern content creators in mind, our AI-driven platform generates audio sound effects in just minutes tailored to your unique needs.
960
  """
961
  )
962
+ with gr.Tab("## AudioGen"):
963
  with gr.Tab("Generate Sound Effects"):
964
  gr.Markdown(
965
  """
966
  ### AudioGen
967
+ Check the "Wiki" to learn how to take the most out of TulipAI Soundscapes Sound Effects Generation Tool.
968
  """
969
  )
970
  with gr.Row():
 
1053
  send_audio_a = gr.Button("Send to Input Audio")
1054
  seed_used_a = gr.Number(label='Seed used', value=-1, interactive=False)
1055
  download_a = gr.File(label="Generated Files", interactive=False)
1056
+ with gr.Tab("## Wiki"):
1057
  gr.Markdown(
1058
  """
1059
  - **[Generate (button)]:**
 
1180
  """
1181
  )
1182
  with gr.Tab("MusicGen"):
1183
+ gr.tab("## MusicGen"):
1184
+ gr.Markdown(
1185
+ """
1186
+ ### MusicGen
1187
+ Check the "Wiki" to learn how to take the most out of TulipAI Soundscapes Music Generation Tool.
1188
+ """
1189
+ )
1190
+ with gr.Row():
1191
+ with gr.Column():
1192
+ with gr.Tab("Generation"):
1193
+ with gr.Accordion("Structure Prompts", open=False):
1194
+ with gr.Column():
1195
+ with gr.Row():
1196
+ struc_prompts = gr.Checkbox(label="Enable", value=False, interactive=True, container=False)
1197
+ bpm = gr.Number(label="BPM", value=120, interactive=True, scale=1, precision=0)
1198
+ key = gr.Dropdown(["C", "C#", "D", "D#", "E", "F", "F#", "G", "G#", "A", "Bb", "B"], label="Key", value="C", interactive=True)
1199
+ scale = gr.Dropdown(["Major", "Minor"], label="Scale", value="Major", interactive=True)
1200
+ with gr.Row():
1201
+ global_prompt = gr.Text(label="Global Prompt", interactive=True, scale=3)
 
 
 
 
 
 
1202
  with gr.Row():
1203
+ s = gr.Slider(1, max_textboxes, value=1, step=1, label="Prompts:", interactive=True, scale=2)
1204
+ #s_mode = gr.Radio(["segmentation", "batch"], value="segmentation", interactive=True, scale=1, label="Generation Mode")
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1205
  with gr.Column():
1206
+ textboxes = []
1207
+ prompts = []
1208
+ repeats = []
1209
+ calcs = []
1210
  with gr.Row():
1211
+ text0 = gr.Text(label="Input Text", interactive=True, scale=4)
1212
+ prompts.append(text0)
1213
+ drag0 = gr.Number(label="Repeat", value=1, interactive=True, scale=1)
1214
+ repeats.append(drag0)
1215
+ calc0 = gr.Text(interactive=False, value="00:00 - 00:00", scale=1, label="Time")
1216
+ calcs.append(calc0)
1217
+ for i in range(max_textboxes):
1218
+ with gr.Row(visible=False) as t:
1219
+ text = gr.Text(label="Input Text", interactive=True, scale=3)
1220
+ repeat = gr.Number(label="Repeat", minimum=1, value=1, interactive=True, scale=1)
1221
+ calc = gr.Text(interactive=False, value="00:00 - 00:00", scale=1, label="Time")
1222
+ textboxes.append(t)
1223
+ prompts.append(text)
1224
+ repeats.append(repeat)
1225
+ calcs.append(calc)
1226
+ to_calc = gr.Button("Calculate Timings", variant="secondary")
1227
+ with gr.Row():
1228
+ duration = gr.Slider(minimum=1, maximum=300, value=10, step=1, label="Duration", interactive=True)
1229
+ with gr.Row():
1230
+ overlap = gr.Slider(minimum=1, maximum=29, value=12, step=1, label="Overlap", interactive=True)
1231
+ with gr.Row():
1232
+ seed = gr.Number(label="Seed", value=-1, scale=4, precision=0, interactive=True)
1233
+ gr.Button('\U0001f3b2\ufe0f', scale=1).click(fn=lambda: -1, outputs=[seed], queue=False)
1234
+ reuse_seed = gr.Button('\u267b\ufe0f', scale=1)
1235
+
1236
+ with gr.Tab("Audio"):
1237
+ with gr.Row():
1238
+ with gr.Column():
1239
+ input_type = gr.Radio(["file", "mic"], value="file", label="Input Type (optional)", interactive=True)
1240
+ mode = gr.Radio(["melody", "sample"], label="Input Audio Mode (optional)", value="sample", interactive=True)
1241
+ with gr.Row():
1242
+ trim_start = gr.Number(label="Trim Start", value=0, interactive=True)
1243
+ trim_end = gr.Number(label="Trim End", value=0, interactive=True)
1244
+ audio = gr.Audio(source="upload", type="numpy", label="Input Audio (optional)", interactive=True)
1245
+
1246
+ with gr.Tab("Customization"):
1247
+ with gr.Row():
1248
+ with gr.Column():
1249
+ background = gr.ColorPicker(value="#0f0f0f", label="background color", interactive=True, scale=0)
1250
+ bar1 = gr.ColorPicker(value="#84cc16", label="bar color start", interactive=True, scale=0)
1251
+ bar2 = gr.ColorPicker(value="#10b981", label="bar color end", interactive=True, scale=0)
1252
+ with gr.Column():
1253
+ image = gr.Image(label="Background Image", type="filepath", interactive=True, scale=4)
1254
+ with gr.Row():
1255
+ height = gr.Number(label="Height", value=512, interactive=True)
1256
+ width = gr.Number(label="Width", value=768, interactive=True)
1257
+
1258
+ with gr.Tab("Settings"):
1259
+ with gr.Row():
1260
+ channel = gr.Radio(["mono", "stereo", "stereo effect"], label="Output Audio Channels", value="stereo", interactive=True, scale=1)
1261
+ sr_select = gr.Dropdown(["11025", "16000", "22050", "24000", "32000", "44100", "48000"], label="Output Audio Sample Rate", value="48000", interactive=True)
1262
+ with gr.Row():
1263
+ model = gr.Radio(["melody", "small", "medium", "large", "custom"], label="Model", value="large", interactive=True, scale=1)
1264
+ with gr.Column():
1265
+ dropdown = gr.Dropdown(choices=get_available_models(), value=("No models found" if len(get_available_models()) < 1 else get_available_models()[0]), label='Custom Model (models folder)', elem_classes='slim-dropdown', interactive=True)
1266
+ ui.create_refresh_button(dropdown, lambda: None, lambda: {'choices': get_available_models()}, 'refresh-button')
1267
+ basemodel = gr.Radio(["small", "medium", "melody", "large"], label="Base Model", value="medium", interactive=True, scale=1)
1268
+ with gr.Row():
1269
+ decoder = gr.Radio(["Default", "MultiBand_Diffusion"], label="Decoder", value="Default", interactive=True)
1270
+ with gr.Row():
1271
+ topk = gr.Number(label="Top-k", value=250, interactive=True)
1272
+ topp = gr.Number(label="Top-p", value=0, interactive=True)
1273
+ temperature = gr.Number(label="Temperature", value=1.0, interactive=True)
1274
+ cfg_coef = gr.Number(label="Classifier Free Guidance", value=3.0, interactive=True)
1275
  with gr.Row():
1276
+ submit = gr.Button("Generate", variant="primary")
1277
+ # Adapted from https://github.com/rkfg/audiocraft/blob/long/app.py, MIT license.
1278
+ _ = gr.Button("Interrupt").click(fn=interrupt, queue=False)
1279
+ with gr.Column() as c:
1280
+ with gr.Tab("Output"):
1281
+ output = gr.Video(label="Generated Music", scale=0)
1282
+ with gr.Row():
1283
+ audio_only = gr.Audio(type="numpy", label="Audio Only", interactive=False)
1284
+ backup_only = gr.Audio(type="numpy", label="Backup Audio", interactive=False, visible=False)
1285
+ send_audio = gr.Button("Send to Input Audio")
1286
+ seed_used = gr.Number(label='Seed used', value=-1, interactive=False)
1287
+ download = gr.File(label="Generated Files", interactive=False)
1288
+ with gr.Tab("## Wiki"):
1289
+ gr.Markdown(
1290
  """
1291
  - **[Generate (button)]:**
1292
  Generates the music with the given settings and prompts.