Spaces:

ahk-d
/

VQ-VAE-Timbre-Transfer-Demo

Running

App Files Files Community

ahk-d commited on Jul 13

Commit

5f48921

verified ·

1 Parent(s): a3f80ab

Update app.py

Browse files

Files changed (1) hide show

app.py +67 -7

app.py CHANGED Viewed

@@ -1,8 +1,57 @@
-"""## Gradio Interface for Custom Audio Upload"""
-import gradio as gr
-import requests
 import tempfile
 # Preset audio URLs
 INPUT_ROOT = 'https://adasp.telecom-paris.fr/rc-ext/demos_companion-pages/vqvae_examples/'
@@ -137,7 +186,7 @@ with gr.Blocks(title="VQ-VAE Timbre Transfer", theme=gr.themes.Soft()) as demo:
     Transfer the timbre (tone/texture) from one audio source to another while preserving the musical content.
-    **Content**: Musical notes/melody that will be preserved
     **Style**: Instrument timbre/texture that will be applied
     ### How It Works:
@@ -230,5 +279,16 @@ with gr.Blocks(title="VQ-VAE Timbre Transfer", theme=gr.themes.Soft()) as demo:
         outputs=[output_audio, status_msg]
     )
-# Launch
-demo.launch(share=True, debug=True, height=1400)

+import os
 import tempfile
+import requests
+import gradio as gr
+import torch
+import librosa
+import numpy as np
+import subprocess
+import sys
+def install_dependencies():
+    """Install required packages for deployment"""
+    try:
+        if not os.path.exists('ss-vq-vae'):
+            print("Cloning ss-vq-vae repository...")
+            subprocess.run(['git', 'clone', 'https://github.com/cifkao/ss-vq-vae.git'], check=True)
+        subprocess.run([sys.executable, '-m', 'pip', 'install', './ss-vq-vae/src'], check=True)
+        print("Dependencies installed successfully!")
+    except Exception as e:
+        print(f"Error installing dependencies: {e}")
+        raise
+# Install dependencies for deployment
+try:
+    install_dependencies()
+    import confugue
+    from ss_vq_vae.models.vqvae_oneshot import Experiment
+except ImportError:
+    print("ss-vq-vae not found. Please install manually or run in Colab.")
+    sys.exit(1)
+def download_model():
+    """Download model files if they don't exist"""
+    model_dir = 'ss-vq-vae/experiments/model'
+    os.makedirs(model_dir, exist_ok=True)
+    model_path = os.path.join(model_dir, 'model_state.pt')
+    if not os.path.exists(model_path):
+        print("Downloading model...")
+        url = 'https://adasp.telecom-paris.fr/rc-ext/demos_companion-pages/vqvae_examples/ssvqvae_model_state.pt'
+        response = requests.get(url)
+        with open(model_path, 'wb') as f:
+            f.write(response.content)
+        print("Model downloaded successfully!")
+# Initialize model
+download_model()
+logdir = 'ss-vq-vae/experiments/model'
+cfg = confugue.Configuration.from_yaml_file(os.path.join(logdir, 'config.yaml'))
+exp = cfg.configure(Experiment, logdir=logdir, device='cpu')
+exp.model.load_state_dict(torch.load(os.path.join(logdir, 'model_state.pt'), map_location=exp.device))
+exp.model.train(False)
 # Preset audio URLs
 INPUT_ROOT = 'https://adasp.telecom-paris.fr/rc-ext/demos_companion-pages/vqvae_examples/'
     Transfer the timbre (tone/texture) from one audio source to another while preserving the musical content.
+    **Content**: Musical notes/melody that will be preserved
     **Style**: Instrument timbre/texture that will be applied
     ### How It Works:
         outputs=[output_audio, status_msg]
     )
+    gr.Markdown("""
+    ### 🔧 Troubleshooting
+    - **Poor transfer quality?** Try different instrument combinations or adjust max duration
+    - **Audio doesn't load?** Check internet connection or try different presets
+    - **Processing slow?** Reduce max duration or try shorter audio clips
+    ### 📖 Citation
+    Original work by Ondřej Cífka (InterDigital R&D and Télécom Paris, 2020).
+    Demo by Ali Dulaimi.
+    """)
+if __name__ == "__main__":
+    demo.launch(share=True, debug=True, height=1400)