Spaces:

aztro
/

yebama-voice-demo

Sleeping

App Files Files Community

aztro commited on 11 days ago

Commit

6bbd5b5

1 Parent(s): a4f9390

Initial commit with RVC demo

Browse files

Files changed (9) hide show

.gitattributes +1 -0
added_IVF403_Flat_nprobe_1_yebama_v2.index +3 -0
app.py +43 -0
config.json +63 -0
requirements.txt +5 -0
response_1694593941525.json +38 -0
response_1694594214307.json +36 -0
yebama.zip +3 -0
yebama_e200_s3200.pth +3 -0

.gitattributes CHANGED Viewed

@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text

 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text
+added_IVF403_Flat_nprobe_1_yebama_v2.index filter=lfs diff=lfs merge=lfs -text

added_IVF403_Flat_nprobe_1_yebama_v2.index ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:e0fb2e3b992e0d836b5e4976b660268ecd6bfb738f0f4fae239614d0264e805c
+size 49714419

app.py ADDED Viewed

	@@ -0,0 +1,43 @@

+import gradio as gr
+import torch
+import librosa
+import numpy as np
+from huggingface_hub import hf_hub_download
+import zipfile
+import os
+# Descargar el modelo desde tu otra cuenta de Hugging Face
+def load_model():
+    # Descargar archivos del modelo (ajusta los nombres según tu repositorio)
+    model_path = hf_hub_download(repo_id="gitgato/yebama", filename="yebama_e200_s3200.pth")
+    index_path = hf_hub_download(repo_id="gitgato/yebama", filename="IVF403_Flat_nprobe_1_yebama_v2.index")
+    config_path = hf_hub_download(repo_id="gitgato/yebama", filename="config.json")
+    # Aquí iría el código para cargar el modelo RVC (depende de tu implementación)
+    # Ejemplo simplificado:
+    # from rvc_inference import load_rvc_model
+    # model = load_rvc_model(model_path, config_path, index_path)
+    # return model
+def process_audio(audio_file):
+    # Cargar el audio (ejemplo con librosa)
+    audio, sr = librosa.load(audio_file, sr=44100)
+    # Aquí iría la lógica de inferencia con RVC
+    # processed_audio = model.infer(audio)
+    # Simulando un resultado (reemplaza con tu modelo real)
+    processed_audio = audio  # Esto es un placeholder
+    return sr, processed_audio
+# Interfaz Gradio
+iface = gr.Interface(
+    fn=process_audio,
+    inputs=gr.Audio(type="filepath", label="Sube tu audio"),
+    outputs=gr.Audio(label="Audio convertido"),
+    title="Demo de Yebama RVC",
+    description="Convierte tu voz con el modelo Yebama RVC."
+)
+iface.launch()

config.json ADDED Viewed

	@@ -0,0 +1,63 @@

+{
+  "added_tokens_decoder": {
+    "0": {
+      "content": "<s>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "1": {
+      "content": "<pad>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "2": {
+      "content": "</s>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "3": {
+      "content": "<unk>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "79": {
+      "content": "<mask>",
+      "lstrip": true,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "80": {
+      "content": "<ctc_blank>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    }
+  },
+  "bos_token": "<s>",
+  "clean_up_tokenization_spaces": true,
+  "eos_token": "</s>",
+  "mask_token": "<mask>",
+  "model_max_length": 600,
+  "normalize": false,
+  "pad_token": "<pad>",
+  "processor_class": "SpeechT5Processor",
+  "sp_model_kwargs": {},
+  "tokenizer_class": "SpeechT5Tokenizer",
+  "unk_token": "<unk>"
+}

requirements.txt ADDED Viewed

	@@ -0,0 +1,5 @@

+gradio>=3.0
+torch>=1.10
+librosa>=0.9.0
+huggingface_hub
+numpy

response_1694593941525.json ADDED Viewed

	@@ -0,0 +1,38 @@

+{
+  "stability": 0.85,
+  "similarity_boost": 0.89,
+  "style": 0.18,
+  "use_speaker_boost": true
+}
+access-control-allow-headers: *
+access-control-allow-methods: POST,OPTIONS,DELETE,GET
+access-control-allow-origin: *
+alt-svc: h3=":443"; ma=2592000,h3-29=":443"; ma=2592000  content-length: 80
+content-type: application/json
+date: Wed,13 Sep 2023 08:32:18 GMT
+server: uvicorn
+via: 1.1
+google  x-firefox-spdy: h2
+{
+  "stability": 0,
+  "similarity_boost": 0,
+  "style": 0,
+  "use_speaker_boost": true
+}
+{
+  "detail": [
+    {
+      "loc": [
+        "string",
+        0
+      ],
+      "msg": "string",
+      "type": "string"
+    }
+  ]
+}

response_1694594214307.json ADDED Viewed

	@@ -0,0 +1,36 @@

+{
+  "stability": 0.93,
+  "similarity_boost": 0.96,
+  "style": 0.23,
+  "use_speaker_boost": true
+}
+access-control-allow-headers: *
+access-control-allow-methods: POST,OPTIONS,DELETE,GET
+access-control-allow-origin: *
+alt-svc: h3=":443"; ma=2592000,h3-29=":443"; ma=2592000
+content-length: 80
+content-type: application/json
+date: Wed,13 Sep 2023 08:36:51
+GMT  server: uvicorn
+via: 1.1 google  x-firefox-spdy: h2
+{
+  "stability": 0,
+  "similarity_boost": 0,
+  "style": 0,
+  "use_speaker_boost": true
+}
+{
+  "detail": [
+    {
+      "loc": [
+        "string",
+        0
+      ],
+      "msg": "string",
+      "type": "string"
+    }
+  ]
+}

yebama.zip ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:bdba5e3d3acd56cb7ddf5d6e3d6f0867c36cef5c5cac63c4d45e2b28791e1426
+size 104943041

yebama_e200_s3200.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:c280e247f5f3a05a2d0f2220248577215110ae0730d1ef7c290bff56e1a46d66
+size 55228322