Spaces:
Running
Running
Commit
·
dd6a80b
1
Parent(s):
cbfcc94
update sherpa-onnx to use piper-phonemize
Browse files- app.py +13 -0
- model.py +2 -7
- requirements.txt +1 -1
app.py
CHANGED
|
@@ -25,6 +25,7 @@ import uuid
|
|
| 25 |
|
| 26 |
import gradio as gr
|
| 27 |
import soundfile as sf
|
|
|
|
| 28 |
|
| 29 |
from model import get_pretrained_model, language_to_models
|
| 30 |
|
|
@@ -185,7 +186,19 @@ with demo:
|
|
| 185 |
|
| 186 |
gr.Markdown(description)
|
| 187 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 188 |
if __name__ == "__main__":
|
|
|
|
| 189 |
formatter = "%(asctime)s %(levelname)s [%(filename)s:%(lineno)d] %(message)s"
|
| 190 |
|
| 191 |
logging.basicConfig(format=formatter, level=logging.INFO)
|
|
|
|
| 25 |
|
| 26 |
import gradio as gr
|
| 27 |
import soundfile as sf
|
| 28 |
+
import system
|
| 29 |
|
| 30 |
from model import get_pretrained_model, language_to_models
|
| 31 |
|
|
|
|
| 186 |
|
| 187 |
gr.Markdown(description)
|
| 188 |
|
| 189 |
+
|
| 190 |
+
def download_espeak_ng_data():
|
| 191 |
+
os.sytem(
|
| 192 |
+
"""
|
| 193 |
+
cd /tmp
|
| 194 |
+
wget https://github.com/k2-fsa/sherpa-onnx/releases/download/tts-models/espeak-ng-data.tar.bz2
|
| 195 |
+
tar xf espeak-ng-data.tar.bz2
|
| 196 |
+
"""
|
| 197 |
+
)
|
| 198 |
+
|
| 199 |
+
|
| 200 |
if __name__ == "__main__":
|
| 201 |
+
download_espeak_ng_data()
|
| 202 |
formatter = "%(asctime)s %(levelname)s [%(filename)s:%(lineno)d] %(message)s"
|
| 203 |
|
| 204 |
logging.basicConfig(format=formatter, level=logging.INFO)
|
model.py
CHANGED
|
@@ -124,12 +124,6 @@ def _get_vits_piper(repo_id: str, speed: float) -> sherpa_onnx.OfflineTts:
|
|
| 124 |
subfolder=".",
|
| 125 |
)
|
| 126 |
|
| 127 |
-
lexicon = get_file(
|
| 128 |
-
repo_id=repo_id,
|
| 129 |
-
filename="lexicon.txt",
|
| 130 |
-
subfolder=".",
|
| 131 |
-
)
|
| 132 |
-
|
| 133 |
tokens = get_file(
|
| 134 |
repo_id=repo_id,
|
| 135 |
filename="tokens.txt",
|
|
@@ -140,7 +134,8 @@ def _get_vits_piper(repo_id: str, speed: float) -> sherpa_onnx.OfflineTts:
|
|
| 140 |
model=sherpa_onnx.OfflineTtsModelConfig(
|
| 141 |
vits=sherpa_onnx.OfflineTtsVitsModelConfig(
|
| 142 |
model=model,
|
| 143 |
-
lexicon=
|
|
|
|
| 144 |
tokens=tokens,
|
| 145 |
length_scale=1.0 / speed,
|
| 146 |
),
|
|
|
|
| 124 |
subfolder=".",
|
| 125 |
)
|
| 126 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 127 |
tokens = get_file(
|
| 128 |
repo_id=repo_id,
|
| 129 |
filename="tokens.txt",
|
|
|
|
| 134 |
model=sherpa_onnx.OfflineTtsModelConfig(
|
| 135 |
vits=sherpa_onnx.OfflineTtsVitsModelConfig(
|
| 136 |
model=model,
|
| 137 |
+
lexicon="",
|
| 138 |
+
data_dir="/tmp/espeak-ng-data",
|
| 139 |
tokens=tokens,
|
| 140 |
length_scale=1.0 / speed,
|
| 141 |
),
|
requirements.txt
CHANGED
|
@@ -1,4 +1,4 @@
|
|
| 1 |
-
https://huggingface.co/csukuangfj/wheels/resolve/main/sherpa_onnx-1.8.
|
| 2 |
#sherpa-onnx
|
| 3 |
|
| 4 |
soundfile
|
|
|
|
| 1 |
+
https://huggingface.co/csukuangfj/wheels/resolve/main/sherpa_onnx-1.8.11-cp38-cp38-linux_x86_64.whl
|
| 2 |
#sherpa-onnx
|
| 3 |
|
| 4 |
soundfile
|