Spaces:
Sleeping
Sleeping
Update src/speech_to_text.py
Browse files- src/speech_to_text.py +2 -0
src/speech_to_text.py
CHANGED
@@ -32,6 +32,8 @@ def transcribe(fp:str, target_lang:str) -> str:
|
|
32 |
processor = AutoProcessor.from_pretrained(model_id, target_lang=target_lang)
|
33 |
model = Wav2Vec2ForCTC.from_pretrained(model_id, target_lang=target_lang, ignore_mismatched_sizes=True)
|
34 |
|
|
|
|
|
35 |
# Process the audio
|
36 |
signal, sampling_rate = librosa.load(fp, sr=16000)
|
37 |
inputs = processor(signal, sampling_rate=16_000, return_tensors="pt")
|
|
|
32 |
processor = AutoProcessor.from_pretrained(model_id, target_lang=target_lang)
|
33 |
model = Wav2Vec2ForCTC.from_pretrained(model_id, target_lang=target_lang, ignore_mismatched_sizes=True)
|
34 |
|
35 |
+
processor.tokenizer.set_target_lang("mos")
|
36 |
+
|
37 |
# Process the audio
|
38 |
signal, sampling_rate = librosa.load(fp, sr=16000)
|
39 |
inputs = processor(signal, sampling_rate=16_000, return_tensors="pt")
|