anyantudre commited on
Commit
cb6b607
·
verified ·
1 Parent(s): f963ed2

Update src/speech_to_text.py

Browse files
Files changed (1) hide show
  1. src/speech_to_text.py +2 -0
src/speech_to_text.py CHANGED
@@ -32,6 +32,8 @@ def transcribe(fp:str, target_lang:str) -> str:
32
  processor = AutoProcessor.from_pretrained(model_id, target_lang=target_lang)
33
  model = Wav2Vec2ForCTC.from_pretrained(model_id, target_lang=target_lang, ignore_mismatched_sizes=True)
34
 
 
 
35
  # Process the audio
36
  signal, sampling_rate = librosa.load(fp, sr=16000)
37
  inputs = processor(signal, sampling_rate=16_000, return_tensors="pt")
 
32
  processor = AutoProcessor.from_pretrained(model_id, target_lang=target_lang)
33
  model = Wav2Vec2ForCTC.from_pretrained(model_id, target_lang=target_lang, ignore_mismatched_sizes=True)
34
 
35
+ processor.tokenizer.set_target_lang("mos")
36
+
37
  # Process the audio
38
  signal, sampling_rate = librosa.load(fp, sr=16000)
39
  inputs = processor(signal, sampling_rate=16_000, return_tensors="pt")