SoSa123456's picture
Create app.py
c080f5c
raw
history blame
1.76 kB
from flask import Flask, render_template, request
from speechbrain.pretrained import WhisperASR
app = Flask(__name__)
asr_model = WhisperASR.from_hparams(
source="speechbrain/asr-whisper-large-v2-commonvoice-fa",
savedir="pretrained_models/asr-whisper-large-v2-commonvoice-fa"
)
html_template = """
<!DOCTYPE html>
<html lang="en">
<head>
<meta charset="UTF-8">
<meta name="viewport" content="width=device-width, initial-scale=1.0">
<title>Speech Transcription</title>
</head>
<body>
<h1>Speech Transcription</h1>
<form action="/transcribe" method="post" enctype="multipart/form-data">
<label for="audio_file">Select an audio file:</label>
<input type="file" name="audio_file" accept=".wav, .mp3">
<button type="submit">Transcribe</button>
</form>
{% if error %}
<p style="color: red;">{{ error }}</p>
{% endif %}
{% if transcription %}
<h2>Transcription Result:</h2>
<p>{{ transcription }}</p>
{% endif %}
</body>
</html>
"""
@app.route('/')
def index():
return html_template
@app.route('/transcribe', methods=['POST'])
def transcribe():
if 'audio_file' not in request.files:
return render_template_string(html_template, error='No file part')
audio_file = request.files['audio_file']
if audio_file.filename == '':
return render_template_string(html_template, error='No selected file')
try:
transcription = asr_model.transcribe_file(audio_file)
return render_template_string(html_template, transcription=transcription)
except Exception as e:
return render_template_string(html_template, error=f'Error during transcription: {str(e)}')
if __name__ == '__main__':
app.run(debug=True)