Emmanuel08's picture
Update app.py
4c9dfad verified
raw
history blame
627 Bytes
import gradio as gr
from transformers import AutoProcessor, AutoModelForCTC
import torch
import soundfile as sf
import nemo.collections.asr as nemo_asr
import gradio as gr
# Load the model
model = nemo_asr.models.ASRModel.from_pretrained("nvidia/stt_en_fastconformer_hybrid_large_pc")
# Function to transcribe audio
def transcribe_audio(audio_file):
transcription = model.transcribe([audio_file])
return transcription[0]
# Gradio interface
iface = gr.Interface(
fn=transcribe_audio,
inputs=gr.Audio(type="filepath"),
outputs="text",
title="Real-Time Transcription with FastConformer"
)
iface.launch()