File size: 627 Bytes
32f1cf7
 
 
 
4c9dfad
 
 
 
32f1cf7
 
 
4c9dfad
 
32f1cf7
4c9dfad
32f1cf7
 
 
 
4c9dfad
32f1cf7
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
import gradio as gr
from transformers import AutoProcessor, AutoModelForCTC
import torch
import soundfile as sf
import nemo.collections.asr as nemo_asr
import gradio as gr
# Load the model
model = nemo_asr.models.ASRModel.from_pretrained("nvidia/stt_en_fastconformer_hybrid_large_pc")

# Function to transcribe audio
def transcribe_audio(audio_file):
    transcription = model.transcribe([audio_file])
    return transcription[0]

# Gradio interface
iface = gr.Interface(
    fn=transcribe_audio,
    inputs=gr.Audio(type="filepath"),
    outputs="text",
    title="Real-Time Transcription with FastConformer"
)

iface.launch()