File size: 547 Bytes
9d3afd7
3a6c9ee
 
9d3afd7
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
from transformers import pipeline
import gradio as gr

pipe = pipeline(model="MaximilianChen/Casper") 

def transcribe(audio):
    text = pipe(audio)["text"]
    return text

iface = gr.Interface(
    fn=transcribe, 
    inputs=[
        gr.Audio(label="Upload Speech", source="upload", type="numpy"),
        gr.Audio(label="Record Speech", source="microphone", type="numpy"),
    ], 
    outputs="text",
    title="Casper",
    description="Realtime demo for Catalan speech recognition using a fine-tuned Whisper small model.",
)

iface.launch()