import gradio as gr from transformers import pipeline import librosa # Initialize the ASR model asr_model = pipeline("automatic-speech-recognition", model="openai/whisper-small") def transcribe(file_path): # Load the audio file with librosa data, samplerate = librosa.load(file_path, sr=None) # Pass the audio data to the model for transcription without specifying sampling_rate transcription = asr_model(data) return transcription["text"] # Create the Gradio interface iface = gr.Interface( fn=transcribe, inputs=gr.Audio(type="filepath", label="Record or Upload Audio"), outputs="text" ) # Launch the interface iface.launch()