Spaces:

Shanuka01
/

ASR-wisper-large

Running

Shanuka01 commited on Nov 3, 2023

Commit

4b68c6d

1 Parent(s): 51cfd89

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -5,7 +5,9 @@ import whisper
 model = whisper.load_model("large")
 def transcribe(audio_file):
     audio = whisper.load_audio(audio_file.name)
     audio = whisper.pad_or_trim(audio)
     # Generate a mel spectrogram
     mel = whisper.log_mel_spectrogram(audio).to(model.device)
@@ -18,7 +20,7 @@ def transcribe(audio_file):
 # Create the Gradio interface
 iface = gr.Interface(
     fn=transcribe,
-    inputs=gr.inputs.Audio(source="upload", type="file", label="Upload your audio file"),
     outputs="text",
     title="Whisper ASR",
     description="Upload an audio file and it will be transcribed using OpenAI's Whisper model."
@@ -26,4 +28,4 @@ iface = gr.Interface(
 # Launch the app
 if __name__ == "__main__":
-    iface.launch()

 model = whisper.load_model("large")
 def transcribe(audio_file):
+    # Load audio file
     audio = whisper.load_audio(audio_file.name)
+    # Pad or trim audio to the expected length
     audio = whisper.pad_or_trim(audio)
     # Generate a mel spectrogram
     mel = whisper.log_mel_spectrogram(audio).to(model.device)
 # Create the Gradio interface
 iface = gr.Interface(
     fn=transcribe,
+    inputs=gr.Audio(source="upload", type="file", label="Upload your audio file"),
     outputs="text",
     title="Whisper ASR",
     description="Upload an audio file and it will be transcribed using OpenAI's Whisper model."
 # Launch the app
 if __name__ == "__main__":
+    iface.launch()