Spaces:

ZennyKenny
/

AudioTranscribe

Running on CPU Upgrade

App Files Files Community

ZennyKenny commited on 1 day ago

Commit

e4afaf8

verified ·

1 Parent(s): 55aeb9b

remove ad hoc record support

Browse files

Files changed (1) hide show

app.py +13 -38

app.py CHANGED Viewed

@@ -7,9 +7,9 @@ import os
 import uuid
 import spaces  # Ensure spaces is imported
-# Directory to save recorded audio files
 OUTPUT_DIR = os.getenv("HF_HOME", ".")  # Use dynamic path or default to current directory
-OUTPUT_DIR = os.path.join(OUTPUT_DIR, "recorded_audio_files")
 os.makedirs(OUTPUT_DIR, exist_ok=True)
 def split_audio(audio_data, sr, chunk_duration=30):
@@ -70,49 +70,30 @@ def main():
     def process_audio(audio_input):
         try:
-            # Debug input type and content
-            print(f"Input type: {type(audio_input)}, Input: {audio_input}")
-            if audio_input is None:
-                raise ValueError("No audio input received. Please record or upload an audio file.")
-            if isinstance(audio_input, tuple):  # Recorded audio
-                print("Handling recorded audio.")
-                audio_data, sr = audio_input
-                filename = f"recorded_audio_{uuid.uuid4().hex}.wav"
-                temp_path = os.path.join(OUTPUT_DIR, filename)
-                sf.write(temp_path, audio_data, sr)
-            elif isinstance(audio_input, str):  # Uploaded file path
-                print("Handling uploaded audio.")
-                if os.path.isdir(audio_input):
-                    raise ValueError("Input is a directory, not a file.")
-                temp_path = audio_input
-            else:
-                raise ValueError("Unsupported audio input format.")
-            # Transcribe the saved audio file
-            transcription = transcribe_long_audio(temp_path, transcriber, chunk_duration=30)
             summary = summarizer(transcription, max_length=50, min_length=10, do_sample=False)[0]["summary_text"]
             # Cleanup old files
             cleanup_output_dir()
-            return transcription, summary, temp_path
         except Exception as e:
             print(f"Error in process_audio: {e}")
             return f"Error processing audio: {e}", "", ""
-    def stop_microphone():
-        """Simulate stopping the microphone."""
-        print("Microphone stopped.")
-        return "Microphone stopped. Recording session has ended."
     with gr.Blocks() as interface:
         with gr.Row():
             with gr.Column():
-                # Enable recording or file upload
-                audio_input = gr.Audio(type="numpy", label="Record or Upload Audio")
                 process_button = gr.Button("Process Audio")
-                stop_button = gr.Button("Stop Recording")
             with gr.Column():
                 transcription_output = gr.Textbox(label="Full Transcription", lines=10)
                 summary_output = gr.Textbox(label="Summary", lines=5)
@@ -124,12 +105,6 @@ def main():
             outputs=[transcription_output, summary_output, audio_output]
         )
-        stop_button.click(
-            stop_microphone,
-            inputs=[],
-            outputs=[]
-        )
     interface.launch(share=False)
 if __name__ == "__main__":

 import uuid
 import spaces  # Ensure spaces is imported
+# Directory to save processed audio files
 OUTPUT_DIR = os.getenv("HF_HOME", ".")  # Use dynamic path or default to current directory
+OUTPUT_DIR = os.path.join(OUTPUT_DIR, "processed_audio_files")
 os.makedirs(OUTPUT_DIR, exist_ok=True)
 def split_audio(audio_data, sr, chunk_duration=30):
     def process_audio(audio_input):
         try:
+            print(f"Processing uploaded audio: {audio_input}")
+            if not isinstance(audio_input, str):
+                raise ValueError("Invalid input type. Please upload a valid audio file.")
+            if os.path.isdir(audio_input):
+                raise ValueError("Input is a directory, not a file.")
+            # Transcribe the uploaded audio file
+            transcription = transcribe_long_audio(audio_input, transcriber, chunk_duration=30)
             summary = summarizer(transcription, max_length=50, min_length=10, do_sample=False)[0]["summary_text"]
             # Cleanup old files
             cleanup_output_dir()
+            return transcription, summary, audio_input
         except Exception as e:
             print(f"Error in process_audio: {e}")
             return f"Error processing audio: {e}", "", ""
     with gr.Blocks() as interface:
         with gr.Row():
             with gr.Column():
+                # Only support file uploads
+                audio_input = gr.Audio(type="filepath", label="Upload Audio File")
                 process_button = gr.Button("Process Audio")
             with gr.Column():
                 transcription_output = gr.Textbox(label="Full Transcription", lines=10)
                 summary_output = gr.Textbox(label="Summary", lines=5)
             outputs=[transcription_output, summary_output, audio_output]
         )
     interface.launch(share=False)
 if __name__ == "__main__":