Spaces:

Agents-MCP-Hackathon
/

MedCodeMCP

Running

App Files Files Community

gpaasch commited on Jun 8

Commit

4b8e08c

1 Parent(s): 9ae574b

solved ffmpeg-related error

Browse files

Files changed (2) hide show

requirements.txt +3 -1
src/app.py +1 -15

requirements.txt CHANGED Viewed

@@ -12,8 +12,10 @@ llama-index-llms-llama-cpp
 sentence-transformers>=2.2.0
 # Audio processing
-ffmpeg-python
 librosa>=0.10.1
 # System utilities
 psutil

 sentence-transformers>=2.2.0
 # Audio processing
+ffmpeg-python>=0.2.0
+pydub>=0.25.1
 librosa>=0.10.1
+soundfile>=0.12.1
 # System utilities
 psutil

src/app.py CHANGED Viewed

@@ -264,7 +264,7 @@ def process_speech(audio_data, history):
                 sample_rate = 16000
             # Transcribe with error handling
-            try:
                 # Format dictionary correctly with required keys
                 input_features = {
                     "raw": audio_array,
@@ -304,9 +304,6 @@ def process_speech(audio_data, history):
                     })}
                 ]
-            except Exception as e:
-                print(f"Transcription error: {str(e)}")
-                return []
         else:
             print(f"Invalid audio format: {type(audio_data)}")
             return []
@@ -530,7 +527,6 @@ with gr.Blocks(
         if not audio or not isinstance(audio, tuple):
             return ""
-        try:
             sample_rate, audio_array = audio
             features = process_audio(audio_array, sample_rate)
@@ -543,10 +539,6 @@ with gr.Blocks(
             elif isinstance(result, str):
                 return result.strip()
             return ""
-        except Exception as e:
-            print(f"Transcription error: {str(e)}")
-            return ""
     microphone.stream(
         fn=update_live_transcription,
@@ -574,7 +566,6 @@ with gr.Blocks(
         if not text:
             return history
-        try:
             # Limit input length
             if len(text) > 500:
                 text = text[:500] + "..."
@@ -600,11 +591,6 @@ with gr.Blocks(
                 })}
             ]
-        except Exception as e:
-            print(f"Text processing error: {str(e)}")
-            cleanup_memory()
-            return history
     submit_btn.click(
         fn=process_text_input,
         inputs=[text_input, chatbot],

                 sample_rate = 16000
             # Transcribe with error handling
                 # Format dictionary correctly with required keys
                 input_features = {
                     "raw": audio_array,
                     })}
                 ]
         else:
             print(f"Invalid audio format: {type(audio_data)}")
             return []
         if not audio or not isinstance(audio, tuple):
             return ""
             sample_rate, audio_array = audio
             features = process_audio(audio_array, sample_rate)
             elif isinstance(result, str):
                 return result.strip()
             return ""
     microphone.stream(
         fn=update_live_transcription,
         if not text:
             return history
             # Limit input length
             if len(text) > 500:
                 text = text[:500] + "..."
                 })}
             ]
     submit_btn.click(
         fn=process_text_input,
         inputs=[text_input, chatbot],