Spaces:

mguven61
/

VoiceAI61

Running

App Files Files Community

mguven61 commited on 14 days ago

Commit

4d86f0d

verified ·

1 Parent(s): 313da01

Update app.py

Browse files

Files changed (1) hide show

app.py +30 -20

app.py CHANGED Viewed

@@ -7,14 +7,9 @@ import os
 import warnings
 warnings.filterwarnings("ignore")
-# Load model once
 model = whisper.load_model("base")
 def translate_audio(text_input, upload_audio, mic_audio, source_lang="tr", target_lang="en"):
-    """
-    Function that handles both uploaded audio and microphone audio
-    """
-    # Determine which audio source to use
     audio_file = None
     audio_source = ""
@@ -26,13 +21,34 @@ def translate_audio(text_input, upload_audio, mic_audio, source_lang="tr", targe
         audio_file = upload_audio
         audio_source = "📁 Upload"
         print(f"Using uploaded audio: {upload_audio}")
     else:
-        return None, "❌ No audio input provided", "Please upload an audio file OR record with microphone", ""
     try:
         print(f"Processing {audio_source} audio: {audio_file}")
-        # Transcribe audio
         result = model.transcribe(audio_file, language=source_lang, fp16=False)
         original_text = result["text"].strip()
@@ -41,7 +57,6 @@ def translate_audio(text_input, upload_audio, mic_audio, source_lang="tr", targe
         print(f"Transcribed: {original_text}")
-        # Translate text
         if source_lang != target_lang:
             translator = GoogleTranslator(source=source_lang, target=target_lang)
             translated_text = translator.translate(original_text)
@@ -50,10 +65,8 @@ def translate_audio(text_input, upload_audio, mic_audio, source_lang="tr", targe
         print(f"Translated: {translated_text}")
-        # Generate speech
         tts = gTTS(text=translated_text, lang=target_lang, slow=False)
-        # Save to temporary file
         with tempfile.NamedTemporaryFile(delete=False, suffix='.mp3') as tmp_file:
             tts.save(tmp_file.name)
             return (
@@ -67,7 +80,6 @@ def translate_audio(text_input, upload_audio, mic_audio, source_lang="tr", targe
         print(f"Error: {str(e)}")
         return None, f"❌ Error: {str(e)}", "Please try again", f"Source: {audio_source}"
-# Language options
 languages = {
     "tr": "🇹🇷 Turkish",
     "en": "🇺🇸 English",
@@ -81,7 +93,6 @@ languages = {
     "zh": "🇨🇳 Chinese"
 }
-# Create Gradio interface exactly like the Clone-Your-Voice example
 demo = gr.Interface(
     fn=translate_audio,
     inputs=[
@@ -92,14 +103,13 @@ demo = gr.Interface(
         ),
         gr.Audio(
             type="filepath",
-            source="upload",
             label="📁 Upload Audio File (MP3, WAV, etc.)"
         ),
         gr.Audio(
-            source="microphone",
             label="🎤 OR Record with Microphone",
-            type="filepath",
-            optional=True
         ),
         gr.Dropdown(
             choices=list(languages.keys()),
@@ -126,6 +136,7 @@ demo = gr.Interface(
         <h3>🎯 How to Use:</h3>
         <p><strong>Option 1:</strong> 📁 Upload an audio file (recommended)</p>
         <p><strong>Option 2:</strong> 🎤 Record directly with microphone</p>
         <p><strong>Then:</strong> Select source and target languages, wait for processing!</p>
         <br>
         <p>🔧 <strong>Troubleshooting:</strong> If microphone doesn't work, use file upload instead.</p>
@@ -134,12 +145,11 @@ demo = gr.Interface(
     """,
     examples=[
-        ["", None, None, "tr", "en"],  # Example with Turkish to English
-        ["", None, None, "en", "fr"],  # Example with English to French
-        ["Hello world", None, None, "en", "es"],  # Example with text input
     ],
-    # Important: Set these flags
     allow_flagging="never",
     show_error=True
 )

 import warnings
 warnings.filterwarnings("ignore")
 model = whisper.load_model("base")
 def translate_audio(text_input, upload_audio, mic_audio, source_lang="tr", target_lang="en"):
     audio_file = None
     audio_source = ""
         audio_file = upload_audio
         audio_source = "📁 Upload"
         print(f"Using uploaded audio: {upload_audio}")
+    elif text_input and text_input.strip():
+        try:
+            original_text = text_input.strip()
+            if source_lang != target_lang:
+                translator = GoogleTranslator(source=source_lang, target=target_lang)
+                translated_text = translator.translate(original_text)
+            else:
+                translated_text = original_text
+            tts = gTTS(text=translated_text, lang=target_lang, slow=False)
+            with tempfile.NamedTemporaryFile(delete=False, suffix='.mp3') as tmp_file:
+                tts.save(tmp_file.name)
+                return (
+                    tmp_file.name,
+                    f"✅ Original: {original_text}",
+                    f"🌍 Translated: {translated_text}",
+                    f"📡 Source: 💬 Text Input"
+                )
+        except Exception as e:
+            return None, f"❌ Error: {str(e)}", "Please try again", "Source: 💬 Text Input"
     else:
+        return None, "❌ No input provided", "Please upload audio, record with microphone, OR enter text", ""
     try:
         print(f"Processing {audio_source} audio: {audio_file}")
         result = model.transcribe(audio_file, language=source_lang, fp16=False)
         original_text = result["text"].strip()
         print(f"Transcribed: {original_text}")
         if source_lang != target_lang:
             translator = GoogleTranslator(source=source_lang, target=target_lang)
             translated_text = translator.translate(original_text)
         print(f"Translated: {translated_text}")
         tts = gTTS(text=translated_text, lang=target_lang, slow=False)
         with tempfile.NamedTemporaryFile(delete=False, suffix='.mp3') as tmp_file:
             tts.save(tmp_file.name)
             return (
         print(f"Error: {str(e)}")
         return None, f"❌ Error: {str(e)}", "Please try again", f"Source: {audio_source}"
 languages = {
     "tr": "🇹🇷 Turkish",
     "en": "🇺🇸 English",
     "zh": "🇨🇳 Chinese"
 }
 demo = gr.Interface(
     fn=translate_audio,
     inputs=[
         ),
         gr.Audio(
             type="filepath",
+            sources=["upload"],
             label="📁 Upload Audio File (MP3, WAV, etc.)"
         ),
         gr.Audio(
+            sources=["microphone"],
             label="🎤 OR Record with Microphone",
+            type="filepath"
         ),
         gr.Dropdown(
             choices=list(languages.keys()),
         <h3>🎯 How to Use:</h3>
         <p><strong>Option 1:</strong> 📁 Upload an audio file (recommended)</p>
         <p><strong>Option 2:</strong> 🎤 Record directly with microphone</p>
+        <p><strong>Option 3:</strong> 💬 Type text directly</p>
         <p><strong>Then:</strong> Select source and target languages, wait for processing!</p>
         <br>
         <p>🔧 <strong>Troubleshooting:</strong> If microphone doesn't work, use file upload instead.</p>
     """,
     examples=[
+        ["", None, None, "tr", "en"],
+        ["", None, None, "en", "fr"],
+        ["Hello world", None, None, "en", "es"],
     ],
     allow_flagging="never",
     show_error=True
 )