Spaces:

darshankr
/

tts

Sleeping

App Files Files Community

darshankr commited on Oct 23, 2024

Commit

d6dc2d5

verified ·

1 Parent(s): c6681f6

Update app.py

Browse files

Files changed (1) hide show

app.py +16 -6

app.py CHANGED Viewed

@@ -2,19 +2,25 @@ import gradio as gr
 import subprocess
 import os
-# Define paths to the TTS model and vocoder files
 MODEL_PATH = "models/v1/hi/fastpitch/best_model.pth"
 CONFIG_PATH = "models/v1/hi/fastpitch/config.json"
 VOCODER_PATH = "models/v1/hi/hifigan/best_model.pth"
 VOCODER_CONFIG_PATH = "models/v1/hi/hifigan/config.json"
 OUTPUT_FILE = "output.mp4"
 def generate_speech(text: str) -> str:
     """
-    Run the TTS synthesis command and generate speech as an MP4 file.
-    Returns the path to the output audio file.
     """
     try:
         # Construct the command for speech synthesis
         command = [
             "python3", "-m", "TTS.bin.synthesize",
@@ -26,7 +32,7 @@ def generate_speech(text: str) -> str:
             "--speaker_idx", "female",
             "--out_path", OUTPUT_FILE
         ]
         # Run the command
         result = subprocess.run(command, capture_output=True, text=True)
@@ -34,12 +40,16 @@ def generate_speech(text: str) -> str:
         if result.returncode != 0:
             raise Exception(f"Error: {result.stderr}")
-        # Return the path to the generated output file
-        return OUTPUT_FILE
     except Exception as e:
         return str(e)
 # Create the Gradio interface
 interface = gr.Interface(
     fn=generate_speech,

 import subprocess
 import os
+# Define paths to the TTS model and vocoder files (relative to the Indic-TTS folder)
 MODEL_PATH = "models/v1/hi/fastpitch/best_model.pth"
 CONFIG_PATH = "models/v1/hi/fastpitch/config.json"
 VOCODER_PATH = "models/v1/hi/hifigan/best_model.pth"
 VOCODER_CONFIG_PATH = "models/v1/hi/hifigan/config.json"
 OUTPUT_FILE = "output.mp4"
+INDIC_TTS_FOLDER = "Indic-TTS"  # Folder where the TTS system is located
 def generate_speech(text: str) -> str:
     """
+    Navigate to the Indic-TTS folder, run the TTS synthesis command, and return to the original directory.
+    Returns the path to the output audio file or an error message.
     """
+    original_dir = os.getcwd()  # Save the current working directory
     try:
+        # Change to the Indic-TTS directory
+        os.chdir(INDIC_TTS_FOLDER)
         # Construct the command for speech synthesis
         command = [
             "python3", "-m", "TTS.bin.synthesize",
             "--speaker_idx", "female",
             "--out_path", OUTPUT_FILE
         ]
         # Run the command
         result = subprocess.run(command, capture_output=True, text=True)
         if result.returncode != 0:
             raise Exception(f"Error: {result.stderr}")
+        # Return the full path to the generated output file
+        return os.path.join(os.getcwd(), OUTPUT_FILE)
     except Exception as e:
         return str(e)
+    finally:
+        # Change back to the original directory
+        os.chdir(original_dir)
 # Create the Gradio interface
 interface = gr.Interface(
     fn=generate_speech,