neutts-air

Running

playmak3r commited on Oct 18

Commit

743b8f5

1 Parent(s): a8f789a

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -1,21 +1,27 @@
 import spaces
-import os
-import sys
 sys.path.append("neutts-air")
 from neuttsair.neutts import NeuTTSAir
 import numpy as np
 import gradio as gr
 SAMPLES_PATH = os.path.join(os.getcwd(), "neutts-air", "samples")
 DEFAULT_REF_TEXT = "So I'm live on radio. And I say, well, my dear friend James here clearly, and the whole room just froze. Turns out I'd completely misspoken and mentioned our other friend."
 DEFAULT_REF_PATH = os.path.join(SAMPLES_PATH, "dave.wav")
 DEFAULT_GEN_TEXT = "My name is Dave, and um, I'm from London."
 tts = NeuTTSAir(
     backbone_repo="neuphonic/neutts-air",
-    backbone_device="cuda",
     codec_repo="neuphonic/neucodec",
-    codec_device="cuda"
 )
 @spaces.GPU()
@@ -35,6 +41,7 @@ def infer(
         tuple [int, np.ndarray]: A tuple containing the sample rate (24000) and the generated audio waveform as a numpy array.
     """
     gr.Info("Starting inference request!")
     gr.Info("Encoding reference...")
     ref_codes = tts.encode_reference(ref_audio_path)

 import spaces
+import os, sys, logging
 sys.path.append("neutts-air")
 from neuttsair.neutts import NeuTTSAir
 import numpy as np
 import gradio as gr
 SAMPLES_PATH = os.path.join(os.getcwd(), "neutts-air", "samples")
 DEFAULT_REF_TEXT = "So I'm live on radio. And I say, well, my dear friend James here clearly, and the whole room just froze. Turns out I'd completely misspoken and mentioned our other friend."
 DEFAULT_REF_PATH = os.path.join(SAMPLES_PATH, "dave.wav")
 DEFAULT_GEN_TEXT = "My name is Dave, and um, I'm from London."
+logging.basicConfig(
+    level=logging.INFO,
+    format="%(asctime)s [%(levelname)s] %(message)s",
+    stream=sys.stdout
+)
 tts = NeuTTSAir(
     backbone_repo="neuphonic/neutts-air",
+    backbone_device="cpu",
     codec_repo="neuphonic/neucodec",
+    codec_device="cpu"
 )
 @spaces.GPU()
         tuple [int, np.ndarray]: A tuple containing the sample rate (24000) and the generated audio waveform as a numpy array.
     """
+    logging.info(f"Using reference: {ref_audio_path}")
     gr.Info("Starting inference request!")
     gr.Info("Encoding reference...")
     ref_codes = tts.encode_reference(ref_audio_path)