import os import soundfile as sf import torch from SparkTTS import SparkTTS model = SparkTTS("weclone-audio/pretrained_models/Spark-TTS-0.5B", "cuda") with torch.no_grad(): wav = model.inference( text="晚上好啊,小可爱们,该睡觉了哦", prompt_speech_path=os.path.join(os.path.dirname(__file__), "sample.wav"), prompt_text="对,这就是我万人敬仰的太乙真人,虽然有点婴儿肥,但也掩不住我逼人的帅气。", ) sf.write(os.path.join(os.path.dirname(__file__), "output.wav"), wav, samplerate=16000) print("生成成功!")