Spaces:
Running
on
Zero
Running
on
Zero
from ..llama_configs import LLAMA_CONFIGS | |
class T3Config: | |
def __init__(self, text_tokens_dict_size=704): | |
self.start_text_token = 255 | |
self.stop_text_token = 0 | |
self.text_tokens_dict_size = text_tokens_dict_size | |
self.max_text_tokens = 2048 | |
self.start_speech_token = 6561 | |
self.stop_speech_token = 6562 | |
self.speech_tokens_dict_size = 8194 | |
self.max_speech_tokens = 4096 | |
self.llama_config_name = "Llama_520M" | |
self.input_pos_emb = "learned" | |
self.speech_cond_prompt_len = 150 | |
self.encoder_type = "voice_encoder" | |
self.speaker_embed_size = 256 | |
self.use_perceiver_resampler = True | |
self.emotion_adv = True | |
def n_channels(self): | |
return LLAMA_CONFIGS[self.llama_config_name]["hidden_size"] | |
def is_multilingual(self): | |
return self.text_tokens_dict_size == 2352 | |
def english_only(cls): | |
"""Create configuration for English-only TTS model.""" | |
return cls(text_tokens_dict_size=704) | |
def multilingual(cls): | |
"""Create configuration for multilingual TTS model.""" | |
return cls(text_tokens_dict_size=2352) |