File size: 856 Bytes
287c28c |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 |
python3 main.py --dataset_name indictts \ --language ta \ --speaker all \ --max_audio_len 441000 \ --max_text_len 400 \ --audio_config without_norm \ --model fastpitch \ --hidden_channels 512 \ --use_speaker_embedding t \ --use_d_vector_file f \ --use_speaker_encoder_as_loss f \ --use_ssim_loss f \ --use_aligner t \ --use_separate_optimizers f \ --use_pre_computed_alignments f \ --batch_size 32 \ --batch_size_eval 32 \ --batch_group_size 0 \ --epochs 2500 \ --aligner_epochs 2500 \ --lr 0.0001 \ --lr_scheduler NoamLR \ --lr_scheduler_warmup_steps 4000 \ --lr_scheduler_step_size 500 \ --lr_scheduler_gamma 0.1 \ --lr_scheduler_threshold_step 500 \ --num_workers 0 \ --num_workers_eval 0 \ --output_path output/ta \ --mixed_precision t |