File size: 856 Bytes
287c28c
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
python3 main.py --dataset_name indictts \
    --language ta \
    --speaker all \
    --max_audio_len 441000 \
    --max_text_len 400 \
    --audio_config without_norm \
    --model fastpitch \
    --hidden_channels 512 \
    --use_speaker_embedding t \
    --use_d_vector_file f \
    --use_speaker_encoder_as_loss f \
    --use_ssim_loss f \
    --use_aligner t \
    --use_separate_optimizers f \
    --use_pre_computed_alignments f \
    --batch_size 32 \
    --batch_size_eval 32 \
    --batch_group_size 0 \
    --epochs 2500 \
    --aligner_epochs 2500 \
    --lr 0.0001 \
    --lr_scheduler NoamLR \
    --lr_scheduler_warmup_steps 4000 \
    --lr_scheduler_step_size 500 \
    --lr_scheduler_gamma 0.1 \
    --lr_scheduler_threshold_step 500 \
    --num_workers 0 \
    --num_workers_eval 0 \
    --output_path output/ta \
    --mixed_precision t