CapSpeech-TTS

Running on Zero

Upload 518 files

dd9600d verified 10 days ago

658 Bytes

	export CUDA_VISIBLE_DEVICES=0

	SAVE_DIR='./agent_data' # to save processed data
	CACHE_DIR='./cache' # to save dataset cache
	WAV_DIR='' # downloaded capspeech-agentdb wav path
	CPUS=30
	N_WORKERS=8
	BATCH_SIZE=64
	HUB='OpenSound/CapSpeech'

	python preprocess_agenttts.py \
	--hub ${HUB} \
	--save_dir ${SAVE_DIR} \
	--cache_dir ${CACHE_DIR} \
	--wav_dir ${WAV_DIR}\
	--splits train_AgentDB test_AgentDB \
	--audio_min_length 2.0 \
	--audio_max_length 20.0

	python phonemize_no_se.py \
	--save_dir ${SAVE_DIR} \
	--num_cpus ${CPUS}

	python caption.py \
	--save_dir ${SAVE_DIR}

	python filemaker_no_se.py \
	--save_dir ${SAVE_DIR}