# 负责wav & text instruct 的处理 import codecs import json import random from gxl_ai_utils.utils import utils_file import torch import os # asr+X task_names = [ "age", "gender", "style", "emotion", "caption" ] map_dict = { "