{ | |
"llm_model": "llm.mnn", | |
"llm_weight": "llm.mnn.weight", | |
"embedding_file": "embeddings_int4.bin", | |
"backend_type": "cpu", | |
"thread_num": 4, | |
"precision": "low", | |
"memory": "low", | |
"mllm": { | |
"backend_type": "cpu", | |
"thread_num": 4, | |
"precision": "low", | |
"memory": "low" | |
}, | |
"sampler_type": "mixed", | |
"mixed_samplers": [ | |
"penalty", | |
"topK", | |
"topP", | |
"min_p", | |
"temperature" | |
], | |
"penalty": 1.0, | |
"temperature": 1.0, | |
"topP": 0.95, | |
"topK": 20, | |
"min_p": 0, | |
"max_new_tokens": 40960 | |
} |