| { | |
| "llm_model": "llm.mnn", | |
| "llm_weight": "llm.mnn.weight", | |
| "embedding_file": "embeddings_int4.bin", | |
| "backend_type": "cpu", | |
| "thread_num": 4, | |
| "precision": "low", | |
| "memory": "low", | |
| "mllm": { | |
| "backend_type": "cpu", | |
| "thread_num": 4, | |
| "precision": "low", | |
| "memory": "low" | |
| }, | |
| "sampler_type": "mixed", | |
| "mixed_samplers": [ | |
| "penalty", | |
| "topK", | |
| "topP", | |
| "min_p", | |
| "temperature" | |
| ], | |
| "penalty": 1.2, | |
| "temperature": 0.7, | |
| "topP": 0.8, | |
| "topK": 20, | |
| "min_p": 0, | |
| "max_new_tokens": 16384 | |
| } | 

