arena / api_config.yaml
terryyz's picture
Update api_config.yaml
df3bf84 verified
gpt-4o-mini-2024-07-18:
model: gpt-4o-mini-2024-07-18
endpoints: null
api_type: openai
max_tokens: 8192
temperature: 0.7
organization: OpenAI
gpt-4.1-mini-2025-04-14:
model: gpt-4.1-mini-2025-04-14
endpoints: null
api_type: openai
max_tokens: 8192
temperature: 0.7
organization: OpenAI
# gpt-5-mini-2025-08-07:
# model: gpt-5-mini-2025-08-07
# endpoints: null
# api_type: openai
# max_tokens: 8192
# temperature: 0.7
# organization: OpenAI
qwen3-max-2025-09-23:
model: qwen3-max-2025-09-23
endpoints:
- api_base: https://dashscope.aliyuncs.com/compatible-mode/v1
api_key: ${DASHSCOPE_API_KEY}
api_type: openai
max_tokens: 8192
temperature: 0.7
organization: Alibaba
qwen3-coder-plus-2025-09-23:
model: qwen3-coder-plus-2025-09-23
endpoints:
- api_base: https://dashscope.aliyuncs.com/compatible-mode/v1
api_key: ${DASHSCOPE_API_KEY}
api_type: openai
max_tokens: 8192
temperature: 0.7
organization: Alibaba
qwen3-coder-flash-2025-07-28:
model: qwen3-coder-flash-2025-07-28
endpoints:
- api_base: https://dashscope.aliyuncs.com/compatible-mode/v1
api_key: ${DASHSCOPE_API_KEY}
api_type: openai
max_tokens: 8192
temperature: 0.7
organization: Alibaba
qwen3-next-80b-a3b-thinking:
model: qwen3-next-80b-a3b-thinking
endpoints:
- api_base: https://dashscope.aliyuncs.com/compatible-mode/v1
api_key: ${DASHSCOPE_API_KEY}
api_type: openai_thinking
max_tokens: 8192
temperature: 0.7
organization: Alibaba
qwen3-next-80b-a3b-instruct:
model: qwen3-next-80b-a3b-instruct
endpoints:
- api_base: https://dashscope.aliyuncs.com/compatible-mode/v1
api_key: ${DASHSCOPE_API_KEY}
api_type: openai
max_tokens: 8192
temperature: 0.7
organization: Alibaba
qwen3-235b-a22b-thinking-2507:
model: qwen3-235b-a22b-thinking-2507
endpoints:
- api_base: https://dashscope.aliyuncs.com/compatible-mode/v1
api_key: ${DASHSCOPE_API_KEY}
api_type: openai_thinking
max_tokens: 8192
temperature: 0.7
organization: Alibaba
qwen3-235b-a22b-instruct-2507:
model: qwen3-235b-a22b-instruct-2507
endpoints:
- api_base: https://dashscope.aliyuncs.com/compatible-mode/v1
api_key: ${DASHSCOPE_API_KEY}
api_type: openai
max_tokens: 8192
temperature: 0.7
organization: Alibaba
qwen3-30b-a3b-thinking-2507:
model: qwen3-30b-a3b-thinking-2507
endpoints:
- api_base: https://dashscope.aliyuncs.com/compatible-mode/v1
api_key: ${DASHSCOPE_API_KEY}
api_type: openai_thinking
max_tokens: 8192
temperature: 0.7
organization: Alibaba
qwen3-30b-a3b-instruct-2507:
model: qwen3-30b-a3b-instruct-2507
endpoints:
- api_base: https://dashscope.aliyuncs.com/compatible-mode/v1
api_key: ${DASHSCOPE_API_KEY}
api_type: openai
max_tokens: 8192
temperature: 0.7
organization: Alibaba
DeepSeek-V3.1-Terminus:
model: deepseek-chat
endpoints:
- api_base: https://api.deepseek.com/v3.1_terminus_expires_on_20251015
api_key: ${DEEPSEEK_API_KEY}
api_type: openai
max_tokens: 8192
temperature: 0.7
organization: DeepSeek
DeepSeek-V3.2-Exp:
model: deepseek-chat
endpoints:
- api_base: https://api.deepseek.com
api_key: ${DEEPSEEK_API_KEY}
api_type: openai
max_tokens: 8192
temperature: 0.7
organization: DeepSeek
GLM-4.6:
model: glm-4.6
endpoints:
- api_base: https://api.z.ai/api/paas/v4/
api_key: ${Z_API_KEY}
api_type: openai
max_tokens: 8192
temperature: 0.7
organization: Zhipu AI
weight: 3.0
# o1-2024-12-17:
# model: o1-2024-12-17
# endpoints: null
# api_type: openai
# parallel: 32
# max_tokens: 8192
# temperature: 0.7
# organization: OpenAI
# license: Proprietary
# o4-mini-2025-04-16:
# model: o4-mini-2025-04-16
# endpoints: null
# api_type: openai_thinking
# parallel: 32
# max_tokens: 8192
# temperature: 1.0
# organization: OpenAI
# license: Proprietary
# o3-mini-2025-01-31:
# model: o3-mini-2025-01-31
# endpoints: null
# api_type: openai_thinking
# parallel: 32
# max_tokens: 8192
# temperature: 0.7
# organization: OpenAI
# license: Proprietary
# gemini-2.0-flash-001:
# model: google/gemini-2.0-flash-001
# endpoints:
# - api_base: https://openrouter.ai/api/v1
# api_key: ${OPENROUTER_API_KEY}
# api_type: openai
# parallel: 32
# max_tokens: 81920
# temperature: 0.7
# organization: Google
# license: Proprietary
# gemini-2.5-pro:
# model: google/gemini-2.5-pro
# endpoints:
# - api_base: https://openrouter.ai/api/v1
# api_key: ${OPENROUTER_API_KEY}
# api_type: openai
# parallel: 32
# max_tokens: 8192
# temperature: 0.7
# organization: Google
# license: Proprietary
# gemini-2.5-flash:
# model: google/gemini-2.5-flash
# endpoints:
# - api_base: https://openrouter.ai/api/v1
# api_key: ${OPENROUTER_API_KEY}
# api_type: openai
# parallel: 32
# max_tokens: 8192
# temperature: 0.7
# organization: Google
# license: Proprietary
# claude35_haiku:
# model: bedrock/anthropic.claude-3-5-haiku-20241022-v1:0
# endpoints: null
# api_type: litellm
# parallel: 32
# max_tokens: 8192
# temperature: 0.7
# organization: Anthropic
# license: Proprietary
# claude35_sonnet:
# model: bedrock/anthropic.claude-3-5-sonnet-20241022-v2:0
# endpoints: null
# api_type: litellm
# parallel: 32
# max_tokens: 8192
# temperature: 0.7
# organization: Anthropic
# license: Proprietary
# claude37_sonnet:
# model: bedrock/us.anthropic.claude-3-7-sonnet-20250219-v1:0
# endpoints: null
# api_type: litellm
# parallel: 32
# max_tokens: 8192
# temperature: 0.7
# organization: Anthropic
# license: Proprietary
# qwen3-coder:
# model: qwen/qwen3-coder
# endpoints:
# - api_base: https://openrouter.ai/api/v1
# api_key: ${OPENROUTER_API_KEY}
# api_type: openai
# parallel: 32
# max_tokens: 8192
# temperature: 0.7
# organization: Alibaba
# license: Apache 2.0
# kimi-k2:
# model: moonshotai/kimi-k2
# endpoints:
# - api_base: https://openrouter.ai/api/v1
# api_key: ${OPENROUTER_API_KEY}
# api_type: openai
# parallel: 32
# max_tokens: 8192
# temperature: 0.7
# organization: Moonshot
# license: Modified MIT
# claude-4-sonnet:
# model: bedrock/us.anthropic.claude-sonnet-4-20250514-v1:0
# endpoints: null
# api_type: litellm
# parallel: 16
# max_tokens: 8192
# temperature: 0.7
# organization: Anthropic
# license: Proprietary
# claude-4-opus:
# model: bedrock/us.anthropic.claude-opus-4-20250514-v1:0
# endpoints: null
# api_type: litellm
# parallel: 16
# max_tokens: 8192
# temperature: 0.7
# organization: Anthropic
# license: Proprietary
# gpt-oss-120b:
# model: openai/gpt-oss-120b
# endpoints:
# - api_base: https://openrouter.ai/api/v1
# api_key: ${OPENROUTER_API_KEY}
# api_type: openai_thinking
# parallel: 32
# max_tokens: 8192
# temperature: 1.0
# organization: OpenAI
# license: MIT
# gpt-oss-20b:
# model: openai/gpt-oss-20b
# endpoints:
# - api_base: https://openrouter.ai/api/v1
# api_key: ${OPENROUTER_API_KEY}
# api_type: openai_thinking
# parallel: 32
# max_tokens: 8192
# temperature: 1.0
# organization: OpenAI
# license: MIT
# deepseek-chat-v3-0324:
# model: deepseek/deepseek-chat-v3-0324
# endpoints:
# - api_base: https://openrouter.ai/api/v1
# api_key: ${OPENROUTER_API_KEY}
# api_type: openai
# parallel: 32
# max_tokens: 8192
# temperature: 0.7
# organization: DeepSeek
# license: MIT
# deepseek-chat-v3.1:
# model: deepseek-chat
# endpoints:
# - api_base: https://api.deepseek.com
# api_key: ${DEEPSEEK_API_KEY}
# api_type: openai
# parallel: 32
# max_tokens: 8192
# temperature: 0.7
# organization: DeepSeek
# license: MIT
# glm-4.5:
# model: z-ai/glm-4.5
# endpoints:
# - api_base: https://openrouter.ai/api/v1
# api_key: ${OPENROUTER_API_KEY}
# api_type: openai
# parallel: 32
# max_tokens: 8192
# temperature: 0.7
# organization: Zhipu AI
# license: Custom
# gpt-4.1-2025-04-14:
# model: gpt-4.1-2025-04-14
# endpoints: null
# api_type: openai
# parallel: 32
# max_tokens: 8192
# temperature: 0.7
# organization: OpenAI
# license: Proprietary
# deepseek-r1-0528:
# model: deepseek/deepseek-r1-0528
# endpoints:
# - api_base: https://openrouter.ai/api/v1
# api_key: ${OPENROUTER_API_KEY}
# api_type: openai_thinking
# parallel: 32
# max_tokens: 81920
# temperature: 1.0
# organization: DeepSeek
# license: MIT
# gpt-5-2025-08-07:
# model: gpt-5-2025-08-07
# endpoints: null
# api_type: openai_thinking
# parallel: 32
# max_tokens: 8192
# temperature: 1.0
# organization: OpenAI
# license: Proprietary
# grok-code:
# model: x-ai/grok-code-fast-1
# endpoints:
# - api_base: https://openrouter.ai/api/v1
# api_key: ${OPENROUTER_API_KEY}
# api_type: openai_thinking
# parallel: 32
# max_tokens: 8192
# temperature: 1.0
# organization: xAI
# license: Proprietary