Spaces:
Running
Running
gpt-4o-mini-2024-07-18: | |
model: gpt-4o-mini-2024-07-18 | |
endpoints: null | |
api_type: openai | |
max_tokens: 8192 | |
temperature: 0.7 | |
organization: OpenAI | |
gpt-4.1-mini-2025-04-14: | |
model: gpt-4.1-mini-2025-04-14 | |
endpoints: null | |
api_type: openai | |
max_tokens: 8192 | |
temperature: 0.7 | |
organization: OpenAI | |
# gpt-5-mini-2025-08-07: | |
# model: gpt-5-mini-2025-08-07 | |
# endpoints: null | |
# api_type: openai | |
# max_tokens: 8192 | |
# temperature: 0.7 | |
# organization: OpenAI | |
qwen3-max-2025-09-23: | |
model: qwen3-max-2025-09-23 | |
endpoints: | |
- api_base: https://dashscope.aliyuncs.com/compatible-mode/v1 | |
api_key: ${DASHSCOPE_API_KEY} | |
api_type: openai | |
max_tokens: 8192 | |
temperature: 0.7 | |
organization: Alibaba | |
qwen3-coder-plus-2025-09-23: | |
model: qwen3-coder-plus-2025-09-23 | |
endpoints: | |
- api_base: https://dashscope.aliyuncs.com/compatible-mode/v1 | |
api_key: ${DASHSCOPE_API_KEY} | |
api_type: openai | |
max_tokens: 8192 | |
temperature: 0.7 | |
organization: Alibaba | |
qwen3-coder-flash-2025-07-28: | |
model: qwen3-coder-flash-2025-07-28 | |
endpoints: | |
- api_base: https://dashscope.aliyuncs.com/compatible-mode/v1 | |
api_key: ${DASHSCOPE_API_KEY} | |
api_type: openai | |
max_tokens: 8192 | |
temperature: 0.7 | |
organization: Alibaba | |
qwen3-next-80b-a3b-thinking: | |
model: qwen3-next-80b-a3b-thinking | |
endpoints: | |
- api_base: https://dashscope.aliyuncs.com/compatible-mode/v1 | |
api_key: ${DASHSCOPE_API_KEY} | |
api_type: openai_thinking | |
max_tokens: 8192 | |
temperature: 0.7 | |
organization: Alibaba | |
qwen3-next-80b-a3b-instruct: | |
model: qwen3-next-80b-a3b-instruct | |
endpoints: | |
- api_base: https://dashscope.aliyuncs.com/compatible-mode/v1 | |
api_key: ${DASHSCOPE_API_KEY} | |
api_type: openai | |
max_tokens: 8192 | |
temperature: 0.7 | |
organization: Alibaba | |
qwen3-235b-a22b-thinking-2507: | |
model: qwen3-235b-a22b-thinking-2507 | |
endpoints: | |
- api_base: https://dashscope.aliyuncs.com/compatible-mode/v1 | |
api_key: ${DASHSCOPE_API_KEY} | |
api_type: openai_thinking | |
max_tokens: 8192 | |
temperature: 0.7 | |
organization: Alibaba | |
qwen3-235b-a22b-instruct-2507: | |
model: qwen3-235b-a22b-instruct-2507 | |
endpoints: | |
- api_base: https://dashscope.aliyuncs.com/compatible-mode/v1 | |
api_key: ${DASHSCOPE_API_KEY} | |
api_type: openai | |
max_tokens: 8192 | |
temperature: 0.7 | |
organization: Alibaba | |
qwen3-30b-a3b-thinking-2507: | |
model: qwen3-30b-a3b-thinking-2507 | |
endpoints: | |
- api_base: https://dashscope.aliyuncs.com/compatible-mode/v1 | |
api_key: ${DASHSCOPE_API_KEY} | |
api_type: openai_thinking | |
max_tokens: 8192 | |
temperature: 0.7 | |
organization: Alibaba | |
qwen3-30b-a3b-instruct-2507: | |
model: qwen3-30b-a3b-instruct-2507 | |
endpoints: | |
- api_base: https://dashscope.aliyuncs.com/compatible-mode/v1 | |
api_key: ${DASHSCOPE_API_KEY} | |
api_type: openai | |
max_tokens: 8192 | |
temperature: 0.7 | |
organization: Alibaba | |
DeepSeek-V3.1-Terminus: | |
model: deepseek-chat | |
endpoints: | |
- api_base: https://api.deepseek.com/v3.1_terminus_expires_on_20251015 | |
api_key: ${DEEPSEEK_API_KEY} | |
api_type: openai | |
max_tokens: 8192 | |
temperature: 0.7 | |
organization: DeepSeek | |
DeepSeek-V3.2-Exp: | |
model: deepseek-chat | |
endpoints: | |
- api_base: https://api.deepseek.com | |
api_key: ${DEEPSEEK_API_KEY} | |
api_type: openai | |
max_tokens: 8192 | |
temperature: 0.7 | |
organization: DeepSeek | |
GLM-4.6: | |
model: glm-4.6 | |
endpoints: | |
- api_base: https://api.z.ai/api/paas/v4/ | |
api_key: ${Z_API_KEY} | |
api_type: openai | |
max_tokens: 8192 | |
temperature: 0.7 | |
organization: Zhipu AI | |
weight: 3.0 | |
# o1-2024-12-17: | |
# model: o1-2024-12-17 | |
# endpoints: null | |
# api_type: openai | |
# parallel: 32 | |
# max_tokens: 8192 | |
# temperature: 0.7 | |
# organization: OpenAI | |
# license: Proprietary | |
# o4-mini-2025-04-16: | |
# model: o4-mini-2025-04-16 | |
# endpoints: null | |
# api_type: openai_thinking | |
# parallel: 32 | |
# max_tokens: 8192 | |
# temperature: 1.0 | |
# organization: OpenAI | |
# license: Proprietary | |
# o3-mini-2025-01-31: | |
# model: o3-mini-2025-01-31 | |
# endpoints: null | |
# api_type: openai_thinking | |
# parallel: 32 | |
# max_tokens: 8192 | |
# temperature: 0.7 | |
# organization: OpenAI | |
# license: Proprietary | |
# gemini-2.0-flash-001: | |
# model: google/gemini-2.0-flash-001 | |
# endpoints: | |
# - api_base: https://openrouter.ai/api/v1 | |
# api_key: ${OPENROUTER_API_KEY} | |
# api_type: openai | |
# parallel: 32 | |
# max_tokens: 81920 | |
# temperature: 0.7 | |
# organization: Google | |
# license: Proprietary | |
# gemini-2.5-pro: | |
# model: google/gemini-2.5-pro | |
# endpoints: | |
# - api_base: https://openrouter.ai/api/v1 | |
# api_key: ${OPENROUTER_API_KEY} | |
# api_type: openai | |
# parallel: 32 | |
# max_tokens: 8192 | |
# temperature: 0.7 | |
# organization: Google | |
# license: Proprietary | |
# gemini-2.5-flash: | |
# model: google/gemini-2.5-flash | |
# endpoints: | |
# - api_base: https://openrouter.ai/api/v1 | |
# api_key: ${OPENROUTER_API_KEY} | |
# api_type: openai | |
# parallel: 32 | |
# max_tokens: 8192 | |
# temperature: 0.7 | |
# organization: Google | |
# license: Proprietary | |
# claude35_haiku: | |
# model: bedrock/anthropic.claude-3-5-haiku-20241022-v1:0 | |
# endpoints: null | |
# api_type: litellm | |
# parallel: 32 | |
# max_tokens: 8192 | |
# temperature: 0.7 | |
# organization: Anthropic | |
# license: Proprietary | |
# claude35_sonnet: | |
# model: bedrock/anthropic.claude-3-5-sonnet-20241022-v2:0 | |
# endpoints: null | |
# api_type: litellm | |
# parallel: 32 | |
# max_tokens: 8192 | |
# temperature: 0.7 | |
# organization: Anthropic | |
# license: Proprietary | |
# claude37_sonnet: | |
# model: bedrock/us.anthropic.claude-3-7-sonnet-20250219-v1:0 | |
# endpoints: null | |
# api_type: litellm | |
# parallel: 32 | |
# max_tokens: 8192 | |
# temperature: 0.7 | |
# organization: Anthropic | |
# license: Proprietary | |
# qwen3-coder: | |
# model: qwen/qwen3-coder | |
# endpoints: | |
# - api_base: https://openrouter.ai/api/v1 | |
# api_key: ${OPENROUTER_API_KEY} | |
# api_type: openai | |
# parallel: 32 | |
# max_tokens: 8192 | |
# temperature: 0.7 | |
# organization: Alibaba | |
# license: Apache 2.0 | |
# kimi-k2: | |
# model: moonshotai/kimi-k2 | |
# endpoints: | |
# - api_base: https://openrouter.ai/api/v1 | |
# api_key: ${OPENROUTER_API_KEY} | |
# api_type: openai | |
# parallel: 32 | |
# max_tokens: 8192 | |
# temperature: 0.7 | |
# organization: Moonshot | |
# license: Modified MIT | |
# claude-4-sonnet: | |
# model: bedrock/us.anthropic.claude-sonnet-4-20250514-v1:0 | |
# endpoints: null | |
# api_type: litellm | |
# parallel: 16 | |
# max_tokens: 8192 | |
# temperature: 0.7 | |
# organization: Anthropic | |
# license: Proprietary | |
# claude-4-opus: | |
# model: bedrock/us.anthropic.claude-opus-4-20250514-v1:0 | |
# endpoints: null | |
# api_type: litellm | |
# parallel: 16 | |
# max_tokens: 8192 | |
# temperature: 0.7 | |
# organization: Anthropic | |
# license: Proprietary | |
# gpt-oss-120b: | |
# model: openai/gpt-oss-120b | |
# endpoints: | |
# - api_base: https://openrouter.ai/api/v1 | |
# api_key: ${OPENROUTER_API_KEY} | |
# api_type: openai_thinking | |
# parallel: 32 | |
# max_tokens: 8192 | |
# temperature: 1.0 | |
# organization: OpenAI | |
# license: MIT | |
# gpt-oss-20b: | |
# model: openai/gpt-oss-20b | |
# endpoints: | |
# - api_base: https://openrouter.ai/api/v1 | |
# api_key: ${OPENROUTER_API_KEY} | |
# api_type: openai_thinking | |
# parallel: 32 | |
# max_tokens: 8192 | |
# temperature: 1.0 | |
# organization: OpenAI | |
# license: MIT | |
# deepseek-chat-v3-0324: | |
# model: deepseek/deepseek-chat-v3-0324 | |
# endpoints: | |
# - api_base: https://openrouter.ai/api/v1 | |
# api_key: ${OPENROUTER_API_KEY} | |
# api_type: openai | |
# parallel: 32 | |
# max_tokens: 8192 | |
# temperature: 0.7 | |
# organization: DeepSeek | |
# license: MIT | |
# deepseek-chat-v3.1: | |
# model: deepseek-chat | |
# endpoints: | |
# - api_base: https://api.deepseek.com | |
# api_key: ${DEEPSEEK_API_KEY} | |
# api_type: openai | |
# parallel: 32 | |
# max_tokens: 8192 | |
# temperature: 0.7 | |
# organization: DeepSeek | |
# license: MIT | |
# glm-4.5: | |
# model: z-ai/glm-4.5 | |
# endpoints: | |
# - api_base: https://openrouter.ai/api/v1 | |
# api_key: ${OPENROUTER_API_KEY} | |
# api_type: openai | |
# parallel: 32 | |
# max_tokens: 8192 | |
# temperature: 0.7 | |
# organization: Zhipu AI | |
# license: Custom | |
# gpt-4.1-2025-04-14: | |
# model: gpt-4.1-2025-04-14 | |
# endpoints: null | |
# api_type: openai | |
# parallel: 32 | |
# max_tokens: 8192 | |
# temperature: 0.7 | |
# organization: OpenAI | |
# license: Proprietary | |
# deepseek-r1-0528: | |
# model: deepseek/deepseek-r1-0528 | |
# endpoints: | |
# - api_base: https://openrouter.ai/api/v1 | |
# api_key: ${OPENROUTER_API_KEY} | |
# api_type: openai_thinking | |
# parallel: 32 | |
# max_tokens: 81920 | |
# temperature: 1.0 | |
# organization: DeepSeek | |
# license: MIT | |
# gpt-5-2025-08-07: | |
# model: gpt-5-2025-08-07 | |
# endpoints: null | |
# api_type: openai_thinking | |
# parallel: 32 | |
# max_tokens: 8192 | |
# temperature: 1.0 | |
# organization: OpenAI | |
# license: Proprietary | |
# grok-code: | |
# model: x-ai/grok-code-fast-1 | |
# endpoints: | |
# - api_base: https://openrouter.ai/api/v1 | |
# api_key: ${OPENROUTER_API_KEY} | |
# api_type: openai_thinking | |
# parallel: 32 | |
# max_tokens: 8192 | |
# temperature: 1.0 | |
# organization: xAI | |
# license: Proprietary |