Spaces:
Running
Running
| gpt-4o-mini-2024-07-18: | |
| model: gpt-4o-mini-2024-07-18 | |
| endpoints: null | |
| api_type: openai | |
| max_tokens: 8192 | |
| temperature: 0.7 | |
| organization: OpenAI | |
| gpt-4.1-mini-2025-04-14: | |
| model: gpt-4.1-mini-2025-04-14 | |
| endpoints: null | |
| api_type: openai | |
| max_tokens: 8192 | |
| temperature: 0.7 | |
| organization: OpenAI | |
| # gpt-5-mini-2025-08-07: | |
| # model: gpt-5-mini-2025-08-07 | |
| # endpoints: null | |
| # api_type: openai | |
| # max_tokens: 8192 | |
| # temperature: 0.7 | |
| # organization: OpenAI | |
| qwen3-max-2025-09-23: | |
| model: qwen3-max-2025-09-23 | |
| endpoints: | |
| - api_base: https://dashscope.aliyuncs.com/compatible-mode/v1 | |
| api_key: ${DASHSCOPE_API_KEY} | |
| api_type: openai | |
| max_tokens: 8192 | |
| temperature: 0.7 | |
| organization: Alibaba | |
| qwen3-coder-plus-2025-09-23: | |
| model: qwen3-coder-plus-2025-09-23 | |
| endpoints: | |
| - api_base: https://dashscope.aliyuncs.com/compatible-mode/v1 | |
| api_key: ${DASHSCOPE_API_KEY} | |
| api_type: openai | |
| max_tokens: 8192 | |
| temperature: 0.7 | |
| organization: Alibaba | |
| qwen3-coder-flash-2025-07-28: | |
| model: qwen3-coder-flash-2025-07-28 | |
| endpoints: | |
| - api_base: https://dashscope.aliyuncs.com/compatible-mode/v1 | |
| api_key: ${DASHSCOPE_API_KEY} | |
| api_type: openai | |
| max_tokens: 8192 | |
| temperature: 0.7 | |
| organization: Alibaba | |
| qwen3-next-80b-a3b-thinking: | |
| model: qwen3-next-80b-a3b-thinking | |
| endpoints: | |
| - api_base: https://dashscope.aliyuncs.com/compatible-mode/v1 | |
| api_key: ${DASHSCOPE_API_KEY} | |
| api_type: openai_thinking | |
| max_tokens: 8192 | |
| temperature: 0.7 | |
| organization: Alibaba | |
| qwen3-next-80b-a3b-instruct: | |
| model: qwen3-next-80b-a3b-instruct | |
| endpoints: | |
| - api_base: https://dashscope.aliyuncs.com/compatible-mode/v1 | |
| api_key: ${DASHSCOPE_API_KEY} | |
| api_type: openai | |
| max_tokens: 8192 | |
| temperature: 0.7 | |
| organization: Alibaba | |
| qwen3-235b-a22b-thinking-2507: | |
| model: qwen3-235b-a22b-thinking-2507 | |
| endpoints: | |
| - api_base: https://dashscope.aliyuncs.com/compatible-mode/v1 | |
| api_key: ${DASHSCOPE_API_KEY} | |
| api_type: openai_thinking | |
| max_tokens: 8192 | |
| temperature: 0.7 | |
| organization: Alibaba | |
| qwen3-235b-a22b-instruct-2507: | |
| model: qwen3-235b-a22b-instruct-2507 | |
| endpoints: | |
| - api_base: https://dashscope.aliyuncs.com/compatible-mode/v1 | |
| api_key: ${DASHSCOPE_API_KEY} | |
| api_type: openai | |
| max_tokens: 8192 | |
| temperature: 0.7 | |
| organization: Alibaba | |
| qwen3-30b-a3b-thinking-2507: | |
| model: qwen3-30b-a3b-thinking-2507 | |
| endpoints: | |
| - api_base: https://dashscope.aliyuncs.com/compatible-mode/v1 | |
| api_key: ${DASHSCOPE_API_KEY} | |
| api_type: openai_thinking | |
| max_tokens: 8192 | |
| temperature: 0.7 | |
| organization: Alibaba | |
| qwen3-30b-a3b-instruct-2507: | |
| model: qwen3-30b-a3b-instruct-2507 | |
| endpoints: | |
| - api_base: https://dashscope.aliyuncs.com/compatible-mode/v1 | |
| api_key: ${DASHSCOPE_API_KEY} | |
| api_type: openai | |
| max_tokens: 8192 | |
| temperature: 0.7 | |
| organization: Alibaba | |
| DeepSeek-V3.1-Terminus: | |
| model: deepseek-chat | |
| endpoints: | |
| - api_base: https://api.deepseek.com/v3.1_terminus_expires_on_20251015 | |
| api_key: ${DEEPSEEK_API_KEY} | |
| api_type: openai | |
| max_tokens: 8192 | |
| temperature: 0.7 | |
| organization: DeepSeek | |
| DeepSeek-V3.2-Exp: | |
| model: deepseek-chat | |
| endpoints: | |
| - api_base: https://api.deepseek.com | |
| api_key: ${DEEPSEEK_API_KEY} | |
| api_type: openai | |
| max_tokens: 8192 | |
| temperature: 0.7 | |
| organization: DeepSeek | |
| GLM-4.6: | |
| model: glm-4.6 | |
| endpoints: | |
| - api_base: https://api.z.ai/api/paas/v4/ | |
| api_key: ${Z_API_KEY} | |
| api_type: openai | |
| max_tokens: 8192 | |
| temperature: 0.7 | |
| organization: Zhipu AI | |
| weight: 3.0 | |
| # o1-2024-12-17: | |
| # model: o1-2024-12-17 | |
| # endpoints: null | |
| # api_type: openai | |
| # parallel: 32 | |
| # max_tokens: 8192 | |
| # temperature: 0.7 | |
| # organization: OpenAI | |
| # license: Proprietary | |
| # o4-mini-2025-04-16: | |
| # model: o4-mini-2025-04-16 | |
| # endpoints: null | |
| # api_type: openai_thinking | |
| # parallel: 32 | |
| # max_tokens: 8192 | |
| # temperature: 1.0 | |
| # organization: OpenAI | |
| # license: Proprietary | |
| # o3-mini-2025-01-31: | |
| # model: o3-mini-2025-01-31 | |
| # endpoints: null | |
| # api_type: openai_thinking | |
| # parallel: 32 | |
| # max_tokens: 8192 | |
| # temperature: 0.7 | |
| # organization: OpenAI | |
| # license: Proprietary | |
| # gemini-2.0-flash-001: | |
| # model: google/gemini-2.0-flash-001 | |
| # endpoints: | |
| # - api_base: https://openrouter.ai/api/v1 | |
| # api_key: ${OPENROUTER_API_KEY} | |
| # api_type: openai | |
| # parallel: 32 | |
| # max_tokens: 81920 | |
| # temperature: 0.7 | |
| # organization: Google | |
| # license: Proprietary | |
| # gemini-2.5-pro: | |
| # model: google/gemini-2.5-pro | |
| # endpoints: | |
| # - api_base: https://openrouter.ai/api/v1 | |
| # api_key: ${OPENROUTER_API_KEY} | |
| # api_type: openai | |
| # parallel: 32 | |
| # max_tokens: 8192 | |
| # temperature: 0.7 | |
| # organization: Google | |
| # license: Proprietary | |
| # gemini-2.5-flash: | |
| # model: google/gemini-2.5-flash | |
| # endpoints: | |
| # - api_base: https://openrouter.ai/api/v1 | |
| # api_key: ${OPENROUTER_API_KEY} | |
| # api_type: openai | |
| # parallel: 32 | |
| # max_tokens: 8192 | |
| # temperature: 0.7 | |
| # organization: Google | |
| # license: Proprietary | |
| # claude35_haiku: | |
| # model: bedrock/anthropic.claude-3-5-haiku-20241022-v1:0 | |
| # endpoints: null | |
| # api_type: litellm | |
| # parallel: 32 | |
| # max_tokens: 8192 | |
| # temperature: 0.7 | |
| # organization: Anthropic | |
| # license: Proprietary | |
| # claude35_sonnet: | |
| # model: bedrock/anthropic.claude-3-5-sonnet-20241022-v2:0 | |
| # endpoints: null | |
| # api_type: litellm | |
| # parallel: 32 | |
| # max_tokens: 8192 | |
| # temperature: 0.7 | |
| # organization: Anthropic | |
| # license: Proprietary | |
| # claude37_sonnet: | |
| # model: bedrock/us.anthropic.claude-3-7-sonnet-20250219-v1:0 | |
| # endpoints: null | |
| # api_type: litellm | |
| # parallel: 32 | |
| # max_tokens: 8192 | |
| # temperature: 0.7 | |
| # organization: Anthropic | |
| # license: Proprietary | |
| # qwen3-coder: | |
| # model: qwen/qwen3-coder | |
| # endpoints: | |
| # - api_base: https://openrouter.ai/api/v1 | |
| # api_key: ${OPENROUTER_API_KEY} | |
| # api_type: openai | |
| # parallel: 32 | |
| # max_tokens: 8192 | |
| # temperature: 0.7 | |
| # organization: Alibaba | |
| # license: Apache 2.0 | |
| # kimi-k2: | |
| # model: moonshotai/kimi-k2 | |
| # endpoints: | |
| # - api_base: https://openrouter.ai/api/v1 | |
| # api_key: ${OPENROUTER_API_KEY} | |
| # api_type: openai | |
| # parallel: 32 | |
| # max_tokens: 8192 | |
| # temperature: 0.7 | |
| # organization: Moonshot | |
| # license: Modified MIT | |
| # claude-4-sonnet: | |
| # model: bedrock/us.anthropic.claude-sonnet-4-20250514-v1:0 | |
| # endpoints: null | |
| # api_type: litellm | |
| # parallel: 16 | |
| # max_tokens: 8192 | |
| # temperature: 0.7 | |
| # organization: Anthropic | |
| # license: Proprietary | |
| # claude-4-opus: | |
| # model: bedrock/us.anthropic.claude-opus-4-20250514-v1:0 | |
| # endpoints: null | |
| # api_type: litellm | |
| # parallel: 16 | |
| # max_tokens: 8192 | |
| # temperature: 0.7 | |
| # organization: Anthropic | |
| # license: Proprietary | |
| # gpt-oss-120b: | |
| # model: openai/gpt-oss-120b | |
| # endpoints: | |
| # - api_base: https://openrouter.ai/api/v1 | |
| # api_key: ${OPENROUTER_API_KEY} | |
| # api_type: openai_thinking | |
| # parallel: 32 | |
| # max_tokens: 8192 | |
| # temperature: 1.0 | |
| # organization: OpenAI | |
| # license: MIT | |
| # gpt-oss-20b: | |
| # model: openai/gpt-oss-20b | |
| # endpoints: | |
| # - api_base: https://openrouter.ai/api/v1 | |
| # api_key: ${OPENROUTER_API_KEY} | |
| # api_type: openai_thinking | |
| # parallel: 32 | |
| # max_tokens: 8192 | |
| # temperature: 1.0 | |
| # organization: OpenAI | |
| # license: MIT | |
| # deepseek-chat-v3-0324: | |
| # model: deepseek/deepseek-chat-v3-0324 | |
| # endpoints: | |
| # - api_base: https://openrouter.ai/api/v1 | |
| # api_key: ${OPENROUTER_API_KEY} | |
| # api_type: openai | |
| # parallel: 32 | |
| # max_tokens: 8192 | |
| # temperature: 0.7 | |
| # organization: DeepSeek | |
| # license: MIT | |
| # deepseek-chat-v3.1: | |
| # model: deepseek-chat | |
| # endpoints: | |
| # - api_base: https://api.deepseek.com | |
| # api_key: ${DEEPSEEK_API_KEY} | |
| # api_type: openai | |
| # parallel: 32 | |
| # max_tokens: 8192 | |
| # temperature: 0.7 | |
| # organization: DeepSeek | |
| # license: MIT | |
| # glm-4.5: | |
| # model: z-ai/glm-4.5 | |
| # endpoints: | |
| # - api_base: https://openrouter.ai/api/v1 | |
| # api_key: ${OPENROUTER_API_KEY} | |
| # api_type: openai | |
| # parallel: 32 | |
| # max_tokens: 8192 | |
| # temperature: 0.7 | |
| # organization: Zhipu AI | |
| # license: Custom | |
| # gpt-4.1-2025-04-14: | |
| # model: gpt-4.1-2025-04-14 | |
| # endpoints: null | |
| # api_type: openai | |
| # parallel: 32 | |
| # max_tokens: 8192 | |
| # temperature: 0.7 | |
| # organization: OpenAI | |
| # license: Proprietary | |
| # deepseek-r1-0528: | |
| # model: deepseek/deepseek-r1-0528 | |
| # endpoints: | |
| # - api_base: https://openrouter.ai/api/v1 | |
| # api_key: ${OPENROUTER_API_KEY} | |
| # api_type: openai_thinking | |
| # parallel: 32 | |
| # max_tokens: 81920 | |
| # temperature: 1.0 | |
| # organization: DeepSeek | |
| # license: MIT | |
| # gpt-5-2025-08-07: | |
| # model: gpt-5-2025-08-07 | |
| # endpoints: null | |
| # api_type: openai_thinking | |
| # parallel: 32 | |
| # max_tokens: 8192 | |
| # temperature: 1.0 | |
| # organization: OpenAI | |
| # license: Proprietary | |
| # grok-code: | |
| # model: x-ai/grok-code-fast-1 | |
| # endpoints: | |
| # - api_base: https://openrouter.ai/api/v1 | |
| # api_key: ${OPENROUTER_API_KEY} | |
| # api_type: openai_thinking | |
| # parallel: 32 | |
| # max_tokens: 8192 | |
| # temperature: 1.0 | |
| # organization: xAI | |
| # license: Proprietary |