diff --git a/conf/all_models.json b/conf/all_models.json index 8eb3ae9c9e..3916428d7b 100644 --- a/conf/all_models.json +++ b/conf/all_models.json @@ -3530,8 +3530,7 @@ { "name": "zai-org/embedding-3", "alias": [ - "embedding-3", - "Embedding-3" + "embedding-3" ], "max_tokens": 8192, "max_dimension": 2048, @@ -3548,8 +3547,7 @@ { "name": "zai-org/embedding-2", "alias": [ - "embedding-2", - "Embedding-2" + "embedding-2" ], "max_tokens": 8192, "max_dimension": 1024, @@ -3571,9 +3569,7 @@ { "name": "zai-org/scail-2", "alias": [ - "zai-org/SCAIL-2", - "SCAIL-2", - "scail-2" + "SCAIL-2" ], "model_types": [ "image_generation" @@ -3582,9 +3578,7 @@ { "name": "zai-org/glm-5.1-fp8", "alias": [ - "zai-org/GLM-5.1-FP8", - "GLM-5.1-FP8", - "glm-5.1-fp8" + "GLM-5.1-FP8" ], "max_tokens": 202752, "model_types": [ @@ -3598,13 +3592,12 @@ { "name": "zai-org/glm-5.1", "alias": [ - "zai-org/GLM-5.1", "GLM-5.1", - "glm-5.1", "z-ai/glm-5.1", "ZHIPU/GLM-5.1", "Pro/zai-org/GLM-5.1", - "Z-AI/GLM 5.1" + "Z-AI/GLM 5.1", + "GLM 5.1 FP4" ], "max_tokens": 202752, "model_types": [ @@ -3613,16 +3606,16 @@ "thinking": { "default_value": true, "clear_thinking": true - } + }, + "max_completion_tokens": 131072 }, { "name": "zai-org/glm-5", "alias": [ - "zai-org/GLM-5", "GLM-5", - "glm-5", "z-ai/glm-5", - "ZHIPU/GLM-5" + "ZHIPU/GLM-5", + "GLM 5 Fp4" ], "max_tokens": 202752, "model_types": [ @@ -3631,14 +3624,13 @@ "thinking": { "default_value": true, "clear_thinking": true - } + }, + "max_completion_tokens": 131072 }, { "name": "zai-org/glm-5-fp8", "alias": [ - "zai-org/GLM-5-FP8", - "GLM-5-FP8", - "glm-5-fp8" + "GLM-5-FP8" ], "max_tokens": 202752, "model_types": [ @@ -3652,23 +3644,22 @@ { "name": "zai-org/glm-ocr", "alias": [ - "zai-org/GLM-OCR", "GLM-OCR", - "glm-ocr" + "GLM OCR" ], "max_tokens": 655380, "model_types": [ "chat", "image2text", - "vision" - ] + "vision", + "ocr" + ], + "max_completion_tokens": 32000 }, { "name": "zai-org/glm-4.7-flash", "alias": [ - "zai-org/GLM-4.7-Flash", "GLM-4.7-Flash", - "glm-4.7-flash", "z-ai/glm-4.7-flash" ], "max_tokens": 202752, @@ -3678,14 +3669,13 @@ "thinking": { "default_value": true, "clear_thinking": true - } + }, + "max_completion_tokens": 128000 }, { "name": "zai-org/glm-image", "alias": [ - "zai-org/GLM-Image", - "GLM-Image", - "glm-image" + "GLM-Image" ], "model_types": [ "text-to-image", @@ -3695,9 +3685,8 @@ { "name": "zai-org/glm-4.7-fp8", "alias": [ - "zai-org/GLM-4.7-FP8", "GLM-4.7-FP8", - "glm-4.7-fp8" + "Glm 4.7 Fp8" ], "max_tokens": 202752, "model_types": [ @@ -3711,9 +3700,7 @@ { "name": "zai-org/glm-4.7", "alias": [ - "zai-org/GLM-4.7", "GLM-4.7", - "glm-4.7", "z-ai/glm-4.7", "Pro/zai-org/GLM-4.7", "Z-Ai/GLM 4.7" @@ -3725,14 +3712,13 @@ "thinking": { "default_value": true, "clear_thinking": true - } + }, + "max_completion_tokens": 131072 }, { "name": "zai-org/realvideo", "alias": [ - "zai-org/RealVideo", - "RealVideo", - "realvideo" + "RealVideo" ], "model_types": [ "omni" @@ -3741,9 +3727,7 @@ { "name": "zai-org/glm-tts", "alias": [ - "zai-org/GLM-TTS", - "GLM-TTS", - "glm-tts" + "GLM-TTS" ], "model_types": [ "tts" @@ -3752,9 +3736,7 @@ { "name": "zai-org/glm-asr-nano-2512", "alias": [ - "zai-org/GLM-ASR-Nano-2512", - "GLM-ASR-Nano-2512", - "glm-asr-nano-2512" + "GLM-ASR-Nano-2512" ], "max_tokens": 65536, "model_types": [ @@ -3765,23 +3747,20 @@ { "name": "zai-org/autoglm-phone-9b-multilingual", "alias": [ - "zai-org/AutoGLM-Phone-9B-Multilingual", - "AutoGLM-Phone-9B-Multilingual", - "autoglm-phone-9b-multilingual" + "AutoGLM-Phone-9B-Multilingual" ], "max_tokens": 64000, "model_types": [ "chat", "image2text", "vision" - ] + ], + "max_completion_tokens": 65536 }, { "name": "zai-org/scail-preview", "alias": [ - "zai-org/SCAIL-Preview", - "SCAIL-Preview", - "scail-preview" + "SCAIL-Preview" ], "model_types": [ "image_generation" @@ -3790,9 +3769,7 @@ { "name": "zai-org/autoglm-phone-9b", "alias": [ - "zai-org/AutoGLM-Phone-9B", - "AutoGLM-Phone-9B", - "autoglm-phone-9b" + "AutoGLM-Phone-9B" ], "max_tokens": 64000, "model_types": [ @@ -3804,9 +3781,7 @@ { "name": "zai-org/glm-4.6v-fp8", "alias": [ - "zai-org/GLM-4.6V-FP8", - "GLM-4.6V-FP8", - "glm-4.6v-fp8" + "GLM-4.6V-FP8" ], "max_tokens": 128000, "model_types": [ @@ -3822,10 +3797,9 @@ { "name": "zai-org/glm-4.6v", "alias": [ - "zai-org/GLM-4.6V", "GLM-4.6V", - "glm-4.6v", - "z-ai/glm-4.6v" + "z-ai/glm-4.6v", + "GLM 4.6V" ], "max_tokens": 128000, "model_types": [ @@ -3836,14 +3810,14 @@ "thinking": { "default_value": true, "clear_thinking": true - } + }, + "max_completion_tokens": 32768 }, { "name": "zai-org/glm-4.6v-flash", "alias": [ - "zai-org/GLM-4.6V-Flash", "GLM-4.6V-Flash", - "glm-4.6v-flash" + "glm-4.6-flash" ], "max_tokens": 128000, "model_types": [ @@ -3859,9 +3833,7 @@ { "name": "zai-org/ssvae", "alias": [ - "zai-org/SSVAE", - "SSVAE", - "ssvae" + "SSVAE" ], "model_types": [ "chat" @@ -3870,9 +3842,7 @@ { "name": "zai-org/webvia-agent", "alias": [ - "zai-org/WebVIA-Agent", - "WebVIA-Agent", - "webvia-agent" + "WebVIA-Agent" ], "max_tokens": 65536, "model_types": [ @@ -3884,9 +3854,7 @@ { "name": "zai-org/ui2code_n", "alias": [ - "zai-org/UI2Code_N", - "UI2Code_N", - "ui2code_n" + "UI2Code_N" ], "max_tokens": 65536, "model_types": [ @@ -3898,9 +3866,7 @@ { "name": "zai-org/kaleido-14b-s2v", "alias": [ - "zai-org/Kaleido-14B-S2V", - "Kaleido-14B-S2V", - "kaleido-14b-s2v" + "Kaleido-14B-S2V" ], "model_types": [ "image_generation" @@ -3909,9 +3875,7 @@ { "name": "zai-org/glyph", "alias": [ - "zai-org/Glyph", - "Glyph", - "glyph" + "Glyph" ], "max_tokens": 128000, "model_types": [ @@ -3923,11 +3887,11 @@ { "name": "zai-org/glm-4.6", "alias": [ - "zai-org/GLM-4.6", "GLM-4.6", - "glm-4.6", "z-ai/glm-4.6", - "Z-AI/GLM 4.6" + "Z-AI/GLM 4.6", + "GLM 4.6", + "GLM 4.6 Fp8" ], "max_tokens": 202752, "model_types": [ @@ -3936,14 +3900,13 @@ "thinking": { "default_value": true, "clear_thinking": true - } + }, + "max_completion_tokens": 131072 }, { "name": "zai-org/glm-4.6-fp8", "alias": [ - "zai-org/GLM-4.6-FP8", - "GLM-4.6-FP8", - "glm-4.6-fp8" + "GLM-4.6-FP8" ], "max_tokens": 202752, "model_types": [ @@ -3957,10 +3920,9 @@ { "name": "zai-org/glm-4.5v", "alias": [ - "zai-org/GLM-4.5V", "GLM-4.5V", - "glm-4.5v", - "z-ai/glm-4.5v" + "z-ai/glm-4.5v", + "GLM 4.5V" ], "max_tokens": 128000, "model_types": [ @@ -3971,14 +3933,13 @@ "thinking": { "default_value": true, "clear_thinking": true - } + }, + "max_completion_tokens": 16384 }, { "name": "zai-org/glm-4.5v-fp8", "alias": [ - "zai-org/GLM-4.5V-FP8", - "GLM-4.5V-FP8", - "glm-4.5v-fp8" + "GLM-4.5V-FP8" ], "max_tokens": 128000, "model_types": [ @@ -3994,9 +3955,7 @@ { "name": "zai-org/glm-4.5-base", "alias": [ - "zai-org/GLM-4.5-Base", - "GLM-4.5-Base", - "glm-4.5-base" + "GLM-4.5-Base" ], "max_tokens": 128000, "model_types": [ @@ -4010,9 +3969,8 @@ { "name": "zai-org/glm-4.5-air-fp8", "alias": [ - "zai-org/GLM-4.5-Air-FP8", "GLM-4.5-Air-FP8", - "glm-4.5-air-fp8" + "Glm 4.5 Air Fp8" ], "max_tokens": 128000, "model_types": [ @@ -4026,9 +3984,7 @@ { "name": "zai-org/glm-4.5-fp8", "alias": [ - "zai-org/GLM-4.5-FP8", - "GLM-4.5-FP8", - "glm-4.5-fp8" + "GLM-4.5-FP8" ], "max_tokens": 128000, "model_types": [ @@ -4042,9 +3998,7 @@ { "name": "zai-org/glm-4.5-air", "alias": [ - "zai-org/GLM-4.5-Air", "GLM-4.5-Air", - "glm-4.5-air", "z-ai/glm-4.5-air", "z-ai/glm-4.5-air:free", "GLM 4.5 Air (free)" @@ -4056,14 +4010,13 @@ "thinking": { "default_value": true, "clear_thinking": true - } + }, + "max_completion_tokens": 98304 }, { "name": "zai-org/glm-4.5", "alias": [ - "zai-org/GLM-4.5", "GLM-4.5", - "glm-4.5", "z-ai/glm-4.5", "GLM 4.5" ], @@ -4074,14 +4027,13 @@ "thinking": { "default_value": true, "clear_thinking": true - } + }, + "max_completion_tokens": 98304 }, { "name": "zai-org/glm-4.5-air-base", "alias": [ - "zai-org/GLM-4.5-Air-Base", - "GLM-4.5-Air-Base", - "glm-4.5-air-base" + "GLM-4.5-Air-Base" ], "max_tokens": 128000, "model_types": [ @@ -4095,9 +4047,7 @@ { "name": "zai-org/glm-4.1v-9b-thinking", "alias": [ - "zai-org/GLM-4.1V-9B-Thinking", - "GLM-4.1V-9B-Thinking", - "glm-4.1v-9b-thinking" + "GLM-4.1V-9B-Thinking" ], "max_tokens": 65536, "model_types": [ @@ -4113,9 +4063,7 @@ { "name": "zai-org/glm-4.1v-9b-base", "alias": [ - "zai-org/GLM-4.1V-9B-Base", - "GLM-4.1V-9B-Base", - "glm-4.1v-9b-base" + "GLM-4.1V-9B-Base" ], "max_tokens": 65536, "model_types": [ @@ -4147,9 +4095,7 @@ { "name": "zai-org/glm-z1-rumination-32b-0414", "alias": [ - "zai-org/GLM-Z1-Rumination-32B-0414", - "GLM-Z1-Rumination-32B-0414", - "glm-z1-rumination-32b-0414" + "GLM-Z1-Rumination-32B-0414" ], "max_tokens": 128000, "model_types": [ @@ -4163,9 +4109,7 @@ { "name": "zai-org/glm-z1-32b-0414", "alias": [ - "zai-org/GLM-Z1-32B-0414", - "GLM-Z1-32B-0414", - "glm-z1-32b-0414" + "GLM-Z1-32B-0414" ], "max_tokens": 128000, "model_types": [ @@ -4179,9 +4123,7 @@ { "name": "zai-org/glm-z1-9b-0414", "alias": [ - "zai-org/GLM-Z1-9B-0414", "GLM-Z1-9B-0414", - "glm-z1-9b-0414", "THUDM/GLM-Z1-9B-0414" ], "max_tokens": 128000, @@ -4196,9 +4138,7 @@ { "name": "zai-org/glm-4-32b-base-0414", "alias": [ - "zai-org/GLM-4-32B-Base-0414", - "GLM-4-32B-Base-0414", - "glm-4-32b-base-0414" + "GLM-4-32B-Base-0414" ], "max_tokens": 128000, "model_types": [ @@ -4208,22 +4148,19 @@ { "name": "zai-org/glm-4-32b-0414", "alias": [ - "zai-org/GLM-4-32B-0414", "GLM-4-32B-0414", - "glm-4-32b-0414", "THUDM/GLM-4-32B-0414" ], "max_tokens": 128000, "model_types": [ "chat" - ] + ], + "max_completion_tokens": 32000 }, { "name": "zai-org/glm-4-9b-0414", "alias": [ - "zai-org/GLM-4-9B-0414", - "GLM-4-9B-0414", - "glm-4-9b-0414" + "GLM-4-9B-0414" ], "max_tokens": 128000, "model_types": [ @@ -4233,9 +4170,7 @@ { "name": "zai-org/swe-dev-9b", "alias": [ - "zai-org/SWE-Dev-9B", - "SWE-Dev-9B", - "swe-dev-9b" + "SWE-Dev-9B" ], "max_tokens": 128000, "model_types": [ @@ -4245,9 +4180,7 @@ { "name": "zai-org/swe-dev-32b", "alias": [ - "zai-org/SWE-Dev-32B", - "SWE-Dev-32B", - "swe-dev-32b" + "SWE-Dev-32B" ], "max_tokens": 131072, "model_types": [ @@ -4257,9 +4190,7 @@ { "name": "zai-org/swe-dev-7b", "alias": [ - "zai-org/SWE-Dev-7B", - "SWE-Dev-7B", - "swe-dev-7b" + "SWE-Dev-7B" ], "max_tokens": 163840, "model_types": [ @@ -4269,9 +4200,7 @@ { "name": "zai-org/cogview4-6b", "alias": [ - "zai-org/CogView4-6B", - "CogView4-6B", - "cogview4-6b" + "CogView4-6B" ], "model_types": [ "text-to-image", @@ -4281,9 +4210,7 @@ { "name": "zai-org/visionreward-image-bf16", "alias": [ - "zai-org/VisionReward-Image-bf16", - "VisionReward-Image-bf16", - "visionreward-image-bf16" + "VisionReward-Image-bf16" ], "model_types": [ "chat", @@ -4316,9 +4243,7 @@ { "name": "zai-org/visionreward-image", "alias": [ - "zai-org/VisionReward-Image", - "VisionReward-Image", - "visionreward-image" + "VisionReward-Image" ], "model_types": [ "chat", @@ -4329,9 +4254,7 @@ { "name": "zai-org/visionreward-video", "alias": [ - "zai-org/VisionReward-Video", - "VisionReward-Video", - "visionreward-video" + "VisionReward-Video" ], "max_tokens": 2048, "model_types": [ @@ -4354,9 +4277,7 @@ { "name": "zai-org/mathglm-vision-19b", "alias": [ - "zai-org/MathGLM-Vision-19B", - "MathGLM-Vision-19B", - "mathglm-vision-19b" + "MathGLM-Vision-19B" ], "model_types": [ "chat" @@ -4365,9 +4286,7 @@ { "name": "zai-org/mathglm-vision", "alias": [ - "zai-org/MathGLM-Vision", - "MathGLM-Vision", - "mathglm-vision" + "MathGLM-Vision" ], "model_types": [ "chat" @@ -4494,9 +4413,7 @@ { "name": "zai-org/cogvideox1.5-5b-sat", "alias": [ - "zai-org/CogVideoX1.5-5B-SAT", - "CogVideoX1.5-5B-SAT", - "cogvideox1.5-5b-sat" + "CogVideoX1.5-5B-SAT" ], "model_types": [ "image_generation" @@ -4505,9 +4422,7 @@ { "name": "zai-org/cogvideox1.5-5b-i2v", "alias": [ - "zai-org/CogVideoX1.5-5B-I2V", - "CogVideoX1.5-5B-I2V", - "cogvideox1.5-5b-i2v" + "CogVideoX1.5-5B-I2V" ], "model_types": [ "image_generation" @@ -4516,9 +4431,7 @@ { "name": "zai-org/cogvideox1.5-5b", "alias": [ - "zai-org/CogVideoX1.5-5B", - "CogVideoX1.5-5B", - "cogvideox1.5-5b" + "CogVideoX1.5-5B" ], "model_types": [ "image_generation" @@ -4527,9 +4440,7 @@ { "name": "zai-org/longreward-glm4-9b-dpo", "alias": [ - "zai-org/LongReward-glm4-9b-DPO", - "LongReward-glm4-9b-DPO", - "longreward-glm4-9b-dpo" + "LongReward-glm4-9b-DPO" ], "max_tokens": 128000, "model_types": [ @@ -4587,9 +4498,7 @@ { "name": "zai-org/longreward-llama3.1-8b-dpo", "alias": [ - "zai-org/LongReward-llama3.1-8b-DPO", - "LongReward-llama3.1-8b-DPO", - "longreward-llama3.1-8b-dpo" + "LongReward-llama3.1-8b-DPO" ], "max_tokens": 65536, "model_types": [ @@ -4599,9 +4508,7 @@ { "name": "zai-org/cogview3-plus-3b", "alias": [ - "zai-org/CogView3-Plus-3B", - "CogView3-Plus-3B", - "cogview3-plus-3b" + "CogView3-Plus-3B" ], "model_types": [ "text-to-image", @@ -4623,9 +4530,7 @@ { "name": "zai-org/cogvideox-5b-i2v", "alias": [ - "zai-org/CogVideoX-5b-I2V", - "CogVideoX-5b-I2V", - "cogvideox-5b-i2v" + "CogVideoX-5b-I2V" ], "model_types": [ "image_generation" @@ -4634,9 +4539,7 @@ { "name": "zai-org/longcite-llama3.1-8b", "alias": [ - "zai-org/LongCite-llama3.1-8b", - "LongCite-llama3.1-8b", - "longcite-llama3.1-8b" + "LongCite-llama3.1-8b" ], "max_tokens": 131072, "model_types": [ @@ -4646,9 +4549,7 @@ { "name": "zai-org/longcite-glm4-9b", "alias": [ - "zai-org/LongCite-glm4-9b", - "LongCite-glm4-9b", - "longcite-glm4-9b" + "LongCite-glm4-9b" ], "max_tokens": 131072, "model_types": [ @@ -4658,9 +4559,7 @@ { "name": "zai-org/cogvideox-5b", "alias": [ - "zai-org/CogVideoX-5b", - "CogVideoX-5b", - "cogvideox-5b" + "CogVideoX-5b" ], "model_types": [ "image_generation" @@ -4669,9 +4568,7 @@ { "name": "zai-org/longwriter-glm4-9b", "alias": [ - "zai-org/LongWriter-glm4-9b", - "LongWriter-glm4-9b", - "longwriter-glm4-9b" + "LongWriter-glm4-9b" ], "max_tokens": 1048576, "model_types": [ @@ -4681,9 +4578,7 @@ { "name": "zai-org/longwriter-llama3.1-8b", "alias": [ - "zai-org/LongWriter-llama3.1-8b", - "LongWriter-llama3.1-8b", - "longwriter-llama3.1-8b" + "LongWriter-llama3.1-8b" ], "max_tokens": 131072, "model_types": [ @@ -4693,9 +4588,7 @@ { "name": "zai-org/cogvideox-2b", "alias": [ - "zai-org/CogVideoX-2b", - "CogVideoX-2b", - "cogvideox-2b" + "CogVideoX-2b" ], "model_types": [ "image_generation" @@ -4724,9 +4617,7 @@ { "name": "zai-org/codegeex4-all-9b-gguf", "alias": [ - "zai-org/codegeex4-all-9b-GGUF", - "codegeex4-all-9b-GGUF", - "codegeex4-all-9b-gguf" + "codegeex4-all-9b-GGUF" ], "max_tokens": 131072, "model_types": [ @@ -4772,9 +4663,7 @@ { "name": "zai-org/msagpt", "alias": [ - "zai-org/MSAGPT", - "MSAGPT", - "msagpt" + "MSAGPT" ], "model_types": [ "chat" @@ -4783,9 +4672,7 @@ { "name": "zai-org/cogvlm2-llama3-chat-19b-tgi", "alias": [ - "zai-org/cogvlm2-llama3-chat-19B-tgi", - "cogvlm2-llama3-chat-19B-tgi", - "cogvlm2-llama3-chat-19b-tgi" + "cogvlm2-llama3-chat-19B-tgi" ], "max_tokens": 8192, "model_types": [ @@ -4797,9 +4684,7 @@ { "name": "zai-org/cogvlm2-llama3-chinese-chat-19b-tgi", "alias": [ - "zai-org/cogvlm2-llama3-chinese-chat-19B-tgi", - "cogvlm2-llama3-chinese-chat-19B-tgi", - "cogvlm2-llama3-chinese-chat-19b-tgi" + "cogvlm2-llama3-chinese-chat-19B-tgi" ], "max_tokens": 8192, "model_types": [ @@ -4851,9 +4736,7 @@ { "name": "zai-org/cogvlm2-llama3-chinese-chat-19b-int4", "alias": [ - "zai-org/cogvlm2-llama3-chinese-chat-19B-int4", - "cogvlm2-llama3-chinese-chat-19B-int4", - "cogvlm2-llama3-chinese-chat-19b-int4" + "cogvlm2-llama3-chinese-chat-19B-int4" ], "max_tokens": 8192, "model_types": [ @@ -4865,9 +4748,7 @@ { "name": "zai-org/cogvlm2-llama3-chat-19b-int4", "alias": [ - "zai-org/cogvlm2-llama3-chat-19B-int4", - "cogvlm2-llama3-chat-19B-int4", - "cogvlm2-llama3-chat-19b-int4" + "cogvlm2-llama3-chat-19B-int4" ], "max_tokens": 8192, "model_types": [ @@ -4879,9 +4760,7 @@ { "name": "zai-org/cogvlm2-llama3-chinese-chat-19b", "alias": [ - "zai-org/cogvlm2-llama3-chinese-chat-19B", - "cogvlm2-llama3-chinese-chat-19B", - "cogvlm2-llama3-chinese-chat-19b" + "cogvlm2-llama3-chinese-chat-19B" ], "max_tokens": 8192, "model_types": [ @@ -4893,9 +4772,7 @@ { "name": "zai-org/cogvlm2-llama3-chat-19b", "alias": [ - "zai-org/cogvlm2-llama3-chat-19B", - "cogvlm2-llama3-chat-19B", - "cogvlm2-llama3-chat-19b" + "cogvlm2-llama3-chat-19B" ], "max_tokens": 8192, "model_types": [ @@ -4917,9 +4794,7 @@ { "name": "zai-org/longalign-13b-64k-base", "alias": [ - "zai-org/LongAlign-13B-64k-base", - "LongAlign-13B-64k-base", - "longalign-13b-64k-base" + "LongAlign-13B-64k-base" ], "max_tokens": 65536, "model_types": [ @@ -4929,9 +4804,7 @@ { "name": "zai-org/longalign-7b-64k-base", "alias": [ - "zai-org/LongAlign-7B-64k-base", - "LongAlign-7B-64k-base", - "longalign-7b-64k-base" + "LongAlign-7B-64k-base" ], "max_tokens": 65536, "model_types": [ @@ -4941,9 +4814,7 @@ { "name": "zai-org/longalign-6b-64k-base", "alias": [ - "zai-org/LongAlign-6B-64k-base", - "LongAlign-6B-64k-base", - "longalign-6b-64k-base" + "LongAlign-6B-64k-base" ], "max_tokens": 65536, "model_types": [ @@ -4953,9 +4824,7 @@ { "name": "zai-org/longalign-13b-64k", "alias": [ - "zai-org/LongAlign-13B-64k", - "LongAlign-13B-64k", - "longalign-13b-64k" + "LongAlign-13B-64k" ], "max_tokens": 65536, "model_types": [ @@ -4965,9 +4834,7 @@ { "name": "zai-org/longalign-6b-64k", "alias": [ - "zai-org/LongAlign-6B-64k", - "LongAlign-6B-64k", - "longalign-6b-64k" + "LongAlign-6B-64k" ], "max_tokens": 65536, "model_types": [ @@ -4977,9 +4844,7 @@ { "name": "zai-org/longalign-7b-64k", "alias": [ - "zai-org/LongAlign-7B-64k", - "LongAlign-7B-64k", - "longalign-7b-64k" + "LongAlign-7B-64k" ], "max_tokens": 65536, "model_types": [ @@ -4999,9 +4864,7 @@ { "name": "zai-org/cogagent", "alias": [ - "zai-org/CogAgent", - "CogAgent", - "cogagent" + "CogAgent" ], "model_types": [ "chat" @@ -5020,9 +4883,7 @@ { "name": "zai-org/bpo", "alias": [ - "zai-org/BPO", - "BPO", - "bpo" + "BPO" ], "max_tokens": 4096, "model_types": [ @@ -5122,9 +4983,7 @@ { "name": "zai-org/cogvlm", "alias": [ - "zai-org/CogVLM", - "CogVLM", - "cogvlm" + "CogVLM" ], "model_types": [ "chat" @@ -5153,9 +5012,7 @@ { "name": "zai-org/mathglm", "alias": [ - "zai-org/MathGLM", - "MathGLM", - "mathglm" + "MathGLM" ], "model_types": [ "chat" @@ -5224,9 +5081,7 @@ { "name": "zai-org/webglm-2b", "alias": [ - "zai-org/WebGLM-2B", - "WebGLM-2B", - "webglm-2b" + "WebGLM-2B" ], "max_tokens": 1024, "model_types": [ @@ -5236,9 +5091,7 @@ { "name": "zai-org/webglm", "alias": [ - "zai-org/WebGLM", - "WebGLM", - "webglm" + "WebGLM" ], "max_tokens": 1024, "model_types": [ @@ -5270,9 +5123,7 @@ { "name": "zai-org/imagereward", "alias": [ - "zai-org/ImageReward", - "ImageReward", - "imagereward" + "ImageReward" ], "model_types": [ "text-to-image", @@ -5362,9 +5213,7 @@ { "name": "zai-org/cogvideo", "alias": [ - "zai-org/CogVideo", - "CogVideo", - "cogvideo" + "CogVideo" ], "model_types": [ "image_generation" @@ -5373,9 +5222,7 @@ { "name": "zai-org/cogview2", "alias": [ - "zai-org/CogView2", - "CogView2", - "cogview2" + "CogView2" ], "model_types": [ "image_generation" @@ -5386,9 +5233,9 @@ "alias": [ "deepseek-chat", "deepseek-ai/DeepSeek-V4-Flash", - "deepseek-ai/deepseek-v4-flash", "deepseek/deepseek-v4-flash", - "deepseek-v4-flash-260425" + "deepseek-v4-flash-260425", + "Deepseek V4 Flash" ], "max_tokens": 1048576, "model_types": [ @@ -5397,14 +5244,14 @@ "thinking": { "default_value": true, "clear_thinking": true - } + }, + "max_completion_tokens": 393216 }, { "name": "deepseek-v4-flash-base", "alias": [ "deepseek/deepseek-v4-flash-base", - "deepseek-ai/DeepSeek-V4-Flash-Base", - "deepseek-ai/deepseek-v4-flash-base" + "deepseek-ai/DeepSeek-V4-Flash-Base" ], "max_tokens": 1048576, "model_types": [ @@ -5415,9 +5262,9 @@ "name": "deepseek-v4-pro", "alias": [ "deepseek-ai/DeepSeek-V4-Pro", - "deepseek-ai/deepseek-v4-pro", "deepseek/deepseek-v4-pro", - "deepseek-v4-pro-260425" + "deepseek-v4-pro-260425", + "Deepseek V4 Pro" ], "max_tokens": 1048576, "model_types": [ @@ -5426,14 +5273,14 @@ "thinking": { "default_value": true, "clear_thinking": true - } + }, + "max_completion_tokens": 393216 }, { "name": "deepseek-v4-pro-base", "alias": [ "deepseek/deepseek-v4-pro-base", - "deepseek-ai/DeepSeek-V4-Pro-Base", - "deepseek-ai/deepseek-v4-pro-base" + "deepseek-ai/DeepSeek-V4-Pro-Base" ], "max_tokens": 1048576, "model_types": [ @@ -5444,33 +5291,41 @@ "name": "deepseek-ocr-2", "alias": [ "deepseek-ai/DeepSeek-OCR-2", - "deepseek-ai/deepseek-ocr-2" + "Deepseek OCR 2" ], "max_tokens": 8192, "model_types": [ - "ocr" + "ocr", + "chat", + "vision", + "image2text" ] }, { "name": "deepseek-v3.2", "alias": [ "deepseek-ai/DeepSeek-V3.2", - "deepseek-ai/deepseek-v3.2", "deepseek/deepseek-v3.2", "Pro/deepseek-ai/DeepSeek-V3.2", "deepseek/deepseek-v3.2-251201", - "deepseek-v3-2-251201" + "deepseek-v3-2-251201", + "Deepseek V3.2", + "deepseek-v3-2" ], "max_tokens": 163840, "model_types": [ "chat" - ] + ], + "max_completion_tokens": 65536, + "thinking": { + "default_value": true, + "clear_thinking": true + } }, { "name": "deepseek-v3.2-speciale", "alias": [ - "deepseek-ai/DeepSeek-V3.2-Speciale", - "deepseek-ai/deepseek-v3.2-speciale" + "deepseek-ai/DeepSeek-V3.2-Speciale" ], "max_tokens": 163840, "model_types": [ @@ -5481,7 +5336,6 @@ "name": "deepseek-math-v2", "alias": [ "deepseek-ai/DeepSeek-Math-V2", - "deepseek-ai/deepseek-math-v2", "deepseek/deepseek-math-v2" ], "max_tokens": 163840, @@ -5493,31 +5347,39 @@ "name": "deepseek-ocr", "alias": [ "deepseek-ai/DeepSeek-OCR", - "deepseek-ai/deepseek-ocr" + "deepseek/deepseek-ocr" ], "max_tokens": 8192, "model_types": [ - "ocr" - ] + "ocr", + "chat", + "image2text", + "vision" + ], + "max_completion_tokens": 8192 }, { "name": "deepseek-v3.2-exp", "alias": [ "deepseek-ai/DeepSeek-V3.2-Exp", - "deepseek-ai/deepseek-v3.2-exp", "deepseek/deepseek-v3.2-exp", - "deepseek/deepseek-v3.2-exp-thinking" + "deepseek/deepseek-v3.2-exp-thinking", + "Deepseek V3.2 Exp" ], "max_tokens": 163840, "model_types": [ "chat" - ] + ], + "max_completion_tokens": 65536, + "thinking": { + "default_value": true, + "clear_thinking": true + } }, { "name": "deepseek-v3.2-exp-base", "alias": [ - "deepseek-ai/DeepSeek-V3.2-Exp-Base", - "deepseek-ai/deepseek-v3.2-exp-base" + "deepseek-ai/DeepSeek-V3.2-Exp-Base" ], "max_tokens": 163840, "model_types": [ @@ -5528,34 +5390,45 @@ "name": "deepseek-v3.1-terminus", "alias": [ "deepseek-ai/DeepSeek-V3.1-Terminus", - "deepseek-ai/deepseek-v3.1-terminus", "deepseek/deepseek-v3.1-terminus", "Pro/deepseek-ai/DeepSeek-V3.1-Terminus", - "deepseek/deepseek-v3.1-terminus-thinking" + "deepseek/deepseek-v3.1-terminus-thinking", + "Deepseek V3.1 Terminus" ], "max_tokens": 163840, "model_types": [ "chat" - ] + ], + "max_completion_tokens": 32768, + "thinking": { + "default_value": true, + "clear_thinking": true + } }, { "name": "deepseek-v3.1", "alias": [ "deepseek-ai/DeepSeek-V3.1", - "deepseek-ai/deepseek-v3.1", "deepseek/deepseek-chat-v3.1", - "deepseek-v3-1-250821" + "deepseek-v3-1-250821", + "deepseek-v3-1-terminus", + "deepseek-v3-1", + "Deepseek V3.1 NVFP4" ], "max_tokens": 163840, "model_types": [ "chat" - ] + ], + "max_completion_tokens": 32768, + "thinking": { + "default_value": true, + "clear_thinking": true + } }, { "name": "deepseek-v3.1-base", "alias": [ - "deepseek-ai/DeepSeek-V3.1-Base", - "deepseek-ai/deepseek-v3.1-base" + "deepseek-ai/DeepSeek-V3.1-Base" ], "max_tokens": 163840, "model_types": [ @@ -5566,32 +5439,39 @@ "name": "deepseek-r1-0528-qwen3-8b", "alias": [ "deepseek-ai/DeepSeek-R1-0528-Qwen3-8B", - "deepseek-ai/deepseek-r1-0528-qwen3-8b" + "deepseek/deepseek-r1-0528-qwen3-8b", + "DeepSeek R1 0528 Qwen3 8B" ], "max_tokens": 131072, "model_types": [ "chat" - ] + ], + "max_completion_tokens": 32000 }, { "name": "deepseek-r1-0528", "alias": [ "deepseek-ai/DeepSeek-R1-0528", - "deepseek-ai/deepseek-r1-0528", "deepseek/deepseek-r1-0528", "deepseek-r1-250528", - "Pro/deepseek-ai/DeepSeek-R1" + "Pro/deepseek-ai/DeepSeek-R1", + "DeepSeek R1 0528", + "DeepSeek R1 0528 NVFP4" ], "max_tokens": 163840, "model_types": [ "chat" - ] + ], + "max_completion_tokens": 32768, + "thinking": { + "default_value": true, + "clear_thinking": true + } }, { "name": "deepseek-prover-v2-671b", "alias": [ - "deepseek-ai/DeepSeek-Prover-V2-671B", - "deepseek-ai/deepseek-prover-v2-671b" + "deepseek-ai/DeepSeek-Prover-V2-671B" ], "max_tokens": 163840, "model_types": [ @@ -5601,8 +5481,7 @@ { "name": "deepseek-prover-v2-7b", "alias": [ - "deepseek-ai/DeepSeek-Prover-V2-7B", - "deepseek-ai/deepseek-prover-v2-7b" + "deepseek-ai/DeepSeek-Prover-V2-7B" ], "max_tokens": 32768, "model_types": [ @@ -5613,7 +5492,6 @@ "name": "deepseek-v3-0324", "alias": [ "deepseek-ai/DeepSeek-V3-0324", - "deepseek-ai/deepseek-v3-0324", "deepseek/deepseek-chat-v3-0324", "deepseek-v3-250324", "Pro/deepseek-ai/DeepSeek-V3" @@ -5621,40 +5499,50 @@ "max_tokens": 163840, "model_types": [ "chat" - ] + ], + "max_completion_tokens": 16384 }, { "name": "deepseek-r1", "alias": [ "deepseek-ai/DeepSeek-R1", - "deepseek-ai/deepseek-r1", "deepseek/deepseek-r1", - "DeepSeek-R1", "deepseek-r1-250120", - "deepseek-r1_32k" + "deepseek-r1_32k", + "deepseek-r1-searching", + "DeepSeek R1" ], "max_tokens": 163840, "model_types": [ "chat" - ] + ], + "max_completion_tokens": 16000, + "thinking": { + "default_value": true, + "clear_thinking": true + } }, { "name": "deepseek-r1-distill-llama-70b", "alias": [ "deepseek-ai/DeepSeek-R1-Distill-Llama-70B", - "deepseek-ai/deepseek-r1-distill-llama-70b", - "deepseek/deepseek-r1-distill-llama-70b" + "deepseek/deepseek-r1-distill-llama-70b", + "DeepSeek R1 Distill LLama 70B" ], "max_tokens": 131072, "model_types": [ "chat" - ] + ], + "max_completion_tokens": 8192, + "thinking": { + "default_value": true, + "clear_thinking": true + } }, { "name": "deepseek-r1-distill-llama-8b", "alias": [ - "deepseek-ai/DeepSeek-R1-Distill-Llama-8B", - "deepseek-ai/deepseek-r1-distill-llama-8b" + "deepseek-ai/DeepSeek-R1-Distill-Llama-8B" ], "max_tokens": 131072, "model_types": [ @@ -5665,54 +5553,73 @@ "name": "deepseek-r1-distill-qwen-1.5b", "alias": [ "deepseek-ai/DeepSeek-R1-Distill-Qwen-1.5B", - "deepseek-ai/deepseek-r1-distill-qwen-1.5b" + "DeepSeek R1 Distill Qwen 1.5B" ], "max_tokens": 131072, "model_types": [ "chat" - ] + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } }, { "name": "deepseek-r1-distill-qwen-14b", "alias": [ "deepseek-ai/DeepSeek-R1-Distill-Qwen-14B", - "deepseek-ai/deepseek-r1-distill-qwen-14b" + "deepseek/deepseek-r1-distill-qwen-14b", + "DeepSeek R1 Distill Qwen 14B" ], "max_tokens": 131072, "model_types": [ "chat" - ] + ], + "max_completion_tokens": 16384, + "thinking": { + "default_value": true, + "clear_thinking": true + } }, { "name": "deepseek-r1-distill-qwen-32b", "alias": [ "deepseek-ai/DeepSeek-R1-Distill-Qwen-32B", - "deepseek-ai/deepseek-r1-distill-qwen-32b", "deepseek/deepseek-r1-distill-qwen-32b", - "deepseek-r1-distill-qwen-32b-250120" + "deepseek-r1-distill-qwen-32b-250120", + "DeepSeek R1 Distill Qwen 32B" ], "max_tokens": 131072, "model_types": [ "chat" - ] + ], + "max_completion_tokens": 32000, + "thinking": { + "default_value": true, + "clear_thinking": true + } }, { "name": "deepseek-r1-distill-qwen-7b", "alias": [ "deepseek-ai/DeepSeek-R1-Distill-Qwen-7B", - "deepseek-ai/deepseek-r1-distill-qwen-7b", - "deepseek-r1-distill-qwen-7b-250120" + "deepseek-r1-distill-qwen-7b-250120", + "DeepSeek R1 Distill Qwen 7B" ], "max_tokens": 131072, "model_types": [ "chat" - ] + ], + "thinking": { + "default_value": true, + "clear_thinking": true + }, + "max_completion_tokens": 8192 }, { "name": "deepseek-r1-zero", "alias": [ - "deepseek-ai/DeepSeek-R1-Zero", - "deepseek-ai/deepseek-r1-zero" + "deepseek-ai/DeepSeek-R1-Zero" ], "max_tokens": 163840, "model_types": [ @@ -5723,20 +5630,23 @@ "name": "deepseek-v3", "alias": [ "deepseek-ai/DeepSeek-V3", - "deepseek-ai/deepseek-v3", "deepseek/deepseek-chat", - "DeepSeek-V3" + "deepseek/deepseek_v3", + "deepseek_v3", + "DeepSeek V3", + "deepseek/deepseek-v3", + "deepseek-v3-241226" ], "max_tokens": 163840, "model_types": [ "chat" - ] + ], + "max_completion_tokens": 16000 }, { "name": "deepseek-v3-base", "alias": [ - "deepseek-ai/DeepSeek-V3-Base", - "deepseek-ai/deepseek-v3-base" + "deepseek-ai/DeepSeek-V3-Base" ], "max_tokens": 163840, "model_types": [ @@ -5776,8 +5686,7 @@ { "name": "deepseek-v2.5-1210", "alias": [ - "deepseek-ai/DeepSeek-V2.5-1210", - "deepseek-ai/deepseek-v2.5-1210" + "deepseek-ai/DeepSeek-V2.5-1210" ], "max_tokens": 163840, "model_types": [ @@ -5787,8 +5696,7 @@ { "name": "deepseek-coder-v2-instruct-0724", "alias": [ - "deepseek-ai/DeepSeek-Coder-V2-Instruct-0724", - "deepseek-ai/deepseek-coder-v2-instruct-0724" + "deepseek-ai/DeepSeek-Coder-V2-Instruct-0724" ], "max_tokens": 163840, "model_types": [ @@ -5798,8 +5706,7 @@ { "name": "deepseek-v2.5", "alias": [ - "deepseek-ai/DeepSeek-V2.5", - "deepseek-ai/deepseek-v2.5" + "deepseek-ai/DeepSeek-V2.5" ], "max_tokens": 163840, "model_types": [ @@ -5809,8 +5716,7 @@ { "name": "deepseek-prover-v1", "alias": [ - "deepseek-ai/DeepSeek-Prover-V1", - "deepseek-ai/deepseek-prover-v1" + "deepseek-ai/DeepSeek-Prover-V1" ], "max_tokens": 4096, "model_types": [ @@ -5820,8 +5726,7 @@ { "name": "deepseek-prover-v1.5-base", "alias": [ - "deepseek-ai/DeepSeek-Prover-V1.5-Base", - "deepseek-ai/deepseek-prover-v1.5-base" + "deepseek-ai/DeepSeek-Prover-V1.5-Base" ], "max_tokens": 4096, "model_types": [ @@ -5831,8 +5736,7 @@ { "name": "deepseek-prover-v1.5-rl", "alias": [ - "deepseek-ai/DeepSeek-Prover-V1.5-RL", - "deepseek-ai/deepseek-prover-v1.5-rl" + "deepseek-ai/DeepSeek-Prover-V1.5-RL" ], "max_tokens": 4096, "model_types": [ @@ -5842,8 +5746,7 @@ { "name": "deepseek-prover-v1.5-sft", "alias": [ - "deepseek-ai/DeepSeek-Prover-V1.5-SFT", - "deepseek-ai/deepseek-prover-v1.5-sft" + "deepseek-ai/DeepSeek-Prover-V1.5-SFT" ], "max_tokens": 4096, "model_types": [ @@ -5853,8 +5756,7 @@ { "name": "deepseek-v2-chat-0628", "alias": [ - "deepseek-ai/DeepSeek-V2-Chat-0628", - "deepseek-ai/deepseek-v2-chat-0628" + "deepseek-ai/DeepSeek-V2-Chat-0628" ], "max_tokens": 163840, "model_types": [ @@ -5864,8 +5766,7 @@ { "name": "deepseek-coder-v2-base", "alias": [ - "deepseek-ai/DeepSeek-Coder-V2-Base", - "deepseek-ai/deepseek-coder-v2-base" + "deepseek-ai/DeepSeek-Coder-V2-Base" ], "max_tokens": 163840, "model_types": [ @@ -5875,8 +5776,7 @@ { "name": "deepseek-coder-v2-instruct", "alias": [ - "deepseek-ai/DeepSeek-Coder-V2-Instruct", - "deepseek-ai/deepseek-coder-v2-instruct" + "deepseek-ai/DeepSeek-Coder-V2-Instruct" ], "max_tokens": 163840, "model_types": [ @@ -5886,8 +5786,7 @@ { "name": "deepseek-coder-v2-lite-base", "alias": [ - "deepseek-ai/DeepSeek-Coder-V2-Lite-Base", - "deepseek-ai/deepseek-coder-v2-lite-base" + "deepseek-ai/DeepSeek-Coder-V2-Lite-Base" ], "max_tokens": 163840, "model_types": [ @@ -5897,8 +5796,7 @@ { "name": "deepseek-coder-v2-lite-instruct", "alias": [ - "deepseek-ai/DeepSeek-Coder-V2-Lite-Instruct", - "deepseek-ai/deepseek-coder-v2-lite-instruct" + "deepseek-ai/DeepSeek-Coder-V2-Lite-Instruct" ], "max_tokens": 163840, "model_types": [ @@ -5908,8 +5806,7 @@ { "name": "deepseek-v2-lite", "alias": [ - "deepseek-ai/DeepSeek-V2-Lite", - "deepseek-ai/deepseek-v2-lite" + "deepseek-ai/DeepSeek-V2-Lite" ], "max_tokens": 163840, "model_types": [ @@ -5919,8 +5816,7 @@ { "name": "deepseek-v2-lite-chat", "alias": [ - "deepseek-ai/DeepSeek-V2-Lite-Chat", - "deepseek-ai/deepseek-v2-lite-chat" + "deepseek-ai/DeepSeek-V2-Lite-Chat" ], "max_tokens": 163840, "model_types": [ @@ -5930,8 +5826,7 @@ { "name": "deepseek-v2-chat", "alias": [ - "deepseek-ai/DeepSeek-V2-Chat", - "deepseek-ai/deepseek-v2-chat" + "deepseek-ai/DeepSeek-V2-Chat" ], "max_tokens": 163840, "model_types": [ @@ -5941,8 +5836,7 @@ { "name": "deepseek-v2", "alias": [ - "deepseek-ai/DeepSeek-V2", - "deepseek-ai/deepseek-v2" + "deepseek-ai/DeepSeek-V2" ], "max_tokens": 163840, "model_types": [ @@ -6102,7 +5996,8 @@ { "name": "deepseek-coder-33b-instruct", "alias": [ - "deepseek-ai/deepseek-coder-33b-instruct" + "deepseek-ai/deepseek-coder-33b-instruct", + "Deepseek Coder 33B Instruct" ], "max_tokens": 16384, "model_types": [ @@ -6173,12 +6068,20 @@ "name": "minimax-m3", "max_tokens": 1024000, "model_types": [ - "chat" + "chat", + "vision", + "image2text" ], "thinking": { "default_value": true, "clear_thinking": true - } + }, + "alias": [ + "minimax/minimax-m3", + "MiniMaxAI/MiniMax-M3", + "MiniMax M3" + ], + "max_completion_tokens": 131072 }, { "name": "bge-m3", @@ -6188,12 +6091,14 @@ "max_tokens": 8192, "model_types": [ "embedding" - ] + ], + "max_dimension": 1024 }, { "name": "bge-reranker-v2-m3", "alias": [ - "baai/bge-reranker-v2-m3" + "baai/bge-reranker-v2-m3", + "Pro/BAAI/bge-reranker-v2-m3" ], "max_tokens": 1024, "model_types": [ @@ -6210,7 +6115,8 @@ "name": "qwen/qwen3.7-max", "alias": [ "qwen3.7-max", - "qwen3.7-max-latest" + "qwen3.7-max-latest", + "Qwen3.7 Max" ], "max_tokens": 1000000, "model_types": [ @@ -6219,7 +6125,8 @@ "thinking": { "default_value": true, "clear_thinking": true - } + }, + "max_completion_tokens": 65536 }, { "name": "qwen/qwen3.7-max-2026-06-08", @@ -6285,7 +6192,8 @@ { "name": "qwen/qwen3-max", "alias": [ - "qwen3-max" + "qwen3-max", + "Qwen3 Max" ], "max_tokens": 262144, "model_types": [ @@ -6294,7 +6202,8 @@ "thinking": { "default_value": true, "clear_thinking": true - } + }, + "max_completion_tokens": 65536 }, { "name": "qwen/qwen3-max-2026-01-23", @@ -6449,19 +6358,22 @@ { "name": "qwen/qwen3.6-plus", "alias": [ - "qwen3.6-plus" + "qwen3.6-plus", + "Qwen3.6 Plus" ], "max_tokens": 1000000, "model_types": [ "chat", "image2text", "vision", - "video_understanding" + "video_understanding", + "ocr" ], "thinking": { "default_value": true, "clear_thinking": true - } + }, + "max_completion_tokens": 65536 }, { "name": "qwen/qwen3.6-plus-2026-04-02", @@ -6497,7 +6409,8 @@ "thinking": { "default_value": true, "clear_thinking": true - } + }, + "max_completion_tokens": 65536 }, { "name": "qwen/qwen3.5-plus-2026-02-15", @@ -7016,7 +6929,8 @@ "chat", "image2text", "vision", - "video_understanding" + "video_understanding", + "ocr" ], "thinking": { "default_value": true, @@ -7064,7 +6978,8 @@ "chat", "image2text", "vision", - "video_understanding" + "video_understanding", + "video_generation" ], "thinking": { "default_value": true, @@ -8084,11 +7999,14 @@ { "name": "qwen/qwen-mt-plus", "alias": [ - "qwen-mt-plus" + "qwen-mt-plus", + "Qwen MT Plus" ], "model_types": [ "chat" - ] + ], + "max_tokens": 16384, + "max_completion_tokens": 8192 }, { "name": "qwen/qwen-mt-turbo", @@ -8126,17 +8044,22 @@ "chat", "image2text", "vision", - "video_understanding" + "video_understanding", + "text-to-image", + "image_generation" ] }, { "name": "qwen/qwen-image-2.0-pro", "alias": [ - "qwen-image-2.0-pro" + "qwen-image-2.0-pro", + "Qwen Image 2.0 Pro" ], "model_types": [ "text-to-image", - "image_generation" + "image_generation", + "image", + "image_edit" ] }, { @@ -8152,11 +8075,14 @@ { "name": "qwen/qwen-image-2.0", "alias": [ - "qwen-image-2.0" + "qwen-image-2.0", + "Qwen Image 2.0" ], "model_types": [ "text-to-image", - "image_generation" + "image_generation", + "image", + "image_edit" ] }, { @@ -8166,7 +8092,9 @@ ], "model_types": [ "text-to-image", - "image_generation" + "image_generation", + "image", + "image_edit" ] }, { @@ -8217,7 +8145,8 @@ "model_types": [ "image_edit", "image_generation", - "image_understanding" + "image_understanding", + "text-to-image" ] }, { @@ -8239,7 +8168,8 @@ "model_types": [ "image_edit", "image_generation", - "image_understanding" + "image_understanding", + "text-to-image" ] }, { @@ -8303,7 +8233,6 @@ { "name": "qwen/sae-res-qwen3.5-35b-a3b-base-w128k-l0_100", "alias": [ - "Qwen/SAE-Res-Qwen3.5-35B-A3B-Base-W128K-L0_100", "sae-res-qwen3.5-35b-a3b-base-w128k-l0_100" ], "model_types": [ @@ -8313,7 +8242,6 @@ { "name": "qwen/sae-res-qwen3.5-35b-a3b-base-w32k-l0_50", "alias": [ - "Qwen/SAE-Res-Qwen3.5-35B-A3B-Base-W32K-L0_50", "sae-res-qwen3.5-35b-a3b-base-w32k-l0_50" ], "model_types": [ @@ -8323,7 +8251,6 @@ { "name": "qwen/sae-res-qwen3-30b-a3b-base-w128k-l0_100", "alias": [ - "Qwen/SAE-Res-Qwen3-30B-A3B-Base-W128K-L0_100", "sae-res-qwen3-30b-a3b-base-w128k-l0_100" ], "model_types": [ @@ -8333,7 +8260,6 @@ { "name": "qwen/sae-res-qwen3-30b-a3b-base-w32k-l0_50", "alias": [ - "Qwen/SAE-Res-Qwen3-30B-A3B-Base-W32K-L0_50", "sae-res-qwen3-30b-a3b-base-w32k-l0_50" ], "model_types": [ @@ -8343,7 +8269,6 @@ { "name": "qwen/sae-res-qwen3.5-27b-w80k-l0_100", "alias": [ - "Qwen/SAE-Res-Qwen3.5-27B-W80K-L0_100", "sae-res-qwen3.5-27b-w80k-l0_100" ], "model_types": [ @@ -8353,7 +8278,6 @@ { "name": "qwen/sae-res-qwen3.5-27b-w80k-l0_50", "alias": [ - "Qwen/SAE-Res-Qwen3.5-27B-W80K-L0_50", "sae-res-qwen3.5-27b-w80k-l0_50" ], "model_types": [ @@ -8363,7 +8287,6 @@ { "name": "qwen/sae-res-qwen3.5-9b-base-w64k-l0_100", "alias": [ - "Qwen/SAE-Res-Qwen3.5-9B-Base-W64K-L0_100", "sae-res-qwen3.5-9b-base-w64k-l0_100" ], "model_types": [ @@ -8373,7 +8296,6 @@ { "name": "qwen/sae-res-qwen3.5-2b-base-w32k-l0_100", "alias": [ - "Qwen/SAE-Res-Qwen3.5-2B-Base-W32K-L0_100", "sae-res-qwen3.5-2b-base-w32k-l0_100" ], "model_types": [ @@ -8383,7 +8305,6 @@ { "name": "qwen/sae-res-qwen3.5-9b-base-w64k-l0_50", "alias": [ - "Qwen/SAE-Res-Qwen3.5-9B-Base-W64K-L0_50", "sae-res-qwen3.5-9b-base-w64k-l0_50" ], "model_types": [ @@ -8393,7 +8314,6 @@ { "name": "qwen/sae-res-qwen3.5-2b-base-w32k-l0_50", "alias": [ - "Qwen/SAE-Res-Qwen3.5-2B-Base-W32K-L0_50", "sae-res-qwen3.5-2b-base-w32k-l0_50" ], "model_types": [ @@ -8403,7 +8323,6 @@ { "name": "qwen/sae-res-qwen3-8b-base-w64k-l0_100", "alias": [ - "Qwen/SAE-Res-Qwen3-8B-Base-W64K-L0_100", "sae-res-qwen3-8b-base-w64k-l0_100" ], "model_types": [ @@ -8413,7 +8332,6 @@ { "name": "qwen/sae-res-qwen3-8b-base-w64k-l0_50", "alias": [ - "Qwen/SAE-Res-Qwen3-8B-Base-W64K-L0_50", "sae-res-qwen3-8b-base-w64k-l0_50" ], "model_types": [ @@ -8423,7 +8341,6 @@ { "name": "qwen/sae-res-qwen3-1.7b-base-w32k-l0_100", "alias": [ - "Qwen/SAE-Res-Qwen3-1.7B-Base-W32K-L0_100", "sae-res-qwen3-1.7b-base-w32k-l0_100" ], "model_types": [ @@ -8433,7 +8350,6 @@ { "name": "qwen/sae-res-qwen3-1.7b-base-w32k-l0_50", "alias": [ - "Qwen/SAE-Res-Qwen3-1.7B-Base-W32K-L0_50", "sae-res-qwen3-1.7b-base-w32k-l0_50" ], "model_types": [ @@ -8443,7 +8359,6 @@ { "name": "qwen/qwen3.6-27b-fp8", "alias": [ - "Qwen/Qwen3.6-27B-FP8", "qwen3.6-27b-fp8" ], "max_tokens": 262144, @@ -8461,7 +8376,6 @@ { "name": "qwen/qwen3.6-27b", "alias": [ - "Qwen/Qwen3.6-27B", "qwen3.6-27b", "qwen/qwen3.6-27b-20260422" ], @@ -8470,18 +8384,20 @@ "chat", "image2text", "vision", - "video_understanding" + "video_understanding", + "video_generation" ], "thinking": { "default_value": true, "clear_thinking": true - } + }, + "max_completion_tokens": 65536 }, { "name": "qwen/qwen3.6-35b-a3b-fp8", "alias": [ - "Qwen/Qwen3.6-35B-A3B-FP8", - "qwen3.6-35b-a3b-fp8" + "qwen3.6-35b-a3b-fp8", + "Qwen3.6 35B A3b Fp8" ], "max_tokens": 262144, "model_types": [ @@ -8498,7 +8414,6 @@ { "name": "qwen/qwen3.6-35b-a3b", "alias": [ - "Qwen/Qwen3.6-35B-A3B", "qwen3.6-35b-a3b", "qwen/qwen3.6-35b-a3b-20260415" ], @@ -8512,12 +8427,12 @@ "thinking": { "default_value": true, "clear_thinking": true - } + }, + "max_completion_tokens": 65536 }, { "name": "qwen/qwen3.5-35b-a3b-gptq-int4", "alias": [ - "Qwen/Qwen3.5-35B-A3B-GPTQ-Int4", "qwen3.5-35b-a3b-gptq-int4" ], "max_tokens": 262144, @@ -8535,7 +8450,6 @@ { "name": "qwen/qwen3.5-27b-gptq-int4", "alias": [ - "Qwen/Qwen3.5-27B-GPTQ-Int4", "qwen3.5-27b-gptq-int4" ], "max_tokens": 262144, @@ -8553,7 +8467,6 @@ { "name": "qwen/qwen3.5-397b-a17b-gptq-int4", "alias": [ - "Qwen/Qwen3.5-397B-A17B-GPTQ-Int4", "qwen3.5-397b-a17b-gptq-int4" ], "max_tokens": 262144, @@ -8571,7 +8484,6 @@ { "name": "qwen/qwen3.5-122b-a10b-gptq-int4", "alias": [ - "Qwen/Qwen3.5-122B-A10B-GPTQ-Int4", "qwen3.5-122b-a10b-gptq-int4" ], "max_tokens": 262144, @@ -8589,7 +8501,6 @@ { "name": "qwen/qwen3.5-0.8b-base", "alias": [ - "Qwen/Qwen3.5-0.8B-Base", "qwen3.5-0.8b-base" ], "max_tokens": 262144, @@ -8607,7 +8518,6 @@ { "name": "qwen/qwen3.5-2b-base", "alias": [ - "Qwen/Qwen3.5-2B-Base", "qwen3.5-2b-base" ], "max_tokens": 262144, @@ -8625,7 +8535,6 @@ { "name": "qwen/qwen3.5-0.8b", "alias": [ - "Qwen/Qwen3.5-0.8B", "qwen3.5-0.8b" ], "max_tokens": 262144, @@ -8643,7 +8552,6 @@ { "name": "qwen/qwen3.5-2b", "alias": [ - "Qwen/Qwen3.5-2B", "qwen3.5-2b" ], "max_tokens": 262144, @@ -8661,7 +8569,6 @@ { "name": "qwen/qwen3.5-4b", "alias": [ - "Qwen/Qwen3.5-4B", "qwen3.5-4b" ], "max_tokens": 262144, @@ -8679,7 +8586,6 @@ { "name": "qwen/qwen3.5-4b-base", "alias": [ - "Qwen/Qwen3.5-4B-Base", "qwen3.5-4b-base" ], "max_tokens": 262144, @@ -8697,9 +8603,9 @@ { "name": "qwen/qwen3.5-9b", "alias": [ - "Qwen/Qwen3.5-9B", "qwen3.5-9b", - "qwen/qwen3.5-9b-20260310" + "qwen/qwen3.5-9b-20260310", + "Qwen3.5 9B FP8" ], "max_tokens": 262144, "model_types": [ @@ -8716,7 +8622,6 @@ { "name": "qwen/qwen3.5-9b-base", "alias": [ - "Qwen/Qwen3.5-9B-Base", "qwen3.5-9b-base" ], "max_tokens": 262144, @@ -8734,7 +8639,6 @@ { "name": "qwen/qwen3.5-35b-a3b-fp8", "alias": [ - "Qwen/Qwen3.5-35B-A3B-FP8", "qwen3.5-35b-a3b-fp8" ], "max_tokens": 262144, @@ -8752,7 +8656,6 @@ { "name": "qwen/qwen3.5-27b-fp8", "alias": [ - "Qwen/Qwen3.5-27B-FP8", "qwen3.5-27b-fp8" ], "max_tokens": 262144, @@ -8770,8 +8673,8 @@ { "name": "qwen/qwen3.5-122b-a10b-fp8", "alias": [ - "Qwen/Qwen3.5-122B-A10B-FP8", - "qwen3.5-122b-a10b-fp8" + "qwen3.5-122b-a10b-fp8", + "Qwen3.5 122B A10b Fp8" ], "max_tokens": 262144, "model_types": [ @@ -8788,7 +8691,6 @@ { "name": "qwen/qwen3.5-122b-a10b", "alias": [ - "Qwen/Qwen3.5-122B-A10B", "qwen3.5-122b-a10b", "qwen/qwen3.5-122b-a10b-20260224" ], @@ -8802,12 +8704,12 @@ "thinking": { "default_value": true, "clear_thinking": true - } + }, + "max_completion_tokens": 65536 }, { "name": "qwen/qwen3.5-35b-a3b-base", "alias": [ - "Qwen/Qwen3.5-35B-A3B-Base", "qwen3.5-35b-a3b-base" ], "max_tokens": 262144, @@ -8825,7 +8727,6 @@ { "name": "qwen/qwen3.5-27b", "alias": [ - "Qwen/Qwen3.5-27B", "qwen3.5-27b", "qwen/qwen3.5-27b-20260224" ], @@ -8839,14 +8740,15 @@ "thinking": { "default_value": true, "clear_thinking": true - } + }, + "max_completion_tokens": 65536 }, { "name": "qwen/qwen3.5-35b-a3b", "alias": [ - "Qwen/Qwen3.5-35B-A3B", "qwen3.5-35b-a3b", - "qwen/qwen3.5-35b-a3b-20260224" + "qwen/qwen3.5-35b-a3b-20260224", + "Qwen3.5 35B A3b" ], "max_tokens": 262144, "model_types": [ @@ -8858,12 +8760,12 @@ "thinking": { "default_value": true, "clear_thinking": true - } + }, + "max_completion_tokens": 65536 }, { "name": "qwen/qwen3.5-397b-a17b-fp8", "alias": [ - "Qwen/Qwen3.5-397B-A17B-FP8", "qwen3.5-397b-a17b-fp8" ], "max_tokens": 262144, @@ -8881,26 +8783,27 @@ { "name": "qwen/qwen3.5-397b-a17b", "alias": [ - "Qwen/Qwen3.5-397B-A17B", "qwen3.5-397b-a17b", - "qwen/qwen3.5-397b-a17b-20260216" + "qwen/qwen3.5-397b-a17b-20260216", + "Qwen3.5 397B A17b" ], "max_tokens": 262144, "model_types": [ "chat", "image2text", "vision", - "video_understanding" + "video_understanding", + "video_generation" ], "thinking": { "default_value": true, "clear_thinking": true - } + }, + "max_completion_tokens": 65536 }, { "name": "qwen/webworld-32b", "alias": [ - "Qwen/WebWorld-32B", "webworld-32b" ], "max_tokens": 40960, @@ -8911,7 +8814,6 @@ { "name": "qwen/webworld-14b", "alias": [ - "Qwen/WebWorld-14B", "webworld-14b" ], "max_tokens": 40960, @@ -8922,7 +8824,6 @@ { "name": "qwen/webworld-8b", "alias": [ - "Qwen/WebWorld-8B", "webworld-8b" ], "max_tokens": 40960, @@ -8933,7 +8834,6 @@ { "name": "qwen/qwen3-coder-next-gguf", "alias": [ - "Qwen/Qwen3-Coder-Next-GGUF", "qwen3-coder-next-gguf" ], "model_types": [ @@ -8944,7 +8844,6 @@ { "name": "qwen/qwen3-coder-next-base", "alias": [ - "Qwen/Qwen3-Coder-Next-Base", "qwen3-coder-next-base" ], "max_tokens": 262144, @@ -8955,8 +8854,8 @@ { "name": "qwen/qwen3-coder-next-fp8", "alias": [ - "Qwen/Qwen3-Coder-Next-FP8", - "qwen3-coder-next-fp8" + "qwen3-coder-next-fp8", + "Qwen3 Coder Next Fp8" ], "max_tokens": 262144, "model_types": [ @@ -8966,19 +8865,19 @@ { "name": "qwen/qwen3-coder-next", "alias": [ - "Qwen/Qwen3-Coder-Next", "qwen3-coder-next", - "qwen/qwen3-coder-next-2025-02-03" + "qwen/qwen3-coder-next-2025-02-03", + "Qwen3 Coder Next" ], "max_tokens": 262144, "model_types": [ "chat" - ] + ], + "max_completion_tokens": 65536 }, { "name": "qwen/qwen3-forcedaligner-0.6b", "alias": [ - "Qwen/Qwen3-ForcedAligner-0.6B", "qwen3-forcedaligner-0.6b" ], "max_tokens": 8192, @@ -8989,7 +8888,6 @@ { "name": "qwen/qwen3-asr-1.7b", "alias": [ - "Qwen/Qwen3-ASR-1.7B", "qwen3-asr-1.7b" ], "max_tokens": 65536, @@ -9000,7 +8898,6 @@ { "name": "qwen/qwen3-asr-0.6b", "alias": [ - "Qwen/Qwen3-ASR-0.6B", "qwen3-asr-0.6b" ], "max_tokens": 65536, @@ -9011,7 +8908,6 @@ { "name": "qwen/qwen3-tts-12hz-0.6b-base", "alias": [ - "Qwen/Qwen3-TTS-12Hz-0.6B-Base", "qwen3-tts-12hz-0.6b-base" ], "max_tokens": 65536, @@ -9022,7 +8918,6 @@ { "name": "qwen/qwen3-tts-12hz-0.6b-customvoice", "alias": [ - "Qwen/Qwen3-TTS-12Hz-0.6B-CustomVoice", "qwen3-tts-12hz-0.6b-customvoice" ], "max_tokens": 65536, @@ -9033,7 +8928,6 @@ { "name": "qwen/qwen3-tts-12hz-1.7b-base", "alias": [ - "Qwen/Qwen3-TTS-12Hz-1.7B-Base", "qwen3-tts-12hz-1.7b-base" ], "max_tokens": 65536, @@ -9044,7 +8938,6 @@ { "name": "qwen/qwen3-tts-12hz-1.7b-customvoice", "alias": [ - "Qwen/Qwen3-TTS-12Hz-1.7B-CustomVoice", "qwen3-tts-12hz-1.7b-customvoice" ], "max_tokens": 65536, @@ -9055,7 +8948,6 @@ { "name": "qwen/qwen3-tts-tokenizer-12hz", "alias": [ - "Qwen/Qwen3-TTS-Tokenizer-12Hz", "qwen3-tts-tokenizer-12hz" ], "max_tokens": 8000, @@ -9066,7 +8958,6 @@ { "name": "qwen/qwen3-tts-12hz-1.7b-voicedesign", "alias": [ - "Qwen/Qwen3-TTS-12Hz-1.7B-VoiceDesign", "qwen3-tts-12hz-1.7b-voicedesign" ], "max_tokens": 65536, @@ -9077,7 +8968,6 @@ { "name": "qwen/qwen3-vl-reranker-8b", "alias": [ - "Qwen/Qwen3-VL-Reranker-8B", "qwen3-vl-reranker-8b" ], "max_tokens": 32768, @@ -9088,7 +8978,6 @@ { "name": "qwen/qwen3-vl-reranker-2b", "alias": [ - "Qwen/Qwen3-VL-Reranker-2B", "qwen3-vl-reranker-2b" ], "max_tokens": 32768, @@ -9099,7 +8988,6 @@ { "name": "qwen/qwen3-vl-embedding-2b", "alias": [ - "Qwen/Qwen3-VL-Embedding-2B", "qwen3-vl-embedding-2b" ], "max_tokens": 32768, @@ -9111,7 +8999,6 @@ { "name": "qwen/qwen3-vl-embedding-8b", "alias": [ - "Qwen/Qwen3-VL-Embedding-8B", "qwen3-vl-embedding-8b" ], "max_tokens": 32768, @@ -9123,7 +9010,6 @@ { "name": "qwen/qwen-image-2512", "alias": [ - "Qwen/Qwen-Image-2512", "qwen-image-2512" ], "model_types": [ @@ -9136,7 +9022,6 @@ { "name": "qwen/qwen-image-layered", "alias": [ - "Qwen/Qwen-Image-Layered", "qwen-image-layered" ], "model_types": [ @@ -9148,7 +9033,6 @@ { "name": "qwen/qwen-image-edit-2511", "alias": [ - "Qwen/Qwen-Image-Edit-2511", "qwen-image-edit-2511" ], "model_types": [ @@ -9160,7 +9044,6 @@ { "name": "qwen/qwen3-next-80b-a3b-thinking-gguf", "alias": [ - "Qwen/Qwen3-Next-80B-A3B-Thinking-GGUF", "qwen3-next-80b-a3b-thinking-gguf" ], "model_types": [ @@ -9174,7 +9057,6 @@ { "name": "qwen/qwen3-next-80b-a3b-instruct-gguf", "alias": [ - "Qwen/Qwen3-Next-80B-A3B-Instruct-GGUF", "qwen3-next-80b-a3b-instruct-gguf" ], "model_types": [ @@ -9184,7 +9066,6 @@ { "name": "qwen/qwen3-vl-235b-a22b-thinking-gguf", "alias": [ - "Qwen/Qwen3-VL-235B-A22B-Thinking-GGUF", "qwen3-vl-235b-a22b-thinking-gguf" ], "model_types": [ @@ -9199,7 +9080,6 @@ { "name": "qwen/qwen3-vl-30b-a3b-thinking-gguf", "alias": [ - "Qwen/Qwen3-VL-30B-A3B-Thinking-GGUF", "qwen3-vl-30b-a3b-thinking-gguf" ], "model_types": [ @@ -9214,7 +9094,6 @@ { "name": "qwen/qwen3-vl-235b-a22b-instruct-gguf", "alias": [ - "Qwen/Qwen3-VL-235B-A22B-Instruct-GGUF", "qwen3-vl-235b-a22b-instruct-gguf" ], "model_types": [ @@ -9229,7 +9108,6 @@ { "name": "qwen/qwen3-vl-30b-a3b-instruct-gguf", "alias": [ - "Qwen/Qwen3-VL-30B-A3B-Instruct-GGUF", "qwen3-vl-30b-a3b-instruct-gguf" ], "model_types": [ @@ -9244,7 +9122,6 @@ { "name": "qwen/qwen3-vl-2b-thinking-gguf", "alias": [ - "Qwen/Qwen3-VL-2B-Thinking-GGUF", "qwen3-vl-2b-thinking-gguf" ], "model_types": [ @@ -9259,7 +9136,6 @@ { "name": "qwen/qwen3-vl-4b-thinking-gguf", "alias": [ - "Qwen/Qwen3-VL-4B-Thinking-GGUF", "qwen3-vl-4b-thinking-gguf" ], "model_types": [ @@ -9274,7 +9150,6 @@ { "name": "qwen/qwen3-vl-8b-thinking-gguf", "alias": [ - "Qwen/Qwen3-VL-8B-Thinking-GGUF", "qwen3-vl-8b-thinking-gguf" ], "model_types": [ @@ -9289,7 +9164,6 @@ { "name": "qwen/qwen3-vl-32b-thinking-gguf", "alias": [ - "Qwen/Qwen3-VL-32B-Thinking-GGUF", "qwen3-vl-32b-thinking-gguf" ], "model_types": [ @@ -9304,7 +9178,6 @@ { "name": "qwen/qwen3-vl-32b-instruct-gguf", "alias": [ - "Qwen/Qwen3-VL-32B-Instruct-GGUF", "qwen3-vl-32b-instruct-gguf" ], "model_types": [ @@ -9319,7 +9192,6 @@ { "name": "qwen/qwen3-vl-8b-instruct-gguf", "alias": [ - "Qwen/Qwen3-VL-8B-Instruct-GGUF", "qwen3-vl-8b-instruct-gguf" ], "model_types": [ @@ -9334,7 +9206,6 @@ { "name": "qwen/qwen3-vl-4b-instruct-gguf", "alias": [ - "Qwen/Qwen3-VL-4B-Instruct-GGUF", "qwen3-vl-4b-instruct-gguf" ], "model_types": [ @@ -9349,7 +9220,6 @@ { "name": "qwen/qwen3-vl-2b-instruct-gguf", "alias": [ - "Qwen/Qwen3-VL-2B-Instruct-GGUF", "qwen3-vl-2b-instruct-gguf" ], "model_types": [ @@ -9364,7 +9234,6 @@ { "name": "qwen/qwen3-vl-2b-thinking-fp8", "alias": [ - "Qwen/Qwen3-VL-2B-Thinking-FP8", "qwen3-vl-2b-thinking-fp8" ], "max_tokens": 262144, @@ -9379,7 +9248,6 @@ { "name": "qwen/qwen3-vl-2b-thinking", "alias": [ - "Qwen/Qwen3-VL-2B-Thinking", "qwen3-vl-2b-thinking" ], "max_tokens": 262144, @@ -9394,7 +9262,6 @@ { "name": "qwen/qwen3-vl-2b-instruct-fp8", "alias": [ - "Qwen/Qwen3-VL-2B-Instruct-FP8", "qwen3-vl-2b-instruct-fp8" ], "max_tokens": 262144, @@ -9409,7 +9276,6 @@ { "name": "qwen/qwen3-vl-2b-instruct", "alias": [ - "Qwen/Qwen3-VL-2B-Instruct", "qwen3-vl-2b-instruct" ], "max_tokens": 262144, @@ -9424,7 +9290,6 @@ { "name": "qwen/qwen3-vl-32b-instruct-fp8", "alias": [ - "Qwen/Qwen3-VL-32B-Instruct-FP8", "qwen3-vl-32b-instruct-fp8" ], "max_tokens": 262144, @@ -9439,7 +9304,6 @@ { "name": "qwen/qwen3-vl-32b-thinking-fp8", "alias": [ - "Qwen/Qwen3-VL-32B-Thinking-FP8", "qwen3-vl-32b-thinking-fp8" ], "max_tokens": 262144, @@ -9454,12 +9318,12 @@ { "name": "qwen/qwen3-vl-32b-thinking", "alias": [ - "Qwen/Qwen3-VL-32B-Thinking", "qwen3-vl-32b-thinking" ], "max_tokens": 262144, "model_types": [ - "chat" + "chat", + "video_generation" ], "thinking": { "default_value": true, @@ -9469,12 +9333,13 @@ { "name": "qwen/qwen3-vl-32b-instruct", "alias": [ - "Qwen/Qwen3-VL-32B-Instruct", "qwen3-vl-32b-instruct" ], "max_tokens": 262144, "model_types": [ - "chat" + "chat", + "vision", + "image2text" ], "thinking": { "default_value": true, @@ -9484,7 +9349,6 @@ { "name": "qwen/qwen3-vl-8b-instruct-fp8", "alias": [ - "Qwen/Qwen3-VL-8B-Instruct-FP8", "qwen3-vl-8b-instruct-fp8" ], "max_tokens": 262144, @@ -9499,7 +9363,6 @@ { "name": "qwen/qwen3-vl-8b-thinking-fp8", "alias": [ - "Qwen/Qwen3-VL-8B-Thinking-FP8", "qwen3-vl-8b-thinking-fp8" ], "max_tokens": 262144, @@ -9514,7 +9377,6 @@ { "name": "qwen/qwen3-vl-4b-thinking-fp8", "alias": [ - "Qwen/Qwen3-VL-4B-Thinking-FP8", "qwen3-vl-4b-thinking-fp8" ], "max_tokens": 262144, @@ -9529,7 +9391,6 @@ { "name": "qwen/qwen3-vl-4b-instruct-fp8", "alias": [ - "Qwen/Qwen3-VL-4B-Instruct-FP8", "qwen3-vl-4b-instruct-fp8" ], "max_tokens": 262144, @@ -9544,12 +9405,14 @@ { "name": "qwen/qwen3-vl-8b-thinking", "alias": [ - "Qwen/Qwen3-VL-8B-Thinking", "qwen3-vl-8b-thinking" ], "max_tokens": 262144, "model_types": [ - "chat" + "chat", + "image2text", + "vision", + "video_generation" ], "thinking": { "default_value": true, @@ -9559,12 +9422,13 @@ { "name": "qwen/qwen3-vl-4b-thinking", "alias": [ - "Qwen/Qwen3-VL-4B-Thinking", "qwen3-vl-4b-thinking" ], "max_tokens": 262144, "model_types": [ - "chat" + "chat", + "image2text", + "vision" ], "thinking": { "default_value": true, @@ -9574,27 +9438,31 @@ { "name": "qwen/qwen3-vl-8b-instruct", "alias": [ - "Qwen/Qwen3-VL-8B-Instruct", "qwen3-vl-8b-instruct" ], "max_tokens": 262144, "model_types": [ - "chat" + "chat", + "image2text", + "vision", + "video_generation" ], "thinking": { "default_value": true, "clear_thinking": true - } + }, + "max_completion_tokens": 32768 }, { "name": "qwen/qwen3-vl-4b-instruct", "alias": [ - "Qwen/Qwen3-VL-4B-Instruct", "qwen3-vl-4b-instruct" ], "max_tokens": 262144, "model_types": [ - "chat" + "chat", + "image2text", + "vision" ], "thinking": { "default_value": true, @@ -9604,7 +9472,6 @@ { "name": "qwen/qwen3-vl-30b-a3b-thinking-fp8", "alias": [ - "Qwen/Qwen3-VL-30B-A3B-Thinking-FP8", "qwen3-vl-30b-a3b-thinking-fp8" ], "max_tokens": 262144, @@ -9619,7 +9486,6 @@ { "name": "qwen/qwen3-vl-30b-a3b-instruct-fp8", "alias": [ - "Qwen/Qwen3-VL-30B-A3B-Instruct-FP8", "qwen3-vl-30b-a3b-instruct-fp8" ], "max_tokens": 262144, @@ -9634,7 +9500,6 @@ { "name": "qwen/qwen3-vl-235b-a22b-thinking-fp8", "alias": [ - "Qwen/Qwen3-VL-235B-A22B-Thinking-FP8", "qwen3-vl-235b-a22b-thinking-fp8" ], "max_tokens": 262144, @@ -9649,12 +9514,13 @@ { "name": "qwen/qwen3-vl-235b-a22b-instruct-fp8", "alias": [ - "Qwen/Qwen3-VL-235B-A22B-Instruct-FP8", "qwen3-vl-235b-a22b-instruct-fp8" ], "max_tokens": 262144, "model_types": [ - "chat" + "chat", + "vision", + "image2text" ], "thinking": { "default_value": true, @@ -9664,37 +9530,43 @@ { "name": "qwen/qwen3-vl-30b-a3b-thinking", "alias": [ - "Qwen/Qwen3-VL-30B-A3B-Thinking", "qwen3-vl-30b-a3b-thinking" ], "max_tokens": 262144, "model_types": [ - "chat" + "chat", + "image2text", + "vision", + "video_generation" ], "thinking": { "default_value": true, "clear_thinking": true - } + }, + "max_completion_tokens": 32768 }, { "name": "qwen/qwen3-vl-30b-a3b-instruct", "alias": [ - "Qwen/Qwen3-VL-30B-A3B-Instruct", "qwen3-vl-30b-a3b-instruct" ], "max_tokens": 262144, "model_types": [ - "chat" + "chat", + "image2text", + "vision", + "ocr", + "video_generation" ], "thinking": { "default_value": true, "clear_thinking": true - } + }, + "max_completion_tokens": 32768 }, { "name": "qwen/qwen3-4b-saferl", "alias": [ - "Qwen/Qwen3-4B-SafeRL", "qwen3-4b-saferl" ], "max_tokens": 40960, @@ -9705,7 +9577,6 @@ { "name": "qwen/qwen3guard-stream-8b", "alias": [ - "Qwen/Qwen3Guard-Stream-8B", "qwen3guard-stream-8b" ], "max_tokens": 8192, @@ -9716,7 +9587,6 @@ { "name": "qwen/qwen3guard-stream-4b", "alias": [ - "Qwen/Qwen3Guard-Stream-4B", "qwen3guard-stream-4b" ], "max_tokens": 8192, @@ -9727,7 +9597,6 @@ { "name": "qwen/qwen3guard-stream-0.6b", "alias": [ - "Qwen/Qwen3Guard-Stream-0.6B", "qwen3guard-stream-0.6b" ], "max_tokens": 8192, @@ -9738,7 +9607,6 @@ { "name": "qwen/qwen3guard-gen-8b", "alias": [ - "Qwen/Qwen3Guard-Gen-8B", "qwen3guard-gen-8b" ], "max_tokens": 32768, @@ -9749,7 +9617,6 @@ { "name": "qwen/qwen3guard-gen-4b", "alias": [ - "Qwen/Qwen3Guard-Gen-4B", "qwen3guard-gen-4b" ], "max_tokens": 32768, @@ -9760,7 +9627,6 @@ { "name": "qwen/qwen3guard-gen-0.6b", "alias": [ - "Qwen/Qwen3Guard-Gen-0.6B", "qwen3guard-gen-0.6b" ], "max_tokens": 32768, @@ -9771,49 +9637,55 @@ { "name": "qwen/qwen-image-edit-2509", "alias": [ - "Qwen/Qwen-Image-Edit-2509", "qwen-image-edit-2509" ], "model_types": [ "image_edit", "image_generation", - "image_understanding" + "image_understanding", + "image" ] }, { "name": "qwen/qwen3-vl-235b-a22b-thinking", "alias": [ - "Qwen/Qwen3-VL-235B-A22B-Thinking", - "qwen3-vl-235b-a22b-thinking" + "qwen3-vl-235b-a22b-thinking", + "Qwen3 VL 235B A22B Thinking" ], "max_tokens": 262144, "model_types": [ - "chat" + "chat", + "image2text", + "vision" ], "thinking": { "default_value": true, "clear_thinking": true - } + }, + "max_completion_tokens": 32768 }, { "name": "qwen/qwen3-vl-235b-a22b-instruct", "alias": [ - "Qwen/Qwen3-VL-235B-A22B-Instruct", - "qwen3-vl-235b-a22b-instruct" + "qwen3-vl-235b-a22b-instruct", + "Qwen3 VL 235B A22B Instruct" ], "max_tokens": 262144, "model_types": [ - "chat" + "chat", + "image2text", + "vision", + "ocr" ], "thinking": { "default_value": true, "clear_thinking": true - } + }, + "max_completion_tokens": 32768 }, { "name": "qwen/qwen3-next-80b-a3b-thinking-fp8", "alias": [ - "Qwen/Qwen3-Next-80B-A3B-Thinking-FP8", "qwen3-next-80b-a3b-thinking-fp8" ], "max_tokens": 262144, @@ -9828,8 +9700,8 @@ { "name": "qwen/qwen3-next-80b-a3b-instruct-fp8", "alias": [ - "Qwen/Qwen3-Next-80B-A3B-Instruct-FP8", - "qwen3-next-80b-a3b-instruct-fp8" + "qwen3-next-80b-a3b-instruct-fp8", + "Qwen3 Next 80B A3b Instruct Fp8" ], "max_tokens": 262144, "model_types": [ @@ -9839,8 +9711,8 @@ { "name": "qwen/qwen3-omni-30b-a3b-instruct", "alias": [ - "Qwen/Qwen3-Omni-30B-A3B-Instruct", - "qwen3-omni-30b-a3b-instruct" + "qwen3-omni-30b-a3b-instruct", + "Qwen3 Omni 30B A3B Instruct" ], "max_tokens": 65536, "model_types": [ @@ -9853,13 +9725,14 @@ "speech2text", "audio_understanding", "tts" - ] + ], + "max_completion_tokens": 16384 }, { "name": "qwen/qwen3-omni-30b-a3b-thinking", "alias": [ - "Qwen/Qwen3-Omni-30B-A3B-Thinking", - "qwen3-omni-30b-a3b-thinking" + "qwen3-omni-30b-a3b-thinking", + "Qwen3 Omni 30B A3B Thinking" ], "max_tokens": 65536, "model_types": [ @@ -9875,12 +9748,12 @@ "thinking": { "default_value": true, "clear_thinking": true - } + }, + "max_completion_tokens": 16384 }, { "name": "qwen/qwen3-omni-30b-a3b-captioner", "alias": [ - "Qwen/Qwen3-Omni-30B-A3B-Captioner", "qwen3-omni-30b-a3b-captioner" ], "max_tokens": 65536, @@ -9888,15 +9761,16 @@ "audio_caption", "audio2text", "audio_understanding", - "caption" + "caption", + "chat" ] }, { "name": "qwen/qwen3-next-80b-a3b-thinking", "alias": [ - "Qwen/Qwen3-Next-80B-A3B-Thinking", "qwen3-next-80b-a3b-thinking", - "qwen/qwen3-next-80b-a3b-thinking-2509" + "qwen/qwen3-next-80b-a3b-thinking-2509", + "Qwen3 Next 80B A3B Thinking" ], "max_tokens": 262144, "model_types": [ @@ -9905,26 +9779,31 @@ "thinking": { "default_value": true, "clear_thinking": true - } + }, + "max_completion_tokens": 32768 }, { "name": "qwen/qwen3-next-80b-a3b-instruct", "alias": [ - "Qwen/Qwen3-Next-80B-A3B-Instruct", "qwen3-next-80b-a3b-instruct", "qwen/qwen3-next-80b-a3b-instruct-2509", "qwen/qwen3-next-80b-a3b-instruct-2509:free", - "qwen/qwen3-next-80b-a3b-instruct:free" + "qwen/qwen3-next-80b-a3b-instruct:free", + "Qwen3 Next 80B A3B Instruct" ], "max_tokens": 262144, "model_types": [ "chat" - ] + ], + "max_completion_tokens": 32768, + "thinking": { + "default_value": true, + "clear_thinking": true + } }, { "name": "qwen/qwen-image-bench", "alias": [ - "Qwen/Qwen-Image-Bench", "qwen-image-bench" ], "model_types": [ @@ -9937,19 +9816,18 @@ { "name": "qwen/qwen-image-edit", "alias": [ - "Qwen/Qwen-Image-Edit", "qwen-image-edit" ], "model_types": [ "image_edit", "image_generation", - "image_understanding" + "image_understanding", + "text-to-image" ] }, { "name": "qwen/qwen3-4b-instruct-2507-fp8", "alias": [ - "Qwen/Qwen3-4B-Instruct-2507-FP8", "qwen3-4b-instruct-2507-fp8" ], "max_tokens": 262144, @@ -9960,7 +9838,6 @@ { "name": "qwen/qwen3-4b-thinking-2507-fp8", "alias": [ - "Qwen/Qwen3-4B-Thinking-2507-FP8", "qwen3-4b-thinking-2507-fp8" ], "max_tokens": 262144, @@ -9975,7 +9852,6 @@ { "name": "qwen/qwen3-4b-thinking-2507", "alias": [ - "Qwen/Qwen3-4B-Thinking-2507", "qwen3-4b-thinking-2507" ], "max_tokens": 262144, @@ -9990,8 +9866,8 @@ { "name": "qwen/qwen3-4b-instruct-2507", "alias": [ - "Qwen/Qwen3-4B-Instruct-2507", - "qwen3-4b-instruct-2507" + "qwen3-4b-instruct-2507", + "Qwen3 4B Instruct 2507" ], "max_tokens": 262144, "model_types": [ @@ -10001,8 +9877,8 @@ { "name": "qwen/qwen-image", "alias": [ - "Qwen/Qwen-Image", - "qwen-image" + "qwen-image", + "Qwen Image" ], "model_types": [ "text-to-image", @@ -10014,7 +9890,6 @@ { "name": "qwen/qwen3-coder-30b-a3b-instruct-fp8", "alias": [ - "Qwen/Qwen3-Coder-30B-A3B-Instruct-FP8", "qwen3-coder-30b-a3b-instruct-fp8" ], "max_tokens": 262144, @@ -10025,18 +9900,18 @@ { "name": "qwen/qwen3-coder-30b-a3b-instruct", "alias": [ - "Qwen/Qwen3-Coder-30B-A3B-Instruct", - "qwen3-coder-30b-a3b-instruct" + "qwen3-coder-30b-a3b-instruct", + "Qwen3 Coder 30b A3B Instruct" ], "max_tokens": 262144, "model_types": [ "chat" - ] + ], + "max_completion_tokens": 32768 }, { "name": "qwen/qwen3-30b-a3b-thinking-2507-fp8", "alias": [ - "Qwen/Qwen3-30B-A3B-Thinking-2507-FP8", "qwen3-30b-a3b-thinking-2507-fp8" ], "max_tokens": 262144, @@ -10051,7 +9926,6 @@ { "name": "qwen/qwen3-30b-a3b-thinking-2507", "alias": [ - "Qwen/Qwen3-30B-A3B-Thinking-2507", "qwen3-30b-a3b-thinking-2507" ], "max_tokens": 262144, @@ -10066,7 +9940,6 @@ { "name": "qwen/qwen3-30b-a3b-instruct-2507-fp8", "alias": [ - "Qwen/Qwen3-30B-A3B-Instruct-2507-FP8", "qwen3-30b-a3b-instruct-2507-fp8" ], "max_tokens": 262144, @@ -10077,7 +9950,6 @@ { "name": "qwen/qwen3-30b-a3b-instruct-2507", "alias": [ - "Qwen/Qwen3-30B-A3B-Instruct-2507", "qwen3-30b-a3b-instruct-2507" ], "max_tokens": 262144, @@ -10088,7 +9960,6 @@ { "name": "qwen/qwen3-235b-a22b-thinking-2507-fp8", "alias": [ - "Qwen/Qwen3-235B-A22B-Thinking-2507-FP8", "qwen3-235b-a22b-thinking-2507-fp8" ], "max_tokens": 262144, @@ -10103,8 +9974,8 @@ { "name": "qwen/qwen3-235b-a22b-thinking-2507", "alias": [ - "Qwen/Qwen3-235B-A22B-Thinking-2507", - "qwen3-235b-a22b-thinking-2507" + "qwen3-235b-a22b-thinking-2507", + "Qwen3 235B A22b Thinking 2507" ], "max_tokens": 262144, "model_types": [ @@ -10113,13 +9984,14 @@ "thinking": { "default_value": true, "clear_thinking": true - } + }, + "max_completion_tokens": 32768 }, { "name": "qwen/qwen3-coder-480b-a35b-instruct-fp8", "alias": [ - "Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8", - "qwen3-coder-480b-a35b-instruct-fp8" + "qwen3-coder-480b-a35b-instruct-fp8", + "Qwen3 Coder 480B A35B Instruct Fp8" ], "max_tokens": 262144, "model_types": [ @@ -10129,7 +10001,6 @@ { "name": "qwen/qwen3-coder-480b-a35b-instruct", "alias": [ - "Qwen/Qwen3-Coder-480B-A35B-Instruct", "qwen3-coder-480b-a35b-instruct", "qwen3-coder-480b", "qwen/qwen3-coder", @@ -10138,18 +10009,20 @@ "qwen/qwen3-coder-480b-a35b-07-25:free", "qwen/qwen3-coder-480b-a35b-instruct-maas", "qwen.qwen3-coder-480b-a35b-instruct", - "qwen.qwen3-coder-480b-a35b-v1:0" + "qwen.qwen3-coder-480b-a35b-v1:0", + "Qwen3 Coder 480B A35B Instruct" ], "max_tokens": 262144, "model_types": [ "chat" - ] + ], + "max_completion_tokens": 65536 }, { "name": "qwen/qwen3-235b-a22b-instruct-2507-fp8", "alias": [ - "Qwen/Qwen3-235B-A22B-Instruct-2507-FP8", - "qwen3-235b-a22b-instruct-2507-fp8" + "qwen3-235b-a22b-instruct-2507-fp8", + "Qwen3 235B A22b Instruct 2507 Fp8" ], "max_tokens": 262144, "model_types": [ @@ -10159,22 +10032,22 @@ { "name": "qwen/qwen3-235b-a22b-instruct-2507", "alias": [ - "Qwen/Qwen3-235B-A22B-Instruct-2507", "qwen3-235b-a22b-instruct-2507", "qwen/qwen3-235b-a22b-07-25", "qwen/qwen3-235b-a22b-2507", "qwen.qwen3-235b-a22b-2507", - "qwen.qwen3-235b-a22b-2507-v1:0" + "qwen.qwen3-235b-a22b-2507-v1:0", + "Qwen3 235B A22B Instruct 2507" ], "max_tokens": 262144, "model_types": [ "chat" - ] + ], + "max_completion_tokens": 16384 }, { "name": "qwen/qwen3-14b-mlx-bf16", "alias": [ - "Qwen/Qwen3-14B-MLX-bf16", "qwen3-14b-mlx-bf16" ], "max_tokens": 32768, @@ -10185,7 +10058,6 @@ { "name": "qwen/qwen3-235b-a22b-mlx-8bit", "alias": [ - "Qwen/Qwen3-235B-A22B-MLX-8bit", "qwen3-235b-a22b-mlx-8bit" ], "max_tokens": 32768, @@ -10196,7 +10068,6 @@ { "name": "qwen/qwen3-235b-a22b-mlx-6bit", "alias": [ - "Qwen/Qwen3-235B-A22B-MLX-6bit", "qwen3-235b-a22b-mlx-6bit" ], "max_tokens": 32768, @@ -10207,7 +10078,6 @@ { "name": "qwen/qwen3-235b-a22b-mlx-4bit", "alias": [ - "Qwen/Qwen3-235B-A22B-MLX-4bit", "qwen3-235b-a22b-mlx-4bit" ], "max_tokens": 32768, @@ -10218,7 +10088,6 @@ { "name": "qwen/qwen3-235b-a22b-mlx-bf16", "alias": [ - "Qwen/Qwen3-235B-A22B-MLX-bf16", "qwen3-235b-a22b-mlx-bf16" ], "max_tokens": 32768, @@ -10229,7 +10098,6 @@ { "name": "qwen/qwen3-30b-a3b-mlx-4bit", "alias": [ - "Qwen/Qwen3-30B-A3B-MLX-4bit", "qwen3-30b-a3b-mlx-4bit" ], "max_tokens": 32768, @@ -10240,7 +10108,6 @@ { "name": "qwen/qwen3-30b-a3b-mlx-6bit", "alias": [ - "Qwen/Qwen3-30B-A3B-MLX-6bit", "qwen3-30b-a3b-mlx-6bit" ], "max_tokens": 32768, @@ -10251,7 +10118,6 @@ { "name": "qwen/qwen3-30b-a3b-mlx-8bit", "alias": [ - "Qwen/Qwen3-30B-A3B-MLX-8bit", "qwen3-30b-a3b-mlx-8bit" ], "max_tokens": 32768, @@ -10262,7 +10128,6 @@ { "name": "qwen/qwen3-30b-a3b-mlx-bf16", "alias": [ - "Qwen/Qwen3-30B-A3B-MLX-bf16", "qwen3-30b-a3b-mlx-bf16" ], "max_tokens": 32768, @@ -10273,7 +10138,6 @@ { "name": "qwen/qwen3-32b-mlx-4bit", "alias": [ - "Qwen/Qwen3-32B-MLX-4bit", "qwen3-32b-mlx-4bit" ], "max_tokens": 32768, @@ -10284,7 +10148,6 @@ { "name": "qwen/qwen3-32b-mlx-6bit", "alias": [ - "Qwen/Qwen3-32B-MLX-6bit", "qwen3-32b-mlx-6bit" ], "max_tokens": 32768, @@ -10295,7 +10158,6 @@ { "name": "qwen/qwen3-32b-mlx-8bit", "alias": [ - "Qwen/Qwen3-32B-MLX-8bit", "qwen3-32b-mlx-8bit" ], "max_tokens": 32768, @@ -10306,7 +10168,6 @@ { "name": "qwen/qwen3-32b-mlx-bf16", "alias": [ - "Qwen/Qwen3-32B-MLX-bf16", "qwen3-32b-mlx-bf16" ], "max_tokens": 32768, @@ -10317,7 +10178,6 @@ { "name": "qwen/qwen3-embedding-0.6b-gguf", "alias": [ - "Qwen/Qwen3-Embedding-0.6B-GGUF", "qwen3-embedding-0.6b-gguf" ], "max_tokens": 32768, @@ -10329,7 +10189,6 @@ { "name": "qwen/qwen3-embedding-4b-gguf", "alias": [ - "Qwen/Qwen3-Embedding-4B-GGUF", "qwen3-embedding-4b-gguf" ], "max_tokens": 32768, @@ -10341,7 +10200,6 @@ { "name": "qwen/qwen3-embedding-8b-gguf", "alias": [ - "Qwen/Qwen3-Embedding-8B-GGUF", "qwen3-embedding-8b-gguf" ], "max_tokens": 32768, @@ -10353,9 +10211,7 @@ { "name": "qwen/qwen3-reranker-4b", "alias": [ - "Qwen/Qwen3-Reranker-4B", - "qwen3-reranker-4b", - "Qwen3-Reranker-4B" + "qwen3-reranker-4b" ], "max_tokens": 32768, "model_types": [ @@ -10365,9 +10221,7 @@ { "name": "qwen/qwen3-embedding-8b", "alias": [ - "Qwen/Qwen3-Embedding-8B", - "qwen3-embedding-8b", - "Qwen3-Embedding-8B" + "qwen3-embedding-8b" ], "max_tokens": 32768, "max_dimension": 4096, @@ -10378,9 +10232,7 @@ { "name": "qwen/qwen3-embedding-4b", "alias": [ - "Qwen/Qwen3-Embedding-4B", - "qwen3-embedding-4b", - "Qwen3-Embedding-4B" + "qwen3-embedding-4b" ], "max_tokens": 32768, "max_dimension": 2560, @@ -10391,9 +10243,7 @@ { "name": "qwen/qwen3-embedding-0.6b", "alias": [ - "Qwen/Qwen3-Embedding-0.6B", - "qwen3-embedding-0.6b", - "Qwen3-Embedding-0.6B" + "qwen3-embedding-0.6b" ], "max_tokens": 32768, "max_dimension": 1024, @@ -10404,9 +10254,7 @@ { "name": "qwen/qwen3-reranker-0.6b", "alias": [ - "Qwen/Qwen3-Reranker-0.6B", - "qwen3-reranker-0.6b", - "Qwen3-Reranker-0.6B" + "qwen3-reranker-0.6b" ], "max_tokens": 32768, "model_types": [ @@ -10416,9 +10264,7 @@ { "name": "qwen/qwen3-reranker-8b", "alias": [ - "Qwen/Qwen3-Reranker-8B", - "qwen3-reranker-8b", - "Qwen3-Reranker-8B" + "qwen3-reranker-8b" ], "max_tokens": 32768, "model_types": [ @@ -10428,7 +10274,6 @@ { "name": "qwen/qwen3-14b-mlx-4bit", "alias": [ - "Qwen/Qwen3-14B-MLX-4bit", "qwen3-14b-mlx-4bit" ], "max_tokens": 32768, @@ -10439,7 +10284,6 @@ { "name": "qwen/qwen3-4b-mlx-4bit", "alias": [ - "Qwen/Qwen3-4B-MLX-4bit", "qwen3-4b-mlx-4bit" ], "max_tokens": 32768, @@ -10450,7 +10294,6 @@ { "name": "qwen/qwen3-4b-mlx-6bit", "alias": [ - "Qwen/Qwen3-4B-MLX-6bit", "qwen3-4b-mlx-6bit" ], "max_tokens": 32768, @@ -10461,7 +10304,6 @@ { "name": "qwen/qwen3-14b-mlx-6bit", "alias": [ - "Qwen/Qwen3-14B-MLX-6bit", "qwen3-14b-mlx-6bit" ], "max_tokens": 32768, @@ -10472,7 +10314,6 @@ { "name": "qwen/qwen3-4b-mlx-8bit", "alias": [ - "Qwen/Qwen3-4B-MLX-8bit", "qwen3-4b-mlx-8bit" ], "max_tokens": 32768, @@ -10483,7 +10324,6 @@ { "name": "qwen/qwen3-14b-mlx-8bit", "alias": [ - "Qwen/Qwen3-14B-MLX-8bit", "qwen3-14b-mlx-8bit" ], "max_tokens": 32768, @@ -10494,7 +10334,6 @@ { "name": "qwen/qwen3-4b-mlx-bf16", "alias": [ - "Qwen/Qwen3-4B-MLX-bf16", "qwen3-4b-mlx-bf16" ], "max_tokens": 32768, @@ -10505,7 +10344,6 @@ { "name": "qwen/qwen3-8b-mlx-bf16", "alias": [ - "Qwen/Qwen3-8B-MLX-bf16", "qwen3-8b-mlx-bf16" ], "max_tokens": 32768, @@ -10516,7 +10354,6 @@ { "name": "qwen/qwen3-8b-mlx-8bit", "alias": [ - "Qwen/Qwen3-8B-MLX-8bit", "qwen3-8b-mlx-8bit" ], "max_tokens": 32768, @@ -10527,7 +10364,6 @@ { "name": "qwen/qwen3-8b-mlx-4bit", "alias": [ - "Qwen/Qwen3-8B-MLX-4bit", "qwen3-8b-mlx-4bit" ], "max_tokens": 32768, @@ -10538,7 +10374,6 @@ { "name": "qwen/qwen3-1.7b-mlx-4bit", "alias": [ - "Qwen/Qwen3-1.7B-MLX-4bit", "qwen3-1.7b-mlx-4bit" ], "max_tokens": 32768, @@ -10549,7 +10384,6 @@ { "name": "qwen/qwen3-1.7b-mlx-8bit", "alias": [ - "Qwen/Qwen3-1.7B-MLX-8bit", "qwen3-1.7b-mlx-8bit" ], "max_tokens": 32768, @@ -10560,7 +10394,6 @@ { "name": "qwen/qwen3-1.7b-mlx-6bit", "alias": [ - "Qwen/Qwen3-1.7B-MLX-6bit", "qwen3-1.7b-mlx-6bit" ], "max_tokens": 32768, @@ -10571,7 +10404,6 @@ { "name": "qwen/qwen3-8b-mlx-6bit", "alias": [ - "Qwen/Qwen3-8B-MLX-6bit", "qwen3-8b-mlx-6bit" ], "max_tokens": 32768, @@ -10582,7 +10414,6 @@ { "name": "qwen/qwen3-1.7b-mlx-bf16", "alias": [ - "Qwen/Qwen3-1.7B-MLX-bf16", "qwen3-1.7b-mlx-bf16" ], "max_tokens": 32768, @@ -10593,7 +10424,6 @@ { "name": "qwen/qwen3-0.6b-mlx-8bit", "alias": [ - "Qwen/Qwen3-0.6B-MLX-8bit", "qwen3-0.6b-mlx-8bit" ], "max_tokens": 32768, @@ -10604,7 +10434,6 @@ { "name": "qwen/qwen3-0.6b-mlx-bf16", "alias": [ - "Qwen/Qwen3-0.6B-MLX-bf16", "qwen3-0.6b-mlx-bf16" ], "max_tokens": 32768, @@ -10615,7 +10444,6 @@ { "name": "qwen/qwen3-0.6b-mlx-6bit", "alias": [ - "Qwen/Qwen3-0.6B-MLX-6bit", "qwen3-0.6b-mlx-6bit" ], "max_tokens": 32768, @@ -10626,7 +10454,6 @@ { "name": "qwen/qwen3-0.6b-mlx-4bit", "alias": [ - "Qwen/Qwen3-0.6B-MLX-4bit", "qwen3-0.6b-mlx-4bit" ], "max_tokens": 32768, @@ -10637,7 +10464,6 @@ { "name": "qwen/worldpm-72b-rlhflow", "alias": [ - "Qwen/WorldPM-72B-RLHFLow", "worldpm-72b-rlhflow" ], "model_types": [ @@ -10647,7 +10473,6 @@ { "name": "qwen/worldpm-72b-ultrafeedback", "alias": [ - "Qwen/WorldPM-72B-UltraFeedback", "worldpm-72b-ultrafeedback" ], "max_tokens": 2048, @@ -10658,7 +10483,6 @@ { "name": "qwen/worldpm-72b-helpsteer2", "alias": [ - "Qwen/WorldPM-72B-HelpSteer2", "worldpm-72b-helpsteer2" ], "max_tokens": 2048, @@ -10669,7 +10493,6 @@ { "name": "qwen/worldpm-72b", "alias": [ - "Qwen/WorldPM-72B", "worldpm-72b" ], "max_tokens": 2048, @@ -10680,7 +10503,6 @@ { "name": "qwen/qwen2.5-omni-7b-gptq-int4", "alias": [ - "Qwen/Qwen2.5-Omni-7B-GPTQ-Int4", "qwen2.5-omni-7b-gptq-int4" ], "max_tokens": 32768, @@ -10699,7 +10521,6 @@ { "name": "qwen/qwen2.5-omni-7b-awq", "alias": [ - "Qwen/Qwen2.5-Omni-7B-AWQ", "qwen2.5-omni-7b-awq" ], "max_tokens": 32768, @@ -10718,7 +10539,6 @@ { "name": "qwen/qwen3-235b-a22b-gguf", "alias": [ - "Qwen/Qwen3-235B-A22B-GGUF", "qwen3-235b-a22b-gguf" ], "model_types": [ @@ -10729,7 +10549,6 @@ { "name": "qwen/qwen3-235b-a22b-gptq-int4", "alias": [ - "Qwen/Qwen3-235B-A22B-GPTQ-Int4", "qwen3-235b-a22b-gptq-int4" ], "max_tokens": 32768, @@ -10740,7 +10559,6 @@ { "name": "qwen/qwen3-0.6b-gptq-int8", "alias": [ - "Qwen/Qwen3-0.6B-GPTQ-Int8", "qwen3-0.6b-gptq-int8" ], "max_tokens": 32768, @@ -10751,7 +10569,6 @@ { "name": "qwen/qwen3-1.7b-gptq-int8", "alias": [ - "Qwen/Qwen3-1.7B-GPTQ-Int8", "qwen3-1.7b-gptq-int8" ], "max_tokens": 32768, @@ -10762,7 +10579,6 @@ { "name": "qwen/qwen3-4b-awq", "alias": [ - "Qwen/Qwen3-4B-AWQ", "qwen3-4b-awq" ], "max_tokens": 32768, @@ -10773,7 +10589,6 @@ { "name": "qwen/qwen3-0.6b-gguf", "alias": [ - "Qwen/Qwen3-0.6B-GGUF", "qwen3-0.6b-gguf" ], "model_types": [ @@ -10784,7 +10599,6 @@ { "name": "qwen/qwen3-1.7b-gguf", "alias": [ - "Qwen/Qwen3-1.7B-GGUF", "qwen3-1.7b-gguf" ], "model_types": [ @@ -10795,7 +10609,6 @@ { "name": "qwen/qwen3-30b-a3b-gptq-int4", "alias": [ - "Qwen/Qwen3-30B-A3B-GPTQ-Int4", "qwen3-30b-a3b-gptq-int4" ], "max_tokens": 32768, @@ -10806,7 +10619,6 @@ { "name": "qwen/qwen3-4b-gguf", "alias": [ - "Qwen/Qwen3-4B-GGUF", "qwen3-4b-gguf" ], "model_types": [ @@ -10817,7 +10629,6 @@ { "name": "qwen/qwen3-30b-a3b-gguf", "alias": [ - "Qwen/Qwen3-30B-A3B-GGUF", "qwen3-30b-a3b-gguf" ], "model_types": [ @@ -10828,7 +10639,6 @@ { "name": "qwen/qwen3-8b-gguf", "alias": [ - "Qwen/Qwen3-8B-GGUF", "qwen3-8b-gguf" ], "model_types": [ @@ -10839,7 +10649,6 @@ { "name": "qwen/qwen3-8b-awq", "alias": [ - "Qwen/Qwen3-8B-AWQ", "qwen3-8b-awq" ], "max_tokens": 32768, @@ -10850,7 +10659,6 @@ { "name": "qwen/qwen3-14b-awq", "alias": [ - "Qwen/Qwen3-14B-AWQ", "qwen3-14b-awq" ], "max_tokens": 32768, @@ -10861,7 +10669,6 @@ { "name": "qwen/qwen3-32b-awq", "alias": [ - "Qwen/Qwen3-32B-AWQ", "qwen3-32b-awq" ], "max_tokens": 32768, @@ -10872,7 +10679,6 @@ { "name": "qwen/qwen3-14b-gguf", "alias": [ - "Qwen/Qwen3-14B-GGUF", "qwen3-14b-gguf" ], "model_types": [ @@ -10883,7 +10689,6 @@ { "name": "qwen/qwen3-32b-gguf", "alias": [ - "Qwen/Qwen3-32B-GGUF", "qwen3-32b-gguf" ], "model_types": [ @@ -10894,7 +10699,6 @@ { "name": "qwen/qwen2.5-omni-3b", "alias": [ - "Qwen/Qwen2.5-Omni-3B", "qwen2.5-omni-3b" ], "max_tokens": 32768, @@ -10913,40 +10717,54 @@ { "name": "qwen/qwen3-235b-a22b-fp8", "alias": [ - "Qwen/Qwen3-235B-A22B-FP8", - "qwen3-235b-a22b-fp8" + "qwen3-235b-a22b-fp8", + "Qwen3 235B A22B" ], "max_tokens": 32768, "model_types": [ "chat" - ] + ], + "max_completion_tokens": 20000, + "thinking": { + "default_value": true, + "clear_thinking": true + } }, { "name": "qwen/qwen3-30b-a3b-fp8", "alias": [ - "Qwen/Qwen3-30B-A3B-FP8", - "qwen3-30b-a3b-fp8" + "qwen3-30b-a3b-fp8", + "Qwen3 30B A3B" ], "max_tokens": 32768, "model_types": [ "chat" - ] + ], + "max_completion_tokens": 20000, + "thinking": { + "default_value": true, + "clear_thinking": true + } }, { "name": "qwen/qwen3-32b-fp8", "alias": [ - "Qwen/Qwen3-32B-FP8", - "qwen3-32b-fp8" + "qwen3-32b-fp8", + "Qwen3 32B" ], "max_tokens": 32768, "model_types": [ "chat" - ] + ], + "max_completion_tokens": 20000, + "thinking": { + "default_value": true, + "clear_thinking": true + } }, { "name": "qwen/qwen3-14b-fp8", "alias": [ - "Qwen/Qwen3-14B-FP8", "qwen3-14b-fp8" ], "max_tokens": 32768, @@ -10957,29 +10775,34 @@ { "name": "qwen/qwen3-8b-fp8", "alias": [ - "Qwen/Qwen3-8B-FP8", - "qwen3-8b-fp8" + "qwen3-8b-fp8", + "Qwen3 8B" ], "max_tokens": 32768, "model_types": [ "chat" - ] + ], + "max_completion_tokens": 20000 }, { "name": "qwen/qwen3-4b-fp8", "alias": [ - "Qwen/Qwen3-4B-FP8", - "qwen3-4b-fp8" + "qwen3-4b-fp8", + "Qwen3 4B" ], "max_tokens": 32768, "model_types": [ "chat" - ] + ], + "max_completion_tokens": 8192, + "thinking": { + "default_value": true, + "clear_thinking": true + } }, { "name": "qwen/qwen3-1.7b-fp8", "alias": [ - "Qwen/Qwen3-1.7B-FP8", "qwen3-1.7b-fp8" ], "max_tokens": 32768, @@ -10990,7 +10813,6 @@ { "name": "qwen/qwen3-0.6b-fp8", "alias": [ - "Qwen/Qwen3-0.6B-FP8", "qwen3-0.6b-fp8" ], "max_tokens": 32768, @@ -11001,8 +10823,8 @@ { "name": "qwen/qwen3-0.6b-base", "alias": [ - "Qwen/Qwen3-0.6B-Base", - "qwen3-0.6b-base" + "qwen3-0.6b-base", + "Qwen3 0.6B Base" ], "max_tokens": 32768, "model_types": [ @@ -11012,8 +10834,8 @@ { "name": "qwen/qwen3-14b-base", "alias": [ - "Qwen/Qwen3-14B-Base", - "qwen3-14b-base" + "qwen3-14b-base", + "Qwen3 14B Base" ], "max_tokens": 32768, "model_types": [ @@ -11023,8 +10845,8 @@ { "name": "qwen/qwen3-1.7b-base", "alias": [ - "Qwen/Qwen3-1.7B-Base", - "qwen3-1.7b-base" + "qwen3-1.7b-base", + "Qwen3 1.7B Base" ], "max_tokens": 32768, "model_types": [ @@ -11034,8 +10856,8 @@ { "name": "qwen/qwen3-4b-base", "alias": [ - "Qwen/Qwen3-4B-Base", - "qwen3-4b-base" + "qwen3-4b-base", + "Qwen3 4B Base" ], "max_tokens": 32768, "model_types": [ @@ -11045,8 +10867,8 @@ { "name": "qwen/qwen3-8b-base", "alias": [ - "Qwen/Qwen3-8B-Base", - "qwen3-8b-base" + "qwen3-8b-base", + "Qwen3 8B Base" ], "max_tokens": 32768, "model_types": [ @@ -11056,8 +10878,8 @@ { "name": "qwen/qwen3-30b-a3b-base", "alias": [ - "Qwen/Qwen3-30B-A3B-Base", - "qwen3-30b-a3b-base" + "qwen3-30b-a3b-base", + "Qwen3 30B A3b Base" ], "max_tokens": 32768, "model_types": [ @@ -11067,9 +10889,7 @@ { "name": "qwen/qwen3-235b-a22b", "alias": [ - "Qwen/Qwen3-235B-A22B", - "qwen3-235b-a22b", - "Qwen3-235B-A22B" + "qwen3-235b-a22b" ], "max_tokens": 32768, "model_types": [ @@ -11079,23 +10899,21 @@ { "name": "qwen/qwen3-32b", "alias": [ - "Qwen/Qwen3-32B", "qwen3-32b", - "Qwen3-32B", "qwen.qwen3-32b", - "qwen.qwen3-32b-v1:0" + "qwen.qwen3-32b-v1:0", + "qwen3-32b-20250429" ], "max_tokens": 32768, "model_types": [ "chat" - ] + ], + "max_completion_tokens": 40960 }, { "name": "qwen/qwen3-30b-a3b", "alias": [ - "Qwen/Qwen3-30B-A3B", - "qwen3-30b-a3b", - "Qwen3-30B-A3B" + "qwen3-30b-a3b" ], "max_tokens": 32768, "model_types": [ @@ -11105,9 +10923,9 @@ { "name": "qwen/qwen3-14b", "alias": [ - "Qwen/Qwen3-14B", "qwen3-14b", - "Qwen3-14B" + "Qwen3 14B", + "qwen3-14b-20250429" ], "max_tokens": 32768, "model_types": [ @@ -11117,9 +10935,8 @@ { "name": "qwen/qwen3-8b", "alias": [ - "Qwen/Qwen3-8B", "qwen3-8b", - "Qwen3-8B" + "qwen3-8b-20250429" ], "max_tokens": 32768, "model_types": [ @@ -11129,9 +10946,7 @@ { "name": "qwen/qwen3-4b", "alias": [ - "Qwen/Qwen3-4B", - "qwen3-4b", - "Qwen3-4B" + "qwen3-4b" ], "max_tokens": 32768, "model_types": [ @@ -11141,8 +10956,8 @@ { "name": "qwen/qwen3-1.7b", "alias": [ - "Qwen/Qwen3-1.7B", - "qwen3-1.7b" + "qwen3-1.7b", + "Qwen3 1.7B" ], "max_tokens": 32768, "model_types": [ @@ -11152,9 +10967,8 @@ { "name": "qwen/qwen3-0.6b", "alias": [ - "Qwen/Qwen3-0.6B", "qwen3-0.6b", - "Qwen3-0.6B" + "Qwen3 0.6B" ], "max_tokens": 32768, "model_types": [ @@ -11164,7 +10978,6 @@ { "name": "qwen/qwen2.5-vl-32b-instruct-awq", "alias": [ - "Qwen/Qwen2.5-VL-32B-Instruct-AWQ", "qwen2.5-vl-32b-instruct-awq" ], "max_tokens": 128000, @@ -11175,7 +10988,6 @@ { "name": "qwen/qwen2.5-omni-7b", "alias": [ - "Qwen/Qwen2.5-Omni-7B", "qwen2.5-omni-7b" ], "max_tokens": 32768, @@ -11194,20 +11006,20 @@ { "name": "qwen/qwen2.5-vl-32b-instruct", "alias": [ - "Qwen/Qwen2.5-VL-32B-Instruct", "qwen2.5-vl-32b-instruct", - "Qwen2.5-VL-32B", - "Qwen2.5-VL-32B-Instruct" + "Qwen2.5-VL-32B" ], "max_tokens": 128000, "model_types": [ - "chat" + "chat", + "image2text", + "vision", + "ocr" ] }, { "name": "qwen/qwq-32b-gguf", "alias": [ - "Qwen/QwQ-32B-GGUF", "qwq-32b-gguf" ], "model_types": [ @@ -11222,9 +11034,8 @@ { "name": "qwen/qwq-32b", "alias": [ - "Qwen/QwQ-32B", "qwq-32b", - "QwQ-32B" + "Qwen QwQ-32B" ], "max_tokens": 131072, "model_types": [ @@ -11238,7 +11049,6 @@ { "name": "qwen/qwq-32b-awq", "alias": [ - "Qwen/QwQ-32B-AWQ", "qwq-32b-awq" ], "max_tokens": 131072, @@ -11253,7 +11063,6 @@ { "name": "qwen/qwen2.5-vl-7b-instruct-awq", "alias": [ - "Qwen/Qwen2.5-VL-7B-Instruct-AWQ", "qwen2.5-vl-7b-instruct-awq" ], "max_tokens": 128000, @@ -11264,7 +11073,6 @@ { "name": "qwen/qwen2.5-vl-72b-instruct-awq", "alias": [ - "Qwen/Qwen2.5-VL-72B-Instruct-AWQ", "qwen2.5-vl-72b-instruct-awq" ], "max_tokens": 128000, @@ -11275,7 +11083,6 @@ { "name": "qwen/qwen2.5-vl-3b-instruct-awq", "alias": [ - "Qwen/Qwen2.5-VL-3B-Instruct-AWQ", "qwen2.5-vl-3b-instruct-awq" ], "max_tokens": 128000, @@ -11286,23 +11093,26 @@ { "name": "qwen/qwen2.5-vl-72b-instruct", "alias": [ - "Qwen/Qwen2.5-VL-72B-Instruct", "qwen2.5-vl-72b-instruct", "qwen-2.5-vl-72b-instruct", "Qwen2.5-VL-72B", - "qwen2.5-vl-72b" + "Qwen2.5 VL 72B Instruct", + "Qwen2.5-VL (72B) Instruct" ], "max_tokens": 128000, "model_types": [ - "chat" - ] + "chat", + "vision", + "image2text" + ], + "max_completion_tokens": 32768 }, { "name": "qwen/qwen2.5-vl-7b-instruct", "alias": [ - "Qwen/Qwen2.5-VL-7B-Instruct", "qwen2.5-vl-7b-instruct", - "qwen-2.5-vl-7b-instruct" + "qwen-2.5-vl-7b-instruct", + "Qwen2.5-VL-7b" ], "max_tokens": 128000, "model_types": [ @@ -11312,8 +11122,8 @@ { "name": "qwen/qwen2.5-vl-3b-instruct", "alias": [ - "Qwen/Qwen2.5-VL-3B-Instruct", - "qwen2.5-vl-3b-instruct" + "qwen2.5-vl-3b-instruct", + "Qwen2.5-VL-3b" ], "max_tokens": 128000, "model_types": [ @@ -11323,7 +11133,6 @@ { "name": "qwen/qwen2.5-7b-instruct-1m", "alias": [ - "Qwen/Qwen2.5-7B-Instruct-1M", "qwen2.5-7b-instruct-1m" ], "max_tokens": 131072, @@ -11334,7 +11143,6 @@ { "name": "qwen/qwen2.5-14b-instruct-1m", "alias": [ - "Qwen/Qwen2.5-14B-Instruct-1M", "qwen2.5-14b-instruct-1m" ], "max_tokens": 131072, @@ -11345,7 +11153,6 @@ { "name": "qwen/qwen2.5-math-prm-7b", "alias": [ - "Qwen/Qwen2.5-Math-PRM-7B", "qwen2.5-math-prm-7b" ], "max_tokens": 4096, @@ -11356,7 +11163,6 @@ { "name": "qwen/qwen2.5-math-prm-72b", "alias": [ - "Qwen/Qwen2.5-Math-PRM-72B", "qwen2.5-math-prm-72b" ], "max_tokens": 4096, @@ -11367,7 +11173,6 @@ { "name": "qwen/qwen2.5-math-7b-prm800k", "alias": [ - "Qwen/Qwen2.5-Math-7B-PRM800K", "qwen2.5-math-7b-prm800k" ], "max_tokens": 4096, @@ -11378,18 +11183,18 @@ { "name": "qwen/qvq-72b-preview", "alias": [ - "Qwen/QVQ-72B-Preview", "qvq-72b-preview" ], "max_tokens": 128000, "model_types": [ - "chat" + "chat", + "image2text", + "vision" ] }, { "name": "qwen/qwen2-vl-72b", "alias": [ - "Qwen/Qwen2-VL-72B", "qwen2-vl-72b" ], "max_tokens": 32768, @@ -11400,7 +11205,6 @@ { "name": "qwen/qwq-32b-preview", "alias": [ - "Qwen/QwQ-32B-Preview", "qwq-32b-preview" ], "max_tokens": 32768, @@ -11415,7 +11219,6 @@ { "name": "qwen/qwen2.5-coder-0.5b-instruct-gguf", "alias": [ - "Qwen/Qwen2.5-Coder-0.5B-Instruct-GGUF", "qwen2.5-coder-0.5b-instruct-gguf" ], "model_types": [ @@ -11425,7 +11228,6 @@ { "name": "qwen/qwen2.5-coder-0.5b-instruct-awq", "alias": [ - "Qwen/Qwen2.5-Coder-0.5B-Instruct-AWQ", "qwen2.5-coder-0.5b-instruct-awq" ], "max_tokens": 32768, @@ -11436,7 +11238,6 @@ { "name": "qwen/qwen2.5-coder-3b-instruct-gguf", "alias": [ - "Qwen/Qwen2.5-Coder-3B-Instruct-GGUF", "qwen2.5-coder-3b-instruct-gguf" ], "model_types": [ @@ -11446,7 +11247,6 @@ { "name": "qwen/qwen2.5-coder-3b-instruct-awq", "alias": [ - "Qwen/Qwen2.5-Coder-3B-Instruct-AWQ", "qwen2.5-coder-3b-instruct-awq" ], "max_tokens": 32768, @@ -11457,7 +11257,6 @@ { "name": "qwen/qwen2.5-coder-14b-instruct-gguf", "alias": [ - "Qwen/Qwen2.5-Coder-14B-Instruct-GGUF", "qwen2.5-coder-14b-instruct-gguf" ], "model_types": [ @@ -11467,7 +11266,6 @@ { "name": "qwen/qwen2.5-coder-14b-instruct-awq", "alias": [ - "Qwen/Qwen2.5-Coder-14B-Instruct-AWQ", "qwen2.5-coder-14b-instruct-awq" ], "max_tokens": 32768, @@ -11478,7 +11276,6 @@ { "name": "qwen/qwen2.5-coder-32b-instruct-gguf", "alias": [ - "Qwen/Qwen2.5-Coder-32B-Instruct-GGUF", "qwen2.5-coder-32b-instruct-gguf" ], "model_types": [ @@ -11488,7 +11285,6 @@ { "name": "qwen/qwen2.5-coder-32b-instruct-awq", "alias": [ - "Qwen/Qwen2.5-Coder-32B-Instruct-AWQ", "qwen2.5-coder-32b-instruct-awq" ], "max_tokens": 32768, @@ -11499,7 +11295,6 @@ { "name": "qwen/qwen2.5-coder-32b-instruct-gptq-int4", "alias": [ - "Qwen/Qwen2.5-Coder-32B-Instruct-GPTQ-Int4", "qwen2.5-coder-32b-instruct-gptq-int4" ], "max_tokens": 32768, @@ -11510,7 +11305,6 @@ { "name": "qwen/qwen2.5-coder-32b-instruct-gptq-int8", "alias": [ - "Qwen/Qwen2.5-Coder-32B-Instruct-GPTQ-Int8", "qwen2.5-coder-32b-instruct-gptq-int8" ], "max_tokens": 32768, @@ -11521,7 +11315,6 @@ { "name": "qwen/qwen2.5-coder-14b-instruct-gptq-int4", "alias": [ - "Qwen/Qwen2.5-Coder-14B-Instruct-GPTQ-Int4", "qwen2.5-coder-14b-instruct-gptq-int4" ], "max_tokens": 32768, @@ -11532,7 +11325,6 @@ { "name": "qwen/qwen2.5-coder-14b-instruct-gptq-int8", "alias": [ - "Qwen/Qwen2.5-Coder-14B-Instruct-GPTQ-Int8", "qwen2.5-coder-14b-instruct-gptq-int8" ], "max_tokens": 32768, @@ -11543,7 +11335,6 @@ { "name": "qwen/qwen2.5-coder-3b-instruct-gptq-int4", "alias": [ - "Qwen/Qwen2.5-Coder-3B-Instruct-GPTQ-Int4", "qwen2.5-coder-3b-instruct-gptq-int4" ], "max_tokens": 32768, @@ -11554,7 +11345,6 @@ { "name": "qwen/qwen2.5-coder-3b-instruct-gptq-int8", "alias": [ - "Qwen/Qwen2.5-Coder-3B-Instruct-GPTQ-Int8", "qwen2.5-coder-3b-instruct-gptq-int8" ], "max_tokens": 32768, @@ -11565,7 +11355,6 @@ { "name": "qwen/qwen2.5-coder-0.5b-instruct-gptq-int4", "alias": [ - "Qwen/Qwen2.5-Coder-0.5B-Instruct-GPTQ-Int4", "qwen2.5-coder-0.5b-instruct-gptq-int4" ], "max_tokens": 32768, @@ -11576,7 +11365,6 @@ { "name": "qwen/qwen2.5-coder-0.5b-instruct-gptq-int8", "alias": [ - "Qwen/Qwen2.5-Coder-0.5B-Instruct-GPTQ-Int8", "qwen2.5-coder-0.5b-instruct-gptq-int8" ], "max_tokens": 32768, @@ -11587,7 +11375,6 @@ { "name": "qwen/qwen2.5-coder-32b", "alias": [ - "Qwen/Qwen2.5-Coder-32B", "qwen2.5-coder-32b" ], "max_tokens": 32768, @@ -11598,7 +11385,6 @@ { "name": "qwen/qwen2.5-coder-14b", "alias": [ - "Qwen/Qwen2.5-Coder-14B", "qwen2.5-coder-14b" ], "max_tokens": 32768, @@ -11609,7 +11395,6 @@ { "name": "qwen/qwen2.5-coder-3b", "alias": [ - "Qwen/Qwen2.5-Coder-3B", "qwen2.5-coder-3b" ], "max_tokens": 32768, @@ -11620,7 +11405,6 @@ { "name": "qwen/qwen2.5-coder-0.5b", "alias": [ - "Qwen/Qwen2.5-Coder-0.5B", "qwen2.5-coder-0.5b" ], "max_tokens": 32768, @@ -11631,8 +11415,8 @@ { "name": "qwen/qwen2.5-coder-32b-instruct", "alias": [ - "Qwen/Qwen2.5-Coder-32B-Instruct", - "qwen2.5-coder-32b-instruct" + "qwen2.5-coder-32b-instruct", + "Qwen 2.5 Coder 32B Instruct" ], "max_tokens": 32768, "model_types": [ @@ -11642,7 +11426,6 @@ { "name": "qwen/qwen2.5-coder-14b-instruct", "alias": [ - "Qwen/Qwen2.5-Coder-14B-Instruct", "qwen2.5-coder-14b-instruct" ], "max_tokens": 32768, @@ -11653,7 +11436,6 @@ { "name": "qwen/qwen2.5-coder-3b-instruct", "alias": [ - "Qwen/Qwen2.5-Coder-3B-Instruct", "qwen2.5-coder-3b-instruct" ], "max_tokens": 32768, @@ -11664,7 +11446,6 @@ { "name": "qwen/qwen2.5-coder-0.5b-instruct", "alias": [ - "Qwen/Qwen2.5-Coder-0.5B-Instruct", "qwen2.5-coder-0.5b-instruct" ], "max_tokens": 32768, @@ -11675,7 +11456,6 @@ { "name": "qwen/qwen2.5-coder-1.5b-instruct-awq", "alias": [ - "Qwen/Qwen2.5-Coder-1.5B-Instruct-AWQ", "qwen2.5-coder-1.5b-instruct-awq" ], "max_tokens": 32768, @@ -11686,7 +11466,6 @@ { "name": "qwen/qwen2.5-coder-7b-instruct-awq", "alias": [ - "Qwen/Qwen2.5-Coder-7B-Instruct-AWQ", "qwen2.5-coder-7b-instruct-awq" ], "max_tokens": 32768, @@ -11697,7 +11476,6 @@ { "name": "qwen/qwen2.5-coder-7b-instruct-gptq-int8", "alias": [ - "Qwen/Qwen2.5-Coder-7B-Instruct-GPTQ-Int8", "qwen2.5-coder-7b-instruct-gptq-int8" ], "max_tokens": 32768, @@ -11708,7 +11486,6 @@ { "name": "qwen/qwen2.5-coder-7b-instruct-gptq-int4", "alias": [ - "Qwen/Qwen2.5-Coder-7B-Instruct-GPTQ-Int4", "qwen2.5-coder-7b-instruct-gptq-int4" ], "max_tokens": 32768, @@ -11719,7 +11496,6 @@ { "name": "qwen/qwen2.5-coder-1.5b-instruct-gptq-int8", "alias": [ - "Qwen/Qwen2.5-Coder-1.5B-Instruct-GPTQ-Int8", "qwen2.5-coder-1.5b-instruct-gptq-int8" ], "max_tokens": 32768, @@ -11730,7 +11506,6 @@ { "name": "qwen/qwen2.5-coder-1.5b-instruct-gptq-int4", "alias": [ - "Qwen/Qwen2.5-Coder-1.5B-Instruct-GPTQ-Int4", "qwen2.5-coder-1.5b-instruct-gptq-int4" ], "max_tokens": 32768, @@ -11741,7 +11516,6 @@ { "name": "qwen/qwen2.5-math-7b-instruct", "alias": [ - "Qwen/Qwen2.5-Math-7B-Instruct", "qwen2.5-math-7b-instruct" ], "max_tokens": 4096, @@ -11752,7 +11526,6 @@ { "name": "qwen/qwen2.5-coder-1.5b-instruct-gguf", "alias": [ - "Qwen/Qwen2.5-Coder-1.5B-Instruct-GGUF", "qwen2.5-coder-1.5b-instruct-gguf" ], "model_types": [ @@ -11762,7 +11535,6 @@ { "name": "qwen/qwen2.5-coder-7b-instruct-gguf", "alias": [ - "Qwen/Qwen2.5-Coder-7B-Instruct-GGUF", "qwen2.5-coder-7b-instruct-gguf" ], "model_types": [ @@ -11772,7 +11544,6 @@ { "name": "qwen/qwen2.5-coder-1.5b-instruct", "alias": [ - "Qwen/Qwen2.5-Coder-1.5B-Instruct", "qwen2.5-coder-1.5b-instruct" ], "max_tokens": 32768, @@ -11783,7 +11554,6 @@ { "name": "qwen/qwen2.5-coder-1.5b", "alias": [ - "Qwen/Qwen2.5-Coder-1.5B", "qwen2.5-coder-1.5b" ], "max_tokens": 32768, @@ -11794,7 +11564,6 @@ { "name": "qwen/qwen2-7b-instruct-mlx", "alias": [ - "Qwen/Qwen2-7B-Instruct-MLX", "qwen2-7b-instruct-mlx" ], "max_tokens": 32768, @@ -11805,8 +11574,8 @@ { "name": "qwen/qwen2.5-1.5b-instruct", "alias": [ - "Qwen/Qwen2.5-1.5B-Instruct", - "qwen2.5-1.5b-instruct" + "qwen2.5-1.5b-instruct", + "Qwen2.5 1.5B Instruct" ], "max_tokens": 32768, "model_types": [ @@ -11816,8 +11585,8 @@ { "name": "qwen/qwen2.5-3b-instruct", "alias": [ - "Qwen/Qwen2.5-3B-Instruct", - "qwen2.5-3b-instruct" + "qwen2.5-3b-instruct", + "Qwen2.5 3B Instruct" ], "max_tokens": 32768, "model_types": [ @@ -11827,7 +11596,6 @@ { "name": "qwen/qwen2.5-72b-instruct-gguf", "alias": [ - "Qwen/Qwen2.5-72B-Instruct-GGUF", "qwen2.5-72b-instruct-gguf" ], "model_types": [ @@ -11838,7 +11606,6 @@ { "name": "qwen/qwen2.5-32b-instruct-gguf", "alias": [ - "Qwen/Qwen2.5-32B-Instruct-GGUF", "qwen2.5-32b-instruct-gguf" ], "model_types": [ @@ -11849,7 +11616,6 @@ { "name": "qwen/qwen2.5-14b-instruct-gguf", "alias": [ - "Qwen/Qwen2.5-14B-Instruct-GGUF", "qwen2.5-14b-instruct-gguf" ], "model_types": [ @@ -11860,7 +11626,6 @@ { "name": "qwen/qwen2.5-7b-instruct-gguf", "alias": [ - "Qwen/Qwen2.5-7B-Instruct-GGUF", "qwen2.5-7b-instruct-gguf" ], "model_types": [ @@ -11871,7 +11636,6 @@ { "name": "qwen/qwen2.5-3b-instruct-gguf", "alias": [ - "Qwen/Qwen2.5-3B-Instruct-GGUF", "qwen2.5-3b-instruct-gguf" ], "model_types": [ @@ -11881,7 +11645,6 @@ { "name": "qwen/qwen2.5-1.5b-instruct-gguf", "alias": [ - "Qwen/Qwen2.5-1.5B-Instruct-GGUF", "qwen2.5-1.5b-instruct-gguf" ], "model_types": [ @@ -11891,7 +11654,6 @@ { "name": "qwen/qwen2.5-0.5b-instruct-gguf", "alias": [ - "Qwen/Qwen2.5-0.5B-Instruct-GGUF", "qwen2.5-0.5b-instruct-gguf" ], "model_types": [ @@ -11901,7 +11663,6 @@ { "name": "qwen/qwen2.5-72b-instruct-awq", "alias": [ - "Qwen/Qwen2.5-72B-Instruct-AWQ", "qwen2.5-72b-instruct-awq" ], "max_tokens": 131072, @@ -11912,7 +11673,6 @@ { "name": "qwen/qwen2.5-32b-instruct-awq", "alias": [ - "Qwen/Qwen2.5-32B-Instruct-AWQ", "qwen2.5-32b-instruct-awq" ], "max_tokens": 131072, @@ -11923,7 +11683,6 @@ { "name": "qwen/qwen2.5-14b-instruct-awq", "alias": [ - "Qwen/Qwen2.5-14B-Instruct-AWQ", "qwen2.5-14b-instruct-awq" ], "max_tokens": 131072, @@ -11934,7 +11693,6 @@ { "name": "qwen/qwen2.5-7b-instruct-awq", "alias": [ - "Qwen/Qwen2.5-7B-Instruct-AWQ", "qwen2.5-7b-instruct-awq" ], "max_tokens": 131072, @@ -11945,7 +11703,6 @@ { "name": "qwen/qwen2.5-3b-instruct-awq", "alias": [ - "Qwen/Qwen2.5-3B-Instruct-AWQ", "qwen2.5-3b-instruct-awq" ], "max_tokens": 32768, @@ -11956,7 +11713,6 @@ { "name": "qwen/qwen2.5-1.5b-instruct-awq", "alias": [ - "Qwen/Qwen2.5-1.5B-Instruct-AWQ", "qwen2.5-1.5b-instruct-awq" ], "max_tokens": 32768, @@ -11967,7 +11723,6 @@ { "name": "qwen/qwen2.5-0.5b-instruct-awq", "alias": [ - "Qwen/Qwen2.5-0.5B-Instruct-AWQ", "qwen2.5-0.5b-instruct-awq" ], "max_tokens": 32768, @@ -11978,7 +11733,6 @@ { "name": "qwen/qwen2.5-coder-7b-instruct", "alias": [ - "Qwen/Qwen2.5-Coder-7B-Instruct", "qwen2.5-coder-7b-instruct" ], "max_tokens": 32768, @@ -11989,7 +11743,6 @@ { "name": "qwen/qwen2.5-72b-instruct-gptq-int8", "alias": [ - "Qwen/Qwen2.5-72B-Instruct-GPTQ-Int8", "qwen2.5-72b-instruct-gptq-int8" ], "max_tokens": 131072, @@ -12000,7 +11753,6 @@ { "name": "qwen/qwen2.5-72b-instruct-gptq-int4", "alias": [ - "Qwen/Qwen2.5-72B-Instruct-GPTQ-Int4", "qwen2.5-72b-instruct-gptq-int4" ], "max_tokens": 131072, @@ -12011,7 +11763,6 @@ { "name": "qwen/qwen2.5-32b-instruct-gptq-int8", "alias": [ - "Qwen/Qwen2.5-32B-Instruct-GPTQ-Int8", "qwen2.5-32b-instruct-gptq-int8" ], "max_tokens": 131072, @@ -12022,7 +11773,6 @@ { "name": "qwen/qwen2.5-32b-instruct-gptq-int4", "alias": [ - "Qwen/Qwen2.5-32B-Instruct-GPTQ-Int4", "qwen2.5-32b-instruct-gptq-int4" ], "max_tokens": 131072, @@ -12033,7 +11783,6 @@ { "name": "qwen/qwen2.5-14b-instruct-gptq-int8", "alias": [ - "Qwen/Qwen2.5-14B-Instruct-GPTQ-Int8", "qwen2.5-14b-instruct-gptq-int8" ], "max_tokens": 131072, @@ -12044,7 +11793,6 @@ { "name": "qwen/qwen2.5-14b-instruct-gptq-int4", "alias": [ - "Qwen/Qwen2.5-14B-Instruct-GPTQ-Int4", "qwen2.5-14b-instruct-gptq-int4" ], "max_tokens": 131072, @@ -12055,7 +11803,6 @@ { "name": "qwen/qwen2.5-7b-instruct-gptq-int8", "alias": [ - "Qwen/Qwen2.5-7B-Instruct-GPTQ-Int8", "qwen2.5-7b-instruct-gptq-int8" ], "max_tokens": 131072, @@ -12066,7 +11813,6 @@ { "name": "qwen/qwen2.5-7b-instruct-gptq-int4", "alias": [ - "Qwen/Qwen2.5-7B-Instruct-GPTQ-Int4", "qwen2.5-7b-instruct-gptq-int4" ], "max_tokens": 131072, @@ -12077,7 +11823,6 @@ { "name": "qwen/qwen2.5-3b-instruct-gptq-int8", "alias": [ - "Qwen/Qwen2.5-3B-Instruct-GPTQ-Int8", "qwen2.5-3b-instruct-gptq-int8" ], "max_tokens": 32768, @@ -12088,7 +11833,6 @@ { "name": "qwen/qwen2.5-3b-instruct-gptq-int4", "alias": [ - "Qwen/Qwen2.5-3B-Instruct-GPTQ-Int4", "qwen2.5-3b-instruct-gptq-int4" ], "max_tokens": 32768, @@ -12099,7 +11843,6 @@ { "name": "qwen/qwen2.5-1.5b-instruct-gptq-int8", "alias": [ - "Qwen/Qwen2.5-1.5B-Instruct-GPTQ-Int8", "qwen2.5-1.5b-instruct-gptq-int8" ], "max_tokens": 32768, @@ -12110,7 +11853,6 @@ { "name": "qwen/qwen2.5-1.5b-instruct-gptq-int4", "alias": [ - "Qwen/Qwen2.5-1.5B-Instruct-GPTQ-Int4", "qwen2.5-1.5b-instruct-gptq-int4" ], "max_tokens": 32768, @@ -12121,7 +11863,6 @@ { "name": "qwen/qwen2.5-0.5b-instruct-gptq-int8", "alias": [ - "Qwen/Qwen2.5-0.5B-Instruct-GPTQ-Int8", "qwen2.5-0.5b-instruct-gptq-int8" ], "max_tokens": 32768, @@ -12132,7 +11873,6 @@ { "name": "qwen/qwen2.5-0.5b-instruct-gptq-int4", "alias": [ - "Qwen/Qwen2.5-0.5B-Instruct-GPTQ-Int4", "qwen2.5-0.5b-instruct-gptq-int4" ], "max_tokens": 32768, @@ -12143,7 +11883,6 @@ { "name": "qwen/qwen2-math-rm-72b", "alias": [ - "Qwen/Qwen2-Math-RM-72B", "qwen2-math-rm-72b" ], "max_tokens": 4096, @@ -12154,7 +11893,6 @@ { "name": "qwen/qwen2.5-math-rm-72b", "alias": [ - "Qwen/Qwen2.5-Math-RM-72B", "qwen2.5-math-rm-72b" ], "max_tokens": 4096, @@ -12165,7 +11903,6 @@ { "name": "qwen/qwen2-vl-72b-instruct-gptq-int8", "alias": [ - "Qwen/Qwen2-VL-72B-Instruct-GPTQ-Int8", "qwen2-vl-72b-instruct-gptq-int8" ], "max_tokens": 32768, @@ -12176,7 +11913,6 @@ { "name": "qwen/qwen2-vl-72b-instruct-gptq-int4", "alias": [ - "Qwen/Qwen2-VL-72B-Instruct-GPTQ-Int4", "qwen2-vl-72b-instruct-gptq-int4" ], "max_tokens": 32768, @@ -12187,7 +11923,6 @@ { "name": "qwen/qwen2-vl-72b-instruct-awq", "alias": [ - "Qwen/Qwen2-VL-72B-Instruct-AWQ", "qwen2-vl-72b-instruct-awq" ], "max_tokens": 32768, @@ -12198,31 +11933,35 @@ { "name": "qwen/qwen2-vl-72b-instruct", "alias": [ - "Qwen/Qwen2-VL-72B-Instruct", "qwen2-vl-72b-instruct", - "qwen/qwen-2-vl-72b-instruct" + "qwen/qwen-2-vl-72b-instruct", + "qwen-2-vl-72b-instruct", + "Qwen 2 VL 72B Instruct", + "Qwen2-VL (72B) Instruct" ], "max_tokens": 32768, "model_types": [ - "chat" - ] + "chat", + "vision", + "image2text" + ], + "max_completion_tokens": 120000 }, { "name": "qwen/qwen2.5-32b-instruct", "alias": [ - "Qwen/Qwen2.5-32B-Instruct", "qwen2.5-32b-instruct", - "Qwen2.5-32B-Instruct" + "Qwen2.5 32B Instruct" ], "max_tokens": 131072, "model_types": [ "chat" - ] + ], + "max_completion_tokens": 32000 }, { "name": "qwen/qwen2.5-math-72b-instruct", "alias": [ - "Qwen/Qwen2.5-Math-72B-Instruct", "qwen2.5-math-72b-instruct" ], "max_tokens": 4096, @@ -12233,7 +11972,6 @@ { "name": "qwen/qwen2.5-math-72b", "alias": [ - "Qwen/Qwen2.5-Math-72B", "qwen2.5-math-72b" ], "max_tokens": 4096, @@ -12244,7 +11982,6 @@ { "name": "qwen/qwen2.5-math-7b", "alias": [ - "Qwen/Qwen2.5-Math-7B", "qwen2.5-math-7b" ], "max_tokens": 4096, @@ -12255,7 +11992,6 @@ { "name": "qwen/qwen2.5-math-1.5b-instruct", "alias": [ - "Qwen/Qwen2.5-Math-1.5B-Instruct", "qwen2.5-math-1.5b-instruct" ], "max_tokens": 4096, @@ -12266,7 +12002,6 @@ { "name": "qwen/qwen2.5-math-1.5b", "alias": [ - "Qwen/Qwen2.5-Math-1.5B", "qwen2.5-math-1.5b" ], "max_tokens": 4096, @@ -12277,7 +12012,6 @@ { "name": "qwen/qwen2.5-coder-7b", "alias": [ - "Qwen/Qwen2.5-Coder-7B", "qwen2.5-coder-7b" ], "max_tokens": 32768, @@ -12288,22 +12022,23 @@ { "name": "qwen/qwen2.5-72b-instruct", "alias": [ - "Qwen/Qwen2.5-72B-Instruct", "qwen2.5-72b-instruct", "qwen/qwen-2.5-72b-instruct", - "Qwen2.5-72B-Instruct" + "qwen-2.5-72b-instruct", + "Qwen 2.5 72B Instruct", + "Qwen2.5 72B Instruct" ], "max_tokens": 131072, "model_types": [ "chat" - ] + ], + "max_completion_tokens": 8192 }, { "name": "qwen/qwen2.5-14b-instruct", "alias": [ - "Qwen/Qwen2.5-14B-Instruct", "qwen2.5-14b-instruct", - "Qwen2.5-14B-Instruct" + "Qwen 2.5 14B Instruct" ], "max_tokens": 131072, "model_types": [ @@ -12313,19 +12048,18 @@ { "name": "qwen/qwen2.5-7b-instruct", "alias": [ - "Qwen/Qwen2.5-7B-Instruct", "qwen2.5-7b-instruct", - "Qwen2.5-7B-Instruct" + "Qwen2.5 7B Instruct" ], "max_tokens": 131072, "model_types": [ "chat" - ] + ], + "max_completion_tokens": 8192 }, { "name": "qwen/qwen2.5-0.5b-instruct", "alias": [ - "Qwen/Qwen2.5-0.5B-Instruct", "qwen2.5-0.5b-instruct" ], "max_tokens": 32768, @@ -12336,9 +12070,8 @@ { "name": "qwen/qwen2.5-72b", "alias": [ - "Qwen/Qwen2.5-72B", "qwen2.5-72b", - "Qwen2.5-72B" + "Qwen2.5 72B" ], "max_tokens": 131072, "model_types": [ @@ -12348,8 +12081,8 @@ { "name": "qwen/qwen2.5-32b", "alias": [ - "Qwen/Qwen2.5-32B", - "qwen2.5-32b" + "qwen2.5-32b", + "Qwen2.5 32B" ], "max_tokens": 131072, "model_types": [ @@ -12359,8 +12092,8 @@ { "name": "qwen/qwen2.5-14b", "alias": [ - "Qwen/Qwen2.5-14B", - "qwen2.5-14b" + "qwen2.5-14b", + "Qwen2.5 14B" ], "max_tokens": 131072, "model_types": [ @@ -12370,8 +12103,8 @@ { "name": "qwen/qwen2.5-7b", "alias": [ - "Qwen/Qwen2.5-7B", - "qwen2.5-7b" + "qwen2.5-7b", + "Qwen2.5 7B" ], "max_tokens": 131072, "model_types": [ @@ -12381,7 +12114,6 @@ { "name": "qwen/qwen2.5-3b", "alias": [ - "Qwen/Qwen2.5-3B", "qwen2.5-3b" ], "max_tokens": 32768, @@ -12392,8 +12124,8 @@ { "name": "qwen/qwen2.5-1.5b", "alias": [ - "Qwen/Qwen2.5-1.5B", - "qwen2.5-1.5b" + "qwen2.5-1.5b", + "Qwen2.5 1.5B" ], "max_tokens": 131072, "model_types": [ @@ -12403,7 +12135,6 @@ { "name": "qwen/qwen2.5-0.5b", "alias": [ - "Qwen/Qwen2.5-0.5B", "qwen2.5-0.5b" ], "max_tokens": 32768, @@ -12414,7 +12145,6 @@ { "name": "qwen/qwen2-vl-7b", "alias": [ - "Qwen/Qwen2-VL-7B", "qwen2-vl-7b" ], "max_tokens": 32768, @@ -12425,7 +12155,6 @@ { "name": "qwen/qwen2-vl-2b", "alias": [ - "Qwen/Qwen2-VL-2B", "qwen2-vl-2b" ], "max_tokens": 32768, @@ -12436,7 +12165,6 @@ { "name": "qwen/qwen2-vl-2b-instruct-gptq-int8", "alias": [ - "Qwen/Qwen2-VL-2B-Instruct-GPTQ-Int8", "qwen2-vl-2b-instruct-gptq-int8" ], "max_tokens": 32768, @@ -12447,7 +12175,6 @@ { "name": "qwen/qwen2-vl-2b-instruct-gptq-int4", "alias": [ - "Qwen/Qwen2-VL-2B-Instruct-GPTQ-Int4", "qwen2-vl-2b-instruct-gptq-int4" ], "max_tokens": 32768, @@ -12458,7 +12185,6 @@ { "name": "qwen/qwen2-vl-2b-instruct-awq", "alias": [ - "Qwen/Qwen2-VL-2B-Instruct-AWQ", "qwen2-vl-2b-instruct-awq" ], "max_tokens": 32768, @@ -12469,7 +12195,6 @@ { "name": "qwen/qwen2-vl-7b-instruct-gptq-int8", "alias": [ - "Qwen/Qwen2-VL-7B-Instruct-GPTQ-Int8", "qwen2-vl-7b-instruct-gptq-int8" ], "max_tokens": 32768, @@ -12480,7 +12205,6 @@ { "name": "qwen/qwen2-vl-7b-instruct-gptq-int4", "alias": [ - "Qwen/Qwen2-VL-7B-Instruct-GPTQ-Int4", "qwen2-vl-7b-instruct-gptq-int4" ], "max_tokens": 32768, @@ -12491,7 +12215,6 @@ { "name": "qwen/qwen2-vl-7b-instruct-awq", "alias": [ - "Qwen/Qwen2-VL-7B-Instruct-AWQ", "qwen2-vl-7b-instruct-awq" ], "max_tokens": 32768, @@ -12502,7 +12225,6 @@ { "name": "qwen/qwen2-vl-7b-instruct", "alias": [ - "Qwen/Qwen2-VL-7B-Instruct", "qwen2-vl-7b-instruct" ], "max_tokens": 32768, @@ -12513,7 +12235,6 @@ { "name": "qwen/qwen2-vl-2b-instruct", "alias": [ - "Qwen/Qwen2-VL-2B-Instruct", "qwen2-vl-2b-instruct" ], "max_tokens": 32768, @@ -12524,7 +12245,6 @@ { "name": "qwen/qwen2-math-1.5b", "alias": [ - "Qwen/Qwen2-Math-1.5B", "qwen2-math-1.5b" ], "max_tokens": 4096, @@ -12535,7 +12255,6 @@ { "name": "qwen/qwen2-math-7b", "alias": [ - "Qwen/Qwen2-Math-7B", "qwen2-math-7b" ], "max_tokens": 4096, @@ -12546,7 +12265,6 @@ { "name": "qwen/qwen2-math-72b", "alias": [ - "Qwen/Qwen2-Math-72B", "qwen2-math-72b" ], "max_tokens": 4096, @@ -12557,7 +12275,6 @@ { "name": "qwen/qwen2-math-1.5b-instruct", "alias": [ - "Qwen/Qwen2-Math-1.5B-Instruct", "qwen2-math-1.5b-instruct" ], "max_tokens": 4096, @@ -12568,7 +12285,6 @@ { "name": "qwen/qwen2-math-7b-instruct", "alias": [ - "Qwen/Qwen2-Math-7B-Instruct", "qwen2-math-7b-instruct" ], "max_tokens": 4096, @@ -12579,7 +12295,6 @@ { "name": "qwen/qwen2-math-72b-instruct", "alias": [ - "Qwen/Qwen2-Math-72B-Instruct", "qwen2-math-72b-instruct" ], "max_tokens": 4096, @@ -12590,9 +12305,7 @@ { "name": "qwen/qwen2-audio-7b-instruct", "alias": [ - "Qwen/Qwen2-Audio-7B-Instruct", - "qwen2-audio-7b-instruct", - "Qwen2-Audio-7B-Instruct" + "qwen2-audio-7b-instruct" ], "max_tokens": 8192, "model_types": [ @@ -12605,7 +12318,6 @@ { "name": "qwen/qwen2-audio-7b", "alias": [ - "Qwen/Qwen2-Audio-7B", "qwen2-audio-7b" ], "max_tokens": 8192, @@ -12618,7 +12330,6 @@ { "name": "qwen/qwen2-57b-a14b-instruct-gguf", "alias": [ - "Qwen/Qwen2-57B-A14B-Instruct-GGUF", "qwen2-57b-a14b-instruct-gguf" ], "model_types": [ @@ -12628,7 +12339,6 @@ { "name": "qwen/qwen2-1.5b-instruct-gguf", "alias": [ - "Qwen/Qwen2-1.5B-Instruct-GGUF", "qwen2-1.5b-instruct-gguf" ], "model_types": [ @@ -12638,7 +12348,6 @@ { "name": "qwen/qwen2-7b-instruct-gguf", "alias": [ - "Qwen/Qwen2-7B-Instruct-GGUF", "qwen2-7b-instruct-gguf" ], "model_types": [ @@ -12648,7 +12357,6 @@ { "name": "qwen/qwen2-72b-instruct-gguf", "alias": [ - "Qwen/Qwen2-72B-Instruct-GGUF", "qwen2-72b-instruct-gguf" ], "model_types": [ @@ -12658,7 +12366,6 @@ { "name": "qwen/qwen2-1.5b-instruct-mlx", "alias": [ - "Qwen/Qwen2-1.5B-Instruct-MLX", "qwen2-1.5b-instruct-mlx" ], "max_tokens": 32768, @@ -12669,7 +12376,6 @@ { "name": "qwen/qwen2-0.5b-instruct-gguf", "alias": [ - "Qwen/Qwen2-0.5B-Instruct-GGUF", "qwen2-0.5b-instruct-gguf" ], "model_types": [ @@ -12679,7 +12385,6 @@ { "name": "qwen/qwen2-0.5b-instruct-mlx", "alias": [ - "Qwen/Qwen2-0.5B-Instruct-MLX", "qwen2-0.5b-instruct-mlx" ], "max_tokens": 32768, @@ -12690,7 +12395,6 @@ { "name": "qwen/qwen2-0.5b-instruct-awq", "alias": [ - "Qwen/Qwen2-0.5B-Instruct-AWQ", "qwen2-0.5b-instruct-awq" ], "max_tokens": 32768, @@ -12701,7 +12405,6 @@ { "name": "qwen/qwen2-0.5b-instruct-gptq-int8", "alias": [ - "Qwen/Qwen2-0.5B-Instruct-GPTQ-Int8", "qwen2-0.5b-instruct-gptq-int8" ], "max_tokens": 32768, @@ -12712,7 +12415,6 @@ { "name": "qwen/qwen2-0.5b-instruct-gptq-int4", "alias": [ - "Qwen/Qwen2-0.5B-Instruct-GPTQ-Int4", "qwen2-0.5b-instruct-gptq-int4" ], "max_tokens": 32768, @@ -12723,7 +12425,6 @@ { "name": "qwen/qwen2-7b-instruct-awq", "alias": [ - "Qwen/Qwen2-7B-Instruct-AWQ", "qwen2-7b-instruct-awq" ], "max_tokens": 32768, @@ -12734,7 +12435,6 @@ { "name": "qwen/qwen2-7b-instruct-gptq-int8", "alias": [ - "Qwen/Qwen2-7B-Instruct-GPTQ-Int8", "qwen2-7b-instruct-gptq-int8" ], "max_tokens": 32768, @@ -12745,7 +12445,6 @@ { "name": "qwen/qwen2-7b-instruct-gptq-int4", "alias": [ - "Qwen/Qwen2-7B-Instruct-GPTQ-Int4", "qwen2-7b-instruct-gptq-int4" ], "max_tokens": 32768, @@ -12756,7 +12455,6 @@ { "name": "qwen/qwen2-1.5b-instruct-awq", "alias": [ - "Qwen/Qwen2-1.5B-Instruct-AWQ", "qwen2-1.5b-instruct-awq" ], "max_tokens": 32768, @@ -12767,7 +12465,6 @@ { "name": "qwen/qwen2-1.5b-instruct-gptq-int8", "alias": [ - "Qwen/Qwen2-1.5B-Instruct-GPTQ-Int8", "qwen2-1.5b-instruct-gptq-int8" ], "max_tokens": 32768, @@ -12778,7 +12475,6 @@ { "name": "qwen/qwen2-1.5b-instruct-gptq-int4", "alias": [ - "Qwen/Qwen2-1.5B-Instruct-GPTQ-Int4", "qwen2-1.5b-instruct-gptq-int4" ], "max_tokens": 32768, @@ -12789,7 +12485,6 @@ { "name": "qwen/qwen2-57b-a14b-instruct-gptq-int4", "alias": [ - "Qwen/Qwen2-57B-A14B-Instruct-GPTQ-Int4", "qwen2-57b-a14b-instruct-gptq-int4" ], "max_tokens": 32768, @@ -12800,8 +12495,8 @@ { "name": "qwen/qwen2-7b", "alias": [ - "Qwen/Qwen2-7B", - "qwen2-7b" + "qwen2-7b", + "Qwen 2 (7B)" ], "max_tokens": 131072, "model_types": [ @@ -12811,20 +12506,20 @@ { "name": "qwen/qwen2-7b-instruct", "alias": [ - "Qwen/Qwen2-7B-Instruct", "qwen2-7b-instruct", "qwen/qwen-2-7b-instruct", - "Qwen2-7B-Instruct" + "qwen-2-7b-instruct", + "Qwen 2 7B Instruct" ], "max_tokens": 32768, "model_types": [ "chat" - ] + ], + "max_completion_tokens": 32768 }, { "name": "qwen/qwen2-57b-a14b-instruct", "alias": [ - "Qwen/Qwen2-57B-A14B-Instruct", "qwen2-57b-a14b-instruct" ], "max_tokens": 32768, @@ -12835,7 +12530,6 @@ { "name": "qwen/qwen2-72b-instruct-awq", "alias": [ - "Qwen/Qwen2-72B-Instruct-AWQ", "qwen2-72b-instruct-awq" ], "max_tokens": 32768, @@ -12846,7 +12540,6 @@ { "name": "qwen/qwen2-72b-instruct-gptq-int8", "alias": [ - "Qwen/Qwen2-72B-Instruct-GPTQ-Int8", "qwen2-72b-instruct-gptq-int8" ], "max_tokens": 32768, @@ -12857,7 +12550,6 @@ { "name": "qwen/qwen2-72b-instruct-gptq-int4", "alias": [ - "Qwen/Qwen2-72B-Instruct-GPTQ-Int4", "qwen2-72b-instruct-gptq-int4" ], "max_tokens": 32768, @@ -12868,8 +12560,8 @@ { "name": "qwen/qwen2-1.5b-instruct", "alias": [ - "Qwen/Qwen2-1.5B-Instruct", - "qwen2-1.5b-instruct" + "qwen2-1.5b-instruct", + "Qwen 2 Instruct (1.5B)" ], "max_tokens": 32768, "model_types": [ @@ -12879,7 +12571,6 @@ { "name": "qwen/qwen2-0.5b-instruct", "alias": [ - "Qwen/Qwen2-0.5B-Instruct", "qwen2-0.5b-instruct" ], "max_tokens": 32768, @@ -12890,8 +12581,8 @@ { "name": "qwen/qwen2-1.5b", "alias": [ - "Qwen/Qwen2-1.5B", - "qwen2-1.5b" + "qwen2-1.5b", + "Qwen 2 (1.5B)" ], "max_tokens": 131072, "model_types": [ @@ -12901,7 +12592,6 @@ { "name": "qwen/qwen2-0.5b", "alias": [ - "Qwen/Qwen2-0.5B", "qwen2-0.5b" ], "max_tokens": 131072, @@ -12912,9 +12602,8 @@ { "name": "qwen/qwen2-72b-instruct", "alias": [ - "Qwen/Qwen2-72B-Instruct", "qwen2-72b-instruct", - "Qwen2-72B-Instruct" + "Qwen2 72B Instruct" ], "max_tokens": 32768, "model_types": [ @@ -12924,7 +12613,6 @@ { "name": "qwen/qwen2-57b-a14b", "alias": [ - "Qwen/Qwen2-57B-A14B", "qwen2-57b-a14b" ], "max_tokens": 131072, @@ -12935,8 +12623,8 @@ { "name": "qwen/qwen2-72b", "alias": [ - "Qwen/Qwen2-72B", - "qwen2-72b" + "qwen2-72b", + "Qwen 2 (72B)" ], "max_tokens": 131072, "model_types": [ @@ -12946,7 +12634,6 @@ { "name": "qwen/qwen1.5-110b-chat-gguf", "alias": [ - "Qwen/Qwen1.5-110B-Chat-GGUF", "qwen1.5-110b-chat-gguf" ], "model_types": [ @@ -12956,7 +12643,6 @@ { "name": "qwen/qwen1.5-110b-chat-awq", "alias": [ - "Qwen/Qwen1.5-110B-Chat-AWQ", "qwen1.5-110b-chat-awq" ], "max_tokens": 32768, @@ -12967,7 +12653,6 @@ { "name": "qwen/qwen1.5-110b-chat-gptq-int4", "alias": [ - "Qwen/Qwen1.5-110B-Chat-GPTQ-Int4", "qwen1.5-110b-chat-gptq-int4" ], "max_tokens": 32768, @@ -12978,7 +12663,6 @@ { "name": "qwen/qwen1.5-110b-chat", "alias": [ - "Qwen/Qwen1.5-110B-Chat", "qwen1.5-110b-chat" ], "max_tokens": 32768, @@ -12989,7 +12673,6 @@ { "name": "qwen/qwen1.5-110b", "alias": [ - "Qwen/Qwen1.5-110B", "qwen1.5-110b" ], "max_tokens": 32768, @@ -13000,7 +12683,6 @@ { "name": "qwen/codeqwen1.5-7b-awq", "alias": [ - "Qwen/CodeQwen1.5-7B-AWQ", "codeqwen1.5-7b-awq" ], "max_tokens": 65536, @@ -13011,7 +12693,6 @@ { "name": "qwen/codeqwen1.5-7b-chat-gguf", "alias": [ - "Qwen/CodeQwen1.5-7B-Chat-GGUF", "codeqwen1.5-7b-chat-gguf" ], "model_types": [ @@ -13021,7 +12702,6 @@ { "name": "qwen/codeqwen1.5-7b-chat-awq", "alias": [ - "Qwen/CodeQwen1.5-7B-Chat-AWQ", "codeqwen1.5-7b-chat-awq" ], "max_tokens": 65536, @@ -13032,7 +12712,6 @@ { "name": "qwen/codeqwen1.5-7b-chat", "alias": [ - "Qwen/CodeQwen1.5-7B-Chat", "codeqwen1.5-7b-chat" ], "max_tokens": 65536, @@ -13043,7 +12722,6 @@ { "name": "qwen/codeqwen1.5-7b", "alias": [ - "Qwen/CodeQwen1.5-7B", "codeqwen1.5-7b" ], "max_tokens": 65536, @@ -13054,7 +12732,6 @@ { "name": "qwen/qwen1.5-32b-chat-awq", "alias": [ - "Qwen/Qwen1.5-32B-Chat-AWQ", "qwen1.5-32b-chat-awq" ], "max_tokens": 32768, @@ -13065,7 +12742,6 @@ { "name": "qwen/qwen1.5-32b-chat-gguf", "alias": [ - "Qwen/Qwen1.5-32B-Chat-GGUF", "qwen1.5-32b-chat-gguf" ], "model_types": [ @@ -13075,7 +12751,6 @@ { "name": "qwen/qwen1.5-32b-chat", "alias": [ - "Qwen/Qwen1.5-32B-Chat", "qwen1.5-32b-chat" ], "max_tokens": 32768, @@ -13086,7 +12761,6 @@ { "name": "qwen/qwen1.5-32b-chat-gptq-int4", "alias": [ - "Qwen/Qwen1.5-32B-Chat-GPTQ-Int4", "qwen1.5-32b-chat-gptq-int4" ], "max_tokens": 32768, @@ -13097,7 +12771,6 @@ { "name": "qwen/qwen1.5-32b", "alias": [ - "Qwen/Qwen1.5-32B", "qwen1.5-32b" ], "max_tokens": 32768, @@ -13108,7 +12781,6 @@ { "name": "qwen/qwen1.5-moe-a2.7b-chat-gptq-int4", "alias": [ - "Qwen/Qwen1.5-MoE-A2.7B-Chat-GPTQ-Int4", "qwen1.5-moe-a2.7b-chat-gptq-int4" ], "max_tokens": 32768, @@ -13119,7 +12791,6 @@ { "name": "qwen/qwen1.5-moe-a2.7b-chat", "alias": [ - "Qwen/Qwen1.5-MoE-A2.7B-Chat", "qwen1.5-moe-a2.7b-chat" ], "max_tokens": 32768, @@ -13130,7 +12801,6 @@ { "name": "qwen/qwen1.5-moe-a2.7b", "alias": [ - "Qwen/Qwen1.5-MoE-A2.7B", "qwen1.5-moe-a2.7b" ], "max_tokens": 8192, @@ -13141,7 +12811,6 @@ { "name": "qwen/qwen1.5-0.5b-chat-gptq-int8", "alias": [ - "Qwen/Qwen1.5-0.5B-Chat-GPTQ-Int8", "qwen1.5-0.5b-chat-gptq-int8" ], "max_tokens": 32768, @@ -13152,7 +12821,6 @@ { "name": "qwen/qwen1.5-0.5b-chat-gptq-int4", "alias": [ - "Qwen/Qwen1.5-0.5B-Chat-GPTQ-Int4", "qwen1.5-0.5b-chat-gptq-int4" ], "max_tokens": 32768, @@ -13163,7 +12831,6 @@ { "name": "qwen/qwen1.5-1.8b-chat-gptq-int4", "alias": [ - "Qwen/Qwen1.5-1.8B-Chat-GPTQ-Int4", "qwen1.5-1.8b-chat-gptq-int4" ], "max_tokens": 32768, @@ -13174,7 +12841,6 @@ { "name": "qwen/qwen1.5-1.8b-chat-gptq-int8", "alias": [ - "Qwen/Qwen1.5-1.8B-Chat-GPTQ-Int8", "qwen1.5-1.8b-chat-gptq-int8" ], "max_tokens": 32768, @@ -13185,7 +12851,6 @@ { "name": "qwen/qwen1.5-4b-chat-gptq-int4", "alias": [ - "Qwen/Qwen1.5-4B-Chat-GPTQ-Int4", "qwen1.5-4b-chat-gptq-int4" ], "max_tokens": 32768, @@ -13196,7 +12861,6 @@ { "name": "qwen/qwen1.5-4b-chat-gptq-int8", "alias": [ - "Qwen/Qwen1.5-4B-Chat-GPTQ-Int8", "qwen1.5-4b-chat-gptq-int8" ], "max_tokens": 32768, @@ -13207,7 +12871,6 @@ { "name": "qwen/qwen1.5-7b-chat-gptq-int4", "alias": [ - "Qwen/Qwen1.5-7B-Chat-GPTQ-Int4", "qwen1.5-7b-chat-gptq-int4" ], "max_tokens": 32768, @@ -13218,7 +12881,6 @@ { "name": "qwen/qwen1.5-7b-chat-gptq-int8", "alias": [ - "Qwen/Qwen1.5-7B-Chat-GPTQ-Int8", "qwen1.5-7b-chat-gptq-int8" ], "max_tokens": 32768, @@ -13229,7 +12891,6 @@ { "name": "qwen/qwen1.5-14b-chat-gptq-int4", "alias": [ - "Qwen/Qwen1.5-14B-Chat-GPTQ-Int4", "qwen1.5-14b-chat-gptq-int4" ], "max_tokens": 32768, @@ -13240,7 +12901,6 @@ { "name": "qwen/qwen1.5-14b-chat-gptq-int8", "alias": [ - "Qwen/Qwen1.5-14B-Chat-GPTQ-Int8", "qwen1.5-14b-chat-gptq-int8" ], "max_tokens": 32768, @@ -13251,7 +12911,6 @@ { "name": "qwen/qwen1.5-72b-chat-gptq-int4", "alias": [ - "Qwen/Qwen1.5-72B-Chat-GPTQ-Int4", "qwen1.5-72b-chat-gptq-int4" ], "max_tokens": 32768, @@ -13262,7 +12921,6 @@ { "name": "qwen/qwen1.5-72b-chat-gptq-int8", "alias": [ - "Qwen/Qwen1.5-72B-Chat-GPTQ-Int8", "qwen1.5-72b-chat-gptq-int8" ], "max_tokens": 32768, @@ -13273,7 +12931,6 @@ { "name": "qwen/qwen1.5-4b-chat-gguf", "alias": [ - "Qwen/Qwen1.5-4B-Chat-GGUF", "qwen1.5-4b-chat-gguf" ], "model_types": [ @@ -13283,7 +12940,6 @@ { "name": "qwen/qwen1.5-1.8b-chat-gguf", "alias": [ - "Qwen/Qwen1.5-1.8B-Chat-GGUF", "qwen1.5-1.8b-chat-gguf" ], "model_types": [ @@ -13293,7 +12949,6 @@ { "name": "qwen/qwen1.5-0.5b-chat-gguf", "alias": [ - "Qwen/Qwen1.5-0.5B-Chat-GGUF", "qwen1.5-0.5b-chat-gguf" ], "model_types": [ @@ -13303,7 +12958,6 @@ { "name": "qwen/qwen1.5-14b-chat-gguf", "alias": [ - "Qwen/Qwen1.5-14B-Chat-GGUF", "qwen1.5-14b-chat-gguf" ], "model_types": [ @@ -13313,7 +12967,6 @@ { "name": "qwen/qwen1.5-7b-chat-gguf", "alias": [ - "Qwen/Qwen1.5-7B-Chat-GGUF", "qwen1.5-7b-chat-gguf" ], "model_types": [ @@ -13323,7 +12976,6 @@ { "name": "qwen/qwen1.5-72b-chat-gguf", "alias": [ - "Qwen/Qwen1.5-72B-Chat-GGUF", "qwen1.5-72b-chat-gguf" ], "model_types": [ @@ -13333,7 +12985,6 @@ { "name": "qwen/qwen1.5-0.5b-chat-awq", "alias": [ - "Qwen/Qwen1.5-0.5B-Chat-AWQ", "qwen1.5-0.5b-chat-awq" ], "max_tokens": 32768, @@ -13344,7 +12995,6 @@ { "name": "qwen/qwen1.5-1.8b-chat-awq", "alias": [ - "Qwen/Qwen1.5-1.8B-Chat-AWQ", "qwen1.5-1.8b-chat-awq" ], "max_tokens": 32768, @@ -13355,7 +13005,6 @@ { "name": "qwen/qwen1.5-4b-chat-awq", "alias": [ - "Qwen/Qwen1.5-4B-Chat-AWQ", "qwen1.5-4b-chat-awq" ], "max_tokens": 32768, @@ -13366,7 +13015,6 @@ { "name": "qwen/qwen1.5-7b-chat-awq", "alias": [ - "Qwen/Qwen1.5-7B-Chat-AWQ", "qwen1.5-7b-chat-awq" ], "max_tokens": 32768, @@ -13377,7 +13025,6 @@ { "name": "qwen/qwen1.5-14b-chat-awq", "alias": [ - "Qwen/Qwen1.5-14B-Chat-AWQ", "qwen1.5-14b-chat-awq" ], "max_tokens": 32768, @@ -13388,7 +13035,6 @@ { "name": "qwen/qwen1.5-72b-chat-awq", "alias": [ - "Qwen/Qwen1.5-72B-Chat-AWQ", "qwen1.5-72b-chat-awq" ], "max_tokens": 32768, @@ -13399,7 +13045,6 @@ { "name": "qwen/qwen1.5-0.5b-chat", "alias": [ - "Qwen/Qwen1.5-0.5B-Chat", "qwen1.5-0.5b-chat" ], "max_tokens": 32768, @@ -13410,7 +13055,6 @@ { "name": "qwen/qwen1.5-72b-chat", "alias": [ - "Qwen/Qwen1.5-72B-Chat", "qwen1.5-72b-chat" ], "max_tokens": 32768, @@ -13421,7 +13065,6 @@ { "name": "qwen/qwen1.5-14b-chat", "alias": [ - "Qwen/Qwen1.5-14B-Chat", "qwen1.5-14b-chat" ], "max_tokens": 32768, @@ -13432,7 +13075,6 @@ { "name": "qwen/qwen1.5-7b-chat", "alias": [ - "Qwen/Qwen1.5-7B-Chat", "qwen1.5-7b-chat" ], "max_tokens": 32768, @@ -13443,7 +13085,6 @@ { "name": "qwen/qwen1.5-4b-chat", "alias": [ - "Qwen/Qwen1.5-4B-Chat", "qwen1.5-4b-chat" ], "max_tokens": 32768, @@ -13454,7 +13095,6 @@ { "name": "qwen/qwen1.5-1.8b-chat", "alias": [ - "Qwen/Qwen1.5-1.8B-Chat", "qwen1.5-1.8b-chat" ], "max_tokens": 32768, @@ -13465,7 +13105,6 @@ { "name": "qwen/qwen1.5-72b", "alias": [ - "Qwen/Qwen1.5-72B", "qwen1.5-72b" ], "max_tokens": 32768, @@ -13476,7 +13115,6 @@ { "name": "qwen/qwen1.5-14b", "alias": [ - "Qwen/Qwen1.5-14B", "qwen1.5-14b" ], "max_tokens": 32768, @@ -13487,7 +13125,6 @@ { "name": "qwen/qwen1.5-7b", "alias": [ - "Qwen/Qwen1.5-7B", "qwen1.5-7b" ], "max_tokens": 32768, @@ -13498,7 +13135,6 @@ { "name": "qwen/qwen1.5-4b", "alias": [ - "Qwen/Qwen1.5-4B", "qwen1.5-4b" ], "max_tokens": 32768, @@ -13509,7 +13145,6 @@ { "name": "qwen/qwen1.5-1.8b", "alias": [ - "Qwen/Qwen1.5-1.8B", "qwen1.5-1.8b" ], "max_tokens": 32768, @@ -13520,7 +13155,6 @@ { "name": "qwen/qwen1.5-0.5b", "alias": [ - "Qwen/Qwen1.5-0.5B", "qwen1.5-0.5b" ], "max_tokens": 32768, @@ -13531,7 +13165,6 @@ { "name": "qwen/qwen-audio-chat", "alias": [ - "Qwen/Qwen-Audio-Chat", "qwen-audio-chat" ], "max_tokens": 2048, @@ -13545,7 +13178,6 @@ { "name": "qwen/qwen-audio", "alias": [ - "Qwen/Qwen-Audio", "qwen-audio" ], "max_tokens": 2048, @@ -13558,7 +13190,6 @@ { "name": "qwen/qwen-72b-chat-int8", "alias": [ - "Qwen/Qwen-72B-Chat-Int8", "qwen-72b-chat-int8" ], "max_tokens": 32768, @@ -13569,7 +13200,6 @@ { "name": "qwen/qwen-72b-chat-int4", "alias": [ - "Qwen/Qwen-72B-Chat-Int4", "qwen-72b-chat-int4" ], "max_tokens": 32768, @@ -13580,7 +13210,6 @@ { "name": "qwen/qwen-1_8b-chat-int4", "alias": [ - "Qwen/Qwen-1_8B-Chat-Int4", "qwen-1_8b-chat-int4" ], "max_tokens": 8192, @@ -13591,7 +13220,6 @@ { "name": "qwen/qwen-1_8b-chat-int8", "alias": [ - "Qwen/Qwen-1_8B-Chat-Int8", "qwen-1_8b-chat-int8" ], "max_tokens": 8192, @@ -13602,7 +13230,6 @@ { "name": "qwen/qwen-1_8b", "alias": [ - "Qwen/Qwen-1_8B", "qwen-1_8b" ], "max_tokens": 8192, @@ -13613,7 +13240,6 @@ { "name": "qwen/qwen-72b-chat", "alias": [ - "Qwen/Qwen-72B-Chat", "qwen-72b-chat" ], "max_tokens": 32768, @@ -13624,7 +13250,6 @@ { "name": "qwen/qwen-72b", "alias": [ - "Qwen/Qwen-72B", "qwen-72b" ], "max_tokens": 32768, @@ -13635,7 +13260,6 @@ { "name": "qwen/qwen-14b-chat-int8", "alias": [ - "Qwen/Qwen-14B-Chat-Int8", "qwen-14b-chat-int8" ], "max_tokens": 8192, @@ -13646,7 +13270,6 @@ { "name": "qwen/qwen-7b-chat-int8", "alias": [ - "Qwen/Qwen-7B-Chat-Int8", "qwen-7b-chat-int8" ], "max_tokens": 32768, @@ -13657,7 +13280,6 @@ { "name": "qwen/qwen-14b", "alias": [ - "Qwen/Qwen-14B", "qwen-14b" ], "max_tokens": 8192, @@ -13668,7 +13290,6 @@ { "name": "qwen/qwen-14b-chat", "alias": [ - "Qwen/Qwen-14B-Chat", "qwen-14b-chat" ], "max_tokens": 8192, @@ -13679,7 +13300,6 @@ { "name": "qwen/qwen-14b-chat-int4", "alias": [ - "Qwen/Qwen-14B-Chat-Int4", "qwen-14b-chat-int4" ], "max_tokens": 8192, @@ -13690,7 +13310,6 @@ { "name": "qwen/qwen-vl-chat-int4", "alias": [ - "Qwen/Qwen-VL-Chat-Int4", "qwen-vl-chat-int4" ], "max_tokens": 8192, @@ -13701,7 +13320,6 @@ { "name": "qwen/qwen-7b-chat-int4", "alias": [ - "Qwen/Qwen-7B-Chat-Int4", "qwen-7b-chat-int4" ], "max_tokens": 32768, @@ -13712,7 +13330,6 @@ { "name": "qwen/qwen-vl-chat", "alias": [ - "Qwen/Qwen-VL-Chat", "qwen-vl-chat" ], "max_tokens": 8192, @@ -13723,7 +13340,6 @@ { "name": "qwen/qwen-vl", "alias": [ - "Qwen/Qwen-VL", "qwen-vl" ], "max_tokens": 8192, @@ -13734,7 +13350,6 @@ { "name": "qwen/qwen-7b-chat", "alias": [ - "Qwen/Qwen-7B-Chat", "qwen-7b-chat" ], "max_tokens": 32768, @@ -13745,7 +13360,6 @@ { "name": "qwen/qwen-7b", "alias": [ - "Qwen/Qwen-7B", "qwen-7b" ], "max_tokens": 32768, @@ -13756,7 +13370,6 @@ { "name": "qwen/qwen-tokenizer", "alias": [ - "Qwen/Qwen-tokenizer", "qwen-tokenizer" ], "model_types": [ @@ -13766,18 +13379,21 @@ { "name": "paddleocr-vl-0.9b", "alias": [ - "paddleocr-vl-1.5" + "paddleocr-vl-1.5", + "PaddlePaddle/PaddleOCR-VL-0.9B" ], "model_types": [ - "ocr" - ] + "ocr", + "chat", + "image2text", + "vision" + ], + "max_tokens": 16384 }, { "name": "baichuan-inc/baichuan-m3-235b-q4_k_m-gguf", "alias": [ - "baichuan-inc/Baichuan-M3-235B-Q4_K_M-GGUF", - "Baichuan-M3-235B-Q4_K_M-GGUF", - "baichuan-m3-235b-q4_k_m-gguf" + "Baichuan-M3-235B-Q4_K_M-GGUF" ], "max_tokens": 131072, "model_types": [ @@ -13791,9 +13407,7 @@ { "name": "baichuan-inc/baichuan-m2-32b-q4_k_m-gguf", "alias": [ - "baichuan-inc/Baichuan-M2-32B-Q4_K_M-GGUF", - "Baichuan-M2-32B-Q4_K_M-GGUF", - "baichuan-m2-32b-q4_k_m-gguf" + "Baichuan-M2-32B-Q4_K_M-GGUF" ], "max_tokens": 131072, "model_types": [ @@ -13807,9 +13421,7 @@ { "name": "baichuan-inc/baichuan-m3-235b-gptq-int4", "alias": [ - "baichuan-inc/Baichuan-M3-235B-GPTQ-INT4", - "Baichuan-M3-235B-GPTQ-INT4", - "baichuan-m3-235b-gptq-int4" + "Baichuan-M3-235B-GPTQ-INT4" ], "max_tokens": 131072, "model_types": [ @@ -13823,9 +13435,7 @@ { "name": "baichuan-inc/baichuan-m3-235b-fp8", "alias": [ - "baichuan-inc/Baichuan-M3-235B-FP8", - "Baichuan-M3-235B-FP8", - "baichuan-m3-235b-fp8" + "Baichuan-M3-235B-FP8" ], "max_tokens": 131072, "model_types": [ @@ -13839,9 +13449,7 @@ { "name": "baichuan-inc/baichuan-m3-235b", "alias": [ - "baichuan-inc/Baichuan-M3-235B", - "Baichuan-M3-235B", - "baichuan-m3-235b" + "Baichuan-M3-235B" ], "max_tokens": 131072, "model_types": [ @@ -13855,9 +13463,9 @@ { "name": "baichuan-inc/baichuan-m2-32b", "alias": [ - "baichuan-inc/Baichuan-M2-32B", "Baichuan-M2-32B", - "baichuan-m2-32b" + "baichuan/baichuan-m2-32b", + "BaiChuan M2 32B" ], "max_tokens": 131072, "model_types": [ @@ -13866,14 +13474,13 @@ "thinking": { "default_value": true, "clear_thinking": true - } + }, + "max_completion_tokens": 131072 }, { "name": "baichuan-inc/baichuan-m2-32b-gptq-int4", "alias": [ - "baichuan-inc/Baichuan-M2-32B-GPTQ-Int4", - "Baichuan-M2-32B-GPTQ-Int4", - "baichuan-m2-32b-gptq-int4" + "Baichuan-M2-32B-GPTQ-Int4" ], "max_tokens": 131072, "model_types": [ @@ -13887,9 +13494,7 @@ { "name": "baichuan-inc/baichuanmed-ocr-7b", "alias": [ - "baichuan-inc/BaichuanMed-OCR-7B", - "BaichuanMed-OCR-7B", - "baichuanmed-ocr-7b" + "BaichuanMed-OCR-7B" ], "max_tokens": 32768, "model_types": [ @@ -13901,9 +13506,7 @@ { "name": "baichuan-inc/baichuanmed-ocr-72b", "alias": [ - "baichuan-inc/BaichuanMed-OCR-72B", - "BaichuanMed-OCR-72B", - "baichuanmed-ocr-72b" + "BaichuanMed-OCR-72B" ], "max_tokens": 32768, "model_types": [ @@ -13915,9 +13518,7 @@ { "name": "baichuan-inc/baichuan-audio-base", "alias": [ - "baichuan-inc/Baichuan-Audio-Base", - "Baichuan-Audio-Base", - "baichuan-audio-base" + "Baichuan-Audio-Base" ], "max_tokens": 32768, "model_types": [ @@ -13929,9 +13530,7 @@ { "name": "baichuan-inc/baichuan-audio-instruct", "alias": [ - "baichuan-inc/Baichuan-Audio-Instruct", - "Baichuan-Audio-Instruct", - "baichuan-audio-instruct" + "Baichuan-Audio-Instruct" ], "max_tokens": 32768, "model_types": [ @@ -13944,9 +13543,7 @@ { "name": "baichuan-inc/baichuan-m1-14b-instruct", "alias": [ - "baichuan-inc/Baichuan-M1-14B-Instruct", - "Baichuan-M1-14B-Instruct", - "baichuan-m1-14b-instruct" + "Baichuan-M1-14B-Instruct" ], "max_tokens": 32768, "model_types": [ @@ -13956,9 +13553,7 @@ { "name": "baichuan-inc/baichuan-m1-14b-base", "alias": [ - "baichuan-inc/Baichuan-M1-14B-Base", - "Baichuan-M1-14B-Base", - "baichuan-m1-14b-base" + "Baichuan-M1-14B-Base" ], "max_tokens": 32768, "model_types": [ @@ -13968,9 +13563,7 @@ { "name": "baichuan-inc/baichuan-omni-1d5-base", "alias": [ - "baichuan-inc/Baichuan-Omni-1d5-Base", "Baichuan-Omni-1d5-Base", - "baichuan-omni-1d5-base", "Baichuan-Omni-1.5-Base" ], "max_tokens": 32768, @@ -13987,9 +13580,7 @@ { "name": "baichuan-inc/baichuan-omni-1d5", "alias": [ - "baichuan-inc/Baichuan-Omni-1d5", "Baichuan-Omni-1d5", - "baichuan-omni-1d5", "Baichuan-Omni-1.5" ], "max_tokens": 32768, @@ -14006,9 +13597,7 @@ { "name": "baichuan-inc/baichuan2-13b-chat", "alias": [ - "baichuan-inc/Baichuan2-13B-Chat", - "Baichuan2-13B-Chat", - "baichuan2-13b-chat" + "Baichuan2-13B-Chat" ], "max_tokens": 4096, "model_types": [ @@ -14018,9 +13607,7 @@ { "name": "baichuan-inc/baichuan2-7b-chat", "alias": [ - "baichuan-inc/Baichuan2-7B-Chat", - "Baichuan2-7B-Chat", - "baichuan2-7b-chat" + "Baichuan2-7B-Chat" ], "max_tokens": 4096, "model_types": [ @@ -14030,9 +13617,7 @@ { "name": "baichuan-inc/baichuan2-7b-base", "alias": [ - "baichuan-inc/Baichuan2-7B-Base", - "Baichuan2-7B-Base", - "baichuan2-7b-base" + "Baichuan2-7B-Base" ], "max_tokens": 4096, "model_types": [ @@ -14042,9 +13627,7 @@ { "name": "baichuan-inc/baichuan-13b-chat", "alias": [ - "baichuan-inc/Baichuan-13B-Chat", - "Baichuan-13B-Chat", - "baichuan-13b-chat" + "Baichuan-13B-Chat" ], "max_tokens": 4096, "model_types": [ @@ -14054,9 +13637,7 @@ { "name": "baichuan-inc/baichuan-7b", "alias": [ - "baichuan-inc/Baichuan-7B", - "Baichuan-7B", - "baichuan-7b" + "Baichuan-7B" ], "max_tokens": 4096, "model_types": [ @@ -14066,9 +13647,7 @@ { "name": "baichuan-inc/baichuan2-13b-chat-4bits", "alias": [ - "baichuan-inc/Baichuan2-13B-Chat-4bits", - "Baichuan2-13B-Chat-4bits", - "baichuan2-13b-chat-4bits" + "Baichuan2-13B-Chat-4bits" ], "max_tokens": 4096, "model_types": [ @@ -14078,9 +13657,7 @@ { "name": "baichuan-inc/baichuan2-7b-chat-4bits", "alias": [ - "baichuan-inc/Baichuan2-7B-Chat-4bits", - "Baichuan2-7B-Chat-4bits", - "baichuan2-7b-chat-4bits" + "Baichuan2-7B-Chat-4bits" ], "max_tokens": 4096, "model_types": [ @@ -14090,9 +13667,7 @@ { "name": "baichuan-inc/baichuan2-13b-base", "alias": [ - "baichuan-inc/Baichuan2-13B-Base", - "Baichuan2-13B-Base", - "baichuan2-13b-base" + "Baichuan2-13B-Base" ], "max_tokens": 4096, "model_types": [ @@ -14102,9 +13677,7 @@ { "name": "baichuan-inc/baichuan2-7b-intermediate-checkpoints", "alias": [ - "baichuan-inc/Baichuan2-7B-Intermediate-Checkpoints", - "Baichuan2-7B-Intermediate-Checkpoints", - "baichuan2-7b-intermediate-checkpoints" + "Baichuan2-7B-Intermediate-Checkpoints" ], "max_tokens": 4096, "model_types": [ @@ -14114,9 +13687,7 @@ { "name": "baichuan-inc/baichuan-13b-base", "alias": [ - "baichuan-inc/Baichuan-13B-Base", - "Baichuan-13B-Base", - "baichuan-13b-base" + "Baichuan-13B-Base" ], "max_tokens": 4096, "model_types": [ @@ -14126,7 +13697,6 @@ { "name": "baidu/nava", "alias": [ - "baidu/NAVA", "nava" ], "model_types": [ @@ -14136,7 +13706,6 @@ { "name": "baidu/ernie-image-aes", "alias": [ - "baidu/ERNIE-Image-Aes", "ernie-image-aes" ], "model_types": [ @@ -14146,7 +13715,6 @@ { "name": "baidu/ernie-image-turbo", "alias": [ - "baidu/ERNIE-Image-Turbo", "ernie-image-turbo" ], "model_types": [ @@ -14156,7 +13724,6 @@ { "name": "baidu/ernie-image", "alias": [ - "baidu/ERNIE-Image", "ernie-image" ], "model_types": [ @@ -14166,7 +13733,6 @@ { "name": "baidu/qianfan-ocr", "alias": [ - "baidu/Qianfan-OCR", "qianfan-ocr" ], "max_tokens": 32768, @@ -14179,7 +13745,6 @@ { "name": "baidu/qianfan-vl-70b", "alias": [ - "baidu/Qianfan-VL-70B", "qianfan-vl-70b" ], "max_tokens": 32768, @@ -14196,7 +13761,6 @@ { "name": "baidu/qianfan-vl-8b", "alias": [ - "baidu/Qianfan-VL-8B", "qianfan-vl-8b" ], "max_tokens": 32768, @@ -14213,7 +13777,6 @@ { "name": "baidu/qianfan-vl-3b", "alias": [ - "baidu/Qianfan-VL-3B", "qianfan-vl-3b" ], "max_tokens": 32768, @@ -14226,7 +13789,6 @@ { "name": "baidu/ernie-4.5-vl-28b-a3b-pt", "alias": [ - "baidu/ERNIE-4.5-VL-28B-A3B-PT", "ernie-4.5-vl-28b-a3b-pt" ], "max_tokens": 131072, @@ -14240,7 +13802,6 @@ { "name": "baidu/ernie-4.5-vl-28b-a3b-thinking", "alias": [ - "baidu/ERNIE-4.5-VL-28B-A3B-Thinking", "ernie-4.5-vl-28b-a3b-thinking" ], "max_tokens": 131072, @@ -14253,12 +13814,12 @@ "thinking": { "default_value": true, "clear_thinking": true - } + }, + "max_completion_tokens": 65536 }, { "name": "baidu/ernie-4.5-vl-28b-a3b-base-pt", "alias": [ - "baidu/ERNIE-4.5-VL-28B-A3B-Base-PT", "ernie-4.5-vl-28b-a3b-base-pt" ], "max_tokens": 131072, @@ -14270,7 +13831,6 @@ { "name": "baidu/ernie-4.5-vl-424b-a47b-pt", "alias": [ - "baidu/ERNIE-4.5-VL-424B-A47B-PT", "ernie-4.5-vl-424b-a47b-pt" ], "max_tokens": 131072, @@ -14284,7 +13844,6 @@ { "name": "baidu/ernie-4.5-vl-424b-a47b-base-pt", "alias": [ - "baidu/ERNIE-4.5-VL-424B-A47B-Base-PT", "ernie-4.5-vl-424b-a47b-base-pt" ], "max_tokens": 131072, @@ -14296,7 +13855,6 @@ { "name": "baidu/ernie-4.5-21b-a3b-base-pt", "alias": [ - "baidu/ERNIE-4.5-21B-A3B-Base-PT", "ernie-4.5-21b-a3b-base-pt" ], "max_tokens": 131072, @@ -14307,7 +13865,6 @@ { "name": "baidu/ernie-4.5-300b-a47b-base-pt", "alias": [ - "baidu/ERNIE-4.5-300B-A47B-Base-PT", "ernie-4.5-300b-a47b-base-pt" ], "max_tokens": 131072, @@ -14318,7 +13875,6 @@ { "name": "baidu/ernie-4.5-21b-a3b-thinking", "alias": [ - "baidu/ERNIE-4.5-21B-A3B-Thinking", "ernie-4.5-21b-a3b-thinking" ], "max_tokens": 131072, @@ -14328,12 +13884,12 @@ "thinking": { "default_value": true, "clear_thinking": true - } + }, + "max_completion_tokens": 65536 }, { "name": "baidu/ernie-4.5-21b-a3b-pt", "alias": [ - "baidu/ERNIE-4.5-21B-A3B-PT", "ernie-4.5-21b-a3b-pt" ], "max_tokens": 131072, @@ -14344,7 +13900,6 @@ { "name": "baidu/ernie-4.5-300b-a47b-pt", "alias": [ - "baidu/ERNIE-4.5-300B-A47B-PT", "ernie-4.5-300b-a47b-pt" ], "max_tokens": 131072, @@ -14355,7 +13910,6 @@ { "name": "baidu/ernie-4.5-300b-a47b-2bits-paddle", "alias": [ - "baidu/ERNIE-4.5-300B-A47B-2Bits-Paddle", "ernie-4.5-300b-a47b-2bits-paddle" ], "max_tokens": 131072, @@ -14366,7 +13920,6 @@ { "name": "baidu/ernie-4.5-300b-a47b-2bits-tp4-paddle", "alias": [ - "baidu/ERNIE-4.5-300B-A47B-2Bits-TP4-Paddle", "ernie-4.5-300b-a47b-2bits-tp4-paddle" ], "max_tokens": 131072, @@ -14377,7 +13930,6 @@ { "name": "baidu/ernie-4.5-300b-a47b-2bits-tp2-paddle", "alias": [ - "baidu/ERNIE-4.5-300B-A47B-2Bits-TP2-Paddle", "ernie-4.5-300b-a47b-2bits-tp2-paddle" ], "max_tokens": 131072, @@ -14388,7 +13940,6 @@ { "name": "baidu/ernie-4.5-21b-a3b-paddle", "alias": [ - "baidu/ERNIE-4.5-21B-A3B-Paddle", "ernie-4.5-21b-a3b-paddle" ], "max_tokens": 131072, @@ -14399,18 +13950,18 @@ { "name": "baidu/ernie-4.5-300b-a47b-paddle", "alias": [ - "baidu/ERNIE-4.5-300B-A47B-Paddle", - "ernie-4.5-300b-a47b-paddle" + "ernie-4.5-300b-a47b-paddle", + "ERNIE 4.5 300B A47B" ], "max_tokens": 131072, "model_types": [ "chat" - ] + ], + "max_completion_tokens": 12000 }, { "name": "baidu/ernie-4.5-300b-a47b-base-paddle", "alias": [ - "baidu/ERNIE-4.5-300B-A47B-Base-Paddle", "ernie-4.5-300b-a47b-base-paddle" ], "max_tokens": 131072, @@ -14421,7 +13972,6 @@ { "name": "baidu/ernie-4.5-300b-a47b-fp8-paddle", "alias": [ - "baidu/ERNIE-4.5-300B-A47B-FP8-Paddle", "ernie-4.5-300b-a47b-fp8-paddle" ], "max_tokens": 131072, @@ -14432,7 +13982,6 @@ { "name": "baidu/ernie-4.5-300b-a47b-w4a8c8-tp4-paddle", "alias": [ - "baidu/ERNIE-4.5-300B-A47B-W4A8C8-TP4-Paddle", "ernie-4.5-300b-a47b-w4a8c8-tp4-paddle" ], "max_tokens": 131072, @@ -14443,7 +13992,6 @@ { "name": "baidu/ernie-4.5-0.3b-base-pt", "alias": [ - "baidu/ERNIE-4.5-0.3B-Base-PT", "ernie-4.5-0.3b-base-pt" ], "max_tokens": 131072, @@ -14454,7 +14002,6 @@ { "name": "baidu/ernie-4.5-0.3b-pt", "alias": [ - "baidu/ERNIE-4.5-0.3B-PT", "ernie-4.5-0.3b-pt" ], "max_tokens": 131072, @@ -14465,7 +14012,6 @@ { "name": "baidu/ernie-4.5-vl-424b-a47b-paddle", "alias": [ - "baidu/ERNIE-4.5-VL-424B-A47B-Paddle", "ernie-4.5-vl-424b-a47b-paddle" ], "max_tokens": 131072, @@ -14479,7 +14025,6 @@ { "name": "baidu/ernie-4.5-vl-28b-a3b-base-paddle", "alias": [ - "baidu/ERNIE-4.5-VL-28B-A3B-Base-Paddle", "ernie-4.5-vl-28b-a3b-base-paddle" ], "max_tokens": 131072, @@ -14491,7 +14036,6 @@ { "name": "baidu/ernie-4.5-21b-a3b-base-paddle", "alias": [ - "baidu/ERNIE-4.5-21B-A3B-Base-Paddle", "ernie-4.5-21b-a3b-base-paddle" ], "max_tokens": 131072, @@ -14502,7 +14046,6 @@ { "name": "baidu/ernie-4.5-vl-28b-a3b-paddle", "alias": [ - "baidu/ERNIE-4.5-VL-28B-A3B-Paddle", "ernie-4.5-vl-28b-a3b-paddle" ], "max_tokens": 131072, @@ -14516,7 +14059,6 @@ { "name": "baidu/ernie-4.5-0.3b-base-paddle", "alias": [ - "baidu/ERNIE-4.5-0.3B-Base-Paddle", "ernie-4.5-0.3b-base-paddle" ], "max_tokens": 131072, @@ -14527,7 +14069,6 @@ { "name": "baidu/ernie-4.5-0.3b-paddle", "alias": [ - "baidu/ERNIE-4.5-0.3B-Paddle", "ernie-4.5-0.3b-paddle" ], "max_tokens": 131072, @@ -14538,7 +14079,6 @@ { "name": "baidu/ernie-4.5-vl-424b-a47b-base-paddle", "alias": [ - "baidu/ERNIE-4.5-VL-424B-A47B-Base-Paddle", "ernie-4.5-vl-424b-a47b-base-paddle" ], "max_tokens": 131072, @@ -14552,14 +14092,33 @@ "max_tokens": 1048576, "model_types": [ "chat" - ] + ], + "alias": [ + "XiaomiMiMo/MiMo-V2.5-Pro" + ], + "max_completion_tokens": 131072, + "thinking": { + "default_value": true, + "clear_thinking": true + } }, { "name": "mimo-v2.5", "max_tokens": 1048576, "model_types": [ - "chat" - ] + "chat", + "image2text", + "vision", + "video_generation" + ], + "alias": [ + "XiaomiMiMo/MiMo-V2.5" + ], + "max_completion_tokens": 131072, + "thinking": { + "default_value": true, + "clear_thinking": true + } }, { "name": "mimo-v2.5-asr", @@ -14572,6 +14131,9 @@ "name": "mimo-v2.5-tts", "model_types": [ "tts" + ], + "alias": [ + "XiaomiMiMo/MiMo-V2.5-tts" ] }, { @@ -14583,9 +14145,7 @@ { "name": "meituan-longcat/longcat-video-avatar-1.5", "alias": [ - "meituan-longcat/LongCat-Video-Avatar-1.5", - "LongCat-Video-Avatar-1.5", - "longcat-video-avatar-1.5" + "LongCat-Video-Avatar-1.5" ], "model_types": [ "video_generation" @@ -14594,9 +14154,7 @@ { "name": "meituan-longcat/wbench-weights", "alias": [ - "meituan-longcat/WBench-weights", - "WBench-weights", - "wbench-weights" + "WBench-weights" ], "model_types": [ "other" @@ -14605,9 +14163,7 @@ { "name": "meituan-longcat/longcat-next", "alias": [ - "meituan-longcat/LongCat-Next", - "LongCat-Next", - "longcat-next" + "LongCat-Next" ], "model_types": [ "chat", @@ -14622,9 +14178,7 @@ { "name": "meituan-longcat/longcat-audiodit-1b", "alias": [ - "meituan-longcat/LongCat-AudioDiT-1B", - "LongCat-AudioDiT-1B", - "longcat-audiodit-1b" + "LongCat-AudioDiT-1B" ], "model_types": [ "audio_generation" @@ -14633,9 +14187,7 @@ { "name": "meituan-longcat/longcat-audiodit-3.5b", "alias": [ - "meituan-longcat/LongCat-AudioDiT-3.5B", - "LongCat-AudioDiT-3.5B", - "longcat-audiodit-3.5b" + "LongCat-AudioDiT-3.5B" ], "model_types": [ "audio_generation" @@ -14644,9 +14196,7 @@ { "name": "meituan-longcat/longcat-flash-prover", "alias": [ - "meituan-longcat/LongCat-Flash-Prover", - "LongCat-Flash-Prover", - "longcat-flash-prover" + "LongCat-Flash-Prover" ], "max_tokens": 131072, "model_types": [ @@ -14660,9 +14210,7 @@ { "name": "meituan-longcat/longcat-flash-lite-fp8", "alias": [ - "meituan-longcat/LongCat-Flash-Lite-FP8", - "LongCat-Flash-Lite-FP8", - "longcat-flash-lite-fp8" + "LongCat-Flash-Lite-FP8" ], "max_tokens": 262144, "model_types": [ @@ -14672,9 +14220,7 @@ { "name": "meituan-longcat/longcat-flash-lite", "alias": [ - "meituan-longcat/LongCat-Flash-Lite", - "LongCat-Flash-Lite", - "longcat-flash-lite" + "LongCat-Flash-Lite" ], "max_tokens": 262144, "model_types": [ @@ -14684,9 +14230,7 @@ { "name": "meituan-longcat/longcat-image-edit-turbo", "alias": [ - "meituan-longcat/LongCat-Image-Edit-Turbo", - "LongCat-Image-Edit-Turbo", - "longcat-image-edit-turbo" + "LongCat-Image-Edit-Turbo" ], "model_types": [ "image_edit" @@ -14695,9 +14239,7 @@ { "name": "meituan-longcat/longcat-flash-thinking-zigzag", "alias": [ - "meituan-longcat/LongCat-Flash-Thinking-ZigZag", - "LongCat-Flash-Thinking-ZigZag", - "longcat-flash-thinking-zigzag" + "LongCat-Flash-Thinking-ZigZag" ], "max_tokens": 262144, "model_types": [ @@ -14711,9 +14253,7 @@ { "name": "meituan-longcat/longcat-flash-thinking-2601-fp8", "alias": [ - "meituan-longcat/LongCat-Flash-Thinking-2601-FP8", - "LongCat-Flash-Thinking-2601-FP8", - "longcat-flash-thinking-2601-fp8" + "LongCat-Flash-Thinking-2601-FP8" ], "max_tokens": 131072, "model_types": [ @@ -14727,9 +14267,7 @@ { "name": "meituan-longcat/longcat-flash-thinking-2601", "alias": [ - "meituan-longcat/LongCat-Flash-Thinking-2601", - "LongCat-Flash-Thinking-2601", - "longcat-flash-thinking-2601" + "LongCat-Flash-Thinking-2601" ], "max_tokens": 131072, "model_types": [ @@ -14743,9 +14281,7 @@ { "name": "meituan-longcat/longcat-heavymode-summary", "alias": [ - "meituan-longcat/LongCat-HeavyMode-Summary", - "LongCat-HeavyMode-Summary", - "longcat-heavymode-summary" + "LongCat-HeavyMode-Summary" ], "max_tokens": 131072, "model_types": [ @@ -14759,9 +14295,7 @@ { "name": "meituan-longcat/longcat-video-avatar", "alias": [ - "meituan-longcat/LongCat-Video-Avatar", - "LongCat-Video-Avatar", - "longcat-video-avatar" + "LongCat-Video-Avatar" ], "model_types": [ "video_generation" @@ -14770,9 +14304,7 @@ { "name": "meituan-longcat/longcat-image", "alias": [ - "meituan-longcat/LongCat-Image", - "LongCat-Image", - "longcat-image" + "LongCat-Image" ], "model_types": [ "image" @@ -14781,9 +14313,7 @@ { "name": "meituan-longcat/longcat-image-edit", "alias": [ - "meituan-longcat/LongCat-Image-Edit", - "LongCat-Image-Edit", - "longcat-image-edit" + "LongCat-Image-Edit" ], "model_types": [ "image_edit" @@ -14792,9 +14322,7 @@ { "name": "meituan-longcat/longcat-image-dev", "alias": [ - "meituan-longcat/LongCat-Image-Dev", - "LongCat-Image-Dev", - "longcat-image-dev" + "LongCat-Image-Dev" ], "model_types": [ "image" @@ -14803,9 +14331,7 @@ { "name": "meituan-longcat/longcat-flash-omni", "alias": [ - "meituan-longcat/LongCat-Flash-Omni", - "LongCat-Flash-Omni", - "longcat-flash-omni" + "LongCat-Flash-Omni" ], "max_tokens": 131072, "model_types": [ @@ -14821,9 +14347,7 @@ { "name": "meituan-longcat/longcat-flash-omni-fp8", "alias": [ - "meituan-longcat/LongCat-Flash-Omni-FP8", - "LongCat-Flash-Omni-FP8", - "longcat-flash-omni-fp8" + "LongCat-Flash-Omni-FP8" ], "max_tokens": 131072, "model_types": [ @@ -14839,9 +14363,7 @@ { "name": "meituan-longcat/longcat-video", "alias": [ - "meituan-longcat/LongCat-Video", - "LongCat-Video", - "longcat-video" + "LongCat-Video" ], "model_types": [ "video_generation" @@ -14850,9 +14372,7 @@ { "name": "meituan-longcat/longcat-audio-codec", "alias": [ - "meituan-longcat/LongCat-Audio-Codec", - "LongCat-Audio-Codec", - "longcat-audio-codec" + "LongCat-Audio-Codec" ], "model_types": [ "audio_codec" @@ -14861,9 +14381,7 @@ { "name": "meituan-longcat/longcat-flash-thinking-fp8", "alias": [ - "meituan-longcat/LongCat-Flash-Thinking-FP8", - "LongCat-Flash-Thinking-FP8", - "longcat-flash-thinking-fp8" + "LongCat-Flash-Thinking-FP8" ], "max_tokens": 131072, "model_types": [ @@ -14877,9 +14395,7 @@ { "name": "meituan-longcat/longcat-flash-thinking", "alias": [ - "meituan-longcat/LongCat-Flash-Thinking", - "LongCat-Flash-Thinking", - "longcat-flash-thinking" + "LongCat-Flash-Thinking" ], "max_tokens": 131072, "model_types": [ @@ -14893,9 +14409,7 @@ { "name": "meituan-longcat/longcat-flash-chat-fp8", "alias": [ - "meituan-longcat/LongCat-Flash-Chat-FP8", - "LongCat-Flash-Chat-FP8", - "longcat-flash-chat-fp8" + "LongCat-Flash-Chat-FP8" ], "max_tokens": 131072, "model_types": [ @@ -14905,9 +14419,7 @@ { "name": "meituan-longcat/longcat-flash-chat", "alias": [ - "meituan-longcat/LongCat-Flash-Chat", - "LongCat-Flash-Chat", - "longcat-flash-chat" + "LongCat-Flash-Chat" ], "max_tokens": 131072, "model_types": [ @@ -15181,9 +14693,7 @@ { "name": "jinaai/jina-embeddings-v5-omni-small-text-matching-gguf", "alias": [ - "jinaai/jina-embeddings-v5-omni-small-text-matching-GGUF", - "jina-embeddings-v5-omni-small-text-matching-GGUF", - "jina-embeddings-v5-omni-small-text-matching-gguf" + "jina-embeddings-v5-omni-small-text-matching-GGUF" ], "max_dimension": 1024, "dimensions": [ @@ -15205,9 +14715,7 @@ { "name": "jinaai/jina-embeddings-v5-omni-small-clustering-gguf", "alias": [ - "jinaai/jina-embeddings-v5-omni-small-clustering-GGUF", - "jina-embeddings-v5-omni-small-clustering-GGUF", - "jina-embeddings-v5-omni-small-clustering-gguf" + "jina-embeddings-v5-omni-small-clustering-GGUF" ], "max_dimension": 1024, "dimensions": [ @@ -15229,9 +14737,7 @@ { "name": "jinaai/jina-embeddings-v5-omni-small-classification-gguf", "alias": [ - "jinaai/jina-embeddings-v5-omni-small-classification-GGUF", - "jina-embeddings-v5-omni-small-classification-GGUF", - "jina-embeddings-v5-omni-small-classification-gguf" + "jina-embeddings-v5-omni-small-classification-GGUF" ], "max_dimension": 1024, "dimensions": [ @@ -15253,9 +14759,7 @@ { "name": "jinaai/jina-embeddings-v5-omni-small-retrieval-gguf", "alias": [ - "jinaai/jina-embeddings-v5-omni-small-retrieval-GGUF", - "jina-embeddings-v5-omni-small-retrieval-GGUF", - "jina-embeddings-v5-omni-small-retrieval-gguf" + "jina-embeddings-v5-omni-small-retrieval-GGUF" ], "max_dimension": 1024, "dimensions": [ @@ -15277,9 +14781,7 @@ { "name": "jinaai/jina-embeddings-v5-omni-nano-text-matching-gguf", "alias": [ - "jinaai/jina-embeddings-v5-omni-nano-text-matching-GGUF", - "jina-embeddings-v5-omni-nano-text-matching-GGUF", - "jina-embeddings-v5-omni-nano-text-matching-gguf" + "jina-embeddings-v5-omni-nano-text-matching-GGUF" ], "max_dimension": 1024, "dimensions": [ @@ -15301,9 +14803,7 @@ { "name": "jinaai/jina-embeddings-v5-omni-nano-clustering-gguf", "alias": [ - "jinaai/jina-embeddings-v5-omni-nano-clustering-GGUF", - "jina-embeddings-v5-omni-nano-clustering-GGUF", - "jina-embeddings-v5-omni-nano-clustering-gguf" + "jina-embeddings-v5-omni-nano-clustering-GGUF" ], "max_dimension": 1024, "dimensions": [ @@ -15325,9 +14825,7 @@ { "name": "jinaai/jina-embeddings-v5-omni-nano-classification-gguf", "alias": [ - "jinaai/jina-embeddings-v5-omni-nano-classification-GGUF", - "jina-embeddings-v5-omni-nano-classification-GGUF", - "jina-embeddings-v5-omni-nano-classification-gguf" + "jina-embeddings-v5-omni-nano-classification-GGUF" ], "max_dimension": 1024, "dimensions": [ @@ -15349,9 +14847,7 @@ { "name": "jinaai/jina-embeddings-v5-omni-nano-retrieval-gguf", "alias": [ - "jinaai/jina-embeddings-v5-omni-nano-retrieval-GGUF", - "jina-embeddings-v5-omni-nano-retrieval-GGUF", - "jina-embeddings-v5-omni-nano-retrieval-gguf" + "jina-embeddings-v5-omni-nano-retrieval-GGUF" ], "max_dimension": 1024, "dimensions": [ @@ -15907,9 +15403,7 @@ { "name": "jinaai/jina-embeddings-v5-text-nano-classification-gguf", "alias": [ - "jinaai/jina-embeddings-v5-text-nano-classification-GGUF", - "jina-embeddings-v5-text-nano-classification-GGUF", - "jina-embeddings-v5-text-nano-classification-gguf" + "jina-embeddings-v5-text-nano-classification-GGUF" ], "max_dimension": 1024, "dimensions": [ @@ -15929,9 +15423,7 @@ { "name": "jinaai/jina-embeddings-v5-text-nano-clustering-gguf", "alias": [ - "jinaai/jina-embeddings-v5-text-nano-clustering-GGUF", - "jina-embeddings-v5-text-nano-clustering-GGUF", - "jina-embeddings-v5-text-nano-clustering-gguf" + "jina-embeddings-v5-text-nano-clustering-GGUF" ], "max_dimension": 1024, "dimensions": [ @@ -15951,9 +15443,7 @@ { "name": "jinaai/jina-embeddings-v5-text-nano-retrieval-gguf", "alias": [ - "jinaai/jina-embeddings-v5-text-nano-retrieval-GGUF", - "jina-embeddings-v5-text-nano-retrieval-GGUF", - "jina-embeddings-v5-text-nano-retrieval-gguf" + "jina-embeddings-v5-text-nano-retrieval-GGUF" ], "max_dimension": 1024, "dimensions": [ @@ -15973,9 +15463,7 @@ { "name": "jinaai/jina-embeddings-v5-text-nano-text-matching-gguf", "alias": [ - "jinaai/jina-embeddings-v5-text-nano-text-matching-GGUF", - "jina-embeddings-v5-text-nano-text-matching-GGUF", - "jina-embeddings-v5-text-nano-text-matching-gguf" + "jina-embeddings-v5-text-nano-text-matching-GGUF" ], "max_dimension": 1024, "dimensions": [ @@ -16229,9 +15717,7 @@ { "name": "jinaai/jina-embeddings-v5-text-small-retrieval-gguf", "alias": [ - "jinaai/jina-embeddings-v5-text-small-retrieval-GGUF", - "jina-embeddings-v5-text-small-retrieval-GGUF", - "jina-embeddings-v5-text-small-retrieval-gguf" + "jina-embeddings-v5-text-small-retrieval-GGUF" ], "max_dimension": 1024, "dimensions": [ @@ -16251,9 +15737,7 @@ { "name": "jinaai/jina-embeddings-v5-text-small-classification-gguf", "alias": [ - "jinaai/jina-embeddings-v5-text-small-classification-GGUF", - "jina-embeddings-v5-text-small-classification-GGUF", - "jina-embeddings-v5-text-small-classification-gguf" + "jina-embeddings-v5-text-small-classification-GGUF" ], "max_dimension": 1024, "dimensions": [ @@ -16273,9 +15757,7 @@ { "name": "jinaai/jina-embeddings-v5-text-small-clustering-gguf", "alias": [ - "jinaai/jina-embeddings-v5-text-small-clustering-GGUF", - "jina-embeddings-v5-text-small-clustering-GGUF", - "jina-embeddings-v5-text-small-clustering-gguf" + "jina-embeddings-v5-text-small-clustering-GGUF" ], "max_dimension": 1024, "dimensions": [ @@ -16295,9 +15777,7 @@ { "name": "jinaai/jina-embeddings-v5-text-small-text-matching-gguf", "alias": [ - "jinaai/jina-embeddings-v5-text-small-text-matching-GGUF", - "jina-embeddings-v5-text-small-text-matching-GGUF", - "jina-embeddings-v5-text-small-text-matching-gguf" + "jina-embeddings-v5-text-small-text-matching-GGUF" ], "max_dimension": 1024, "dimensions": [ @@ -16339,9 +15819,7 @@ { "name": "jinaai/jina-reranker-v3-gguf", "alias": [ - "jinaai/jina-reranker-v3-GGUF", - "jina-reranker-v3-GGUF", - "jina-reranker-v3-gguf" + "jina-reranker-v3-GGUF" ], "model_types": [ "rerank" @@ -16395,9 +15873,7 @@ { "name": "jinaai/jina-embeddings-v4-text-matching-gguf", "alias": [ - "jinaai/jina-embeddings-v4-text-matching-GGUF", - "jina-embeddings-v4-text-matching-GGUF", - "jina-embeddings-v4-text-matching-gguf" + "jina-embeddings-v4-text-matching-GGUF" ], "max_dimension": 2048, "dimensions": [ @@ -16415,9 +15891,7 @@ { "name": "jinaai/jina-embeddings-v4-text-code-gguf", "alias": [ - "jinaai/jina-embeddings-v4-text-code-GGUF", - "jina-embeddings-v4-text-code-GGUF", - "jina-embeddings-v4-text-code-gguf" + "jina-embeddings-v4-text-code-GGUF" ], "max_dimension": 2048, "dimensions": [ @@ -16435,9 +15909,7 @@ { "name": "jinaai/jina-embeddings-v4-text-retrieval-gguf", "alias": [ - "jinaai/jina-embeddings-v4-text-retrieval-GGUF", - "jina-embeddings-v4-text-retrieval-GGUF", - "jina-embeddings-v4-text-retrieval-gguf" + "jina-embeddings-v4-text-retrieval-GGUF" ], "max_dimension": 2048, "dimensions": [ @@ -16494,9 +15966,7 @@ { "name": "jinaai/jina-code-embeddings-1.5b-gguf", "alias": [ - "jinaai/jina-code-embeddings-1.5b-GGUF", - "jina-code-embeddings-1.5b-GGUF", - "jina-code-embeddings-1.5b-gguf" + "jina-code-embeddings-1.5b-GGUF" ], "max_dimension": 1024, "dimensions": [ @@ -16513,9 +15983,7 @@ { "name": "jinaai/jina-code-embeddings-0.5b-gguf", "alias": [ - "jinaai/jina-code-embeddings-0.5b-GGUF", - "jina-code-embeddings-0.5b-GGUF", - "jina-code-embeddings-0.5b-gguf" + "jina-code-embeddings-0.5b-GGUF" ], "max_dimension": 1024, "dimensions": [ @@ -16570,9 +16038,7 @@ { "name": "jinaai/jina-reranker-m0-gguf", "alias": [ - "jinaai/jina-reranker-m0-GGUF", - "jina-reranker-m0-GGUF", - "jina-reranker-m0-gguf" + "jina-reranker-m0-GGUF" ], "model_types": [ "rerank" @@ -16601,9 +16067,7 @@ { "name": "jinaai/readerlm-v2", "alias": [ - "jinaai/ReaderLM-v2", - "ReaderLM-v2", - "readerlm-v2" + "ReaderLM-v2" ], "max_tokens": 256000, "model_types": [ @@ -16869,9 +16333,7 @@ { "name": "jinaai/phi-3-tiny-untrained", "alias": [ - "jinaai/Phi-3-tiny-untrained", - "Phi-3-tiny-untrained", - "phi-3-tiny-untrained" + "Phi-3-tiny-untrained" ], "model_types": [ "chat" @@ -16998,12 +16460,14 @@ ], "max_tokens": 131072, "model_types": [ - "chat" + "chat", + "moderation" ], "thinking": { "default_value": true, "clear_thinking": true - } + }, + "max_completion_tokens": 65536 }, { "name": "openai/circuit-sparsity", @@ -17031,30 +16495,40 @@ { "name": "openai/gpt-oss-20b", "alias": [ - "gpt-oss-20b" + "gpt-oss-20b", + "OpenAI: GPT OSS 20B", + "OpenAI GPT-OSS 20B" ], "max_tokens": 131072, "model_types": [ - "chat" + "chat", + "vision", + "image2text" ], "thinking": { "default_value": true, "clear_thinking": true - } + }, + "max_completion_tokens": 65536 }, { "name": "openai/gpt-oss-120b", "alias": [ - "gpt-oss-120b" + "gpt-oss-120b", + "OpenAI GPT OSS 120B", + "OpenAI GPT-OSS 120B" ], "max_tokens": 131072, "model_types": [ - "chat" + "chat", + "vision", + "image2text" ], "thinking": { "default_value": true, "clear_thinking": true - } + }, + "max_completion_tokens": 65536 }, { "name": "openai/whisper-large-v3-turbo", @@ -17062,17 +16536,24 @@ "whisper-large-v3-turbo" ], "model_types": [ - "asr" - ] + "asr", + "speech2text" + ], + "max_tokens": 448, + "max_completion_tokens": 448 }, { "name": "openai/whisper-large-v3", "alias": [ - "whisper-large-v3" + "whisper-large-v3", + "Whisper large-v3" ], "model_types": [ - "asr" - ] + "asr", + "speech2text" + ], + "max_tokens": 448, + "max_completion_tokens": 448 }, { "name": "openai/whisper-large-v2", @@ -17125,7 +16606,8 @@ "whisper-base" ], "model_types": [ - "asr" + "asr", + "speech2text" ] }, { @@ -17139,7 +16621,8 @@ ], "model_types": [ "embedding", - "vision" + "vision", + "image_understanding" ] }, { @@ -17148,7 +16631,8 @@ "whisper-medium.en" ], "model_types": [ - "asr" + "asr", + "speech2text" ] }, { @@ -17157,7 +16641,8 @@ "whisper-small.en" ], "model_types": [ - "asr" + "asr", + "speech2text" ] }, { @@ -17166,7 +16651,8 @@ "whisper-tiny.en" ], "model_types": [ - "asr" + "asr", + "speech2text" ] }, { @@ -17175,7 +16661,8 @@ "whisper-base.en" ], "model_types": [ - "asr" + "asr", + "speech2text" ] }, { @@ -17371,12 +16858,16 @@ ], "model_types": [ "embedding", - "vision" + "vision", + "image_understanding" ] }, { "name": "gpt-5.4", "alias": [ + "gpt-5.4-2026-03-05", + "openai/gpt-5.4", + "openai/gpt-5.4-2026-03-05" ], "max_tokens": 1050000, "model_types": [ @@ -17389,17 +16880,21 @@ }, { "name": "gpt-image-2", - "alias": [ - ], "model_types": [ "image", - "image_edit" + "image_edit", + "chat", + "text-to-image", + "image_generation" + ], + "alias": [ + "openai/gpt-image-2", + "gpt-image-2-all", + "GPT Image 2" ] }, { "name": "gpt-5.1", - "alias": [ - ], "max_tokens": 400000, "model_types": [ "chat" @@ -17407,12 +16902,15 @@ "thinking": { "default_value": true, "clear_thinking": true - } + }, + "alias": [ + "gpt-5.1-thinking-all", + "gpt-5.1-all", + "openai/gpt-5.1" + ] }, { "name": "gpt-5.2", - "alias": [ - ], "max_tokens": 400000, "model_types": [ "chat" @@ -17420,12 +16918,14 @@ "thinking": { "default_value": true, "clear_thinking": true - } + }, + "alias": [ + "gpt-5.2-all", + "openai/gpt-5.2" + ] }, { "name": "gpt-5.4-mini", - "alias": [ - ], "max_tokens": 400000, "model_types": [ "chat" @@ -17433,12 +16933,13 @@ "thinking": { "default_value": true, "clear_thinking": true - } + }, + "alias": [ + "openai/gpt-5.4-mini" + ] }, { "name": "gpt-5", - "alias": [ - ], "max_tokens": 400000, "model_types": [ "chat" @@ -17446,12 +16947,14 @@ "thinking": { "default_value": true, "clear_thinking": true - } + }, + "alias": [ + "gpt-5-all", + "openai/gpt-5" + ] }, { "name": "gpt-5-codex", - "alias": [ - ], "max_tokens": 400000, "model_types": [ "chat" @@ -17459,12 +16962,13 @@ "thinking": { "default_value": true, "clear_thinking": true - } + }, + "alias": [ + "openai/gpt-5-codex" + ] }, { "name": "gpt-5.3-codex", - "alias": [ - ], "max_tokens": 400000, "model_types": [ "chat" @@ -17472,12 +16976,13 @@ "thinking": { "default_value": true, "clear_thinking": true - } + }, + "alias": [ + "openai/gpt-5.3-codex" + ] }, { "name": "gpt-5.1-codex", - "alias": [ - ], "max_tokens": 400000, "model_types": [ "chat" @@ -17485,12 +16990,13 @@ "thinking": { "default_value": true, "clear_thinking": true - } + }, + "alias": [ + "openai/gpt-5.1-codex" + ] }, { "name": "gpt-5.3-codex-spark", - "alias": [ - ], "model_types": [ "chat" ], @@ -17501,8 +17007,6 @@ }, { "name": "gpt-5-codex-mini", - "alias": [ - ], "model_types": [ "chat" ], @@ -17513,8 +17017,6 @@ }, { "name": "gpt-5.1-codex-max", - "alias": [ - ], "max_tokens": 400000, "model_types": [ "chat" @@ -17526,8 +17028,6 @@ }, { "name": "gpt-5.5", - "alias": [ - ], "max_tokens": 1050000, "model_types": [ "chat" @@ -17535,12 +17035,13 @@ "thinking": { "default_value": true, "clear_thinking": true - } + }, + "alias": [ + "openai/gpt-5.5" + ] }, { "name": "gpt-5.1-codex-mini", - "alias": [ - ], "max_tokens": 400000, "model_types": [ "chat" @@ -17548,12 +17049,13 @@ "thinking": { "default_value": true, "clear_thinking": true - } + }, + "alias": [ + "openai/gpt-5.1-codex-mini" + ] }, { "name": "gpt-5.2-codex", - "alias": [ - ], "max_tokens": 400000, "model_types": [ "chat" @@ -17561,12 +17063,16 @@ "thinking": { "default_value": true, "clear_thinking": true - } + }, + "alias": [ + "openai/gpt-5.2-codex" + ] }, { "name": "claude-fable-5", "alias": [ - "anthropic.claude-fable-5" + "anthropic.claude-fable-5", + "anthropic/claude-fable-5" ], "max_tokens": 1000000, "model_types": [ @@ -17580,8 +17086,6 @@ }, { "name": "claude-mythos-5", - "alias": [ - ], "max_tokens": 1000000, "model_types": [ "chat", @@ -17595,12 +17099,17 @@ { "name": "claude-opus-4-8", "alias": [ - "anthropic.claude-opus-4-8" + "anthropic.claude-opus-4-8", + "anthropic/claude-opus-4-8", + "anthropic/claude-opus-4.8", + "claude-opus-4.8" ], "max_tokens": 1000000, "model_types": [ "chat", - "vision" + "vision", + "image2text", + "ocr" ], "thinking": { "default_value": true, @@ -17625,12 +17134,17 @@ { "name": "claude-sonnet-4-6", "alias": [ - "anthropic.claude-sonnet-4-6" + "anthropic.claude-sonnet-4-6", + "anthropic/claude-sonnet-4-6", + "anthropic/claude-sonnet-4.6", + "claude-sonnet-4.6" ], "max_tokens": 1000000, "model_types": [ "chat", - "vision" + "vision", + "image2text", + "ocr" ], "thinking": { "default_value": true, @@ -17640,7 +17154,10 @@ { "name": "claude-sonnet-4-5", "alias": [ - "anthropic.claude-sonnet-4-5" + "anthropic.claude-sonnet-4-5", + "anthropic/claude-sonnet-4-5", + "anthropic/claude-sonnet-4.5", + "claude-sonnet-4.5" ], "max_tokens": 1000000, "model_types": [ @@ -17656,12 +17173,18 @@ "name": "claude-haiku-4-5-20251001", "alias": [ "claude-haiku-4-5", - "anthropic.claude-haiku-4-5-20251001-v1:0" + "anthropic.claude-haiku-4-5-20251001-v1:0", + "anthropic/claude-haiku-4-5", + "anthropic/claude-haiku-4-5-20251001", + "anthropic/claude-haiku-4.5", + "claude-haiku-4.5" ], "max_tokens": 200000, "model_types": [ "chat", - "vision" + "vision", + "image2text", + "ocr" ], "thinking": { "default_value": true, @@ -17671,25 +17194,30 @@ { "name": "moonshotai/kimi-k2.6", "alias": [ - "moonshotai/Kimi-K2.6", - "kimi-k2.6" + "kimi-k2.6", + "Kimi K2.6", + "kimi/kimi-k2.6", + "Kimi K2.6 Fp4" ], "model_types": [ "chat", "vision", - "image2text" + "image2text", + "video_generation" ], "max_tokens": 262144, "thinking": { "default_value": true, "clear_thinking": true - } + }, + "max_completion_tokens": 262144 }, { "name": "moonshotai/kimi-k2.5", "alias": [ - "moonshotai/Kimi-K2.5", - "kimi-k2.5" + "kimi-k2.5", + "Kimi K2.5", + "kimi/kimi-k2.5" ], "model_types": [ "chat", @@ -17700,13 +17228,14 @@ "thinking": { "default_value": true, "clear_thinking": true - } + }, + "max_completion_tokens": 262144 }, { "name": "moonshotai/kimi-k2-instruct", "alias": [ - "moonshotai/Kimi-K2-Instruct", - "kimi-k2-instruct" + "kimi-k2-instruct", + "Kimi K2 Instruct" ], "model_types": [ "chat" @@ -17715,12 +17244,12 @@ "thinking": { "default_value": true, "clear_thinking": true - } + }, + "max_completion_tokens": 32768 }, { "name": "moonshotai/kimi-vl-a3b-thinking-2506", "alias": [ - "moonshotai/Kimi-VL-A3B-Thinking-2506", "kimi-vl-a3b-thinking-2506" ], "model_types": [ @@ -17737,7 +17266,6 @@ { "name": "moonshotai/kimi-vl-a3b-thinking", "alias": [ - "moonshotai/Kimi-VL-A3B-Thinking", "kimi-vl-a3b-thinking" ], "model_types": [ @@ -17754,7 +17282,6 @@ { "name": "moonshotai/moonlight-16b-a3b-instruct", "alias": [ - "moonshotai/Moonlight-16B-A3B-Instruct", "moonlight-16b-a3b-instruct" ], "model_types": [ @@ -17769,7 +17296,6 @@ { "name": "moonshotai/kimi-k2-base", "alias": [ - "moonshotai/Kimi-K2-Base", "kimi-k2-base" ], "model_types": [ @@ -17780,7 +17306,6 @@ { "name": "moonshotai/moonlight-16b-a3b", "alias": [ - "moonshotai/Moonlight-16B-A3B", "moonlight-16b-a3b" ], "model_types": [ @@ -17791,7 +17316,6 @@ { "name": "moonshotai/kimi-vl-a3b-instruct", "alias": [ - "moonshotai/Kimi-VL-A3B-Instruct", "kimi-vl-a3b-instruct" ], "model_types": [ @@ -17804,7 +17328,6 @@ { "name": "moonshotai/kimi-linear-48b-a3b-base", "alias": [ - "moonshotai/Kimi-Linear-48B-A3B-Base", "kimi-linear-48b-a3b-base" ], "model_types": [ @@ -17815,7 +17338,6 @@ { "name": "moonshotai/kimi-k2-instruct-0905", "alias": [ - "moonshotai/Kimi-K2-Instruct-0905", "kimi-k2-instruct-0905" ], "model_types": [ @@ -17830,7 +17352,6 @@ { "name": "moonshotai/kimi-linear-48b-a3b-instruct", "alias": [ - "moonshotai/Kimi-Linear-48B-A3B-Instruct", "kimi-linear-48b-a3b-instruct" ], "model_types": [ @@ -17845,7 +17366,6 @@ { "name": "moonshotai/kimi-dev-72b", "alias": [ - "moonshotai/Kimi-Dev-72B", "kimi-dev-72b" ], "model_types": [ @@ -17860,7 +17380,6 @@ { "name": "moonshotai/kimi-audio-7b-instruct", "alias": [ - "moonshotai/Kimi-Audio-7B-Instruct", "kimi-audio-7b-instruct" ], "model_types": [ @@ -17872,7 +17391,6 @@ { "name": "moonshotai/kimi-audio-7b", "alias": [ - "moonshotai/Kimi-Audio-7B", "kimi-audio-7b" ], "model_types": [ @@ -17884,7 +17402,6 @@ { "name": "moonshotai/moonvit-so-400m", "alias": [ - "moonshotai/MoonViT-SO-400M", "moonvit-so-400m" ], "model_types": [ @@ -17895,9 +17412,10 @@ { "name": "minimaxai/minimax-m2.7", "alias": [ - "minimaxai/MiniMax-M2.7", "minimax-m2.7", - "minimax/minimax-m2.7" + "minimax/minimax-m2.7", + "MiniMax M2.7", + "MiniMax M2.7 FP4" ], "model_types": [ "chat" @@ -17906,14 +17424,15 @@ "thinking": { "default_value": true, "clear_thinking": true - } + }, + "max_completion_tokens": 131072 }, { "name": "minimaxai/minimax-m2.5", "alias": [ - "minimaxai/MiniMax-M2.5", "minimax-m2.5", - "minimax/minimax-m2.5" + "minimax/minimax-m2.5", + "MiniMax M2.5" ], "model_types": [ "chat" @@ -17922,14 +17441,15 @@ "thinking": { "default_value": true, "clear_thinking": true - } + }, + "max_completion_tokens": 131100 }, { "name": "minimaxai/minimax-m2.1", "alias": [ - "minimaxai/MiniMax-M2.1", "minimax-m2.1", - "minimax/minimax-m2.1" + "minimax/minimax-m2.1", + "Minimax M2.1" ], "model_types": [ "chat" @@ -17938,14 +17458,15 @@ "thinking": { "default_value": true, "clear_thinking": true - } + }, + "max_completion_tokens": 131072 }, { "name": "minimaxai/minimax-m2", "alias": [ - "minimaxai/MiniMax-M2", "minimax-m2", - "minimax/minimax-m2" + "minimax/minimax-m2", + "MiniMax M2" ], "model_types": [ "chat" @@ -17954,12 +17475,12 @@ "thinking": { "default_value": true, "clear_thinking": true - } + }, + "max_completion_tokens": 131072 }, { "name": "minimaxai/vtp-large-f16d64", "alias": [ - "minimaxai/VTP-Large-f16d64", "vtp-large-f16d64" ], "model_types": [ @@ -17975,7 +17496,6 @@ { "name": "minimaxai/vtp-base-f16d64", "alias": [ - "minimaxai/VTP-Base-f16d64", "vtp-base-f16d64" ], "model_types": [ @@ -17991,7 +17511,6 @@ { "name": "minimaxai/vtp-small-f16d64", "alias": [ - "minimaxai/VTP-Small-f16d64", "vtp-small-f16d64" ], "model_types": [ @@ -18007,7 +17526,6 @@ { "name": "minimaxai/minimax-m1-40k-hf", "alias": [ - "minimaxai/MiniMax-M1-40k-hf", "minimax-m1-40k-hf" ], "model_types": [ @@ -18022,7 +17540,6 @@ { "name": "minimaxai/minimax-text-01-hf", "alias": [ - "minimaxai/MiniMax-Text-01-hf", "minimax-text-01-hf" ], "model_types": [ @@ -18037,7 +17554,6 @@ { "name": "minimaxai/minimax-m1-80k-hf", "alias": [ - "minimaxai/MiniMax-M1-80k-hf", "minimax-m1-80k-hf" ], "model_types": [ @@ -18052,8 +17568,9 @@ { "name": "minimaxai/minimax-m1-80k", "alias": [ - "minimaxai/MiniMax-M1-80k", - "minimax-m1-80k" + "minimax-m1-80k", + "MiniMax M1", + "Minimax M1 80K" ], "model_types": [ "chat" @@ -18062,13 +17579,14 @@ "thinking": { "default_value": true, "clear_thinking": true - } + }, + "max_completion_tokens": 40000 }, { "name": "minimaxai/minimax-m1-40k", "alias": [ - "minimaxai/MiniMax-M1-40k", - "minimax-m1-40k" + "minimax-m1-40k", + "Minimax M1 40K" ], "model_types": [ "chat" @@ -18082,7 +17600,6 @@ { "name": "minimaxai/minimax-text-01", "alias": [ - "minimaxai/MiniMax-Text-01", "minimax-text-01" ], "model_types": [ @@ -18097,7 +17614,6 @@ { "name": "minimaxai/minimax-vl-01", "alias": [ - "minimaxai/MiniMax-VL-01", "minimax-vl-01" ], "model_types": [ @@ -18114,7 +17630,6 @@ { "name": "minimaxai/synlogic-32b", "alias": [ - "minimaxai/SynLogic-32B", "synlogic-32b" ], "model_types": [ @@ -18129,7 +17644,6 @@ { "name": "minimaxai/synlogic-7b", "alias": [ - "minimaxai/SynLogic-7B", "synlogic-7b" ], "model_types": [ @@ -18144,7 +17658,6 @@ { "name": "minimaxai/synlogic-mix-3-32b", "alias": [ - "minimaxai/SynLogic-Mix-3-32B", "synlogic-mix-3-32b" ], "model_types": [ @@ -18175,7 +17688,8 @@ { "name": "stepfun-ai/Step-3.7-Flash", "alias": [ - "Step-3.7-Flash" + "Step-3.7-Flash", + "stepfun/step-3.7-flash" ], "model_types": [ "chat", @@ -18186,7 +17700,8 @@ "thinking": { "default_value": true, "clear_thinking": true - } + }, + "max_completion_tokens": 256000 }, { "name": "stepfun-ai/Step-3.7-Flash-NVFP4", @@ -18223,7 +17738,8 @@ { "name": "stepfun-ai/Step-3.5-Flash", "alias": [ - "Step-3.5-Flash" + "Step-3.5-Flash", + "step-3.5-flash-2603" ], "model_types": [ "chat" @@ -18566,9 +18082,7 @@ { "name": "tencent/hy-mt2-1.8b-1.25bit-gguf", "alias": [ - "tencent/Hy-MT2-1.8B-1.25Bit-GGUF", - "Hy-MT2-1.8B-1.25Bit-GGUF", - "hy-mt2-1.8b-1.25bit-gguf" + "Hy-MT2-1.8B-1.25Bit-GGUF" ], "max_tokens": 262144, "model_types": [ @@ -18579,9 +18093,7 @@ { "name": "tencent/hy-mt1.5-1.8b-1.25bit-gguf", "alias": [ - "tencent/Hy-MT1.5-1.8B-1.25bit-GGUF", - "Hy-MT1.5-1.8B-1.25bit-GGUF", - "hy-mt1.5-1.8b-1.25bit-gguf" + "Hy-MT1.5-1.8B-1.25bit-GGUF" ], "max_tokens": 262144, "model_types": [ @@ -18592,9 +18104,7 @@ { "name": "tencent/universal_audio_tokenizer", "alias": [ - "tencent/Universal_Audio_Tokenizer", - "Universal_Audio_Tokenizer", - "universal_audio_tokenizer" + "Universal_Audio_Tokenizer" ], "model_types": [ "audio_codec" @@ -18603,9 +18113,7 @@ { "name": "tencent/hy-mt1.5-7b", "alias": [ - "tencent/HY-MT1.5-7B", - "HY-MT1.5-7B", - "hy-mt1.5-7b" + "HY-MT1.5-7B" ], "max_tokens": 262144, "model_types": [ @@ -18616,9 +18124,7 @@ { "name": "tencent/hy-mt1.5-1.8b-1.25bit", "alias": [ - "tencent/Hy-MT1.5-1.8B-1.25bit", - "Hy-MT1.5-1.8B-1.25bit", - "hy-mt1.5-1.8b-1.25bit" + "Hy-MT1.5-1.8B-1.25bit" ], "max_tokens": 262144, "model_types": [ @@ -18629,9 +18135,7 @@ { "name": "tencent/hy-mt2-1.8b-2bit-gguf", "alias": [ - "tencent/Hy-MT2-1.8B-2Bit-GGUF", - "Hy-MT2-1.8B-2Bit-GGUF", - "hy-mt2-1.8b-2bit-gguf" + "Hy-MT2-1.8B-2Bit-GGUF" ], "max_tokens": 262144, "model_types": [ @@ -18642,9 +18146,7 @@ { "name": "tencent/hy-mt2-7b-gguf", "alias": [ - "tencent/Hy-MT2-7B-GGUF", - "Hy-MT2-7B-GGUF", - "hy-mt2-7b-gguf" + "Hy-MT2-7B-GGUF" ], "max_tokens": 262144, "model_types": [ @@ -18655,9 +18157,7 @@ { "name": "tencent/hy-mt2-1.8b-gguf", "alias": [ - "tencent/Hy-MT2-1.8B-GGUF", - "Hy-MT2-1.8B-GGUF", - "hy-mt2-1.8b-gguf" + "Hy-MT2-1.8B-GGUF" ], "max_tokens": 262144, "model_types": [ @@ -18668,9 +18168,7 @@ { "name": "tencent/hy-mt2-30b-a3b-fp8", "alias": [ - "tencent/Hy-MT2-30B-A3B-FP8", - "Hy-MT2-30B-A3B-FP8", - "hy-mt2-30b-a3b-fp8" + "Hy-MT2-30B-A3B-FP8" ], "max_tokens": 262144, "model_types": [ @@ -18681,9 +18179,7 @@ { "name": "tencent/hy-mt2-7b-fp8", "alias": [ - "tencent/Hy-MT2-7B-FP8", - "Hy-MT2-7B-FP8", - "hy-mt2-7b-fp8" + "Hy-MT2-7B-FP8" ], "max_tokens": 262144, "model_types": [ @@ -18694,9 +18190,7 @@ { "name": "tencent/hy-mt2-1.8b-fp8", "alias": [ - "tencent/Hy-MT2-1.8B-FP8", - "Hy-MT2-1.8B-FP8", - "hy-mt2-1.8b-fp8" + "Hy-MT2-1.8B-FP8" ], "max_tokens": 262144, "model_types": [ @@ -18707,9 +18201,7 @@ { "name": "tencent/hy-mt2-1.8b", "alias": [ - "tencent/Hy-MT2-1.8B", - "Hy-MT2-1.8B", - "hy-mt2-1.8b" + "Hy-MT2-1.8B" ], "max_tokens": 262144, "model_types": [ @@ -18720,9 +18212,7 @@ { "name": "tencent/hy-mt2-7b", "alias": [ - "tencent/Hy-MT2-7B", - "Hy-MT2-7B", - "hy-mt2-7b" + "Hy-MT2-7B" ], "max_tokens": 262144, "model_types": [ @@ -18733,9 +18223,7 @@ { "name": "tencent/hy-mt2-30b-a3b", "alias": [ - "tencent/Hy-MT2-30B-A3B", - "Hy-MT2-30B-A3B", - "hy-mt2-30b-a3b" + "Hy-MT2-30B-A3B" ], "max_tokens": 262144, "model_types": [ @@ -18746,9 +18234,7 @@ { "name": "tencent/hy-world-2.0", "alias": [ - "tencent/HY-World-2.0", - "HY-World-2.0", - "hy-world-2.0" + "HY-World-2.0" ], "model_types": [ "3d_generation" @@ -18757,9 +18243,7 @@ { "name": "tencent/hy-omniweaving", "alias": [ - "tencent/HY-OmniWeaving", - "HY-OmniWeaving", - "hy-omniweaving" + "HY-OmniWeaving" ], "model_types": [ "video_generation" @@ -18768,9 +18252,7 @@ { "name": "tencent/hy-mt1.5-1.8b-2bit", "alias": [ - "tencent/Hy-MT1.5-1.8B-2bit", - "Hy-MT1.5-1.8B-2bit", - "hy-mt1.5-1.8b-2bit" + "Hy-MT1.5-1.8B-2bit" ], "max_tokens": 262144, "model_types": [ @@ -18781,9 +18263,7 @@ { "name": "tencent/hy-mt1.5-1.8b-2bit-gguf", "alias": [ - "tencent/Hy-MT1.5-1.8B-2bit-GGUF", - "Hy-MT1.5-1.8B-2bit-GGUF", - "hy-mt1.5-1.8b-2bit-gguf" + "Hy-MT1.5-1.8B-2bit-GGUF" ], "max_tokens": 262144, "model_types": [ @@ -18794,9 +18274,7 @@ { "name": "tencent/points-seeker", "alias": [ - "tencent/POINTS-Seeker", - "POINTS-Seeker", - "points-seeker" + "POINTS-Seeker" ], "max_tokens": 262144, "model_types": [ @@ -18812,9 +18290,7 @@ { "name": "tencent/hy-embodied-0.5-x", "alias": [ - "tencent/HY-Embodied-0.5-X", - "HY-Embodied-0.5-X", - "hy-embodied-0.5-x" + "HY-Embodied-0.5-X" ], "max_tokens": 262144, "model_types": [ @@ -18826,9 +18302,7 @@ { "name": "tencent/hy3-preview-base", "alias": [ - "tencent/Hy3-preview-Base", - "Hy3-preview-Base", - "hy3-preview-base" + "Hy3-preview-Base" ], "max_tokens": 262144, "model_types": [ @@ -18838,9 +18312,7 @@ { "name": "tencent/hy3-preview", "alias": [ - "tencent/Hy3-preview", - "Hy3-preview", - "hy3-preview" + "Hy3-preview" ], "max_tokens": 262144, "model_types": [ @@ -18854,9 +18326,7 @@ { "name": "tencent/unified_audio_schema", "alias": [ - "tencent/Unified_Audio_Schema", - "Unified_Audio_Schema", - "unified_audio_schema" + "Unified_Audio_Schema" ], "max_tokens": 262144, "model_types": [ @@ -18868,9 +18338,7 @@ { "name": "tencent/disca", "alias": [ - "tencent/DisCa", - "DisCa", - "disca" + "DisCa" ], "model_types": [ "other" @@ -18879,9 +18347,7 @@ { "name": "tencent/hy-embodied-0.5", "alias": [ - "tencent/HY-Embodied-0.5", - "HY-Embodied-0.5", - "hy-embodied-0.5" + "HY-Embodied-0.5" ], "max_tokens": 262144, "model_types": [ @@ -18893,9 +18359,7 @@ { "name": "tencent/unicom-unified-multimodal-modeling-via-compressed-continuous-semantic-representations", "alias": [ - "tencent/Unicom-Unified-Multimodal-Modeling-via-Compressed-Continuous-Semantic-Representations", - "Unicom-Unified-Multimodal-Modeling-via-Compressed-Continuous-Semantic-Representations", - "unicom-unified-multimodal-modeling-via-compressed-continuous-semantic-representations" + "Unicom-Unified-Multimodal-Modeling-via-Compressed-Continuous-Semantic-Representations" ], "model_types": [ "image" @@ -18904,9 +18368,7 @@ { "name": "tencent/sequential-hidden-decoding-8b-n8-instruct", "alias": [ - "tencent/Sequential-Hidden-Decoding-8B-n8-Instruct", - "Sequential-Hidden-Decoding-8B-n8-Instruct", - "sequential-hidden-decoding-8b-n8-instruct" + "Sequential-Hidden-Decoding-8B-n8-Instruct" ], "max_tokens": 262144, "model_types": [ @@ -18916,9 +18378,7 @@ { "name": "tencent/versavit", "alias": [ - "tencent/VersaViT", - "VersaViT", - "versavit" + "VersaViT" ], "model_types": [ "vision" @@ -18927,9 +18387,7 @@ { "name": "tencent/covo-audio-chat", "alias": [ - "tencent/Covo-Audio-Chat", - "Covo-Audio-Chat", - "covo-audio-chat" + "Covo-Audio-Chat" ], "max_tokens": 262144, "model_types": [ @@ -18942,9 +18400,7 @@ { "name": "tencent/sequential-hidden-decoding-8b-n8", "alias": [ - "tencent/Sequential-Hidden-Decoding-8B-n8", - "Sequential-Hidden-Decoding-8B-n8", - "sequential-hidden-decoding-8b-n8" + "Sequential-Hidden-Decoding-8B-n8" ], "max_tokens": 262144, "model_types": [ @@ -18954,9 +18410,7 @@ { "name": "tencent/penguin-vl-2b", "alias": [ - "tencent/Penguin-VL-2B", - "Penguin-VL-2B", - "penguin-vl-2b" + "Penguin-VL-2B" ], "max_tokens": 262144, "model_types": [ @@ -18968,9 +18422,7 @@ { "name": "tencent/penguin-vl-8b", "alias": [ - "tencent/Penguin-VL-8B", - "Penguin-VL-8B", - "penguin-vl-8b" + "Penguin-VL-8B" ], "max_tokens": 262144, "model_types": [ @@ -18982,9 +18434,7 @@ { "name": "tencent/points-gui-g", "alias": [ - "tencent/POINTS-GUI-G", - "POINTS-GUI-G", - "points-gui-g" + "POINTS-GUI-G" ], "max_tokens": 262144, "model_types": [ @@ -18996,9 +18446,7 @@ { "name": "tencent/sequential-hidden-decoding-8b-n2", "alias": [ - "tencent/Sequential-Hidden-Decoding-8B-n2", - "Sequential-Hidden-Decoding-8B-n2", - "sequential-hidden-decoding-8b-n2" + "Sequential-Hidden-Decoding-8B-n2" ], "max_tokens": 262144, "model_types": [ @@ -19008,9 +18456,7 @@ { "name": "tencent/sequential-hidden-decoding-8b-n4", "alias": [ - "tencent/Sequential-Hidden-Decoding-8B-n4", - "Sequential-Hidden-Decoding-8B-n4", - "sequential-hidden-decoding-8b-n4" + "Sequential-Hidden-Decoding-8B-n4" ], "max_tokens": 262144, "model_types": [ @@ -19020,9 +18466,7 @@ { "name": "tencent/penguin-encoder", "alias": [ - "tencent/Penguin-Encoder", - "Penguin-Encoder", - "penguin-encoder" + "Penguin-Encoder" ], "model_types": [ "embedding", @@ -19032,9 +18476,7 @@ { "name": "tencent/hy-worldplay", "alias": [ - "tencent/HY-WorldPlay", - "HY-WorldPlay", - "hy-worldplay" + "HY-WorldPlay" ], "model_types": [ "video_generation" @@ -19043,9 +18485,7 @@ { "name": "tencent/hy-wu", "alias": [ - "tencent/HY-WU", - "HY-WU", - "hy-wu" + "HY-WU" ], "model_types": [ "image" @@ -19054,9 +18494,7 @@ { "name": "tencent/songgeneration", "alias": [ - "tencent/SongGeneration", - "SongGeneration", - "songgeneration" + "SongGeneration" ], "model_types": [ "audio_generation" @@ -19065,9 +18503,7 @@ { "name": "tencent/stabletoken", "alias": [ - "tencent/StableToken", - "StableToken", - "stabletoken" + "StableToken" ], "model_types": [ "audio_codec" @@ -19076,9 +18512,7 @@ { "name": "tencent/youtu-llm-2b", "alias": [ - "tencent/Youtu-LLM-2B", - "Youtu-LLM-2B", - "youtu-llm-2b" + "Youtu-LLM-2B" ], "max_tokens": 262144, "model_types": [ @@ -19088,9 +18522,7 @@ { "name": "tencent/youtu-llm-2b-base", "alias": [ - "tencent/Youtu-LLM-2B-Base", - "Youtu-LLM-2B-Base", - "youtu-llm-2b-base" + "Youtu-LLM-2B-Base" ], "max_tokens": 262144, "model_types": [ @@ -19100,9 +18532,7 @@ { "name": "tencent/youtu-vl-4b-instruct-gguf", "alias": [ - "tencent/Youtu-VL-4B-Instruct-GGUF", - "Youtu-VL-4B-Instruct-GGUF", - "youtu-vl-4b-instruct-gguf" + "Youtu-VL-4B-Instruct-GGUF" ], "max_tokens": 262144, "model_types": [ @@ -19114,9 +18544,7 @@ { "name": "tencent/youtu-vl-4b-instruct", "alias": [ - "tencent/Youtu-VL-4B-Instruct", - "Youtu-VL-4B-Instruct", - "youtu-vl-4b-instruct" + "Youtu-VL-4B-Instruct" ], "max_tokens": 262144, "model_types": [ @@ -19128,9 +18556,7 @@ { "name": "tencent/kalm-embedding-gemma3-12b-2511", "alias": [ - "tencent/KaLM-Embedding-Gemma3-12B-2511", - "KaLM-Embedding-Gemma3-12B-2511", - "kalm-embedding-gemma3-12b-2511" + "KaLM-Embedding-Gemma3-12B-2511" ], "model_types": [ "embedding" @@ -19139,9 +18565,7 @@ { "name": "tencent/hy3d-bench", "alias": [ - "tencent/HY3D-Bench", - "HY3D-Bench", - "hy3d-bench" + "HY3D-Bench" ], "model_types": [ "3d_generation" @@ -19150,9 +18574,7 @@ { "name": "tencent/youtu-hichunk", "alias": [ - "tencent/Youtu-HiChunk", - "Youtu-HiChunk", - "youtu-hichunk" + "Youtu-HiChunk" ], "model_types": [ "embedding", @@ -19162,9 +18584,7 @@ { "name": "tencent/hunyuanimage-3.0-instruct-distil", "alias": [ - "tencent/HunyuanImage-3.0-Instruct-Distil", - "HunyuanImage-3.0-Instruct-Distil", - "hunyuanimage-3.0-instruct-distil" + "HunyuanImage-3.0-Instruct-Distil" ], "model_types": [ "image_edit" @@ -19173,9 +18593,7 @@ { "name": "tencent/hunyuanimage-3.0-instruct", "alias": [ - "tencent/HunyuanImage-3.0-Instruct", - "HunyuanImage-3.0-Instruct", - "hunyuanimage-3.0-instruct" + "HunyuanImage-3.0-Instruct" ], "model_types": [ "image_edit" @@ -19184,9 +18602,7 @@ { "name": "tencent/youtu-parsing", "alias": [ - "tencent/Youtu-Parsing", - "Youtu-Parsing", - "youtu-parsing" + "Youtu-Parsing" ], "max_tokens": 262144, "model_types": [ @@ -19197,9 +18613,7 @@ { "name": "tencent/hunyuanimage-3.0", "alias": [ - "tencent/HunyuanImage-3.0", - "HunyuanImage-3.0", - "hunyuanimage-3.0" + "HunyuanImage-3.0" ], "model_types": [ "image" @@ -19208,9 +18622,7 @@ { "name": "tencent/hy-video-prfl", "alias": [ - "tencent/HY-Video-PRFL", - "HY-Video-PRFL", - "hy-video-prfl" + "HY-Video-PRFL" ], "model_types": [ "video_generation" @@ -19219,9 +18631,7 @@ { "name": "tencent/hunyuanocr", "alias": [ - "tencent/HunyuanOCR", - "HunyuanOCR", - "hunyuanocr" + "HunyuanOCR" ], "model_types": [ "ocr", @@ -19232,9 +18642,7 @@ { "name": "tencent/tcandon-router", "alias": [ - "tencent/TCAndon-Router", - "TCAndon-Router", - "tcandon-router" + "TCAndon-Router" ], "max_tokens": 262144, "model_types": [ @@ -19244,9 +18652,7 @@ { "name": "tencent/hy-mt1.5-7b-gguf", "alias": [ - "tencent/HY-MT1.5-7B-GGUF", - "HY-MT1.5-7B-GGUF", - "hy-mt1.5-7b-gguf" + "HY-MT1.5-7B-GGUF" ], "max_tokens": 262144, "model_types": [ @@ -19257,9 +18663,7 @@ { "name": "tencent/hy-mt1.5-1.8b-gguf", "alias": [ - "tencent/HY-MT1.5-1.8B-GGUF", - "HY-MT1.5-1.8B-GGUF", - "hy-mt1.5-1.8b-gguf" + "HY-MT1.5-1.8B-GGUF" ], "max_tokens": 262144, "model_types": [ @@ -19270,9 +18674,7 @@ { "name": "tencent/youtu-llm-2b-gguf", "alias": [ - "tencent/Youtu-LLM-2B-GGUF", - "Youtu-LLM-2B-GGUF", - "youtu-llm-2b-gguf" + "Youtu-LLM-2B-GGUF" ], "max_tokens": 262144, "model_types": [ @@ -19282,9 +18684,7 @@ { "name": "tencent/hy-mt1.5-7b-gptq-int4", "alias": [ - "tencent/HY-MT1.5-7B-GPTQ-Int4", - "HY-MT1.5-7B-GPTQ-Int4", - "hy-mt1.5-7b-gptq-int4" + "HY-MT1.5-7B-GPTQ-Int4" ], "max_tokens": 262144, "model_types": [ @@ -19295,9 +18695,7 @@ { "name": "tencent/hy-mt1.5-7b-fp8", "alias": [ - "tencent/HY-MT1.5-7B-FP8", - "HY-MT1.5-7B-FP8", - "hy-mt1.5-7b-fp8" + "HY-MT1.5-7B-FP8" ], "max_tokens": 262144, "model_types": [ @@ -19308,9 +18706,7 @@ { "name": "tencent/hy-mt1.5-1.8b-gptq-int4", "alias": [ - "tencent/HY-MT1.5-1.8B-GPTQ-Int4", - "HY-MT1.5-1.8B-GPTQ-Int4", - "hy-mt1.5-1.8b-gptq-int4" + "HY-MT1.5-1.8B-GPTQ-Int4" ], "max_tokens": 262144, "model_types": [ @@ -19321,9 +18717,7 @@ { "name": "tencent/hy-mt1.5-1.8b-fp8", "alias": [ - "tencent/HY-MT1.5-1.8B-FP8", - "HY-MT1.5-1.8B-FP8", - "hy-mt1.5-1.8b-fp8" + "HY-MT1.5-1.8B-FP8" ], "max_tokens": 262144, "model_types": [ @@ -19334,9 +18728,7 @@ { "name": "tencent/hy-mt1.5-1.8b", "alias": [ - "tencent/HY-MT1.5-1.8B", - "HY-MT1.5-1.8B", - "hy-mt1.5-1.8b" + "HY-MT1.5-1.8B" ], "max_tokens": 262144, "model_types": [ @@ -19347,9 +18739,7 @@ { "name": "tencent/wedlm-8b-instruct", "alias": [ - "tencent/WeDLM-8B-Instruct", - "WeDLM-8B-Instruct", - "wedlm-8b-instruct" + "WeDLM-8B-Instruct" ], "max_tokens": 262144, "model_types": [ @@ -19359,9 +18749,7 @@ { "name": "tencent/hy-motion-1.0", "alias": [ - "tencent/HY-Motion-1.0", - "HY-Motion-1.0", - "hy-motion-1.0" + "HY-Motion-1.0" ], "model_types": [ "3d_generation" @@ -19370,9 +18758,7 @@ { "name": "tencent/hunyuan-mt-7b", "alias": [ - "tencent/Hunyuan-MT-7B", - "Hunyuan-MT-7B", - "hunyuan-mt-7b" + "Hunyuan-MT-7B" ], "max_tokens": 262144, "model_types": [ @@ -19383,9 +18769,7 @@ { "name": "tencent/wedlm-7b-instruct", "alias": [ - "tencent/WeDLM-7B-Instruct", - "WeDLM-7B-Instruct", - "wedlm-7b-instruct" + "WeDLM-7B-Instruct" ], "max_tokens": 262144, "model_types": [ @@ -19395,9 +18779,7 @@ { "name": "tencent/wedlm-7b-base", "alias": [ - "tencent/WeDLM-7B-Base", - "WeDLM-7B-Base", - "wedlm-7b-base" + "WeDLM-7B-Base" ], "max_tokens": 262144, "model_types": [ @@ -19407,9 +18789,7 @@ { "name": "tencent/wedlm-8b-base", "alias": [ - "tencent/WeDLM-8B-Base", - "WeDLM-8B-Base", - "wedlm-8b-base" + "WeDLM-8B-Base" ], "max_tokens": 262144, "model_types": [ @@ -19419,9 +18799,7 @@ { "name": "tencent/hunyuanvideo-1.5", "alias": [ - "tencent/HunyuanVideo-1.5", - "HunyuanVideo-1.5", - "hunyuanvideo-1.5" + "HunyuanVideo-1.5" ], "model_types": [ "video_generation" @@ -19430,9 +18808,7 @@ { "name": "tencent/youtu-embedding", "alias": [ - "tencent/Youtu-Embedding", - "Youtu-Embedding", - "youtu-embedding" + "Youtu-Embedding" ], "model_types": [ "embedding" @@ -19441,9 +18817,7 @@ { "name": "tencent/drive-rl", "alias": [ - "tencent/DRIVE-RL", - "DRIVE-RL", - "drive-rl" + "DRIVE-RL" ], "max_tokens": 262144, "model_types": [ @@ -19457,9 +18831,7 @@ { "name": "tencent/drive-sft", "alias": [ - "tencent/DRIVE-SFT", - "DRIVE-SFT", - "drive-sft" + "DRIVE-SFT" ], "max_tokens": 262144, "model_types": [ @@ -19469,9 +18841,7 @@ { "name": "tencent/deepseek-v3.1-terminus-w4afp8", "alias": [ - "tencent/DeepSeek-V3.1-Terminus-W4AFP8", - "DeepSeek-V3.1-Terminus-W4AFP8", - "deepseek-v3.1-terminus-w4afp8" + "DeepSeek-V3.1-Terminus-W4AFP8" ], "max_tokens": 262144, "model_types": [ @@ -19485,9 +18855,7 @@ { "name": "tencent/hunyuan-4b-instruct", "alias": [ - "tencent/Hunyuan-4B-Instruct", - "Hunyuan-4B-Instruct", - "hunyuan-4b-instruct" + "Hunyuan-4B-Instruct" ], "max_tokens": 262144, "model_types": [ @@ -19497,9 +18865,7 @@ { "name": "tencent/hunyuanworld-mirror", "alias": [ - "tencent/HunyuanWorld-Mirror", - "HunyuanWorld-Mirror", - "hunyuanworld-mirror" + "HunyuanWorld-Mirror" ], "model_types": [ "3d_generation" @@ -19508,9 +18874,7 @@ { "name": "tencent/songprep-7b", "alias": [ - "tencent/SongPrep-7B", - "SongPrep-7B", - "songprep-7b" + "SongPrep-7B" ], "model_types": [ "asr" @@ -19519,9 +18883,7 @@ { "name": "tencent/hunyuanworld-1", "alias": [ - "tencent/HunyuanWorld-1", - "HunyuanWorld-1", - "hunyuanworld-1" + "HunyuanWorld-1" ], "model_types": [ "3d_generation" @@ -19530,9 +18892,7 @@ { "name": "tencent/hunyuan3d-part", "alias": [ - "tencent/Hunyuan3D-Part", - "Hunyuan3D-Part", - "hunyuan3d-part" + "Hunyuan3D-Part" ], "model_types": [ "3d_generation" @@ -19541,9 +18901,7 @@ { "name": "tencent/hunyuanworld-voyager", "alias": [ - "tencent/HunyuanWorld-Voyager", - "HunyuanWorld-Voyager", - "hunyuanworld-voyager" + "HunyuanWorld-Voyager" ], "model_types": [ "video_generation" @@ -19552,9 +18910,7 @@ { "name": "tencent/hunyuan3d-2mv", "alias": [ - "tencent/Hunyuan3D-2mv", - "Hunyuan3D-2mv", - "hunyuan3d-2mv" + "Hunyuan3D-2mv" ], "model_types": [ "3d_generation" @@ -19563,9 +18919,7 @@ { "name": "tencent/hunyuan3d-omni", "alias": [ - "tencent/Hunyuan3D-Omni", - "Hunyuan3D-Omni", - "hunyuan3d-omni" + "Hunyuan3D-Omni" ], "model_types": [ "3d_generation" @@ -19574,9 +18928,7 @@ { "name": "tencent/hunyuan3d-2mini", "alias": [ - "tencent/Hunyuan3D-2mini", - "Hunyuan3D-2mini", - "hunyuan3d-2mini" + "Hunyuan3D-2mini" ], "model_types": [ "3d_generation" @@ -19585,9 +18937,7 @@ { "name": "tencent/hunyuan3d-2.1", "alias": [ - "tencent/Hunyuan3D-2.1", - "Hunyuan3D-2.1", - "hunyuan3d-2.1" + "Hunyuan3D-2.1" ], "model_types": [ "3d_generation" @@ -19596,9 +18946,7 @@ { "name": "tencent/hunyuan3d-2", "alias": [ - "tencent/Hunyuan3D-2", - "Hunyuan3D-2", - "hunyuan3d-2" + "Hunyuan3D-2" ], "model_types": [ "3d_generation" @@ -19607,9 +18955,7 @@ { "name": "tencent/hunyuan3d-1", "alias": [ - "tencent/Hunyuan3D-1", - "Hunyuan3D-1", - "hunyuan3d-1" + "Hunyuan3D-1" ], "model_types": [ "3d_generation" @@ -19618,9 +18964,7 @@ { "name": "tencent/hunyuanimage-2.1", "alias": [ - "tencent/HunyuanImage-2.1", - "HunyuanImage-2.1", - "hunyuanimage-2.1" + "HunyuanImage-2.1" ], "model_types": [ "image" @@ -19629,9 +18973,7 @@ { "name": "tencent/hunyuanvideo-foley", "alias": [ - "tencent/HunyuanVideo-Foley", - "HunyuanVideo-Foley", - "hunyuanvideo-foley" + "HunyuanVideo-Foley" ], "model_types": [ "audio_generation" @@ -19640,9 +18982,7 @@ { "name": "tencent/srpo", "alias": [ - "tencent/SRPO", - "SRPO", - "srpo" + "SRPO" ], "model_types": [ "image" @@ -19651,9 +18991,7 @@ { "name": "tencent/points-reader", "alias": [ - "tencent/POINTS-Reader", - "POINTS-Reader", - "points-reader" + "POINTS-Reader" ], "max_tokens": 262144, "model_types": [ @@ -19664,9 +19002,7 @@ { "name": "tencent/hunyuan-mt-chimera-7b", "alias": [ - "tencent/Hunyuan-MT-Chimera-7B", - "Hunyuan-MT-Chimera-7B", - "hunyuan-mt-chimera-7b" + "Hunyuan-MT-Chimera-7B" ], "max_tokens": 262144, "model_types": [ @@ -19677,9 +19013,7 @@ { "name": "tencent/hunyuan-mt-chimera-7b-fp8", "alias": [ - "tencent/Hunyuan-MT-Chimera-7B-fp8", - "Hunyuan-MT-Chimera-7B-fp8", - "hunyuan-mt-chimera-7b-fp8" + "Hunyuan-MT-Chimera-7B-fp8" ], "max_tokens": 262144, "model_types": [ @@ -19690,9 +19024,7 @@ { "name": "tencent/hunyuan-mt-7b-fp8", "alias": [ - "tencent/Hunyuan-MT-7B-fp8", - "Hunyuan-MT-7B-fp8", - "hunyuan-mt-7b-fp8" + "Hunyuan-MT-7B-fp8" ], "max_tokens": 262144, "model_types": [ @@ -19703,9 +19035,7 @@ { "name": "tencent/hunyuan-0.5b-instruct-gptq-int4", "alias": [ - "tencent/Hunyuan-0.5B-Instruct-GPTQ-Int4", - "Hunyuan-0.5B-Instruct-GPTQ-Int4", - "hunyuan-0.5b-instruct-gptq-int4" + "Hunyuan-0.5B-Instruct-GPTQ-Int4" ], "max_tokens": 262144, "model_types": [ @@ -19715,9 +19045,7 @@ { "name": "tencent/hunyuan-7b-instruct-fp8", "alias": [ - "tencent/Hunyuan-7B-Instruct-FP8", - "Hunyuan-7B-Instruct-FP8", - "hunyuan-7b-instruct-fp8" + "Hunyuan-7B-Instruct-FP8" ], "max_tokens": 262144, "model_types": [ @@ -19727,9 +19055,7 @@ { "name": "tencent/hunyuan-7b-instruct-gptq-int4", "alias": [ - "tencent/Hunyuan-7B-Instruct-GPTQ-Int4", - "Hunyuan-7B-Instruct-GPTQ-Int4", - "hunyuan-7b-instruct-gptq-int4" + "Hunyuan-7B-Instruct-GPTQ-Int4" ], "max_tokens": 262144, "model_types": [ @@ -19739,9 +19065,7 @@ { "name": "tencent/hunyuan-7b-instruct", "alias": [ - "tencent/Hunyuan-7B-Instruct", - "Hunyuan-7B-Instruct", - "hunyuan-7b-instruct" + "Hunyuan-7B-Instruct" ], "max_tokens": 262144, "model_types": [ @@ -19751,9 +19075,7 @@ { "name": "tencent/hunyuan-7b-instruct-awq-int4", "alias": [ - "tencent/Hunyuan-7B-Instruct-AWQ-Int4", - "Hunyuan-7B-Instruct-AWQ-Int4", - "hunyuan-7b-instruct-awq-int4" + "Hunyuan-7B-Instruct-AWQ-Int4" ], "max_tokens": 262144, "model_types": [ @@ -19763,9 +19085,7 @@ { "name": "tencent/hunyuan-7b-pretrain", "alias": [ - "tencent/Hunyuan-7B-Pretrain", - "Hunyuan-7B-Pretrain", - "hunyuan-7b-pretrain" + "Hunyuan-7B-Pretrain" ], "max_tokens": 262144, "model_types": [ @@ -19775,9 +19095,7 @@ { "name": "tencent/hunyuan-4b-instruct-gptq-int4", "alias": [ - "tencent/Hunyuan-4B-Instruct-GPTQ-Int4", - "Hunyuan-4B-Instruct-GPTQ-Int4", - "hunyuan-4b-instruct-gptq-int4" + "Hunyuan-4B-Instruct-GPTQ-Int4" ], "max_tokens": 262144, "model_types": [ @@ -19787,9 +19105,7 @@ { "name": "tencent/hunyuan-4b-instruct-awq-int4", "alias": [ - "tencent/Hunyuan-4B-Instruct-AWQ-Int4", - "Hunyuan-4B-Instruct-AWQ-Int4", - "hunyuan-4b-instruct-awq-int4" + "Hunyuan-4B-Instruct-AWQ-Int4" ], "max_tokens": 262144, "model_types": [ @@ -19799,9 +19115,7 @@ { "name": "tencent/hunyuan-1.8b-instruct-gptq-int4", "alias": [ - "tencent/Hunyuan-1.8B-Instruct-GPTQ-Int4", - "Hunyuan-1.8B-Instruct-GPTQ-Int4", - "hunyuan-1.8b-instruct-gptq-int4" + "Hunyuan-1.8B-Instruct-GPTQ-Int4" ], "max_tokens": 262144, "model_types": [ @@ -19811,9 +19125,7 @@ { "name": "tencent/hunyuan-1.8b-instruct-awq-int4", "alias": [ - "tencent/Hunyuan-1.8B-Instruct-AWQ-Int4", - "Hunyuan-1.8B-Instruct-AWQ-Int4", - "hunyuan-1.8b-instruct-awq-int4" + "Hunyuan-1.8B-Instruct-AWQ-Int4" ], "max_tokens": 262144, "model_types": [ @@ -19823,9 +19135,7 @@ { "name": "tencent/hunyuan-0.5b-instruct-fp8", "alias": [ - "tencent/Hunyuan-0.5B-Instruct-FP8", - "Hunyuan-0.5B-Instruct-FP8", - "hunyuan-0.5b-instruct-fp8" + "Hunyuan-0.5B-Instruct-FP8" ], "max_tokens": 262144, "model_types": [ @@ -19835,9 +19145,7 @@ { "name": "tencent/hunyuan-1.8b-instruct-fp8", "alias": [ - "tencent/Hunyuan-1.8B-Instruct-FP8", - "Hunyuan-1.8B-Instruct-FP8", - "hunyuan-1.8b-instruct-fp8" + "Hunyuan-1.8B-Instruct-FP8" ], "max_tokens": 262144, "model_types": [ @@ -19847,9 +19155,7 @@ { "name": "tencent/hunyuan-0.5b-instruct-awq-int4", "alias": [ - "tencent/Hunyuan-0.5B-Instruct-AWQ-Int4", - "Hunyuan-0.5B-Instruct-AWQ-Int4", - "hunyuan-0.5b-instruct-awq-int4" + "Hunyuan-0.5B-Instruct-AWQ-Int4" ], "max_tokens": 262144, "model_types": [ @@ -19859,9 +19165,7 @@ { "name": "tencent/hunyuan-4b-instruct-fp8", "alias": [ - "tencent/Hunyuan-4B-Instruct-FP8", - "Hunyuan-4B-Instruct-FP8", - "hunyuan-4b-instruct-fp8" + "Hunyuan-4B-Instruct-FP8" ], "max_tokens": 262144, "model_types": [ @@ -19871,9 +19175,7 @@ { "name": "tencent/hunyuan-a13b-instruct", "alias": [ - "tencent/Hunyuan-A13B-Instruct", - "Hunyuan-A13B-Instruct", - "hunyuan-a13b-instruct" + "Hunyuan-A13B-Instruct" ], "max_tokens": 262144, "model_types": [ @@ -19883,9 +19185,7 @@ { "name": "tencent/hunyuan-gamecraft-1.0", "alias": [ - "tencent/Hunyuan-GameCraft-1.0", - "Hunyuan-GameCraft-1.0", - "hunyuan-gamecraft-1.0" + "Hunyuan-GameCraft-1.0" ], "model_types": [ "video_generation" @@ -19894,9 +19194,7 @@ { "name": "tencent/dogr", "alias": [ - "tencent/DOGR", - "DOGR", - "dogr" + "DOGR" ], "max_tokens": 262144, "model_types": [ @@ -19906,9 +19204,7 @@ { "name": "tencent/hunyuan-4b-pretrain", "alias": [ - "tencent/Hunyuan-4B-Pretrain", - "Hunyuan-4B-Pretrain", - "hunyuan-4b-pretrain" + "Hunyuan-4B-Pretrain" ], "max_tokens": 262144, "model_types": [ @@ -19918,9 +19214,7 @@ { "name": "tencent/hunyuan-1.8b-pretrain", "alias": [ - "tencent/Hunyuan-1.8B-Pretrain", - "Hunyuan-1.8B-Pretrain", - "hunyuan-1.8b-pretrain" + "Hunyuan-1.8B-Pretrain" ], "max_tokens": 262144, "model_types": [ @@ -19930,9 +19224,7 @@ { "name": "tencent/hunyuan-1.8b-instruct", "alias": [ - "tencent/Hunyuan-1.8B-Instruct", - "Hunyuan-1.8B-Instruct", - "hunyuan-1.8b-instruct" + "Hunyuan-1.8B-Instruct" ], "max_tokens": 262144, "model_types": [ @@ -19942,9 +19234,7 @@ { "name": "tencent/hunyuan-0.5b-pretrain", "alias": [ - "tencent/Hunyuan-0.5B-Pretrain", - "Hunyuan-0.5B-Pretrain", - "hunyuan-0.5b-pretrain" + "Hunyuan-0.5B-Pretrain" ], "max_tokens": 262144, "model_types": [ @@ -19954,9 +19244,7 @@ { "name": "tencent/hunyuan-0.5b-instruct", "alias": [ - "tencent/Hunyuan-0.5B-Instruct", - "Hunyuan-0.5B-Instruct", - "hunyuan-0.5b-instruct" + "Hunyuan-0.5B-Instruct" ], "max_tokens": 262144, "model_types": [ @@ -19966,9 +19254,7 @@ { "name": "tencent/depthcrafter", "alias": [ - "tencent/DepthCrafter", - "DepthCrafter", - "depthcrafter" + "DepthCrafter" ], "model_types": [ "depth_estimation" @@ -19977,9 +19263,7 @@ { "name": "tencent/hunyuan-7b-instruct-0124", "alias": [ - "tencent/Hunyuan-7B-Instruct-0124", - "Hunyuan-7B-Instruct-0124", - "hunyuan-7b-instruct-0124" + "Hunyuan-7B-Instruct-0124" ], "max_tokens": 262144, "model_types": [ @@ -19989,9 +19273,7 @@ { "name": "tencent/mimicmotion", "alias": [ - "tencent/MimicMotion", - "MimicMotion", - "mimicmotion" + "MimicMotion" ], "model_types": [ "video_generation" @@ -20000,9 +19282,7 @@ { "name": "tencent/hunyuan-a13b-instruct-gguf", "alias": [ - "tencent/Hunyuan-A13B-Instruct-GGUF", - "Hunyuan-A13B-Instruct-GGUF", - "hunyuan-a13b-instruct-gguf" + "Hunyuan-A13B-Instruct-GGUF" ], "max_tokens": 262144, "model_types": [ @@ -20012,9 +19292,7 @@ { "name": "tencent/hunyuan-a13b-instruct-gptq-int4", "alias": [ - "tencent/Hunyuan-A13B-Instruct-GPTQ-Int4", - "Hunyuan-A13B-Instruct-GPTQ-Int4", - "hunyuan-a13b-instruct-gptq-int4" + "Hunyuan-A13B-Instruct-GPTQ-Int4" ], "max_tokens": 262144, "model_types": [ @@ -20024,9 +19302,7 @@ { "name": "tencent/hunyuan-a13b-pretrain", "alias": [ - "tencent/Hunyuan-A13B-Pretrain", - "Hunyuan-A13B-Pretrain", - "hunyuan-a13b-pretrain" + "Hunyuan-A13B-Pretrain" ], "max_tokens": 262144, "model_types": [ @@ -20036,9 +19312,7 @@ { "name": "tencent/hunyuan-a13b-instruct-fp8", "alias": [ - "tencent/Hunyuan-A13B-Instruct-FP8", - "Hunyuan-A13B-Instruct-FP8", - "hunyuan-a13b-instruct-fp8" + "Hunyuan-A13B-Instruct-FP8" ], "max_tokens": 262144, "model_types": [ @@ -20048,9 +19322,7 @@ { "name": "tencent/hunyuan-7b-pretrain-0124", "alias": [ - "tencent/Hunyuan-7B-Pretrain-0124", - "Hunyuan-7B-Pretrain-0124", - "hunyuan-7b-pretrain-0124" + "Hunyuan-7B-Pretrain-0124" ], "max_tokens": 262144, "model_types": [ @@ -20060,9 +19332,7 @@ { "name": "tencent/hunyuancustom", "alias": [ - "tencent/HunyuanCustom", - "HunyuanCustom", - "hunyuancustom" + "HunyuanCustom" ], "model_types": [ "video_generation" @@ -20071,9 +19341,7 @@ { "name": "tencent/hunyuanvideo-avatar", "alias": [ - "tencent/HunyuanVideo-Avatar", - "HunyuanVideo-Avatar", - "hunyuanvideo-avatar" + "HunyuanVideo-Avatar" ], "model_types": [ "video_generation" @@ -20082,9 +19350,7 @@ { "name": "tencent/hunyuanportrait", "alias": [ - "tencent/HunyuanPortrait", - "HunyuanPortrait", - "hunyuanportrait" + "HunyuanPortrait" ], "model_types": [ "video_generation" @@ -20093,9 +19359,7 @@ { "name": "tencent/instantcharacter", "alias": [ - "tencent/InstantCharacter", - "InstantCharacter", - "instantcharacter" + "InstantCharacter" ], "model_types": [ "image" @@ -20104,9 +19368,7 @@ { "name": "tencent/hunyuanvideo-i2v", "alias": [ - "tencent/HunyuanVideo-I2V", - "HunyuanVideo-I2V", - "hunyuanvideo-i2v" + "HunyuanVideo-I2V" ], "model_types": [ "video_generation" @@ -20115,9 +19377,7 @@ { "name": "tencent/hunyuanvideo", "alias": [ - "tencent/HunyuanVideo", - "HunyuanVideo", - "hunyuanvideo" + "HunyuanVideo" ], "model_types": [ "video_generation" @@ -20126,9 +19386,7 @@ { "name": "tencent/tencent-hunyuan-large", "alias": [ - "tencent/Tencent-Hunyuan-Large", - "Tencent-Hunyuan-Large", - "tencent-hunyuan-large" + "Tencent-Hunyuan-Large" ], "max_tokens": 262144, "model_types": [ @@ -20138,9 +19396,7 @@ { "name": "tencent/hunyuanvideo-promptrewrite", "alias": [ - "tencent/HunyuanVideo-PromptRewrite", - "HunyuanVideo-PromptRewrite", - "hunyuanvideo-promptrewrite" + "HunyuanVideo-PromptRewrite" ], "max_tokens": 262144, "model_types": [ @@ -20201,8 +19457,6 @@ }, { "name": "amazon.titan-embed-text-v1", - "alias": [ - ], "max_tokens": 8192, "model_types": [ "embedding" @@ -20281,11 +19535,14 @@ { "name": "xai/grok-2-vision-1212", "alias": [ - "grok-2-vision" + "grok-2-vision", + "grok-2-vision-1212" ], "max_tokens": 131072, "model_types": [ - "chat" + "chat", + "image2text", + "vision" ] }, { @@ -20301,9 +19558,7 @@ { "name": "meta-llama/prompt-guard-86m", "alias": [ - "meta-llama/Prompt-Guard-86M", - "Prompt-Guard-86M", - "prompt-guard-86m" + "Prompt-Guard-86M" ], "model_types": [ "moderation" @@ -20312,9 +19567,8 @@ { "name": "meta-llama/meta-llama-3-8b-instruct", "alias": [ - "meta-llama/Meta-Llama-3-8B-Instruct", "Meta-Llama-3-8B-Instruct", - "meta-llama-3-8b-instruct" + "Meta Llama 3 8B Instruct" ], "max_tokens": 8192, "model_types": [ @@ -20324,9 +19578,7 @@ { "name": "meta-llama/meta-llama-3-70b-instruct", "alias": [ - "meta-llama/Meta-Llama-3-70B-Instruct", - "Meta-Llama-3-70B-Instruct", - "meta-llama-3-70b-instruct" + "Meta-Llama-3-70B-Instruct" ], "max_tokens": 8192, "model_types": [ @@ -20336,9 +19588,7 @@ { "name": "meta-llama/llama-4-maverick-17b-128e-instruct", "alias": [ - "meta-llama/Llama-4-Maverick-17B-128E-Instruct", - "Llama-4-Maverick-17B-128E-Instruct", - "llama-4-maverick-17b-128e-instruct" + "Llama-4-Maverick-17B-128E-Instruct" ], "max_tokens": 1048576, "model_types": [ @@ -20350,37 +19600,38 @@ { "name": "meta-llama/llama-4-maverick-17b-128e-instruct-fp8", "alias": [ - "meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8", "Llama-4-Maverick-17B-128E-Instruct-FP8", - "llama-4-maverick-17b-128e-instruct-fp8" + "Llama 4 Maverick Instruct" ], "max_tokens": 1048576, "model_types": [ "chat", "vision", - "image2text" - ] + "image2text", + "ocr" + ], + "max_completion_tokens": 8192 }, { "name": "meta-llama/llama-4-scout-17b-16e-instruct", "alias": [ - "meta-llama/Llama-4-Scout-17B-16E-Instruct", "Llama-4-Scout-17B-16E-Instruct", - "llama-4-scout-17b-16e-instruct" + "Llama 4 Scout Instruct", + "Llama 4 Scout Instruct (17Bx16E)" ], "max_tokens": 10485760, "model_types": [ "chat", "vision", - "image2text" - ] + "image2text", + "ocr" + ], + "max_completion_tokens": 8192 }, { "name": "meta-llama/llama-4-maverick-17b-128e-instruct-original", "alias": [ - "meta-llama/Llama-4-Maverick-17B-128E-Instruct-Original", - "Llama-4-Maverick-17B-128E-Instruct-Original", - "llama-4-maverick-17b-128e-instruct-original" + "Llama-4-Maverick-17B-128E-Instruct-Original" ], "max_tokens": 1048576, "model_types": [ @@ -20392,45 +19643,44 @@ { "name": "meta-llama/llama-guard-4-12b", "alias": [ - "meta-llama/Llama-Guard-4-12B", "Llama-Guard-4-12B", - "llama-guard-4-12b" + "Llama Guard 4 12B" ], "max_tokens": 131072, "model_types": [ "moderation", "vision", - "image2text" + "image2text", + "chat", + "ocr" ] }, { "name": "meta-llama/llama-prompt-guard-2-86m", "alias": [ - "meta-llama/Llama-Prompt-Guard-2-86M", - "Llama-Prompt-Guard-2-86M", - "llama-prompt-guard-2-86m" + "Llama-Prompt-Guard-2-86M" ], "model_types": [ "moderation" - ] + ], + "max_tokens": 512, + "max_completion_tokens": 512 }, { "name": "meta-llama/llama-prompt-guard-2-22m", "alias": [ - "meta-llama/Llama-Prompt-Guard-2-22M", - "Llama-Prompt-Guard-2-22M", - "llama-prompt-guard-2-22m" + "Llama-Prompt-Guard-2-22M" ], "model_types": [ "moderation" - ] + ], + "max_tokens": 512, + "max_completion_tokens": 512 }, { "name": "meta-llama/llama-4-maverick-17b-128e", "alias": [ - "meta-llama/Llama-4-Maverick-17B-128E", - "Llama-4-Maverick-17B-128E", - "llama-4-maverick-17b-128e" + "Llama-4-Maverick-17B-128E" ], "max_tokens": 1048576, "model_types": [ @@ -20442,9 +19692,8 @@ { "name": "meta-llama/llama-4-scout-17b-16e", "alias": [ - "meta-llama/Llama-4-Scout-17B-16E", "Llama-4-Scout-17B-16E", - "llama-4-scout-17b-16e" + "Llama 4 Scout (17Bx16E)" ], "max_tokens": 10485760, "model_types": [ @@ -20456,9 +19705,7 @@ { "name": "meta-llama/llama-4-maverick-17b-128e-original", "alias": [ - "meta-llama/Llama-4-Maverick-17B-128E-Original", - "Llama-4-Maverick-17B-128E-Original", - "llama-4-maverick-17b-128e-original" + "Llama-4-Maverick-17B-128E-Original" ], "max_tokens": 1048576, "model_types": [ @@ -20470,9 +19717,7 @@ { "name": "meta-llama/llama-4-scout-17b-16e-original", "alias": [ - "meta-llama/Llama-4-Scout-17B-16E-Original", - "Llama-4-Scout-17B-16E-Original", - "llama-4-scout-17b-16e-original" + "Llama-4-Scout-17B-16E-Original" ], "max_tokens": 10485760, "model_types": [ @@ -20484,9 +19729,7 @@ { "name": "meta-llama/llama-4-maverick-17b-128e-instruct-fp8-original", "alias": [ - "meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8-Original", - "Llama-4-Maverick-17B-128E-Instruct-FP8-Original", - "llama-4-maverick-17b-128e-instruct-fp8-original" + "Llama-4-Maverick-17B-128E-Instruct-FP8-Original" ], "max_tokens": 1048576, "model_types": [ @@ -20498,9 +19741,7 @@ { "name": "meta-llama/llama-4-scout-17b-16e-instruct-original", "alias": [ - "meta-llama/Llama-4-Scout-17B-16E-Instruct-Original", - "Llama-4-Scout-17B-16E-Instruct-Original", - "llama-4-scout-17b-16e-instruct-original" + "Llama-4-Scout-17B-16E-Instruct-Original" ], "max_tokens": 10485760, "model_types": [ @@ -20512,9 +19753,8 @@ { "name": "meta-llama/llama-3.2-90b-vision-instruct", "alias": [ - "meta-llama/Llama-3.2-90B-Vision-Instruct", "Llama-3.2-90B-Vision-Instruct", - "llama-3.2-90b-vision-instruct" + "nim/meta/llama-3.2-90b-vision-instruct" ], "max_tokens": 131072, "model_types": [ @@ -20526,21 +19766,22 @@ { "name": "meta-llama/llama-3.3-70b-instruct", "alias": [ - "meta-llama/Llama-3.3-70B-Instruct", "Llama-3.3-70B-Instruct", - "llama-3.3-70b-instruct" + "Llama 3.3 70B Instruct", + "Meta Llama 3.3 70B Instruct", + "nim/meta/llama-3.3-70b-instruct" ], "max_tokens": 131072, "model_types": [ "chat" - ] + ], + "max_completion_tokens": 120000 }, { "name": "meta-llama/llama-3.1-70b-instruct", "alias": [ - "meta-llama/Llama-3.1-70B-Instruct", "Llama-3.1-70B-Instruct", - "llama-3.1-70b-instruct" + "nim/meta/llama-3.1-70b-instruct" ], "max_tokens": 131072, "model_types": [ @@ -20550,9 +19791,7 @@ { "name": "meta-llama/llama-3.1-405b-fp8", "alias": [ - "meta-llama/Llama-3.1-405B-FP8", - "Llama-3.1-405B-FP8", - "llama-3.1-405b-fp8" + "Llama-3.1-405B-FP8" ], "max_tokens": 131072, "model_types": [ @@ -20562,23 +19801,21 @@ { "name": "meta-llama/llama-3.2-11b-vision-instruct", "alias": [ - "meta-llama/Llama-3.2-11B-Vision-Instruct", "Llama-3.2-11B-Vision-Instruct", - "llama-3.2-11b-vision-instruct" + "nim/meta/llama-3.2-11b-vision-instruct" ], "max_tokens": 131072, "model_types": [ "chat", "vision", - "image2text" + "image2text", + "ocr" ] }, { "name": "meta-llama/llama-3.2-3b-instruct-qlora_int4_eo8", "alias": [ - "meta-llama/Llama-3.2-3B-Instruct-QLORA_INT4_EO8", - "Llama-3.2-3B-Instruct-QLORA_INT4_EO8", - "llama-3.2-3b-instruct-qlora_int4_eo8" + "Llama-3.2-3B-Instruct-QLORA_INT4_EO8" ], "max_tokens": 131072, "model_types": [ @@ -20588,9 +19825,7 @@ { "name": "meta-llama/llama-3.2-3b-instruct-spinquant_int4_eo8", "alias": [ - "meta-llama/Llama-3.2-3B-Instruct-SpinQuant_INT4_EO8", - "Llama-3.2-3B-Instruct-SpinQuant_INT4_EO8", - "llama-3.2-3b-instruct-spinquant_int4_eo8" + "Llama-3.2-3B-Instruct-SpinQuant_INT4_EO8" ], "max_tokens": 131072, "model_types": [ @@ -20600,9 +19835,7 @@ { "name": "meta-llama/llama-3.2-1b-instruct-spinquant_int4_eo8", "alias": [ - "meta-llama/Llama-3.2-1B-Instruct-SpinQuant_INT4_EO8", - "Llama-3.2-1B-Instruct-SpinQuant_INT4_EO8", - "llama-3.2-1b-instruct-spinquant_int4_eo8" + "Llama-3.2-1B-Instruct-SpinQuant_INT4_EO8" ], "max_tokens": 131072, "model_types": [ @@ -20612,9 +19845,7 @@ { "name": "meta-llama/llama-3.2-1b-instruct-qlora_int4_eo8", "alias": [ - "meta-llama/Llama-3.2-1B-Instruct-QLORA_INT4_EO8", - "Llama-3.2-1B-Instruct-QLORA_INT4_EO8", - "llama-3.2-1b-instruct-qlora_int4_eo8" + "Llama-3.2-1B-Instruct-QLORA_INT4_EO8" ], "max_tokens": 131072, "model_types": [ @@ -20624,9 +19855,7 @@ { "name": "meta-llama/llama-guard-3-11b-vision", "alias": [ - "meta-llama/Llama-Guard-3-11B-Vision", - "Llama-Guard-3-11B-Vision", - "llama-guard-3-11b-vision" + "Llama-Guard-3-11B-Vision" ], "max_tokens": 131072, "model_types": [ @@ -20638,9 +19867,8 @@ { "name": "meta-llama/llama-3.2-1b", "alias": [ - "meta-llama/Llama-3.2-1B", "Llama-3.2-1B", - "llama-3.2-1b" + "Llama 3.2 1B" ], "max_tokens": 131072, "model_types": [ @@ -20650,21 +19878,21 @@ { "name": "meta-llama/llama-3.2-1b-instruct", "alias": [ - "meta-llama/Llama-3.2-1B-Instruct", "Llama-3.2-1B-Instruct", - "llama-3.2-1b-instruct" + "Llama 3.2 1B Instruct", + "Meta Llama 3.2 1B Instruct" ], "max_tokens": 131072, "model_types": [ "chat" - ] + ], + "max_completion_tokens": 32000 }, { "name": "meta-llama/llama-3.2-3b", "alias": [ - "meta-llama/Llama-3.2-3B", "Llama-3.2-3B", - "llama-3.2-3b" + "Meta Llama 3.2 3B" ], "max_tokens": 131072, "model_types": [ @@ -20674,21 +19902,20 @@ { "name": "meta-llama/llama-3.2-3b-instruct", "alias": [ - "meta-llama/Llama-3.2-3B-Instruct", "Llama-3.2-3B-Instruct", - "llama-3.2-3b-instruct" + "Llama 3.2 3B Instruct", + "Meta Llama 3.2 3B Instruct" ], "max_tokens": 131072, "model_types": [ "chat" - ] + ], + "max_completion_tokens": 32000 }, { "name": "meta-llama/llama-3.1-8b", "alias": [ - "meta-llama/Llama-3.1-8B", - "Llama-3.1-8B", - "llama-3.1-8b" + "Llama-3.1-8B" ], "max_tokens": 131072, "model_types": [ @@ -20698,21 +19925,18 @@ { "name": "meta-llama/llama-guard-3-8b", "alias": [ - "meta-llama/Llama-Guard-3-8B", - "Llama-Guard-3-8B", - "llama-guard-3-8b" + "Llama-Guard-3-8B" ], "max_tokens": 131072, "model_types": [ - "moderation" + "moderation", + "chat" ] }, { "name": "meta-llama/meta-llama-3-70b", "alias": [ - "meta-llama/Meta-Llama-3-70B", - "Meta-Llama-3-70B", - "meta-llama-3-70b" + "Meta-Llama-3-70B" ], "max_tokens": 8192, "model_types": [ @@ -20722,9 +19946,7 @@ { "name": "meta-llama/meta-llama-3-8b", "alias": [ - "meta-llama/Meta-Llama-3-8B", - "Meta-Llama-3-8B", - "meta-llama-3-8b" + "Meta-Llama-3-8B" ], "max_tokens": 8192, "model_types": [ @@ -20734,9 +19956,7 @@ { "name": "meta-llama/llama-3.2-90b-vision", "alias": [ - "meta-llama/Llama-3.2-90B-Vision", - "Llama-3.2-90B-Vision", - "llama-3.2-90b-vision" + "Llama-3.2-90B-Vision" ], "max_tokens": 131072, "model_types": [ @@ -20748,9 +19968,7 @@ { "name": "meta-llama/llama-3.2-11b-vision", "alias": [ - "meta-llama/Llama-3.2-11B-Vision", - "Llama-3.2-11B-Vision", - "llama-3.2-11b-vision" + "Llama-3.2-11B-Vision" ], "max_tokens": 131072, "model_types": [ @@ -20762,9 +19980,7 @@ { "name": "meta-llama/llama-guard-3-1b", "alias": [ - "meta-llama/Llama-Guard-3-1B", - "Llama-Guard-3-1B", - "llama-guard-3-1b" + "Llama-Guard-3-1B" ], "max_tokens": 131072, "model_types": [ @@ -20774,9 +19990,7 @@ { "name": "meta-llama/llama-guard-3-1b-int4", "alias": [ - "meta-llama/Llama-Guard-3-1B-INT4", - "Llama-Guard-3-1B-INT4", - "llama-guard-3-1b-int4" + "Llama-Guard-3-1B-INT4" ], "max_tokens": 131072, "model_types": [ @@ -20786,9 +20000,7 @@ { "name": "meta-llama/llama-3.1-405b-instruct-fp8", "alias": [ - "meta-llama/Llama-3.1-405B-Instruct-FP8", - "Llama-3.1-405B-Instruct-FP8", - "llama-3.1-405b-instruct-fp8" + "Llama-3.1-405B-Instruct-FP8" ], "max_tokens": 131072, "model_types": [ @@ -20798,9 +20010,8 @@ { "name": "meta-llama/llama-3.1-405b-instruct", "alias": [ - "meta-llama/Llama-3.1-405B-Instruct", "Llama-3.1-405B-Instruct", - "llama-3.1-405b-instruct" + "Meta Llama 3.1 405B Instruct" ], "max_tokens": 131072, "model_types": [ @@ -20810,9 +20021,8 @@ { "name": "meta-llama/llama-3.1-405b", "alias": [ - "meta-llama/Llama-3.1-405B", "Llama-3.1-405B", - "llama-3.1-405b" + "Llama 3.1 405B" ], "max_tokens": 131072, "model_types": [ @@ -20822,9 +20032,7 @@ { "name": "meta-llama/llama-3.1-70b", "alias": [ - "meta-llama/Llama-3.1-70B", - "Llama-3.1-70B", - "llama-3.1-70b" + "Llama-3.1-70B" ], "max_tokens": 131072, "model_types": [ @@ -20834,21 +20042,20 @@ { "name": "meta-llama/llama-3.1-8b-instruct", "alias": [ - "meta-llama/Llama-3.1-8B-Instruct", "Llama-3.1-8B-Instruct", - "llama-3.1-8b-instruct" + "Llama 3.1 8B Instruct", + "nim/meta/llama-3.1-8b-instruct" ], "max_tokens": 131072, "model_types": [ "chat" - ] + ], + "max_completion_tokens": 16384 }, { "name": "meta-llama/llama-guard-3-8b-int8", "alias": [ - "meta-llama/Llama-Guard-3-8B-INT8", - "Llama-Guard-3-8B-INT8", - "llama-guard-3-8b-int8" + "Llama-Guard-3-8B-INT8" ], "max_tokens": 131072, "model_types": [ @@ -20858,9 +20065,7 @@ { "name": "meta-llama/meta-llama-guard-2-8b", "alias": [ - "meta-llama/Meta-Llama-Guard-2-8B", - "Meta-Llama-Guard-2-8B", - "meta-llama-guard-2-8b" + "Meta-Llama-Guard-2-8B" ], "max_tokens": 4096, "model_types": [ @@ -20870,9 +20075,7 @@ { "name": "meta-llama/llamaguard-7b", "alias": [ - "meta-llama/LlamaGuard-7b", - "LlamaGuard-7b", - "llamaguard-7b" + "LlamaGuard-7b" ], "max_tokens": 4096, "model_types": [ @@ -20882,9 +20085,7 @@ { "name": "meta-llama/llama-2-70b-chat-hf", "alias": [ - "meta-llama/Llama-2-70b-chat-hf", - "Llama-2-70b-chat-hf", - "llama-2-70b-chat-hf" + "Llama-2-70b-chat-hf" ], "max_tokens": 4096, "model_types": [ @@ -20894,9 +20095,7 @@ { "name": "meta-llama/llama-2-13b-chat-hf", "alias": [ - "meta-llama/Llama-2-13b-chat-hf", - "Llama-2-13b-chat-hf", - "llama-2-13b-chat-hf" + "Llama-2-13b-chat-hf" ], "max_tokens": 4096, "model_types": [ @@ -20906,9 +20105,7 @@ { "name": "meta-llama/llama-2-7b-chat-hf", "alias": [ - "meta-llama/Llama-2-7b-chat-hf", - "Llama-2-7b-chat-hf", - "llama-2-7b-chat-hf" + "Llama-2-7b-chat-hf" ], "max_tokens": 4096, "model_types": [ @@ -20918,9 +20115,7 @@ { "name": "meta-llama/llama-2-70b-hf", "alias": [ - "meta-llama/Llama-2-70b-hf", - "Llama-2-70b-hf", - "llama-2-70b-hf" + "Llama-2-70b-hf" ], "max_tokens": 4096, "model_types": [ @@ -20930,9 +20125,7 @@ { "name": "meta-llama/llama-2-13b-hf", "alias": [ - "meta-llama/Llama-2-13b-hf", - "Llama-2-13b-hf", - "llama-2-13b-hf" + "Llama-2-13b-hf" ], "max_tokens": 4096, "model_types": [ @@ -20942,9 +20135,7 @@ { "name": "meta-llama/llama-2-7b-hf", "alias": [ - "meta-llama/Llama-2-7b-hf", - "Llama-2-7b-hf", - "llama-2-7b-hf" + "Llama-2-7b-hf" ], "max_tokens": 4096, "model_types": [ @@ -20954,9 +20145,7 @@ { "name": "meta-llama/llama-2-70b-chat", "alias": [ - "meta-llama/Llama-2-70b-chat", - "Llama-2-70b-chat", - "llama-2-70b-chat" + "Llama-2-70b-chat" ], "max_tokens": 4096, "model_types": [ @@ -20966,9 +20155,7 @@ { "name": "meta-llama/llama-2-13b-chat", "alias": [ - "meta-llama/Llama-2-13b-chat", - "Llama-2-13b-chat", - "llama-2-13b-chat" + "Llama-2-13b-chat" ], "max_tokens": 4096, "model_types": [ @@ -20978,9 +20165,7 @@ { "name": "meta-llama/llama-2-7b-chat", "alias": [ - "meta-llama/Llama-2-7b-chat", - "Llama-2-7b-chat", - "llama-2-7b-chat" + "Llama-2-7b-chat" ], "max_tokens": 4096, "model_types": [ @@ -20990,9 +20175,7 @@ { "name": "meta-llama/llama-2-70b", "alias": [ - "meta-llama/Llama-2-70b", - "Llama-2-70b", - "llama-2-70b" + "Llama-2-70b" ], "max_tokens": 4096, "model_types": [ @@ -21002,9 +20185,7 @@ { "name": "meta-llama/llama-2-13b", "alias": [ - "meta-llama/Llama-2-13b", - "Llama-2-13b", - "llama-2-13b" + "Llama-2-13b" ], "max_tokens": 4096, "model_types": [ @@ -21014,9 +20195,7 @@ { "name": "meta-llama/llama-2-7b", "alias": [ - "meta-llama/Llama-2-7b", - "Llama-2-7b", - "llama-2-7b" + "Llama-2-7b" ], "max_tokens": 4096, "model_types": [ @@ -21026,9 +20205,7 @@ { "name": "meta-llama/codellama-70b-instruct-hf", "alias": [ - "meta-llama/CodeLlama-70b-Instruct-hf", - "CodeLlama-70b-Instruct-hf", - "codellama-70b-instruct-hf" + "CodeLlama-70b-Instruct-hf" ], "max_tokens": 16384, "model_types": [ @@ -21038,9 +20215,7 @@ { "name": "meta-llama/codellama-70b-python-hf", "alias": [ - "meta-llama/CodeLlama-70b-Python-hf", - "CodeLlama-70b-Python-hf", - "codellama-70b-python-hf" + "CodeLlama-70b-Python-hf" ], "max_tokens": 16384, "model_types": [ @@ -21050,9 +20225,7 @@ { "name": "meta-llama/codellama-70b-hf", "alias": [ - "meta-llama/CodeLlama-70b-hf", - "CodeLlama-70b-hf", - "codellama-70b-hf" + "CodeLlama-70b-hf" ], "max_tokens": 16384, "model_types": [ @@ -21062,9 +20235,7 @@ { "name": "meta-llama/codellama-34b-instruct-hf", "alias": [ - "meta-llama/CodeLlama-34b-Instruct-hf", - "CodeLlama-34b-Instruct-hf", - "codellama-34b-instruct-hf" + "CodeLlama-34b-Instruct-hf" ], "max_tokens": 16384, "model_types": [ @@ -21074,9 +20245,7 @@ { "name": "meta-llama/codellama-34b-python-hf", "alias": [ - "meta-llama/CodeLlama-34b-Python-hf", - "CodeLlama-34b-Python-hf", - "codellama-34b-python-hf" + "CodeLlama-34b-Python-hf" ], "max_tokens": 16384, "model_types": [ @@ -21086,9 +20255,7 @@ { "name": "meta-llama/codellama-34b-hf", "alias": [ - "meta-llama/CodeLlama-34b-hf", - "CodeLlama-34b-hf", - "codellama-34b-hf" + "CodeLlama-34b-hf" ], "max_tokens": 16384, "model_types": [ @@ -21098,9 +20265,7 @@ { "name": "meta-llama/codellama-13b-instruct-hf", "alias": [ - "meta-llama/CodeLlama-13b-Instruct-hf", - "CodeLlama-13b-Instruct-hf", - "codellama-13b-instruct-hf" + "CodeLlama-13b-Instruct-hf" ], "max_tokens": 16384, "model_types": [ @@ -21110,9 +20275,7 @@ { "name": "meta-llama/codellama-13b-python-hf", "alias": [ - "meta-llama/CodeLlama-13b-Python-hf", - "CodeLlama-13b-Python-hf", - "codellama-13b-python-hf" + "CodeLlama-13b-Python-hf" ], "max_tokens": 16384, "model_types": [ @@ -21122,9 +20285,7 @@ { "name": "meta-llama/codellama-13b-hf", "alias": [ - "meta-llama/CodeLlama-13b-hf", - "CodeLlama-13b-hf", - "codellama-13b-hf" + "CodeLlama-13b-hf" ], "max_tokens": 16384, "model_types": [ @@ -21134,9 +20295,7 @@ { "name": "meta-llama/codellama-7b-instruct-hf", "alias": [ - "meta-llama/CodeLlama-7b-Instruct-hf", - "CodeLlama-7b-Instruct-hf", - "codellama-7b-instruct-hf" + "CodeLlama-7b-Instruct-hf" ], "max_tokens": 16384, "model_types": [ @@ -21146,9 +20305,7 @@ { "name": "meta-llama/codellama-7b-python-hf", "alias": [ - "meta-llama/CodeLlama-7b-Python-hf", - "CodeLlama-7b-Python-hf", - "codellama-7b-python-hf" + "CodeLlama-7b-Python-hf" ], "max_tokens": 16384, "model_types": [ @@ -21158,9 +20315,7 @@ { "name": "meta-llama/codellama-7b-hf", "alias": [ - "meta-llama/CodeLlama-7b-hf", - "CodeLlama-7b-hf", - "codellama-7b-hf" + "CodeLlama-7b-hf" ], "max_tokens": 16384, "model_types": [ @@ -21170,9 +20325,7 @@ { "name": "nvidia/nemotron-3-content-safety", "alias": [ - "nvidia/Nemotron-3-Content-Safety", - "Nemotron-3-Content-Safety", - "nemotron-3-content-safety" + "Nemotron-3-Content-Safety" ], "model_types": [ "moderation", @@ -21192,9 +20345,7 @@ { "name": "nvidia/kimi-k2.6-eagle3", "alias": [ - "nvidia/Kimi-K2.6-Eagle3", - "Kimi-K2.6-Eagle3", - "kimi-k2.6-eagle3" + "Kimi-K2.6-Eagle3" ], "max_tokens": 262144, "model_types": [ @@ -21204,9 +20355,7 @@ { "name": "nvidia/kimi-k2.5-thinking-eagle3", "alias": [ - "nvidia/Kimi-K2.5-Thinking-Eagle3", - "Kimi-K2.5-Thinking-Eagle3", - "kimi-k2.5-thinking-eagle3" + "Kimi-K2.5-Thinking-Eagle3" ], "max_tokens": 262144, "model_types": [ @@ -21220,9 +20369,7 @@ { "name": "nvidia/diffusiongemma-26b-a4b-it-nvfp4", "alias": [ - "nvidia/diffusiongemma-26B-A4B-it-NVFP4", - "diffusiongemma-26B-A4B-it-NVFP4", - "diffusiongemma-26b-a4b-it-nvfp4" + "diffusiongemma-26B-A4B-it-NVFP4" ], "max_tokens": 131072, "model_types": [ @@ -21232,9 +20379,7 @@ { "name": "nvidia/deepseek-v4-flash-nvfp4", "alias": [ - "nvidia/DeepSeek-V4-Flash-NVFP4", - "DeepSeek-V4-Flash-NVFP4", - "deepseek-v4-flash-nvfp4" + "DeepSeek-V4-Flash-NVFP4" ], "max_tokens": 1048576, "model_types": [ @@ -21248,9 +20393,7 @@ { "name": "nvidia/nv-kermt-70m-v2", "alias": [ - "nvidia/NV-KERMT-70M-v2", - "NV-KERMT-70M-v2", - "nv-kermt-70m-v2" + "NV-KERMT-70M-v2" ], "model_types": [ "other" @@ -21259,9 +20402,7 @@ { "name": "nvidia/nvidia-nemotron-3-ultra-550b-a55b-nvfp4", "alias": [ - "nvidia/NVIDIA-Nemotron-3-Ultra-550B-A55B-NVFP4", - "NVIDIA-Nemotron-3-Ultra-550B-A55B-NVFP4", - "nvidia-nemotron-3-ultra-550b-a55b-nvfp4" + "NVIDIA-Nemotron-3-Ultra-550B-A55B-NVFP4" ], "max_tokens": 262144, "model_types": [ @@ -21271,13 +20412,13 @@ { "name": "nvidia/nvidia-nemotron-3-ultra-550b-a55b-bf16", "alias": [ - "nvidia/NVIDIA-Nemotron-3-Ultra-550B-A55B-BF16", - "NVIDIA-Nemotron-3-Ultra-550B-A55B-BF16", - "nvidia-nemotron-3-ultra-550b-a55b-bf16" + "NVIDIA-Nemotron-3-Ultra-550B-A55B-BF16" ], "max_tokens": 262144, "model_types": [ - "chat" + "chat", + "image2text", + "vision" ] }, { @@ -21311,9 +20452,7 @@ { "name": "nvidia/locateanything-3b", "alias": [ - "nvidia/LocateAnything-3B", - "LocateAnything-3B", - "locateanything-3b" + "LocateAnything-3B" ], "model_types": [ "chat", @@ -21324,22 +20463,24 @@ { "name": "nvidia/cosmos3-super", "alias": [ - "nvidia/Cosmos3-Super", - "Cosmos3-Super", - "cosmos3-super" + "Cosmos3-Super" ], "model_types": [ - "other" + "other", + "video_generation" ] }, { "name": "nvidia/nemotron-3.5-asr-streaming-0.6b", "alias": [ - "nemotron-3.5-asr-streaming-0.6b" + "nemotron-3.5-asr-streaming-0.6b", + "Nvidia Nemotron 3.5 ASR Streaming 0.6B" ], "model_types": [ - "asr" - ] + "asr", + "speech2text" + ], + "max_tokens": 448 }, { "name": "nvidia/omni-dreams-models", @@ -21353,9 +20494,7 @@ { "name": "nvidia/deepseek-v4-pro-nvfp4", "alias": [ - "nvidia/DeepSeek-V4-Pro-NVFP4", - "DeepSeek-V4-Pro-NVFP4", - "deepseek-v4-pro-nvfp4" + "DeepSeek-V4-Pro-NVFP4" ], "max_tokens": 1048576, "model_types": [ @@ -21369,9 +20508,7 @@ { "name": "nvidia/nvidia-nemotron-3-ultra-550b-a55b-genrm", "alias": [ - "nvidia/NVIDIA-Nemotron-3-Ultra-550B-A55B-GenRM", - "NVIDIA-Nemotron-3-Ultra-550B-A55B-GenRM", - "nvidia-nemotron-3-ultra-550b-a55b-genrm" + "NVIDIA-Nemotron-3-Ultra-550B-A55B-GenRM" ], "max_tokens": 262144, "model_types": [ @@ -21385,9 +20522,7 @@ { "name": "nvidia/nvidia-nemotron-3-ultra-550b-a55b-base-bf16", "alias": [ - "nvidia/NVIDIA-Nemotron-3-Ultra-550B-A55B-Base-BF16", - "NVIDIA-Nemotron-3-Ultra-550B-A55B-Base-BF16", - "nvidia-nemotron-3-ultra-550b-a55b-base-bf16" + "NVIDIA-Nemotron-3-Ultra-550B-A55B-Base-BF16" ], "max_tokens": 262144, "model_types": [ @@ -21397,9 +20532,7 @@ { "name": "nvidia/artifixer", "alias": [ - "nvidia/ArtiFixer", - "ArtiFixer", - "artifixer" + "ArtiFixer" ], "model_types": [ "other" @@ -21408,9 +20541,7 @@ { "name": "nvidia/nemotron-3.5-content-safety", "alias": [ - "nvidia/Nemotron-3.5-Content-Safety", - "Nemotron-3.5-Content-Safety", - "nemotron-3.5-content-safety" + "Nemotron-3.5-Content-Safety" ], "model_types": [ "moderation", @@ -21420,9 +20551,7 @@ { "name": "nvidia/nemotron-labs-diffusion-vlm-8b", "alias": [ - "nvidia/Nemotron-Labs-Diffusion-VLM-8B", - "Nemotron-Labs-Diffusion-VLM-8B", - "nemotron-labs-diffusion-vlm-8b" + "Nemotron-Labs-Diffusion-VLM-8B" ], "max_tokens": 262144, "model_types": [ @@ -21434,9 +20563,7 @@ { "name": "nvidia/nemotron-labs-diffusion-3b-base", "alias": [ - "nvidia/Nemotron-Labs-Diffusion-3B-Base", - "Nemotron-Labs-Diffusion-3B-Base", - "nemotron-labs-diffusion-3b-base" + "Nemotron-Labs-Diffusion-3B-Base" ], "max_tokens": 262144, "model_types": [ @@ -21446,9 +20573,7 @@ { "name": "nvidia/nemotron-labs-diffusion-8b-base", "alias": [ - "nvidia/Nemotron-Labs-Diffusion-8B-Base", - "Nemotron-Labs-Diffusion-8B-Base", - "nemotron-labs-diffusion-8b-base" + "Nemotron-Labs-Diffusion-8B-Base" ], "max_tokens": 262144, "model_types": [ @@ -21458,9 +20583,7 @@ { "name": "nvidia/nemotron-labs-diffusion-14b-base", "alias": [ - "nvidia/Nemotron-Labs-Diffusion-14B-Base", - "Nemotron-Labs-Diffusion-14B-Base", - "nemotron-labs-diffusion-14b-base" + "Nemotron-Labs-Diffusion-14B-Base" ], "max_tokens": 262144, "model_types": [ @@ -21470,9 +20593,7 @@ { "name": "nvidia/nemotron-labs-diffusion-14b", "alias": [ - "nvidia/Nemotron-Labs-Diffusion-14B", - "Nemotron-Labs-Diffusion-14B", - "nemotron-labs-diffusion-14b" + "Nemotron-Labs-Diffusion-14B" ], "max_tokens": 262144, "model_types": [ @@ -21482,9 +20603,7 @@ { "name": "nvidia/nemotron-labs-diffusion-3b", "alias": [ - "nvidia/Nemotron-Labs-Diffusion-3B", - "Nemotron-Labs-Diffusion-3B", - "nemotron-labs-diffusion-3b" + "Nemotron-Labs-Diffusion-3B" ], "max_tokens": 262144, "model_types": [ @@ -21494,9 +20613,7 @@ { "name": "nvidia/nemotron-labs-diffusion-8b", "alias": [ - "nvidia/Nemotron-Labs-Diffusion-8B", - "Nemotron-Labs-Diffusion-8B", - "nemotron-labs-diffusion-8b" + "Nemotron-Labs-Diffusion-8B" ], "max_tokens": 262144, "model_types": [ @@ -21511,14 +20628,14 @@ "model_types": [ "embedding", "vision" - ] + ], + "max_tokens": 10240, + "max_dimension": 2048 }, { "name": "nvidia/qwen3.5-122b-a10b-nvfp4", "alias": [ - "nvidia/Qwen3.5-122B-A10B-NVFP4", - "Qwen3.5-122B-A10B-NVFP4", - "qwen3.5-122b-a10b-nvfp4" + "Qwen3.5-122B-A10B-NVFP4" ], "max_tokens": 262144, "model_types": [ @@ -21538,9 +20655,7 @@ { "name": "nvidia/gr00t-h", "alias": [ - "nvidia/GR00T-H", - "GR00T-H", - "gr00t-h" + "GR00T-H" ], "model_types": [ "other" @@ -21549,11 +20664,14 @@ { "name": "nvidia/parakeet-tdt-0.6b-v3", "alias": [ - "parakeet-tdt-0.6b-v3" + "parakeet-tdt-0.6b-v3", + "Nvidia Parakeet TDT 0.6B V3" ], "model_types": [ - "asr" - ] + "asr", + "speech2text" + ], + "max_tokens": 448 }, { "name": "nvidia/llama-nemotron-embed-1b-v2", @@ -21580,7 +20698,8 @@ ], "model_types": [ "rerank" - ] + ], + "max_tokens": 10240 }, { "name": "nvidia/llama-nv-embed-reasoning-3b", @@ -21604,9 +20723,7 @@ { "name": "nvidia/wan2.2-t2v-a14b-diffusers-fp8", "alias": [ - "nvidia/Wan2.2-T2V-A14B-Diffusers-FP8", - "Wan2.2-T2V-A14B-Diffusers-FP8", - "wan2.2-t2v-a14b-diffusers-fp8" + "Wan2.2-T2V-A14B-Diffusers-FP8" ], "model_types": [ "other" @@ -21615,9 +20732,7 @@ { "name": "nvidia/wan2.2-t2v-a14b-diffusers-nvfp4", "alias": [ - "nvidia/Wan2.2-T2V-A14B-Diffusers-NVFP4", - "Wan2.2-T2V-A14B-Diffusers-NVFP4", - "wan2.2-t2v-a14b-diffusers-nvfp4" + "Wan2.2-T2V-A14B-Diffusers-NVFP4" ], "model_types": [ "other" @@ -21626,9 +20741,7 @@ { "name": "nvidia/cosmos-embed1-448p-anomaly-detection", "alias": [ - "nvidia/Cosmos-Embed1-448p-anomaly-detection", - "Cosmos-Embed1-448p-anomaly-detection", - "cosmos-embed1-448p-anomaly-detection" + "Cosmos-Embed1-448p-anomaly-detection" ], "model_types": [ "embedding", @@ -21638,9 +20751,7 @@ { "name": "nvidia/kimi-k2.6-nvfp4", "alias": [ - "nvidia/Kimi-K2.6-NVFP4", - "Kimi-K2.6-NVFP4", - "kimi-k2.6-nvfp4" + "Kimi-K2.6-NVFP4" ], "max_tokens": 262144, "model_types": [ @@ -21650,9 +20761,7 @@ { "name": "nvidia/re-use", "alias": [ - "nvidia/RE-USE", - "RE-USE", - "re-use" + "RE-USE" ], "model_types": [ "audio", @@ -21663,9 +20772,7 @@ { "name": "nvidia/kimi-k2.5-nvfp4", "alias": [ - "nvidia/Kimi-K2.5-NVFP4", - "Kimi-K2.5-NVFP4", - "kimi-k2.5-nvfp4" + "Kimi-K2.5-NVFP4" ], "max_tokens": 262144, "model_types": [ @@ -21718,9 +20825,7 @@ { "name": "nvidia/lyra-2.0", "alias": [ - "nvidia/Lyra-2.0", - "Lyra-2.0", - "lyra-2.0" + "Lyra-2.0" ], "model_types": [ "3d_generation" @@ -21729,9 +20834,7 @@ { "name": "nvidia/gemma-4-26b-a4b-nvfp4", "alias": [ - "nvidia/Gemma-4-26B-A4B-NVFP4", - "Gemma-4-26B-A4B-NVFP4", - "gemma-4-26b-a4b-nvfp4" + "Gemma-4-26B-A4B-NVFP4" ], "max_tokens": 131072, "model_types": [ @@ -21741,9 +20844,7 @@ { "name": "nvidia/pointworld_models", "alias": [ - "nvidia/PointWorld_models", - "PointWorld_models", - "pointworld_models" + "PointWorld_models" ], "model_types": [ "other" @@ -21752,9 +20853,7 @@ { "name": "nvidia/nemotron-elastic-12b", "alias": [ - "nvidia/Nemotron-Elastic-12B", - "Nemotron-Elastic-12B", - "nemotron-elastic-12b" + "Nemotron-Elastic-12B" ], "max_tokens": 262144, "model_types": [ @@ -21764,9 +20863,7 @@ { "name": "nvidia/nemotron-3-nano-omni-30b-a3b-reasoning-bf16", "alias": [ - "nvidia/Nemotron-3-Nano-Omni-30B-A3B-Reasoning-BF16", - "Nemotron-3-Nano-Omni-30B-A3B-Reasoning-BF16", - "nemotron-3-nano-omni-30b-a3b-reasoning-bf16" + "Nemotron-3-Nano-Omni-30B-A3B-Reasoning-BF16" ], "max_tokens": 262144, "model_types": [ @@ -21780,9 +20877,7 @@ { "name": "nvidia/gpt-oss-120b-eagle3-v3", "alias": [ - "nvidia/gpt-oss-120b-Eagle3-v3", - "gpt-oss-120b-Eagle3-v3", - "gpt-oss-120b-eagle3-v3" + "gpt-oss-120b-Eagle3-v3" ], "max_tokens": 131072, "model_types": [ @@ -21792,9 +20887,7 @@ { "name": "nvidia/nvidia-nemotron-labs-3-elastic-30b-a3b-nvfp4", "alias": [ - "nvidia/NVIDIA-Nemotron-Labs-3-Elastic-30B-A3B-NVFP4", - "NVIDIA-Nemotron-Labs-3-Elastic-30B-A3B-NVFP4", - "nvidia-nemotron-labs-3-elastic-30b-a3b-nvfp4" + "NVIDIA-Nemotron-Labs-3-Elastic-30B-A3B-NVFP4" ], "max_tokens": 262144, "model_types": [ @@ -21804,9 +20897,7 @@ { "name": "nvidia/nvidia-nemotron-labs-3-elastic-30b-a3b-fp8", "alias": [ - "nvidia/NVIDIA-Nemotron-Labs-3-Elastic-30B-A3B-FP8", - "NVIDIA-Nemotron-Labs-3-Elastic-30B-A3B-FP8", - "nvidia-nemotron-labs-3-elastic-30b-a3b-fp8" + "NVIDIA-Nemotron-Labs-3-Elastic-30B-A3B-FP8" ], "max_tokens": 262144, "model_types": [ @@ -21816,9 +20907,7 @@ { "name": "nvidia/nvidia-nemotron-labs-3-elastic-30b-a3b-bf16", "alias": [ - "nvidia/NVIDIA-Nemotron-Labs-3-Elastic-30B-A3B-BF16", - "NVIDIA-Nemotron-Labs-3-Elastic-30B-A3B-BF16", - "nvidia-nemotron-labs-3-elastic-30b-a3b-bf16" + "NVIDIA-Nemotron-Labs-3-Elastic-30B-A3B-BF16" ], "max_tokens": 262144, "model_types": [ @@ -21828,9 +20917,7 @@ { "name": "nvidia/gemma-4-31b-it-nvfp4", "alias": [ - "nvidia/Gemma-4-31B-IT-NVFP4", - "Gemma-4-31B-IT-NVFP4", - "gemma-4-31b-it-nvfp4" + "Gemma-4-31B-IT-NVFP4" ], "max_tokens": 131072, "model_types": [ @@ -21867,9 +20954,7 @@ { "name": "nvidia/nv-raw2insights-mri", "alias": [ - "nvidia/NV-Raw2insights-MRI", - "NV-Raw2insights-MRI", - "nv-raw2insights-mri" + "NV-Raw2insights-MRI" ], "model_types": [ "other" @@ -21887,9 +20972,7 @@ { "name": "nvidia/nvidia-nemotron-nano-9b-v2-japanese", "alias": [ - "nvidia/NVIDIA-Nemotron-Nano-9B-v2-Japanese", - "NVIDIA-Nemotron-Nano-9B-v2-Japanese", - "nvidia-nemotron-nano-9b-v2-japanese" + "NVIDIA-Nemotron-Nano-9B-v2-Japanese" ], "max_tokens": 262144, "model_types": [ @@ -21899,9 +20982,7 @@ { "name": "nvidia/gr00t-n1.7-libero", "alias": [ - "nvidia/GR00T-N1.7-LIBERO", - "GR00T-N1.7-LIBERO", - "gr00t-n1.7-libero" + "GR00T-N1.7-LIBERO" ], "model_types": [ "other" @@ -21910,9 +20991,7 @@ { "name": "nvidia/gr00t-n1.7-droid", "alias": [ - "nvidia/GR00T-N1.7-DROID", - "GR00T-N1.7-DROID", - "gr00t-n1.7-droid" + "GR00T-N1.7-DROID" ], "model_types": [ "other" @@ -21921,9 +21000,7 @@ { "name": "nvidia/gr00t-n1.7-simplerenv-fractal", "alias": [ - "nvidia/GR00T-N1.7-SimplerEnv-Fractal", - "GR00T-N1.7-SimplerEnv-Fractal", - "gr00t-n1.7-simplerenv-fractal" + "GR00T-N1.7-SimplerEnv-Fractal" ], "model_types": [ "other" @@ -21932,9 +21009,7 @@ { "name": "nvidia/gr00t-n1.7-simplerenv-bridge", "alias": [ - "nvidia/GR00T-N1.7-SimplerEnv-Bridge", - "GR00T-N1.7-SimplerEnv-Bridge", - "gr00t-n1.7-simplerenv-bridge" + "GR00T-N1.7-SimplerEnv-Bridge" ], "model_types": [ "other" @@ -21943,9 +21018,7 @@ { "name": "nvidia/gn1x-tuned-arena-g1-loco-manipulation", "alias": [ - "nvidia/GN1x-Tuned-Arena-G1-Loco-Manipulation", - "GN1x-Tuned-Arena-G1-Loco-Manipulation", - "gn1x-tuned-arena-g1-loco-manipulation" + "GN1x-Tuned-Arena-G1-Loco-Manipulation" ], "model_types": [ "robotics" @@ -21954,9 +21027,7 @@ { "name": "nvidia/minimax-m2.5-nvfp4", "alias": [ - "nvidia/MiniMax-M2.5-NVFP4", - "MiniMax-M2.5-NVFP4", - "minimax-m2.5-nvfp4" + "MiniMax-M2.5-NVFP4" ], "max_tokens": 1000000, "model_types": [ @@ -21966,9 +21037,7 @@ { "name": "nvidia/cosmos-h-surgical-simulator", "alias": [ - "nvidia/Cosmos-H-Surgical-Simulator", - "Cosmos-H-Surgical-Simulator", - "cosmos-h-surgical-simulator" + "Cosmos-H-Surgical-Simulator" ], "model_types": [ "other" @@ -21977,9 +21046,7 @@ { "name": "nvidia/pixeldit-imagenet", "alias": [ - "nvidia/PixelDiT-ImageNet", - "PixelDiT-ImageNet", - "pixeldit-imagenet" + "PixelDiT-ImageNet" ], "model_types": [ "image" @@ -21988,9 +21055,7 @@ { "name": "nvidia/pixeldit-1300m-1024px", "alias": [ - "nvidia/PixelDiT-1300M-1024px", - "PixelDiT-1300M-1024px", - "pixeldit-1300m-1024px" + "PixelDiT-1300M-1024px" ], "model_types": [ "image" @@ -21999,9 +21064,7 @@ { "name": "nvidia/ising-calibration-1-35b-a3b", "alias": [ - "nvidia/Ising-Calibration-1-35B-A3B", - "Ising-Calibration-1-35B-A3B", - "ising-calibration-1-35b-a3b" + "Ising-Calibration-1-35B-A3B" ], "model_types": [ "other" @@ -22010,9 +21073,7 @@ { "name": "nvidia/cosmos-h-surgical", "alias": [ - "nvidia/Cosmos-H-Surgical", - "Cosmos-H-Surgical", - "cosmos-h-surgical" + "Cosmos-H-Surgical" ], "model_types": [ "other" @@ -22021,9 +21082,7 @@ { "name": "nvidia/nvidia-nemotron-parse-v1.1-tc", "alias": [ - "nvidia/NVIDIA-Nemotron-Parse-v1.1-TC", - "NVIDIA-Nemotron-Parse-v1.1-TC", - "nvidia-nemotron-parse-v1.1-tc" + "NVIDIA-Nemotron-Parse-v1.1-TC" ], "max_tokens": 262144, "model_types": [ @@ -22035,9 +21094,7 @@ { "name": "nvidia/gn1x-tuned-arena-gr1-manipulation", "alias": [ - "nvidia/GN1x-Tuned-Arena-GR1-Manipulation", - "GN1x-Tuned-Arena-GR1-Manipulation", - "gn1x-tuned-arena-gr1-manipulation" + "GN1x-Tuned-Arena-GR1-Manipulation" ], "model_types": [ "robotics" @@ -22046,9 +21103,7 @@ { "name": "nvidia/gn1.6-tuned-arena-gr1-placeitemclosedoor-task", "alias": [ - "nvidia/GN1.6-Tuned-Arena-GR1-PlaceItemCloseDoor-Task", - "GN1.6-Tuned-Arena-GR1-PlaceItemCloseDoor-Task", - "gn1.6-tuned-arena-gr1-placeitemclosedoor-task" + "GN1.6-Tuned-Arena-GR1-PlaceItemCloseDoor-Task" ], "model_types": [ "robotics" @@ -22077,9 +21132,7 @@ { "name": "nvidia/gear-sonic", "alias": [ - "nvidia/GEAR-SONIC", - "GEAR-SONIC", - "gear-sonic" + "GEAR-SONIC" ], "model_types": [ "robotics" @@ -22088,9 +21141,7 @@ { "name": "nvidia/glm-5-nvfp4", "alias": [ - "nvidia/GLM-5-NVFP4", - "GLM-5-NVFP4", - "glm-5-nvfp4" + "GLM-5-NVFP4" ], "max_tokens": 131072, "model_types": [ @@ -22100,9 +21151,7 @@ { "name": "nvidia/kimodo-soma-seed-v1.1", "alias": [ - "nvidia/Kimodo-SOMA-SEED-v1.1", - "Kimodo-SOMA-SEED-v1.1", - "kimodo-soma-seed-v1.1" + "Kimodo-SOMA-SEED-v1.1" ], "model_types": [ "robotics" @@ -22111,9 +21160,7 @@ { "name": "nvidia/kimodo-soma-rp-v1.1", "alias": [ - "nvidia/Kimodo-SOMA-RP-v1.1", - "Kimodo-SOMA-RP-v1.1", - "kimodo-soma-rp-v1.1" + "Kimodo-SOMA-RP-v1.1" ], "model_types": [ "robotics" @@ -22122,9 +21169,7 @@ { "name": "nvidia/tmr-soma-rp-v1", "alias": [ - "nvidia/TMR-SOMA-RP-v1", - "TMR-SOMA-RP-v1", - "tmr-soma-rp-v1" + "TMR-SOMA-RP-v1" ], "model_types": [ "robotics" @@ -22133,9 +21178,7 @@ { "name": "nvidia/egm-8b-sft", "alias": [ - "nvidia/EGM-8B-SFT", - "EGM-8B-SFT", - "egm-8b-sft" + "EGM-8B-SFT" ], "model_types": [ "chat", @@ -22146,9 +21189,7 @@ { "name": "nvidia/egm-4b-sft", "alias": [ - "nvidia/EGM-4B-SFT", - "EGM-4B-SFT", - "egm-4b-sft" + "EGM-4B-SFT" ], "model_types": [ "chat", @@ -22159,9 +21200,7 @@ { "name": "nvidia/egm-8b", "alias": [ - "nvidia/EGM-8B", - "EGM-8B", - "egm-8b" + "EGM-8B" ], "model_types": [ "chat", @@ -22172,9 +21211,7 @@ { "name": "nvidia/egm-4b", "alias": [ - "nvidia/EGM-4B", - "EGM-4B", - "egm-4b" + "EGM-4B" ], "model_types": [ "chat", @@ -22196,9 +21233,7 @@ { "name": "nvidia/esm2_t48_15b_ur50d", "alias": [ - "nvidia/esm2_t48_15B_UR50D", - "esm2_t48_15B_UR50D", - "esm2_t48_15b_ur50d" + "esm2_t48_15B_UR50D" ], "model_types": [ "other" @@ -22207,9 +21242,7 @@ { "name": "nvidia/esm2_t36_3b_ur50d", "alias": [ - "nvidia/esm2_t36_3B_UR50D", - "esm2_t36_3B_UR50D", - "esm2_t36_3b_ur50d" + "esm2_t36_3B_UR50D" ], "model_types": [ "other" @@ -22218,9 +21251,7 @@ { "name": "nvidia/esm2_t33_650m_ur50d", "alias": [ - "nvidia/esm2_t33_650M_UR50D", - "esm2_t33_650M_UR50D", - "esm2_t33_650m_ur50d" + "esm2_t33_650M_UR50D" ], "model_types": [ "other" @@ -22238,9 +21269,7 @@ { "name": "nvidia/nvidia-nemotron-3-nano-4b-fp8", "alias": [ - "nvidia/NVIDIA-Nemotron-3-Nano-4B-FP8", - "NVIDIA-Nemotron-3-Nano-4B-FP8", - "nvidia-nemotron-3-nano-4b-fp8" + "NVIDIA-Nemotron-3-Nano-4B-FP8" ], "max_tokens": 262144, "model_types": [ @@ -22250,9 +21279,7 @@ { "name": "nvidia/nvidia-nemotron-3-nano-4b-bf16", "alias": [ - "nvidia/NVIDIA-Nemotron-3-Nano-4B-BF16", - "NVIDIA-Nemotron-3-Nano-4B-BF16", - "nvidia-nemotron-3-nano-4b-bf16" + "NVIDIA-Nemotron-3-Nano-4B-BF16" ], "max_tokens": 262144, "model_types": [ @@ -22262,9 +21289,7 @@ { "name": "nvidia/nvila-8b-hd-video", "alias": [ - "nvidia/NVILA-8B-HD-Video", - "NVILA-8B-HD-Video", - "nvila-8b-hd-video" + "NVILA-8B-HD-Video" ], "model_types": [ "video_generation" @@ -22273,9 +21298,7 @@ { "name": "nvidia/autogaze", "alias": [ - "nvidia/AutoGaze", - "AutoGaze", - "autogaze" + "AutoGaze" ], "model_types": [ "vision" @@ -22284,9 +21307,7 @@ { "name": "nvidia/cosmos-tokenizer-surg", "alias": [ - "nvidia/Cosmos-Tokenizer-Surg", - "Cosmos-Tokenizer-Surg", - "cosmos-tokenizer-surg" + "Cosmos-Tokenizer-Surg" ], "model_types": [ "other" @@ -22295,9 +21316,7 @@ { "name": "nvidia/nvidia-nemotron-3-nano-4b-gguf", "alias": [ - "nvidia/NVIDIA-Nemotron-3-Nano-4B-GGUF", - "NVIDIA-Nemotron-3-Nano-4B-GGUF", - "nvidia-nemotron-3-nano-4b-gguf" + "NVIDIA-Nemotron-3-Nano-4B-GGUF" ], "max_tokens": 262144, "model_types": [ @@ -22307,9 +21326,7 @@ { "name": "nvidia/soma-x", "alias": [ - "nvidia/SOMA-X", - "SOMA-X", - "soma-x" + "SOMA-X" ], "model_types": [ "robotics" @@ -22318,9 +21335,7 @@ { "name": "nvidia/kimodo-smplx-rp-v1", "alias": [ - "nvidia/Kimodo-SMPLX-RP-v1", - "Kimodo-SMPLX-RP-v1", - "kimodo-smplx-rp-v1" + "Kimodo-SMPLX-RP-v1" ], "model_types": [ "robotics" @@ -22329,9 +21344,7 @@ { "name": "nvidia/kimodo-soma-rp-v1", "alias": [ - "nvidia/Kimodo-SOMA-RP-v1", - "Kimodo-SOMA-RP-v1", - "kimodo-soma-rp-v1" + "Kimodo-SOMA-RP-v1" ], "model_types": [ "robotics" @@ -22340,9 +21353,7 @@ { "name": "nvidia/kimodo-soma-seed-v1", "alias": [ - "nvidia/Kimodo-SOMA-SEED-v1", - "Kimodo-SOMA-SEED-v1", - "kimodo-soma-seed-v1" + "Kimodo-SOMA-SEED-v1" ], "model_types": [ "robotics" @@ -22351,9 +21362,7 @@ { "name": "nvidia/kimodo-g1-seed-v1", "alias": [ - "nvidia/Kimodo-G1-SEED-v1", - "Kimodo-G1-SEED-v1", - "kimodo-g1-seed-v1" + "Kimodo-G1-SEED-v1" ], "model_types": [ "robotics" @@ -22362,9 +21371,7 @@ { "name": "nvidia/kimodo-g1-rp-v1", "alias": [ - "nvidia/Kimodo-G1-RP-v1", - "Kimodo-G1-RP-v1", - "kimodo-g1-rp-v1" + "Kimodo-G1-RP-v1" ], "model_types": [ "robotics" @@ -22382,9 +21389,7 @@ { "name": "nvidia/nv-proteina-complexa-ame-160m-v1", "alias": [ - "nvidia/NV-Proteina-Complexa-AME-160M-v1", - "NV-Proteina-Complexa-AME-160M-v1", - "nv-proteina-complexa-ame-160m-v1" + "NV-Proteina-Complexa-AME-160M-v1" ], "model_types": [ "other" @@ -22393,9 +21398,7 @@ { "name": "nvidia/nv-proteina-complexa-protein-target-160m-v1", "alias": [ - "nvidia/NV-Proteina-Complexa-Protein-Target-160M-v1", - "NV-Proteina-Complexa-Protein-Target-160M-v1", - "nv-proteina-complexa-protein-target-160m-v1" + "NV-Proteina-Complexa-Protein-Target-160M-v1" ], "model_types": [ "other" @@ -22404,9 +21407,7 @@ { "name": "nvidia/nv-proteina-complexa-ligand-target-160m-v1", "alias": [ - "nvidia/NV-Proteina-Complexa-Ligand-Target-160M-v1", - "NV-Proteina-Complexa-Ligand-Target-160M-v1", - "nv-proteina-complexa-ligand-target-160m-v1" + "NV-Proteina-Complexa-Ligand-Target-160M-v1" ], "model_types": [ "other" @@ -22415,9 +21416,7 @@ { "name": "nvidia/nvidia-nemotron-3-nano-30b-a3b-base-bf16", "alias": [ - "nvidia/NVIDIA-Nemotron-3-Nano-30B-A3B-Base-BF16", - "NVIDIA-Nemotron-3-Nano-30B-A3B-Base-BF16", - "nvidia-nemotron-3-nano-30b-a3b-base-bf16" + "NVIDIA-Nemotron-3-Nano-30B-A3B-Base-BF16" ], "max_tokens": 262144, "model_types": [ @@ -22427,9 +21426,7 @@ { "name": "nvidia/nvidia-nemotron-3-nano-30b-a3b-nvfp4", "alias": [ - "nvidia/NVIDIA-Nemotron-3-Nano-30B-A3B-NVFP4", - "NVIDIA-Nemotron-3-Nano-30B-A3B-NVFP4", - "nvidia-nemotron-3-nano-30b-a3b-nvfp4" + "NVIDIA-Nemotron-3-Nano-30B-A3B-NVFP4" ], "max_tokens": 262144, "model_types": [ @@ -22439,9 +21436,8 @@ { "name": "nvidia/nvidia-nemotron-3-nano-30b-a3b-bf16", "alias": [ - "nvidia/NVIDIA-Nemotron-3-Nano-30B-A3B-BF16", "NVIDIA-Nemotron-3-Nano-30B-A3B-BF16", - "nvidia-nemotron-3-nano-30b-a3b-bf16" + "Nvidia Nemotron 3 Nano 30B A3b Bf16" ], "max_tokens": 262144, "model_types": [ @@ -22451,9 +21447,7 @@ { "name": "nvidia/nvidia-nemotron-3-nano-30b-a3b-fp8", "alias": [ - "nvidia/NVIDIA-Nemotron-3-Nano-30B-A3B-FP8", - "NVIDIA-Nemotron-3-Nano-30B-A3B-FP8", - "nvidia-nemotron-3-nano-30b-a3b-fp8" + "NVIDIA-Nemotron-3-Nano-30B-A3B-FP8" ], "max_tokens": 262144, "model_types": [ @@ -22463,9 +21457,7 @@ { "name": "nvidia/nvidia-nemotron-3-super-120b-a12b-base-bf16", "alias": [ - "nvidia/NVIDIA-Nemotron-3-Super-120B-A12B-Base-BF16", - "NVIDIA-Nemotron-3-Super-120B-A12B-Base-BF16", - "nvidia-nemotron-3-super-120b-a12b-base-bf16" + "NVIDIA-Nemotron-3-Super-120B-A12B-Base-BF16" ], "max_tokens": 262144, "model_types": [ @@ -22475,9 +21467,7 @@ { "name": "nvidia/cosmos-embed1-448p", "alias": [ - "nvidia/Cosmos-Embed1-448p", - "Cosmos-Embed1-448p", - "cosmos-embed1-448p" + "Cosmos-Embed1-448p" ], "model_types": [ "embedding", @@ -22487,9 +21477,7 @@ { "name": "nvidia/cosmos-embed1-336p", "alias": [ - "nvidia/Cosmos-Embed1-336p", - "Cosmos-Embed1-336p", - "cosmos-embed1-336p" + "Cosmos-Embed1-336p" ], "model_types": [ "embedding", @@ -22499,9 +21487,7 @@ { "name": "nvidia/gr00t-n1.5-rl-rheo-assembletrocar", "alias": [ - "nvidia/GR00T-N1.5-RL-Rheo-AssembleTrocar", - "GR00T-N1.5-RL-Rheo-AssembleTrocar", - "gr00t-n1.5-rl-rheo-assembletrocar" + "GR00T-N1.5-RL-Rheo-AssembleTrocar" ], "model_types": [ "other" @@ -22510,9 +21496,7 @@ { "name": "nvidia/gr00t-n1.6-rheo-sim-pushcart", "alias": [ - "nvidia/GR00T-N1.6-Rheo-Sim-PushCart", - "GR00T-N1.6-Rheo-Sim-PushCart", - "gr00t-n1.6-rheo-sim-pushcart" + "GR00T-N1.6-Rheo-Sim-PushCart" ], "model_types": [ "other" @@ -22521,9 +21505,7 @@ { "name": "nvidia/gr00t-n1.6-rheo-picknplacetray", "alias": [ - "nvidia/GR00T-N1.6-Rheo-PickNPlaceTray", - "GR00T-N1.6-Rheo-PickNPlaceTray", - "gr00t-n1.6-rheo-picknplacetray" + "GR00T-N1.6-Rheo-PickNPlaceTray" ], "model_types": [ "other" @@ -22532,9 +21514,7 @@ { "name": "nvidia/cosmos-embed1-224p", "alias": [ - "nvidia/Cosmos-Embed1-224p", - "Cosmos-Embed1-224p", - "cosmos-embed1-224p" + "Cosmos-Embed1-224p" ], "model_types": [ "embedding", @@ -22544,9 +21524,7 @@ { "name": "nvidia/kimi-k2-thinking-eagle3", "alias": [ - "nvidia/Kimi-K2-Thinking-Eagle3", - "Kimi-K2-Thinking-Eagle3", - "kimi-k2-thinking-eagle3" + "Kimi-K2-Thinking-Eagle3" ], "max_tokens": 262144, "model_types": [ @@ -22587,9 +21565,7 @@ { "name": "nvidia/qwen3-30b-a3b-thinking-2507-eagle3", "alias": [ - "nvidia/Qwen3-30B-A3B-Thinking-2507-Eagle3", - "Qwen3-30B-A3B-Thinking-2507-Eagle3", - "qwen3-30b-a3b-thinking-2507-eagle3" + "Qwen3-30B-A3B-Thinking-2507-Eagle3" ], "max_tokens": 262144, "model_types": [ @@ -22603,9 +21579,7 @@ { "name": "nvidia/qwen3-235b-a22b-thinking-2507-fp4-eagle3", "alias": [ - "nvidia/Qwen3-235B-A22B-Thinking-2507-FP4-Eagle3", - "Qwen3-235B-A22B-Thinking-2507-FP4-Eagle3", - "qwen3-235b-a22b-thinking-2507-fp4-eagle3" + "Qwen3-235B-A22B-Thinking-2507-FP4-Eagle3" ], "max_tokens": 262144, "model_types": [ @@ -22619,9 +21593,7 @@ { "name": "nvidia/qwen3-235b-a22b-thinking-2507-eagle3", "alias": [ - "nvidia/Qwen3-235B-A22B-Thinking-2507-Eagle3", - "Qwen3-235B-A22B-Thinking-2507-Eagle3", - "qwen3-235b-a22b-thinking-2507-eagle3" + "Qwen3-235B-A22B-Thinking-2507-Eagle3" ], "max_tokens": 262144, "model_types": [ @@ -22635,9 +21607,7 @@ { "name": "nvidia/qwen3-nemotron-235b-a22b-genrm-2603", "alias": [ - "nvidia/Qwen3-Nemotron-235B-A22B-GenRM-2603", - "Qwen3-Nemotron-235B-A22B-GenRM-2603", - "qwen3-nemotron-235b-a22b-genrm-2603" + "Qwen3-Nemotron-235B-A22B-GenRM-2603" ], "max_tokens": 262144, "model_types": [ @@ -22651,9 +21621,7 @@ { "name": "nvidia/audio2emotion-v2.2", "alias": [ - "nvidia/Audio2Emotion-v2.2", - "Audio2Emotion-v2.2", - "audio2emotion-v2.2" + "Audio2Emotion-v2.2" ], "model_types": [ "audio" @@ -22662,9 +21630,7 @@ { "name": "nvidia/audio2emotion-v3.0", "alias": [ - "nvidia/Audio2Emotion-v3.0", - "Audio2Emotion-v3.0", - "audio2emotion-v3.0" + "Audio2Emotion-v3.0" ], "model_types": [ "audio" @@ -22673,9 +21639,7 @@ { "name": "nvidia/diffit", "alias": [ - "nvidia/DiffiT", - "DiffiT", - "diffit" + "DiffiT" ], "model_types": [ "image" @@ -22729,9 +21693,8 @@ { "name": "nvidia/nvidia-nemotron-nano-9b-v2", "alias": [ - "nvidia/NVIDIA-Nemotron-Nano-9B-v2", "NVIDIA-Nemotron-Nano-9B-v2", - "nvidia-nemotron-nano-9b-v2" + "Nvidia Nemotron Nano 9B V2" ], "max_tokens": 262144, "model_types": [ @@ -22759,9 +21722,7 @@ { "name": "nvidia/qwen3-vl-235b-a22b-instruct-nvfp4", "alias": [ - "nvidia/Qwen3-VL-235B-A22B-Instruct-NVFP4", - "Qwen3-VL-235B-A22B-Instruct-NVFP4", - "qwen3-vl-235b-a22b-instruct-nvfp4" + "Qwen3-VL-235B-A22B-Instruct-NVFP4" ], "max_tokens": 262144, "model_types": [ @@ -22773,9 +21734,7 @@ { "name": "nvidia/cosmos-predict2.5-2b", "alias": [ - "nvidia/Cosmos-Predict2.5-2B", - "Cosmos-Predict2.5-2B", - "cosmos-predict2.5-2b" + "Cosmos-Predict2.5-2B" ], "model_types": [ "video_generation" @@ -22795,9 +21754,7 @@ { "name": "nvidia/nemotron-research-goosereason-4b-instruct", "alias": [ - "nvidia/Nemotron-Research-GooseReason-4B-Instruct", - "Nemotron-Research-GooseReason-4B-Instruct", - "nemotron-research-goosereason-4b-instruct" + "Nemotron-Research-GooseReason-4B-Instruct" ], "max_tokens": 262144, "model_types": [ @@ -22811,9 +21768,7 @@ { "name": "nvidia/nemotron-terminal-32b", "alias": [ - "nvidia/Nemotron-Terminal-32B", - "Nemotron-Terminal-32B", - "nemotron-terminal-32b" + "Nemotron-Terminal-32B" ], "max_tokens": 262144, "model_types": [ @@ -22827,9 +21782,7 @@ { "name": "nvidia/nemotron-terminal-14b", "alias": [ - "nvidia/Nemotron-Terminal-14B", - "Nemotron-Terminal-14B", - "nemotron-terminal-14b" + "Nemotron-Terminal-14B" ], "max_tokens": 262144, "model_types": [ @@ -22843,9 +21796,7 @@ { "name": "nvidia/nemotron-terminal-8b", "alias": [ - "nvidia/Nemotron-Terminal-8B", - "Nemotron-Terminal-8B", - "nemotron-terminal-8b" + "Nemotron-Terminal-8B" ], "max_tokens": 262144, "model_types": [ @@ -22859,9 +21810,7 @@ { "name": "nvidia/dreamdojo", "alias": [ - "nvidia/DreamDojo", - "DreamDojo", - "dreamdojo" + "DreamDojo" ], "model_types": [ "video_generation" @@ -22899,9 +21848,7 @@ { "name": "nvidia/physicalai-simulation-vomp-model", "alias": [ - "nvidia/PhysicalAI-Simulation-VoMP-Model", - "PhysicalAI-Simulation-VoMP-Model", - "physicalai-simulation-vomp-model" + "PhysicalAI-Simulation-VoMP-Model" ], "model_types": [ "other" @@ -22910,9 +21857,7 @@ { "name": "nvidia/cosmos-transfer2.5-2b", "alias": [ - "nvidia/Cosmos-Transfer2.5-2B", - "Cosmos-Transfer2.5-2B", - "cosmos-transfer2.5-2b" + "Cosmos-Transfer2.5-2B" ], "model_types": [ "video_generation" @@ -22921,9 +21866,7 @@ { "name": "nvidia/llama-3.3-70b-instruct-eagle3", "alias": [ - "nvidia/Llama-3.3-70B-Instruct-Eagle3", - "Llama-3.3-70B-Instruct-Eagle3", - "llama-3.3-70b-instruct-eagle3" + "Llama-3.3-70B-Instruct-Eagle3" ], "model_types": [ "other" @@ -22932,9 +21875,7 @@ { "name": "nvidia/kimi-k2-thinking-nvfp4", "alias": [ - "nvidia/Kimi-K2-Thinking-NVFP4", - "Kimi-K2-Thinking-NVFP4", - "kimi-k2-thinking-nvfp4" + "Kimi-K2-Thinking-NVFP4" ], "max_tokens": 262144, "model_types": [ @@ -22948,9 +21889,7 @@ { "name": "nvidia/qwen3-next-80b-a3b-thinking-nvfp4", "alias": [ - "nvidia/Qwen3-Next-80B-A3B-Thinking-NVFP4", - "Qwen3-Next-80B-A3B-Thinking-NVFP4", - "qwen3-next-80b-a3b-thinking-nvfp4" + "Qwen3-Next-80B-A3B-Thinking-NVFP4" ], "max_tokens": 262144, "model_types": [ @@ -22964,9 +21903,7 @@ { "name": "nvidia/qwen3-next-80b-a3b-instruct-nvfp4", "alias": [ - "nvidia/Qwen3-Next-80B-A3B-Instruct-NVFP4", - "Qwen3-Next-80B-A3B-Instruct-NVFP4", - "qwen3-next-80b-a3b-instruct-nvfp4" + "Qwen3-Next-80B-A3B-Instruct-NVFP4" ], "max_tokens": 262144, "model_types": [ @@ -22976,9 +21913,7 @@ { "name": "nvidia/parakeet-ctc-0.6b-vietnamese", "alias": [ - "nvidia/parakeet-ctc-0.6b-Vietnamese", - "parakeet-ctc-0.6b-Vietnamese", - "parakeet-ctc-0.6b-vietnamese" + "parakeet-ctc-0.6b-Vietnamese" ], "model_types": [ "asr" @@ -22987,9 +21922,7 @@ { "name": "nvidia/nitrogen", "alias": [ - "nvidia/NitroGen", - "NitroGen", - "nitrogen" + "NitroGen" ], "model_types": [ "robotics" @@ -22998,9 +21931,7 @@ { "name": "nvidia/qwen3-coder-480b-a35b-instruct-nvfp4", "alias": [ - "nvidia/Qwen3-Coder-480B-A35B-Instruct-NVFP4", - "Qwen3-Coder-480B-A35B-Instruct-NVFP4", - "qwen3-coder-480b-a35b-instruct-nvfp4" + "Qwen3-Coder-480B-A35B-Instruct-NVFP4" ], "max_tokens": 262144, "model_types": [ @@ -23028,9 +21959,7 @@ { "name": "nvidia/qwen3-vl-235b-a22b-instruct-nvfp4-mlperf-inference-closed-v6.0", "alias": [ - "nvidia/Qwen3-VL-235B-A22B-Instruct-NVFP4-MLPerf-Inference-Closed-V6.0", - "Qwen3-VL-235B-A22B-Instruct-NVFP4-MLPerf-Inference-Closed-V6.0", - "qwen3-vl-235b-a22b-instruct-nvfp4-mlperf-inference-closed-v6.0" + "Qwen3-VL-235B-A22B-Instruct-NVFP4-MLPerf-Inference-Closed-V6.0" ], "max_tokens": 262144, "model_types": [ @@ -23042,9 +21971,7 @@ { "name": "nvidia/cosmos-policy-aloha-planning-model-predict2-2b", "alias": [ - "nvidia/Cosmos-Policy-ALOHA-Planning-Model-Predict2-2B", - "Cosmos-Policy-ALOHA-Planning-Model-Predict2-2B", - "cosmos-policy-aloha-planning-model-predict2-2b" + "Cosmos-Policy-ALOHA-Planning-Model-Predict2-2B" ], "model_types": [ "robotics" @@ -23053,9 +21980,7 @@ { "name": "nvidia/cosmos-policy-aloha-predict2-2b", "alias": [ - "nvidia/Cosmos-Policy-ALOHA-Predict2-2B", - "Cosmos-Policy-ALOHA-Predict2-2B", - "cosmos-policy-aloha-predict2-2b" + "Cosmos-Policy-ALOHA-Predict2-2B" ], "model_types": [ "robotics" @@ -23064,9 +21989,7 @@ { "name": "nvidia/cosmos-policy-robocasa-predict2-2b", "alias": [ - "nvidia/Cosmos-Policy-RoboCasa-Predict2-2B", - "Cosmos-Policy-RoboCasa-Predict2-2B", - "cosmos-policy-robocasa-predict2-2b" + "Cosmos-Policy-RoboCasa-Predict2-2B" ], "model_types": [ "robotics" @@ -23075,9 +21998,7 @@ { "name": "nvidia/cosmos-policy-libero-predict2-2b", "alias": [ - "nvidia/Cosmos-Policy-LIBERO-Predict2-2B", - "Cosmos-Policy-LIBERO-Predict2-2B", - "cosmos-policy-libero-predict2-2b" + "Cosmos-Policy-LIBERO-Predict2-2B" ], "model_types": [ "robotics" @@ -23086,9 +22007,7 @@ { "name": "nvidia/gr00t-n1.6-droid", "alias": [ - "nvidia/GR00T-N1.6-DROID", - "GR00T-N1.6-DROID", - "gr00t-n1.6-droid" + "GR00T-N1.6-DROID" ], "model_types": [ "other" @@ -23097,9 +22016,7 @@ { "name": "nvidia/qwen3-235b-a22b-thinking-2507-nvfp4", "alias": [ - "nvidia/Qwen3-235B-A22B-Thinking-2507-NVFP4", - "Qwen3-235B-A22B-Thinking-2507-NVFP4", - "qwen3-235b-a22b-thinking-2507-nvfp4" + "Qwen3-235B-A22B-Thinking-2507-NVFP4" ], "max_tokens": 262144, "model_types": [ @@ -23113,9 +22030,7 @@ { "name": "nvidia/qwen3-235b-a22b-instruct-2507-nvfp4", "alias": [ - "nvidia/Qwen3-235B-A22B-Instruct-2507-NVFP4", - "Qwen3-235B-A22B-Instruct-2507-NVFP4", - "qwen3-235b-a22b-instruct-2507-nvfp4" + "Qwen3-235B-A22B-Instruct-2507-NVFP4" ], "max_tokens": 262144, "model_types": [ @@ -23125,9 +22040,7 @@ { "name": "nvidia/c-radiov2-h", "alias": [ - "nvidia/C-RADIOv2-H", - "C-RADIOv2-H", - "c-radiov2-h" + "C-RADIOv2-H" ], "model_types": [ "embedding", @@ -23137,9 +22050,7 @@ { "name": "nvidia/c-radiov2-l", "alias": [ - "nvidia/C-RADIOv2-L", - "C-RADIOv2-L", - "c-radiov2-l" + "C-RADIOv2-L" ], "model_types": [ "embedding", @@ -23149,9 +22060,7 @@ { "name": "nvidia/c-radiov3-g", "alias": [ - "nvidia/C-RADIOv3-g", - "C-RADIOv3-g", - "c-radiov3-g" + "C-RADIOv3-g" ], "model_types": [ "embedding", @@ -23161,9 +22070,7 @@ { "name": "nvidia/c-radiov3-h", "alias": [ - "nvidia/C-RADIOv3-H", - "C-RADIOv3-H", - "c-radiov3-h" + "C-RADIOv3-H" ], "model_types": [ "embedding", @@ -23173,9 +22080,7 @@ { "name": "nvidia/c-radiov3-l", "alias": [ - "nvidia/C-RADIOv3-L", - "C-RADIOv3-L", - "c-radiov3-l" + "C-RADIOv3-L" ], "model_types": [ "embedding", @@ -23185,9 +22090,7 @@ { "name": "nvidia/c-radiov3-b", "alias": [ - "nvidia/C-RADIOv3-B", - "C-RADIOv3-B", - "c-radiov3-b" + "C-RADIOv3-B" ], "model_types": [ "embedding", @@ -23197,9 +22100,7 @@ { "name": "nvidia/c-radiov4-h", "alias": [ - "nvidia/C-RADIOv4-H", - "C-RADIOv4-H", - "c-radiov4-h" + "C-RADIOv4-H" ], "model_types": [ "embedding", @@ -23209,9 +22110,7 @@ { "name": "nvidia/c-radiov4-so400m", "alias": [ - "nvidia/C-RADIOv4-SO400M", - "C-RADIOv4-SO400M", - "c-radiov4-so400m" + "C-RADIOv4-SO400M" ], "model_types": [ "embedding", @@ -23221,9 +22120,7 @@ { "name": "nvidia/c-radiov2-b", "alias": [ - "nvidia/C-RADIOv2-B", - "C-RADIOv2-B", - "c-radiov2-b" + "C-RADIOv2-B" ], "model_types": [ "embedding", @@ -23242,9 +22139,7 @@ { "name": "nvidia/gpt-oss-120b-eagle3-short-context", "alias": [ - "nvidia/gpt-oss-120b-Eagle3-short-context", - "gpt-oss-120b-Eagle3-short-context", - "gpt-oss-120b-eagle3-short-context" + "gpt-oss-120b-Eagle3-short-context" ], "max_tokens": 131072, "model_types": [ @@ -23254,9 +22149,7 @@ { "name": "nvidia/gpt-oss-120b-eagle3-throughput", "alias": [ - "nvidia/gpt-oss-120b-Eagle3-throughput", - "gpt-oss-120b-Eagle3-throughput", - "gpt-oss-120b-eagle3-throughput" + "gpt-oss-120b-Eagle3-throughput" ], "max_tokens": 131072, "model_types": [ @@ -23266,9 +22159,7 @@ { "name": "nvidia/qwen3-235b-a22b-eagle3", "alias": [ - "nvidia/Qwen3-235B-A22B-Eagle3", - "Qwen3-235B-A22B-Eagle3", - "qwen3-235b-a22b-eagle3" + "Qwen3-235B-A22B-Eagle3" ], "max_tokens": 262144, "model_types": [ @@ -23278,9 +22169,7 @@ { "name": "nvidia/gpt-oss-120b-eagle3-long-context", "alias": [ - "nvidia/gpt-oss-120b-Eagle3-long-context", - "gpt-oss-120b-Eagle3-long-context", - "gpt-oss-120b-eagle3-long-context" + "gpt-oss-120b-Eagle3-long-context" ], "max_tokens": 131072, "model_types": [ @@ -23290,9 +22179,7 @@ { "name": "nvidia/gn16-tuned-arena-gr1-manipulation", "alias": [ - "nvidia/GN16-Tuned-Arena-GR1-Manipulation", - "GN16-Tuned-Arena-GR1-Manipulation", - "gn16-tuned-arena-gr1-manipulation" + "GN16-Tuned-Arena-GR1-Manipulation" ], "model_types": [ "robotics" @@ -23301,9 +22188,7 @@ { "name": "nvidia/qwen3-8b-dms-8x", "alias": [ - "nvidia/Qwen3-8B-DMS-8x", - "Qwen3-8B-DMS-8x", - "qwen3-8b-dms-8x" + "Qwen3-8B-DMS-8x" ], "max_tokens": 262144, "model_types": [ @@ -23313,9 +22198,7 @@ { "name": "nvidia/kvzap-mlp-llama-3.1-8b-instruct", "alias": [ - "nvidia/KVzap-mlp-Llama-3.1-8B-Instruct", - "KVzap-mlp-Llama-3.1-8B-Instruct", - "kvzap-mlp-llama-3.1-8b-instruct" + "KVzap-mlp-Llama-3.1-8B-Instruct" ], "model_types": [ "other" @@ -23324,9 +22207,7 @@ { "name": "nvidia/kvzap-mlp-qwen3-32b", "alias": [ - "nvidia/KVzap-mlp-Qwen3-32B", - "KVzap-mlp-Qwen3-32B", - "kvzap-mlp-qwen3-32b" + "KVzap-mlp-Qwen3-32B" ], "max_tokens": 262144, "model_types": [ @@ -23336,9 +22217,7 @@ { "name": "nvidia/kvzap-mlp-qwen3-8b", "alias": [ - "nvidia/KVzap-mlp-Qwen3-8B", - "KVzap-mlp-Qwen3-8B", - "kvzap-mlp-qwen3-8b" + "KVzap-mlp-Qwen3-8B" ], "max_tokens": 262144, "model_types": [ @@ -23348,9 +22227,7 @@ { "name": "nvidia/kvzap-linear-llama-3.1-8b-instruct", "alias": [ - "nvidia/KVzap-linear-Llama-3.1-8B-Instruct", - "KVzap-linear-Llama-3.1-8B-Instruct", - "kvzap-linear-llama-3.1-8b-instruct" + "KVzap-linear-Llama-3.1-8B-Instruct" ], "model_types": [ "other" @@ -23359,9 +22236,7 @@ { "name": "nvidia/kvzap-linear-qwen3-32b", "alias": [ - "nvidia/KVzap-linear-Qwen3-32B", - "KVzap-linear-Qwen3-32B", - "kvzap-linear-qwen3-32b" + "KVzap-linear-Qwen3-32B" ], "max_tokens": 262144, "model_types": [ @@ -23371,9 +22246,7 @@ { "name": "nvidia/kvzap-linear-qwen3-8b", "alias": [ - "nvidia/KVzap-linear-Qwen3-8B", - "KVzap-linear-Qwen3-8B", - "kvzap-linear-qwen3-8b" + "KVzap-linear-Qwen3-8B" ], "max_tokens": 262144, "model_types": [ @@ -23383,9 +22256,7 @@ { "name": "nvidia/deepseek-v3.2-nvfp4", "alias": [ - "nvidia/DeepSeek-V3.2-NVFP4", - "DeepSeek-V3.2-NVFP4", - "deepseek-v3.2-nvfp4" + "DeepSeek-V3.2-NVFP4" ], "max_tokens": 163840, "model_types": [ @@ -23399,9 +22270,7 @@ { "name": "nvidia/riva-translate-4b-instruct-v1.1", "alias": [ - "nvidia/Riva-Translate-4B-Instruct-v1.1", - "Riva-Translate-4B-Instruct-v1.1", - "riva-translate-4b-instruct-v1.1" + "Riva-Translate-4B-Instruct-v1.1" ], "model_types": [ "chat" @@ -23410,9 +22279,7 @@ { "name": "nvidia/nemotron-4-mini-hindi-4b-base", "alias": [ - "nvidia/Nemotron-4-Mini-Hindi-4B-Base", - "Nemotron-4-Mini-Hindi-4B-Base", - "nemotron-4-mini-hindi-4b-base" + "Nemotron-4-Mini-Hindi-4B-Base" ], "max_tokens": 262144, "model_types": [ @@ -23422,9 +22289,7 @@ { "name": "nvidia/deepseek-v3.1-nvfp4", "alias": [ - "nvidia/DeepSeek-V3.1-NVFP4", - "DeepSeek-V3.1-NVFP4", - "deepseek-v3.1-nvfp4" + "DeepSeek-V3.1-NVFP4" ], "max_tokens": 163840, "model_types": [ @@ -23438,9 +22303,7 @@ { "name": "nvidia/qwen2.5-vl-7b-surg-cholect50", "alias": [ - "nvidia/Qwen2.5-VL-7B-Surg-CholecT50", - "Qwen2.5-VL-7B-Surg-CholecT50", - "qwen2.5-vl-7b-surg-cholect50" + "Qwen2.5-VL-7B-Surg-CholecT50" ], "max_tokens": 131072, "model_types": [ @@ -23452,9 +22315,7 @@ { "name": "nvidia/rnapro-private-best-500m", "alias": [ - "nvidia/RNAPro-Private-Best-500M", - "RNAPro-Private-Best-500M", - "rnapro-private-best-500m" + "RNAPro-Private-Best-500M" ], "model_types": [ "other" @@ -23463,9 +22324,7 @@ { "name": "nvidia/rnapro-public-best-500m", "alias": [ - "nvidia/RNAPro-Public-Best-500M", - "RNAPro-Public-Best-500M", - "rnapro-public-best-500m" + "RNAPro-Public-Best-500M" ], "model_types": [ "other" @@ -23474,9 +22333,7 @@ { "name": "nvidia/nemotron-flash-3b-instruct", "alias": [ - "nvidia/Nemotron-Flash-3B-Instruct", - "Nemotron-Flash-3B-Instruct", - "nemotron-flash-3b-instruct" + "Nemotron-Flash-3B-Instruct" ], "max_tokens": 262144, "model_types": [ @@ -23486,9 +22343,7 @@ { "name": "nvidia/nemotron-flash-3b", "alias": [ - "nvidia/Nemotron-Flash-3B", - "Nemotron-Flash-3B", - "nemotron-flash-3b" + "Nemotron-Flash-3B" ], "max_tokens": 262144, "model_types": [ @@ -23498,9 +22353,7 @@ { "name": "nvidia/nemotron-flash-1b", "alias": [ - "nvidia/Nemotron-Flash-1B", - "Nemotron-Flash-1B", - "nemotron-flash-1b" + "Nemotron-Flash-1B" ], "max_tokens": 262144, "model_types": [ @@ -23510,9 +22363,7 @@ { "name": "nvidia/nv-reasyn-eb-174m-v2", "alias": [ - "nvidia/NV-ReaSyn-EB-174M-v2", - "NV-ReaSyn-EB-174M-v2", - "nv-reasyn-eb-174m-v2" + "NV-ReaSyn-EB-174M-v2" ], "model_types": [ "other" @@ -23521,9 +22372,7 @@ { "name": "nvidia/nv-reasyn-ar-166m-v2", "alias": [ - "nvidia/NV-ReaSyn-AR-166M-v2", - "NV-ReaSyn-AR-166M-v2", - "nv-reasyn-ar-166m-v2" + "NV-ReaSyn-AR-166M-v2" ], "model_types": [ "other" @@ -23532,9 +22381,7 @@ { "name": "nvidia/nv-reasyn-ar-166m-v1", "alias": [ - "nvidia/NV-ReaSyn-AR-166M-v1", - "NV-ReaSyn-AR-166M-v1", - "nv-reasyn-ar-166m-v1" + "NV-ReaSyn-AR-166M-v1" ], "model_types": [ "other" @@ -23543,9 +22390,7 @@ { "name": "nvidia/nvidia-nemotron-nano-9b-v2-nvfp4", "alias": [ - "nvidia/NVIDIA-Nemotron-Nano-9B-v2-NVFP4", - "NVIDIA-Nemotron-Nano-9B-v2-NVFP4", - "nvidia-nemotron-nano-9b-v2-nvfp4" + "NVIDIA-Nemotron-Nano-9B-v2-NVFP4" ], "max_tokens": 262144, "model_types": [ @@ -23555,9 +22400,7 @@ { "name": "nvidia/nvidia-nemotron-nano-9b-v2-fp8", "alias": [ - "nvidia/NVIDIA-Nemotron-Nano-9B-v2-FP8", - "NVIDIA-Nemotron-Nano-9B-v2-FP8", - "nvidia-nemotron-nano-9b-v2-fp8" + "NVIDIA-Nemotron-Nano-9B-v2-FP8" ], "max_tokens": 262144, "model_types": [ @@ -23576,9 +22419,7 @@ { "name": "nvidia/qwen2.5-cascaderl-rm-72b", "alias": [ - "nvidia/Qwen2.5-CascadeRL-RM-72B", - "Qwen2.5-CascadeRL-RM-72B", - "qwen2.5-cascaderl-rm-72b" + "Qwen2.5-CascadeRL-RM-72B" ], "model_types": [ "chat" @@ -23587,9 +22428,7 @@ { "name": "nvidia/nemotron-cascade-8b-thinking", "alias": [ - "nvidia/Nemotron-Cascade-8B-Thinking", - "Nemotron-Cascade-8B-Thinking", - "nemotron-cascade-8b-thinking" + "Nemotron-Cascade-8B-Thinking" ], "max_tokens": 262144, "model_types": [ @@ -23603,9 +22442,7 @@ { "name": "nvidia/nemotron-cascade-8b", "alias": [ - "nvidia/Nemotron-Cascade-8B", - "Nemotron-Cascade-8B", - "nemotron-cascade-8b" + "Nemotron-Cascade-8B" ], "max_tokens": 262144, "model_types": [ @@ -23619,9 +22456,7 @@ { "name": "nvidia/nemotron-cascade-14b-thinking", "alias": [ - "nvidia/Nemotron-Cascade-14B-Thinking", - "Nemotron-Cascade-14B-Thinking", - "nemotron-cascade-14b-thinking" + "Nemotron-Cascade-14B-Thinking" ], "max_tokens": 262144, "model_types": [ @@ -23653,9 +22488,7 @@ { "name": "nvidia/nemotron-cascade-8b-intermediate-ckpts", "alias": [ - "nvidia/Nemotron-Cascade-8B-Intermediate-ckpts", - "Nemotron-Cascade-8B-Intermediate-ckpts", - "nemotron-cascade-8b-intermediate-ckpts" + "Nemotron-Cascade-8B-Intermediate-ckpts" ], "max_tokens": 262144, "model_types": [ @@ -23669,9 +22502,7 @@ { "name": "nvidia/qwen3-nemotron-14b-brrm", "alias": [ - "nvidia/Qwen3-Nemotron-14B-BRRM", - "Qwen3-Nemotron-14B-BRRM", - "qwen3-nemotron-14b-brrm" + "Qwen3-Nemotron-14B-BRRM" ], "max_tokens": 262144, "model_types": [ @@ -23681,9 +22512,7 @@ { "name": "nvidia/qwen3-nemotron-8b-brrm", "alias": [ - "nvidia/Qwen3-Nemotron-8B-BRRM", - "Qwen3-Nemotron-8B-BRRM", - "qwen3-nemotron-8b-brrm" + "Qwen3-Nemotron-8B-BRRM" ], "max_tokens": 262144, "model_types": [ @@ -23711,9 +22540,7 @@ { "name": "nvidia/gr00t-n1.6-3b", "alias": [ - "nvidia/GR00T-N1.6-3B", - "GR00T-N1.6-3B", - "gr00t-n1.6-3b" + "GR00T-N1.6-3B" ], "model_types": [ "other" @@ -24506,6 +23333,11369 @@ "audio", "3d_generation" ] + }, + { + "name": "dall-e-3", + "model_types": [ + "text-to-image", + "image_generation" + ] + }, + { + "name": "gpt-3.5-turbo", + "max_tokens": 4000, + "model_types": [ + "chat" + ], + "alias": [ + "openai/gpt-3.5-turbo" + ] + }, + { + "name": "gpt-3.5-turbo-1106", + "max_tokens": 4000, + "model_types": [ + "chat" + ], + "alias": [ + "openai/gpt-3.5-turbo-1106" + ] + }, + { + "name": "gpt-3.5-turbo-16k", + "max_tokens": 16000, + "model_types": [ + "chat" + ], + "alias": [ + "openai/gpt-3.5-turbo-16k" + ] + }, + { + "name": "gpt-4", + "max_tokens": 8000, + "model_types": [ + "chat", + "vision", + "image2text" + ], + "alias": [ + "gpt-4-all", + "openai/gpt-4" + ] + }, + { + "name": "gpt-4-0125-preview", + "max_tokens": 128000, + "model_types": [ + "chat" + ] + }, + { + "name": "gpt-4-0613", + "max_tokens": 16000, + "model_types": [ + "chat" + ], + "alias": [ + "openai/gpt-4-0613" + ] + }, + { + "name": "gpt-4-1106-preview", + "max_tokens": 128000, + "model_types": [ + "chat" + ] + }, + { + "name": "gpt-4-32k", + "max_tokens": 32000, + "model_types": [ + "chat" + ] + }, + { + "name": "gpt-4-32k-0613", + "max_tokens": 32000, + "model_types": [ + "chat" + ] + }, + { + "name": "tts-1", + "model_types": [ + "tts", + "chat" + ], + "alias": [ + "openai/tts-1" + ] + }, + { + "name": "tts-1-1106", + "model_types": [ + "tts", + "chat" + ], + "alias": [ + "openai/tts-1-1106" + ] + }, + { + "name": "tts-1-hd", + "model_types": [ + "tts", + "chat" + ], + "alias": [ + "openai/tts-1-hd" + ] + }, + { + "name": "tts-1-hd-1106", + "model_types": [ + "tts", + "chat" + ], + "alias": [ + "openai/tts-1-hd-1106" + ] + }, + { + "name": "gpt-3.5-turbo-0125", + "max_tokens": 16000, + "model_types": [ + "chat" + ], + "alias": [ + "openai/gpt-3.5-turbo-0125" + ] + }, + { + "name": "gpt-3.5-turbo-instruct", + "max_tokens": 4000, + "model_types": [ + "chat" + ] + }, + { + "name": "gpt-4-gizmo-*", + "max_tokens": 128000, + "model_types": [ + "chat" + ] + }, + { + "name": "text-embedding-3-large", + "model_types": [ + "embedding", + "chat" + ], + "alias": [ + "openai/text-embedding-3-large" + ] + }, + { + "name": "text-embedding-3-small", + "model_types": [ + "embedding", + "chat" + ], + "alias": [ + "openai/text-embedding-3-small" + ] + }, + { + "name": "text-embedding-ada-002", + "model_types": [ + "embedding", + "chat" + ], + "alias": [ + "openai/text-embedding-ada-002" + ] + }, + { + "name": "claude-3-haiku-20240307", + "alias": [ + "claude-3-haiku" + ], + "max_tokens": 200000, + "model_types": [ + "chat" + ] + }, + { + "name": "glm-4-0520", + "max_tokens": 128000, + "model_types": [ + "chat" + ] + }, + { + "name": "glm-4v", + "max_tokens": 32000, + "model_types": [ + "chat", + "image2text", + "vision" + ] + }, + { + "name": "Baichuan-Text-Embedding", + "model_types": [ + "embedding" + ] + }, + { + "name": "Baichuan2-53B", + "max_tokens": 32000, + "model_types": [ + "chat" + ] + }, + { + "name": "Baichuan2-Turbo", + "max_tokens": 32000, + "model_types": [ + "chat" + ] + }, + { + "name": "Baichuan2-Turbo-192k", + "max_tokens": 192000, + "model_types": [ + "chat" + ] + }, + { + "name": "moonshot-v1-128k", + "max_tokens": 128000, + "model_types": [ + "chat" + ] + }, + { + "name": "moonshot-v1-32k", + "max_tokens": 32000, + "model_types": [ + "chat" + ] + }, + { + "name": "moonshot-v1-8k", + "max_tokens": 8000, + "model_types": [ + "chat" + ] + }, + { + "name": "whisper-1", + "model_types": [ + "asr", + "speech2text" + ] + }, + { + "name": "tavily", + "model_types": [ + "chat" + ] + }, + { + "name": "searchapi", + "model_types": [ + "chat" + ] + }, + { + "name": "clipdrop", + "model_types": [ + "chat" + ] + }, + { + "name": "vectorizer", + "model_types": [ + "chat" + ] + }, + { + "name": "ernie-4.0-8k", + "max_tokens": 8000, + "model_types": [ + "chat" + ] + }, + { + "name": "stable-diffusion", + "model_types": [ + "text-to-image", + "image_generation" + ] + }, + { + "name": "gpt-4-turbo", + "max_tokens": 128000, + "model_types": [ + "chat", + "vision", + "image2text" + ], + "alias": [ + "openai/gpt-4-turbo" + ] + }, + { + "name": "302", + "alias": [ + "302 API" + ], + "model_types": [ + "chat" + ] + }, + { + "name": "gpt-4o", + "max_tokens": 128000, + "model_types": [ + "chat", + "vision", + "image2text" + ], + "alias": [ + "gpt-4o-all", + "openai/gpt-4o" + ] + }, + { + "name": "glm-4-air", + "max_tokens": 128000, + "model_types": [ + "chat" + ] + }, + { + "name": "glm-4-flash", + "max_tokens": 128000, + "model_types": [ + "chat" + ] + }, + { + "name": "zhipu-embedding-2", + "model_types": [ + "embedding" + ] + }, + { + "name": "Doubao-pro-32k", + "max_tokens": 32000, + "model_types": [ + "chat" + ], + "alias": [ + "doubao-pro-32k-character-240528", + "doubao-pro-32k-functioncall-240515", + "doubao-pro-32k-browsing-240615", + "doubao-pro-32k-240615", + "doubao-pro-32k-functioncall-240815", + "doubao-pro-32k-240828", + "doubao-pro-32k-character-240828", + "doubao-pro-32k-browsing-240828", + "doubao-pro-32k-functioncall-preview", + "doubao-pro-32k-functioncall-241028", + "doubao-pro-32k-browsing-241115", + "doubao-pro-32k-character-241215", + "doubao-pro-32k-241215" + ], + "max_completion_tokens": 16384 + }, + { + "name": "Doubao-pro-128k", + "max_tokens": 128000, + "model_types": [ + "chat" + ], + "alias": [ + "doubao-pro-128k-240515", + "doubao-pro-128k-240628" + ] + }, + { + "name": "claude-3-5-sonnet-20240620", + "max_tokens": 200000, + "model_types": [ + "chat" + ] + }, + { + "name": "luma", + "model_types": [ + "chat" + ] + }, + { + "name": "step-1v-32k", + "max_tokens": 32000, + "model_types": [ + "chat" + ] + }, + { + "name": "step-1v-8k", + "max_tokens": 8000, + "model_types": [ + "chat" + ] + }, + { + "name": "yi-vision", + "alias": [ + "yi-vision-v2" + ], + "max_tokens": 16000, + "model_types": [ + "chat", + "image2text", + "vision" + ] + }, + { + "name": "generalv3.5", + "alias": [ + "Spark Max" + ], + "max_tokens": 8000, + "model_types": [ + "chat" + ] + }, + { + "name": "ernie-4.0-turbo-8k", + "alias": [ + "ERNIE-4.0-Turbo" + ], + "max_tokens": 8000, + "model_types": [ + "chat" + ] + }, + { + "name": "Baichuan3-Turbo", + "max_tokens": 32000, + "model_types": [ + "chat" + ] + }, + { + "name": "Baichuan3-Turbo-128k", + "max_tokens": 128000, + "model_types": [ + "chat" + ] + }, + { + "name": "Baichuan4", + "max_tokens": 32000, + "model_types": [ + "chat" + ] + }, + { + "name": "runway", + "model_types": [ + "chat" + ] + }, + { + "name": "doc2x", + "model_types": [ + "chat" + ] + }, + { + "name": "glif", + "model_types": [ + "chat" + ] + }, + { + "name": "SenseChat-5", + "max_tokens": 128000, + "model_types": [ + "chat" + ] + }, + { + "name": "SenseChat-Turbo", + "max_tokens": 32000, + "model_types": [ + "chat" + ] + }, + { + "name": "codegeex-4", + "max_tokens": 128000, + "model_types": [ + "chat" + ] + }, + { + "name": "glm-4-airx", + "max_tokens": 8000, + "model_types": [ + "chat" + ] + }, + { + "name": "gpt-4o-mini", + "model_types": [ + "chat" + ], + "alias": [ + "openai/gpt-4o-mini" + ] + }, + { + "name": "gpt-4o-mini-2024-07-18", + "max_tokens": 128000, + "model_types": [ + "chat" + ], + "alias": [ + "openai/gpt-4o-mini-2024-07-18" + ] + }, + { + "name": "llama3.1-405b", + "max_tokens": 128000, + "model_types": [ + "chat" + ] + }, + { + "name": "azure_tts", + "model_types": [ + "tts" + ] + }, + { + "name": "llama3.1-70b", + "max_tokens": 128000, + "model_types": [ + "chat" + ] + }, + { + "name": "llama3.1-8b", + "max_tokens": 128000, + "model_types": [ + "chat" + ] + }, + { + "name": "BAAI/bge-large-zh-v1.5", + "model_types": [ + "embedding" + ] + }, + { + "name": "BAAI/bge-large-en-v1.5", + "model_types": [ + "embedding" + ], + "max_tokens": 512, + "max_dimension": 1024 + }, + { + "name": "mistral-large-2", + "max_tokens": 128000, + "model_types": [ + "chat" + ] + }, + { + "name": "deepl-en", + "max_tokens": 32000, + "model_types": [ + "chat" + ] + }, + { + "name": "deepl-zh", + "max_tokens": 32000, + "model_types": [ + "chat" + ] + }, + { + "name": "deepl-ja", + "max_tokens": 32000, + "model_types": [ + "chat" + ] + }, + { + "name": "step-2-16k", + "alias": [ + "step-2-mini" + ], + "max_tokens": 16000, + "model_types": [ + "chat" + ] + }, + { + "name": "klingai", + "model_types": [ + "chat" + ] + }, + { + "name": "gpt-4-plus", + "max_tokens": 128000, + "model_types": [ + "chat" + ] + }, + { + "name": "exaai", + "model_types": [ + "chat" + ] + }, + { + "name": "flux", + "alias": [ + "ClarityAI/flux", + "deepgram/flux", + "Deepgram Flux" + ], + "model_types": [ + "text-to-image", + "image_generation", + "asr", + "speech2text" + ], + "max_tokens": 448 + }, + { + "name": "cogvideox", + "model_types": [ + "video_generation" + ] + }, + { + "name": "abab6.5s-chat", + "alias": [ + "abab6.5s" + ], + "max_tokens": 245000, + "model_types": [ + "chat" + ] + }, + { + "name": "gpt-4o-2024-08-06", + "max_tokens": 128000, + "model_types": [ + "chat" + ], + "alias": [ + "openai/gpt-4o-2024-08-06" + ] + }, + { + "name": "farui-plus", + "max_tokens": 12000, + "model_types": [ + "chat" + ] + }, + { + "name": "doubao_tts_hd", + "model_types": [ + "tts" + ] + }, + { + "name": "bochaai", + "model_types": [ + "chat" + ] + }, + { + "name": "netease-youdao/bce-reranker-base_v1", + "model_types": [ + "rerank" + ], + "alias": [ + "netease-youdao/bce-reranker-base-v1" + ] + }, + { + "name": "netease-youdao/bce-embedding-base_v1", + "model_types": [ + "embedding" + ] + }, + { + "name": "chatgpt-4o-latest", + "max_tokens": 128000, + "model_types": [ + "chat" + ] + }, + { + "name": "glm-4-long", + "max_tokens": 1000000, + "model_types": [ + "chat" + ] + }, + { + "name": "hunyuan-lite", + "max_tokens": 250000, + "model_types": [ + "chat" + ] + }, + { + "name": "hunyuan-standard", + "max_tokens": 30000, + "model_types": [ + "chat" + ] + }, + { + "name": "hunyuan-standard-256K", + "max_tokens": 250000, + "model_types": [ + "chat" + ] + }, + { + "name": "hunyuan-pro", + "max_tokens": 28000, + "model_types": [ + "chat" + ] + }, + { + "name": "hunyuan-code", + "max_tokens": 4000, + "model_types": [ + "chat" + ] + }, + { + "name": "hunyuan-role", + "max_tokens": 4000, + "model_types": [ + "chat" + ] + }, + { + "name": "hunyuan-functioncall", + "max_tokens": 28000, + "model_types": [ + "chat" + ] + }, + { + "name": "hunyuan-vision", + "max_tokens": 4000, + "model_types": [ + "chat", + "image2text", + "vision" + ] + }, + { + "name": "ideogram", + "model_types": [ + "text-to-image", + "image_generation" + ] + }, + { + "name": "gpt-3.5-sonnet-cursor", + "alias": [ + "claude-3.5-sonnet", + "gpt-3.5-sonnet-20241022-cursor", + "gpt-3.5-sonnet-20240620-cursor", + "gpt-4o-sonnet-cursor" + ], + "max_tokens": 200000, + "model_types": [ + "chat" + ] + }, + { + "name": "glm-4-plus", + "max_tokens": 128000, + "model_types": [ + "chat" + ] + }, + { + "name": "glm-4v-plus", + "max_tokens": 32000, + "model_types": [ + "chat", + "image2text", + "vision" + ] + }, + { + "name": "minimaxi_video-01", + "model_types": [ + "video_generation" + ] + }, + { + "name": "deepl", + "model_types": [ + "chat" + ] + }, + { + "name": "suno-api", + "model_types": [ + "chat" + ] + }, + { + "name": "fish-audio", + "model_types": [ + "chat" + ] + }, + { + "name": "llama3.2-90b", + "max_tokens": 131072, + "model_types": [ + "chat" + ] + }, + { + "name": "llama3.2-11b", + "max_tokens": 131072, + "model_types": [ + "chat" + ] + }, + { + "name": "gpt-4o-2024-05-13", + "max_tokens": 128000, + "model_types": [ + "chat", + "vision", + "image2text" + ], + "alias": [ + "openai/gpt-4o-2024-05-13" + ] + }, + { + "name": "gpt-4o-realtime-preview", + "model_types": [ + "chat" + ] + }, + { + "name": "gpt-4o-realtime-preview-2024-10-01", + "model_types": [ + "chat", + "video_generation" + ] + }, + { + "name": "minimaxi_text2voice", + "model_types": [ + "video_generation" + ] + }, + { + "name": "gpt-4o-audio-preview", + "max_tokens": 128000, + "model_types": [ + "chat", + "image2text", + "vision", + "tts" + ] + }, + { + "name": "gpt-4o-audio-preview-2024-10-01", + "max_tokens": 128000, + "model_types": [ + "chat", + "image2text", + "vision" + ] + }, + { + "name": "dubbingx", + "max_tokens": 32768, + "model_types": [ + "chat" + ] + }, + { + "name": "pika", + "max_tokens": 32768, + "model_types": [ + "chat" + ] + }, + { + "name": "yi-lightning", + "model_types": [ + "chat" + ] + }, + { + "name": "claude-3-5-sonnet-20241022", + "max_tokens": 200000, + "model_types": [ + "chat" + ] + }, + { + "name": "hedra", + "model_types": [ + "chat" + ] + }, + { + "name": "claude-3-5-sonnet-latest", + "max_tokens": 200000, + "model_types": [ + "chat" + ] + }, + { + "name": "recraft-v3", + "model_types": [ + "text-to-image", + "image_generation" + ] + }, + { + "name": "claude-3-5-haiku-20241022", + "max_tokens": 200000, + "model_types": [ + "chat" + ] + }, + { + "name": "gpt-4-turbo-2024-04-09", + "max_tokens": 128000, + "model_types": [ + "chat", + "vision", + "image2text" + ], + "alias": [ + "openai/gpt-4-turbo-2024-04-09" + ] + }, + { + "name": "pixtral-large-2411", + "max_tokens": 128000, + "model_types": [ + "chat", + "image2text", + "vision" + ] + }, + { + "name": "mistral-large-2411", + "max_tokens": 128000, + "model_types": [ + "chat" + ] + }, + { + "name": "pix", + "max_tokens": 32768, + "model_types": [ + "chat" + ] + }, + { + "name": "gpt-4o-2024-11-20", + "max_tokens": 128000, + "model_types": [ + "chat" + ], + "alias": [ + "openai/gpt-4o-2024-11-20" + ] + }, + { + "name": "gpt-4o-plus", + "max_tokens": 128000, + "model_types": [ + "chat" + ] + }, + { + "name": "ernie-4.0-turbo-128k", + "max_tokens": 8000, + "model_types": [ + "chat" + ] + }, + { + "name": "Luma-Photon", + "model_types": [ + "text-to-image", + "image_generation" + ] + }, + { + "name": "Doubao-vision-pro-32k", + "max_tokens": 32000, + "model_types": [ + "chat", + "image2text", + "vision" + ], + "alias": [ + "doubao-vision-pro-32k-241028" + ], + "max_completion_tokens": 4096 + }, + { + "name": "abab7-chat-preview", + "alias": [ + "abab7-preview" + ], + "max_tokens": 245000, + "model_types": [ + "chat" + ] + }, + { + "name": "coder-claude-3-5-sonnet-20240620", + "max_tokens": 200000, + "model_types": [ + "chat" + ] + }, + { + "name": "coder-claude-3-5-sonnet-20241022", + "max_tokens": 200000, + "model_types": [ + "chat" + ] + }, + { + "name": "minimaxi_music", + "model_types": [ + "chat" + ] + }, + { + "name": "llama3.3-70b", + "max_tokens": 128000, + "model_types": [ + "chat" + ] + }, + { + "name": "runway_exapnd", + "model_types": [ + "chat" + ] + }, + { + "name": "o1-plus", + "max_tokens": 128000, + "model_types": [ + "chat" + ] + }, + { + "name": "bge-large-zh-v1.5", + "model_types": [ + "embedding" + ] + }, + { + "name": "bge-large-en-v1.5", + "model_types": [ + "embedding" + ] + }, + { + "name": "tripo3d", + "model_types": [ + "chat" + ] + }, + { + "name": "vidu", + "model_types": [ + "chat" + ] + }, + { + "name": "Doubao-Vision-Lite-32k", + "max_tokens": 32000, + "model_types": [ + "chat", + "image2text", + "vision" + ], + "alias": [ + "doubao-vision-lite-32k-241015" + ], + "max_completion_tokens": 4096 + }, + { + "name": "o1", + "max_tokens": 200000, + "model_types": [ + "chat" + ], + "alias": [ + "o1-all" + ] + }, + { + "name": "general_v2.1_L", + "model_types": [ + "chat" + ] + }, + { + "name": "general_v2.0_L", + "model_types": [ + "chat" + ] + }, + { + "name": "general_v2.0", + "model_types": [ + "chat" + ] + }, + { + "name": "general_v2.0_L_seededit", + "model_types": [ + "text-to-image", + "image_generation" + ] + }, + { + "name": "general_v2.0_L_character", + "model_types": [ + "chat" + ] + }, + { + "name": "o1-2024-12-17", + "max_tokens": 200000, + "model_types": [ + "chat" + ] + }, + { + "name": "gpt-4o-realtime-preview-2024-12-17", + "model_types": [ + "chat" + ] + }, + { + "name": "gpt-4o-mini-realtime-preview-2024-12-17", + "model_types": [ + "chat" + ] + }, + { + "name": "gpt-4o-mini-realtime-preview", + "model_types": [ + "chat" + ] + }, + { + "name": "doubao", + "model_types": [ + "text-to-image", + "image_generation" + ] + }, + { + "name": "glm-zero-preview", + "max_tokens": 16000, + "model_types": [ + "chat" + ] + }, + { + "name": "kolors-virtual-try-on-v1", + "model_types": [ + "chat" + ] + }, + { + "name": "kolors-virtual-try-on-v1-5", + "model_types": [ + "chat" + ] + }, + { + "name": "text-moderation-latest", + "model_types": [ + "chat" + ] + }, + { + "name": "Qwen/Qwen2.5-72B-Instruct-128K", + "max_tokens": 128000, + "model_types": [ + "chat" + ] + }, + { + "name": "internlm/internlm2_5-7b-chat", + "max_tokens": 32000, + "model_types": [ + "chat" + ] + }, + { + "name": "THUDM/glm-4-9b-chat", + "max_tokens": 128000, + "model_types": [ + "chat" + ] + }, + { + "name": "Pro/Qwen/Qwen2.5-Coder-7B-Instruct", + "max_tokens": 32000, + "model_types": [ + "chat" + ] + }, + { + "name": "Pro/Qwen/Qwen2.5-7B-Instruct", + "max_tokens": 32000, + "model_types": [ + "chat" + ] + }, + { + "name": "Pro/Qwen/Qwen2-7B-Instruct", + "max_tokens": 32000, + "model_types": [ + "chat" + ] + }, + { + "name": "Pro/THUDM/glm-4-9b-chat", + "max_tokens": 128000, + "model_types": [ + "chat" + ] + }, + { + "name": "moonshot-v1-8k-vision-preview", + "max_tokens": 8000, + "model_types": [ + "chat", + "image2text", + "vision" + ] + }, + { + "name": "moonshot-v1-32k-vision-preview", + "max_tokens": 32000, + "model_types": [ + "chat", + "image2text", + "vision" + ] + }, + { + "name": "moonshot-v1-128k-vision-preview", + "max_tokens": 128000, + "model_types": [ + "chat", + "image2text", + "vision" + ] + }, + { + "name": "claude-3-5-haiku-latest", + "max_tokens": 200000, + "model_types": [ + "chat" + ] + }, + { + "name": "claude-3-5-haiku", + "max_tokens": 200000, + "model_types": [ + "chat" + ] + }, + { + "name": "step-2-16k-exp", + "max_tokens": 16000, + "model_types": [ + "chat" + ] + }, + { + "name": "memobase", + "model_types": [ + "chat" + ] + }, + { + "name": "deepseek-reasoner", + "alias": [ + "deepseek/deepseek-reasoner" + ], + "max_tokens": 128000, + "model_types": [ + "chat" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "Doubao-1.5-vision-pro-32k", + "max_tokens": 32000, + "model_types": [ + "chat", + "image2text", + "vision" + ] + }, + { + "name": "Doubao-1.5-pro-32k", + "max_tokens": 32000, + "model_types": [ + "chat" + ] + }, + { + "name": "Doubao-1.5-lite-32k", + "max_tokens": 32000, + "model_types": [ + "chat" + ] + }, + { + "name": "Doubao-1.5-pro-256k", + "max_tokens": 128000, + "model_types": [ + "chat" + ] + }, + { + "name": "sonar-pro", + "max_tokens": 200000, + "model_types": [ + "chat" + ] + }, + { + "name": "sonar", + "max_tokens": 200000, + "model_types": [ + "chat" + ], + "alias": [ + "perplexity/sonar" + ] + }, + { + "name": "step-1o-vision-32k", + "max_tokens": 32000, + "model_types": [ + "chat", + "image2text", + "vision" + ] + }, + { + "name": "sonar-reasoning", + "max_tokens": 127000, + "model_types": [ + "chat" + ] + }, + { + "name": "o3-mini", + "max_tokens": 128000, + "model_types": [ + "chat" + ], + "alias": [ + "o3-mini-all" + ] + }, + { + "name": "o3-mini-2025-01-31", + "max_tokens": 128000, + "model_types": [ + "chat" + ] + }, + { + "name": "deepseek-r1-huoshan", + "max_tokens": 64000, + "model_types": [ + "chat" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "deepseek-v3-huoshan", + "max_tokens": 64000, + "model_types": [ + "chat" + ] + }, + { + "name": "deepseek-r1-baidu", + "max_tokens": 64000, + "model_types": [ + "chat" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "deepseek-v3-baidu", + "max_tokens": 64000, + "model_types": [ + "chat" + ] + }, + { + "name": "minimaxi_video-01-live2d", + "model_types": [ + "video_generation" + ] + }, + { + "name": "minimaxi_S2V-01", + "model_types": [ + "chat" + ] + }, + { + "name": "deepseek-r1-aliyun", + "max_tokens": 64000, + "model_types": [ + "chat" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "deepseek-v3-aliyun", + "max_tokens": 64000, + "model_types": [ + "chat" + ] + }, + { + "name": "zzkj", + "alias": [ + "WiseDiag-Z1" + ], + "max_tokens": 32000, + "model_types": [ + "chat" + ] + }, + { + "name": "zzkj-think", + "alias": [ + "WiseDiag-Z1 Think" + ], + "max_tokens": 32000, + "model_types": [ + "chat" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "zzkj-lite", + "alias": [ + "WiseDiag-Z1 Lite" + ], + "max_tokens": 32000, + "model_types": [ + "chat" + ] + }, + { + "name": "zzkj-genetics", + "alias": [ + "WiseDiag-Genetics" + ], + "max_tokens": 32000, + "model_types": [ + "chat" + ] + }, + { + "name": "sonar-reasoning-pro", + "max_tokens": 127000, + "model_types": [ + "chat" + ] + }, + { + "name": "grok-4.3", + "max_tokens": 1000000, + "model_types": [ + "chat", + "vision", + "image2text" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + }, + "alias": [ + "xai/grok-4.3", + "grok-4.3-latest", + "grok-latest", + "grok-3", + "grok-3-latest", + "grok-3-beta", + "grok-3-fast", + "grok-3-fast-latest", + "grok-3-fast-beta", + "grok-3-mini", + "grok-3-mini-latest", + "grok-3-mini-beta", + "grok-3-mini-fast", + "grok-3-mini-fast-latest", + "grok-3-mini-fast-beta", + "grok-3-mini-high", + "grok-3-mini-high-beta", + "grok-3-mini-fast-high", + "grok-3-mini-fast-high-beta", + "grok-4-0709", + "grok-4", + "grok-4-latest", + "grok-4-fast-reasoning", + "grok-4-fast", + "grok-4-fast-reasoning-latest", + "grok-4-fast-non-reasoning", + "grok-4-fast-non-reasoning-latest", + "grok-4-1-fast-reasoning", + "grok-4-1-fast", + "grok-4-1-fast-reasoning-latest", + "grok-4-1-fast-non-reasoning", + "grok-4-1-fast-non-reasoning-latest", + "grok-4.1-fast", + "grok-4.2", + "grok-4.2-fast" + ] + }, + { + "name": "claude-3-7-sonnet-20250219", + "max_tokens": 200000, + "model_types": [ + "chat" + ] + }, + { + "name": "claude-3-7-sonnet-latest", + "max_tokens": 200000, + "model_types": [ + "chat", + "image2text", + "vision", + "ocr" + ], + "alias": [ + "anthropic/claude-3-7-sonnet-latest" + ] + }, + { + "name": "claude-3-7-sonnet-20250219-thinking", + "max_tokens": 200000, + "model_types": [ + "chat" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "kimi-latest", + "max_tokens": 128000, + "model_types": [ + "chat" + ] + }, + { + "name": "sonar-deep-research", + "max_tokens": 127000, + "model_types": [ + "chat" + ] + }, + { + "name": "hunyuan-turbos-20250226", + "max_tokens": 24000, + "model_types": [ + "chat" + ] + }, + { + "name": "gpt-3.7-sonnet-20250219-cursor", + "alias": [ + "claude-3.7-sonnet" + ], + "max_tokens": 200000, + "model_types": [ + "chat" + ] + }, + { + "name": "qwq-plus", + "max_tokens": 128000, + "model_types": [ + "chat" + ] + }, + { + "name": "minimaxi-image-01", + "model_types": [ + "text-to-image", + "image_generation" + ] + }, + { + "name": "cogview-4", + "model_types": [ + "text-to-image", + "image_generation" + ] + }, + { + "name": "cogview-4-250304", + "model_types": [ + "text-to-image", + "image_generation" + ] + }, + { + "name": "mistral-small-latest", + "max_tokens": 128000, + "model_types": [ + "chat" + ] + }, + { + "name": "mistral-large-latest", + "max_tokens": 128000, + "model_types": [ + "chat" + ] + }, + { + "name": "pixtral-large-latest", + "max_tokens": 128000, + "model_types": [ + "chat", + "image2text", + "vision" + ] + }, + { + "name": "mistral-small-2503", + "max_tokens": 128000, + "model_types": [ + "chat" + ] + }, + { + "name": "doubao-seededit", + "model_types": [ + "text-to-image", + "image_generation" + ] + }, + { + "name": "hunyuan-t1-latest", + "max_tokens": 64000, + "model_types": [ + "chat" + ] + }, + { + "name": "hunyuan-t1-20250321", + "max_tokens": 64000, + "model_types": [ + "chat" + ] + }, + { + "name": "ernie-4.5-8k-preview", + "max_tokens": 8000, + "model_types": [ + "chat" + ] + }, + { + "name": "qvq-max", + "max_tokens": 128000, + "model_types": [ + "chat", + "vision", + "image2text" + ] + }, + { + "name": "baidubce-irag-1.0", + "model_types": [ + "chat" + ] + }, + { + "name": "gpt-4o-transcribe", + "max_tokens": 16000, + "model_types": [ + "chat", + "asr", + "speech2text" + ] + }, + { + "name": "gpt-4o-mini-transcribe", + "max_tokens": 16000, + "model_types": [ + "chat", + "asr", + "speech2text" + ] + }, + { + "name": "gpt-4o-mini-tts", + "model_types": [ + "tts", + "chat" + ], + "alias": [ + "openai/gpt-4o-mini-tts" + ] + }, + { + "name": "gpt-4o-image-generation", + "max_tokens": 128000, + "model_types": [ + "text-to-image", + "image_generation" + ] + }, + { + "name": "step-r1-v-mini", + "max_tokens": 100000, + "model_types": [ + "chat" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "high_aes_general_v30l_zt2i", + "model_types": [ + "chat" + ] + }, + { + "name": "general_v3.0", + "model_types": [ + "chat" + ] + }, + { + "name": "glm-z1-air", + "max_tokens": 32000, + "model_types": [ + "chat" + ] + }, + { + "name": "glm-z1-airx", + "max_tokens": 32000, + "model_types": [ + "chat" + ] + }, + { + "name": "glm-z1-flash", + "max_tokens": 32000, + "model_types": [ + "chat" + ] + }, + { + "name": "glm-4-air-250414", + "max_tokens": 32000, + "model_types": [ + "chat" + ] + }, + { + "name": "glm-4-flash-250414", + "max_tokens": 128000, + "model_types": [ + "chat" + ] + }, + { + "name": "gpt-4.1", + "max_tokens": 1000000, + "model_types": [ + "chat" + ], + "alias": [ + "openai/gpt-4.1" + ] + }, + { + "name": "gpt-4.1-2025-04-14", + "max_tokens": 1000000, + "model_types": [ + "chat" + ], + "alias": [ + "openai/gpt-4.1-2025-04-14" + ] + }, + { + "name": "gpt-4.1-mini", + "max_tokens": 1000000, + "model_types": [ + "chat" + ], + "alias": [ + "openai/gpt-4.1-mini" + ] + }, + { + "name": "gpt-4.1-mini-2025-04-14", + "max_tokens": 1000000, + "model_types": [ + "chat" + ], + "alias": [ + "openai/gpt-4.1-mini-2025-04-14" + ] + }, + { + "name": "gpt-4.1-nano", + "max_tokens": 1000000, + "model_types": [ + "chat" + ], + "alias": [ + "openai/gpt-4.1-nano" + ] + }, + { + "name": "gpt-4.1-nano-2025-04-14", + "max_tokens": 1000000, + "model_types": [ + "chat" + ], + "alias": [ + "openai/gpt-4.1-nano-2025-04-14" + ] + }, + { + "name": "THUDM/GLM-Z1-32B-0414", + "max_tokens": 32000, + "model_types": [ + "chat" + ] + }, + { + "name": "THUDM/GLM-Z1-Rumination-32B-0414", + "max_tokens": 32000, + "model_types": [ + "chat" + ] + }, + { + "name": "THUDM/GLM-4-9B-0414", + "max_tokens": 32000, + "model_types": [ + "chat" + ] + }, + { + "name": "o3", + "max_tokens": 200000, + "model_types": [ + "chat", + "vision", + "image2text" + ], + "alias": [ + "o3-all" + ] + }, + { + "name": "o4-mini", + "max_tokens": 200000, + "model_types": [ + "chat", + "vision", + "image2text" + ], + "alias": [ + "o4-mini-all" + ] + }, + { + "name": "o4-mini-2025-04-16", + "max_tokens": 200000, + "model_types": [ + "chat", + "vision", + "image2text" + ] + }, + { + "name": "o3-2025-04-16", + "max_tokens": 200000, + "model_types": [ + "chat", + "vision", + "image2text" + ] + }, + { + "name": "doubao-1-5-thinking-pro-250415", + "alias": [ + "Doubao-1.5-Thinking-Pro", + "doubao-1-5-thinking-pro", + "doubao-1-5-thinking-pro-m-250415", + "doubao-1-5-thinking-pro-m-250428" + ], + "max_tokens": 96000, + "model_types": [ + "chat", + "vision", + "image2text" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + }, + "max_completion_tokens": 16384 + }, + { + "name": "doubao-1-5-thinking-pro-vision-250415", + "alias": [ + "Doubao-1.5-Thinking-Pro-Vision" + ], + "max_tokens": 96000, + "model_types": [ + "chat", + "image2text", + "vision" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "firecrawl", + "model_types": [ + "chat" + ] + }, + { + "name": "gpt-image-1", + "max_tokens": 32000, + "model_types": [ + "text-to-image", + "image_generation", + "image", + "image_edit", + "chat" + ], + "alias": [ + "gpt-image-1-all", + "openai/gpt-image-1" + ] + }, + { + "name": "gpt-4o-search-preview", + "max_tokens": 128000, + "model_types": [ + "chat" + ], + "alias": [ + "openai/gpt-4o-search-preview" + ] + }, + { + "name": "gpt-4o-mini-search-preview", + "max_tokens": 128000, + "model_types": [ + "chat" + ], + "alias": [ + "openai/gpt-4o-mini-search-preview" + ] + }, + { + "name": "doubao-1.5-ui-tars-250328", + "alias": [ + "doubao-1-5-ui-tars", + "doubao-1-5-ui-tars-250428" + ], + "max_tokens": 32000, + "model_types": [ + "chat", + "vision", + "image2text" + ], + "max_completion_tokens": 16384, + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "llama-4-scout", + "alias": [ + "meta-llama/llama-4-scout" + ], + "max_tokens": 128000, + "model_types": [ + "chat" + ] + }, + { + "name": "llama-4-maverick", + "alias": [ + "meta-llama/llama-4-maverick" + ], + "max_tokens": 128000, + "model_types": [ + "chat" + ] + }, + { + "name": "mistral-medium-latest", + "max_tokens": 128000, + "model_types": [ + "chat" + ] + }, + { + "name": "Phi-4-mini-reasoning", + "max_tokens": 32000, + "model_types": [ + "chat" + ] + }, + { + "name": "Phi-4-reasoning", + "max_tokens": 32000, + "model_types": [ + "chat" + ] + }, + { + "name": "SenseNova-V6-Pro", + "max_tokens": 32000, + "model_types": [ + "chat" + ] + }, + { + "name": "SenseNova-V6-Turbo", + "max_tokens": 32000, + "model_types": [ + "chat" + ] + }, + { + "name": "SenseNova-V6-Reasoner", + "max_tokens": 32000, + "model_types": [ + "chat" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "ernie-x1-turbo-32k", + "max_tokens": 32000, + "model_types": [ + "chat" + ] + }, + { + "name": "ernie-4.5-turbo-vl-32k", + "max_tokens": 8000, + "model_types": [ + "chat", + "image2text", + "vision" + ] + }, + { + "name": "ernie-4.5-turbo-128k", + "max_tokens": 128000, + "model_types": [ + "chat" + ] + }, + { + "name": "higgsfield", + "model_types": [ + "chat" + ] + }, + { + "name": "doubao-1-5-thinking-vision-pro-250428", + "alias": [ + "Doubao-1.5-Thinking-Vision-Pro-0428", + "doubao-1-5-thinking-vision-pro" + ], + "max_tokens": 128000, + "model_types": [ + "chat", + "image2text", + "vision" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + }, + "max_completion_tokens": 16384 + }, + { + "name": "MAI-DS-R1", + "max_tokens": 64000, + "model_types": [ + "chat" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "higgsfield-shortads", + "model_types": [ + "chat" + ] + }, + { + "name": "devstral-small-2505", + "max_tokens": 128000, + "model_types": [ + "chat" + ], + "alias": [ + "mistralai/Devstral-Small-2505", + "Devstral Small 2505" + ] + }, + { + "name": "claude-sonnet-4-20250514", + "max_tokens": 200000, + "model_types": [ + "chat" + ] + }, + { + "name": "claude-opus-4-20250514", + "max_tokens": 200000, + "model_types": [ + "chat" + ] + }, + { + "name": "claude-sonnet-4-20250514-thinking", + "max_tokens": 200000, + "model_types": [ + "chat" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "claude-opus-4-20250514-thinking", + "max_tokens": 200000, + "model_types": [ + "chat" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "kling-v1-6", + "model_types": [ + "chat" + ] + }, + { + "name": "deepseek-r1-huoshan-0528", + "max_tokens": 128000, + "model_types": [ + "chat" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "hedra-app", + "model_types": [ + "chat" + ] + }, + { + "name": "doubao-seedance-1-0-lite-t2v-250428", + "model_types": [ + "video_generation" + ], + "alias": [ + "doubao-seedance-1-0-lite-t2v" + ] + }, + { + "name": "doubao-seedance-1-0-lite-i2v-250428", + "model_types": [ + "video_generation" + ], + "alias": [ + "doubao-seedance-1-0-lite-i2v" + ] + }, + { + "name": "kling-v1", + "model_types": [ + "chat" + ] + }, + { + "name": "kling-v1-5", + "model_types": [ + "chat" + ] + }, + { + "name": "kling-v2-master", + "model_types": [ + "chat" + ], + "alias": [ + "kling/kling-v2-master" + ] + }, + { + "name": "deepseek/deepseek-v3-0324", + "max_tokens": 128000, + "model_types": [ + "chat" + ], + "alias": [ + "DeepSeek V3 0324" + ], + "max_completion_tokens": 65536 + }, + { + "name": "deepseek/deepseek-prover-v2-671b", + "max_tokens": 160000, + "model_types": [ + "chat" + ], + "alias": [ + "Deepseek Prover V2 671B" + ], + "max_completion_tokens": 160000 + }, + { + "name": "deepseek/deepseek-r1-turbo", + "max_tokens": 64000, + "model_types": [ + "chat" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + }, + "alias": [ + "DeepSeek R1 (Turbo)" + ], + "max_completion_tokens": 16000 + }, + { + "name": "deepseek/deepseek-v3-turbo", + "max_tokens": 64000, + "model_types": [ + "chat" + ], + "alias": [ + "deepseek-v3-turbo", + "DeepSeek V3 (Turbo)" + ], + "max_completion_tokens": 16000 + }, + { + "name": "deepseek/deepseek-v3/community", + "max_tokens": 64000, + "model_types": [ + "chat" + ], + "alias": [ + "community" + ], + "max_completion_tokens": 8000 + }, + { + "name": "deepseek/deepseek-r1/community", + "max_tokens": 64000, + "model_types": [ + "chat" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + }, + "max_completion_tokens": 8000 + }, + { + "name": "deepseek/deepseek-r1-distill-llama-8b", + "max_tokens": 32000, + "model_types": [ + "chat" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "o3-pro", + "max_tokens": 200000, + "model_types": [ + "chat", + "vision", + "image2text" + ], + "alias": [ + "o3-pro-all" + ] + }, + { + "name": "o3-pro-2025-06-10", + "max_tokens": 200000, + "model_types": [ + "chat" + ] + }, + { + "name": "doubao-seedance-1-0-pro-250528", + "model_types": [ + "video_generation" + ], + "alias": [ + "doubao-seedance-1-0-pro" + ] + }, + { + "name": "doubao-seed-1-6-thinking-250615", + "max_tokens": 256000, + "model_types": [ + "chat", + "vision", + "image2text" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + }, + "alias": [ + "doubao-seed-1-6-thinking" + ], + "max_completion_tokens": 16384 + }, + { + "name": "doubao-seed-1-6-250615", + "max_tokens": 256000, + "model_types": [ + "chat", + "vision", + "image2text" + ], + "alias": [ + "doubao-seed-1-6", + "doubao-seed-1-6-251015" + ], + "max_completion_tokens": 32768, + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "doubao-seed-1-6-flash-250615", + "max_tokens": 256000, + "model_types": [ + "chat", + "vision", + "image2text" + ], + "alias": [ + "doubao-seed-1-6-flash", + "doubao-seed-1-6-flash-250828" + ], + "max_completion_tokens": 32768, + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "doubao-seedream-3-0-t2i-250415", + "model_types": [ + "text-to-image", + "image_generation" + ], + "alias": [ + "doubao-seedream-3-0-t2i" + ] + }, + { + "name": "codex-mini-latest", + "max_tokens": 200000, + "model_types": [ + "chat" + ] + }, + { + "name": "MiniMax-M1", + "max_tokens": 1000000, + "model_types": [ + "chat" + ] + }, + { + "name": "Tongyi-Zhiwen/QwenLong-L1-32B", + "max_tokens": 128000, + "model_types": [ + "chat" + ] + }, + { + "name": "Pro/Qwen/Qwen2.5-VL-7B-Instruct", + "max_tokens": 32000, + "model_types": [ + "chat", + "image2text", + "vision" + ] + }, + { + "name": "T2V-01", + "model_types": [ + "video_generation" + ] + }, + { + "name": "T2V-01-Director", + "model_types": [ + "video_generation" + ] + }, + { + "name": "I2V-01", + "model_types": [ + "video_generation" + ] + }, + { + "name": "I2V-01-live", + "model_types": [ + "video_generation" + ] + }, + { + "name": "I2V-01-Director", + "model_types": [ + "video_generation" + ] + }, + { + "name": "chanjing-video", + "model_types": [ + "video_generation" + ] + }, + { + "name": "chanjing-cicada1.0", + "model_types": [ + "chat" + ] + }, + { + "name": "chanjing-cicada3.0", + "model_types": [ + "chat" + ] + }, + { + "name": "v0-1.5-md", + "max_tokens": 128000, + "model_types": [ + "chat" + ] + }, + { + "name": "v0-1.5-lg", + "max_tokens": 512000, + "model_types": [ + "chat" + ] + }, + { + "name": "v0-1.0-md", + "max_tokens": 128000, + "model_types": [ + "chat" + ] + }, + { + "name": "kling-v2-1", + "model_types": [ + "chat" + ] + }, + { + "name": "kling-v2-1-master", + "model_types": [ + "chat" + ], + "alias": [ + "kling/kling-v2-1-master" + ] + }, + { + "name": "omni-moderation-latest", + "model_types": [ + "chat" + ] + }, + { + "name": "gpt-4-sonnet-20250514-cursor", + "max_tokens": 200000, + "model_types": [ + "chat" + ] + }, + { + "name": "gpt-4-opus-4-20250514-cursor", + "max_tokens": 200000, + "model_types": [ + "chat" + ] + }, + { + "name": "gpt-4-opus-20250514-cursor", + "max_tokens": 200000, + "model_types": [ + "chat" + ] + }, + { + "name": "o3-deep-research", + "max_tokens": 200000, + "model_types": [ + "chat" + ] + }, + { + "name": "o3-deep-research-2025-06-26", + "max_tokens": 200000, + "model_types": [ + "chat" + ] + }, + { + "name": "o4-mini-deep-research", + "max_tokens": 200000, + "model_types": [ + "chat" + ] + }, + { + "name": "o4-mini-deep-research-2025-06-26", + "max_tokens": 200000, + "model_types": [ + "chat" + ] + }, + { + "name": "higgsfield-soul", + "model_types": [ + "chat" + ] + }, + { + "name": "baidu/ERNIE-4.5-300B-A47B", + "max_tokens": 128000, + "model_types": [ + "chat" + ] + }, + { + "name": "doubao-1.5-vision-pro-250328", + "max_tokens": 128000, + "model_types": [ + "chat", + "image2text", + "vision" + ], + "alias": [ + "doubao-1-5-vision-pro" + ], + "max_completion_tokens": 16384 + }, + { + "name": "doubao-1.5-vision-lite-250315", + "max_tokens": 128000, + "model_types": [ + "chat", + "image2text", + "vision" + ], + "alias": [ + "doubao-1-5-vision-lite" + ], + "max_completion_tokens": 16384 + }, + { + "name": "seededit_v3.0", + "model_types": [ + "text-to-image", + "image_generation" + ] + }, + { + "name": "gpt-4o-audio-preview-2025-06-03", + "max_tokens": 128000, + "model_types": [ + "chat", + "image2text", + "vision" + ] + }, + { + "name": "gpt-4o-audio-preview-2024-12-17", + "max_tokens": 128000, + "model_types": [ + "chat", + "image2text", + "vision", + "tts" + ] + }, + { + "name": "glm-4.1v-thinking-flash", + "max_tokens": 64000, + "model_types": [ + "chat" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "glm-4.1v-thinking-flashx", + "max_tokens": 64000, + "model_types": [ + "chat" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "sophnet/DeepSeek-R1-0528", + "max_tokens": 128000, + "model_types": [ + "chat" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "sophnet/DeepSeek-R1", + "max_tokens": 64000, + "model_types": [ + "chat" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "sophnet/DeepSeek-V3-Fast", + "max_tokens": 32000, + "model_types": [ + "chat" + ] + }, + { + "name": "sophnet/DeepSeek-v3", + "max_tokens": 128000, + "model_types": [ + "chat" + ] + }, + { + "name": "sophnet/DeepSeek-Prover-V2", + "max_tokens": 128000, + "model_types": [ + "chat" + ] + }, + { + "name": "sophnet/Qwen3-14B", + "max_tokens": 128000, + "model_types": [ + "chat" + ] + }, + { + "name": "sophnet/Qwen3-235B-A22B", + "max_tokens": 128000, + "model_types": [ + "chat" + ] + }, + { + "name": "sophnet/QwQ-32B", + "max_tokens": 128000, + "model_types": [ + "chat" + ] + }, + { + "name": "sophnet/Qwen2.5-72B-Instruct", + "max_tokens": 128000, + "model_types": [ + "chat" + ] + }, + { + "name": "sophnet/Qwen2.5-32B-Instruct", + "max_tokens": 128000, + "model_types": [ + "chat" + ] + }, + { + "name": "sophnet/Qwen2.5-7B-Instruct", + "max_tokens": 128000, + "model_types": [ + "chat" + ] + }, + { + "name": "sophnet/DeepSeek-R1-Distill-Llama-70B", + "max_tokens": 32000, + "model_types": [ + "chat" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "sophnet/DeepSeek-R1-Distill-Qwen-32B", + "max_tokens": 32000, + "model_types": [ + "chat" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "sophnet/DeepSeek-R1-Distill-Qwen-7B", + "max_tokens": 32000, + "model_types": [ + "chat" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "sophnet/Qwen2.5-VL-72B-Instruct", + "max_tokens": 128000, + "model_types": [ + "chat", + "image2text", + "vision" + ] + }, + { + "name": "sophnet/Qwen2.5-VL-32B-Instruct", + "max_tokens": 128000, + "model_types": [ + "chat", + "image2text", + "vision" + ] + }, + { + "name": "sophnet/Qwen2.5-VL-7B-Instruct", + "max_tokens": 128000, + "model_types": [ + "chat", + "image2text", + "vision" + ] + }, + { + "name": "sophnet/Qwen2-VL-72B-Instruct", + "max_tokens": 32000, + "model_types": [ + "chat", + "image2text", + "vision" + ] + }, + { + "name": "sophnet/Qwen2-VL-7B-Instruct", + "max_tokens": 32000, + "model_types": [ + "chat", + "image2text", + "vision" + ] + }, + { + "name": "kimi-k2-0711-preview", + "max_tokens": 128000, + "model_types": [ + "chat" + ] + }, + { + "name": "devstral-small-2507", + "max_tokens": 128000, + "model_types": [ + "chat" + ], + "alias": [ + "mistralai/Devstral-Small-2507" + ] + }, + { + "name": "devstral-medium-2507", + "max_tokens": 128000, + "model_types": [ + "chat" + ] + }, + { + "name": "sophnet/Kimi-K2", + "alias": [ + "sophnet/Kimi-K2Kimi-K2" + ], + "max_tokens": 64000, + "model_types": [ + "chat" + ] + }, + { + "name": "higgsfield-character", + "model_types": [ + "chat" + ] + }, + { + "name": "doubao-seededit-3-0-i2i-250628", + "model_types": [ + "text-to-image", + "image_generation" + ], + "alias": [ + "doubao-seededit-3-0-i2i" + ] + }, + { + "name": "glm-4.5-x", + "max_tokens": 128000, + "model_types": [ + "chat" + ] + }, + { + "name": "glm-4.5-airx", + "max_tokens": 128000, + "model_types": [ + "chat" + ] + }, + { + "name": "glm-4.5-flash", + "max_tokens": 128000, + "model_types": [ + "chat" + ] + }, + { + "name": "sf/zai-org/GLM-4.5-Air", + "max_tokens": 128000, + "model_types": [ + "chat" + ] + }, + { + "name": "step-3", + "max_tokens": 64000, + "model_types": [ + "chat" + ] + }, + { + "name": "playai-tts", + "model_types": [ + "tts" + ] + }, + { + "name": "kimi-k2-turbo-preview", + "max_tokens": 256000, + "model_types": [ + "chat" + ] + }, + { + "name": "runway-aleph", + "model_types": [ + "chat" + ] + }, + { + "name": "sophnet/Qwen3-Coder", + "max_tokens": 1000000, + "model_types": [ + "chat" + ] + }, + { + "name": "sophnet/Qwen3-32B", + "max_tokens": 128000, + "model_types": [ + "chat" + ] + }, + { + "name": "sophnet/Qwen3-235B-A22B-Instruct-2507", + "max_tokens": 262000, + "model_types": [ + "chat" + ] + }, + { + "name": "baidu/ernie-4.5-vl-424b-a47b", + "max_tokens": 123000, + "model_types": [ + "chat", + "image2text", + "vision" + ], + "alias": [ + "ernie-4.5-vl-424b-a47b", + "ERNIE 4.5 VL 424B A47B" + ], + "max_completion_tokens": 16000, + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "baidu/ernie-4.5-0.3b", + "max_tokens": 120000, + "model_types": [ + "chat" + ], + "alias": [ + "ernie-4.5-0.3b" + ], + "max_completion_tokens": 8000 + }, + { + "name": "baidu/ernie-4.5-21B-a3b", + "max_tokens": 120000, + "model_types": [ + "chat" + ], + "alias": [ + "ernie-4.5-21B-a3b", + "ERNIE 4.5 21B A3B" + ], + "max_completion_tokens": 8000 + }, + { + "name": "THUDM/GLM-4.1V-9B-Thinking", + "max_tokens": 64000, + "model_types": [ + "chat", + "vision", + "image2text" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + }, + "max_completion_tokens": 32000 + }, + { + "name": "claude-opus-4-1-20250805", + "max_tokens": 200000, + "model_types": [ + "chat" + ], + "alias": [ + "anthropic/claude-opus-4-1-20250805" + ] + }, + { + "name": "claude-opus-4-1-20250805-thinking", + "max_tokens": 200000, + "model_types": [ + "chat" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "cc-sonnet-4-20250514", + "max_tokens": 200000, + "model_types": [ + "chat" + ] + }, + { + "name": "gpt-5-2025-08-07", + "max_tokens": 400000, + "model_types": [ + "chat" + ], + "alias": [ + "openai/gpt-5-2025-08-07" + ] + }, + { + "name": "gpt-5-mini", + "max_tokens": 400000, + "model_types": [ + "chat", + "vision", + "image2text" + ], + "alias": [ + "openai/gpt-5-mini" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "gpt-5-mini-2025-08-07", + "max_tokens": 400000, + "model_types": [ + "chat" + ], + "alias": [ + "openai/gpt-5-mini-2025-08-07" + ] + }, + { + "name": "gpt-5-nano", + "max_tokens": 400000, + "model_types": [ + "chat", + "vision", + "image2text" + ], + "alias": [ + "openai/gpt-5-nano" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "gpt-5-nano-2025-08-07", + "max_tokens": 400000, + "model_types": [ + "chat" + ], + "alias": [ + "openai/gpt-5-nano-2025-08-07" + ] + }, + { + "name": "gpt-5-chat-latest", + "max_tokens": 400000, + "model_types": [ + "chat" + ], + "alias": [ + "openai/gpt-5-chat-latest" + ] + }, + { + "name": "gpt-5-thinking", + "max_tokens": 400000, + "model_types": [ + "chat" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + }, + "alias": [ + "gpt-5-thinking-all" + ] + }, + { + "name": "speech-02-hd", + "model_types": [ + "chat", + "tts" + ] + }, + { + "name": "speech-01-hd", + "model_types": [ + "chat" + ] + }, + { + "name": "speech-02-turbo", + "model_types": [ + "chat", + "tts" + ] + }, + { + "name": "speech-01-turbo", + "model_types": [ + "chat" + ] + }, + { + "name": "speech-01-turbo-240228", + "model_types": [ + "chat" + ] + }, + { + "name": "speech-2.5-turbo-preview", + "model_types": [ + "chat" + ] + }, + { + "name": "speech-2.5-hd-preview", + "model_types": [ + "chat" + ] + }, + { + "name": "SenseNova-V6-5-Turbo", + "max_tokens": 32000, + "model_types": [ + "chat" + ] + }, + { + "name": "SenseNova-V6-5-Pro", + "max_tokens": 32000, + "model_types": [ + "chat" + ] + }, + { + "name": "doubao-seed-1-6-flash-250715", + "max_tokens": 256000, + "model_types": [ + "chat", + "vision", + "image2text" + ], + "max_completion_tokens": 32768, + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "doubao-seed-1-6-thinking-250715", + "max_tokens": 256000, + "model_types": [ + "chat", + "vision", + "image2text" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + }, + "max_completion_tokens": 32768 + }, + { + "name": "jina-deepsearch-v1", + "model_types": [ + "chat" + ] + }, + { + "name": "kimi-k2-250711", + "max_tokens": 128000, + "model_types": [ + "chat" + ], + "max_completion_tokens": 32768 + }, + { + "name": "Baichuan-M2", + "max_tokens": 32000, + "model_types": [ + "chat" + ] + }, + { + "name": "Baichuan4-Air", + "max_tokens": 32000, + "model_types": [ + "chat" + ] + }, + { + "name": "Baichuan4-Turbo", + "max_tokens": 32000, + "model_types": [ + "chat" + ] + }, + { + "name": "hunyuan-turbos-20250716", + "max_tokens": 32000, + "model_types": [ + "chat" + ] + }, + { + "name": "hunyuan-t1-20250711", + "max_tokens": 28000, + "model_types": [ + "chat" + ] + }, + { + "name": "slides_glm_agent", + "model_types": [ + "chat" + ] + }, + { + "name": "deepcogito/cogito-v2-preview-deepseek-671b", + "max_tokens": 64000, + "model_types": [ + "chat" + ] + }, + { + "name": "deepcogito/cogito-v2-preview-llama-405B", + "max_tokens": 64000, + "model_types": [ + "chat" + ] + }, + { + "name": "deepcogito/cogito-v2-preview-llama-70B", + "max_tokens": 64000, + "model_types": [ + "chat" + ] + }, + { + "name": "u1-pro", + "max_tokens": 32000, + "model_types": [ + "chat" + ] + }, + { + "name": "u1", + "max_tokens": 32000, + "model_types": [ + "chat" + ] + }, + { + "name": "deepseek-v3.1-huoshan", + "max_tokens": 128000, + "model_types": [ + "chat" + ] + }, + { + "name": "deepseek-v3.1-thinking", + "max_tokens": 128000, + "model_types": [ + "chat" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "deepseek/deepseek-v3.1", + "max_tokens": 163840, + "model_types": [ + "chat" + ], + "alias": [ + "DeepSeek V3.1" + ], + "max_completion_tokens": 32768, + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "cc-opus-4-1-20250805", + "max_tokens": 200000, + "model_types": [ + "chat" + ] + }, + { + "name": "cc-3-5-haiku-20241022", + "max_tokens": 200000, + "model_types": [ + "chat" + ] + }, + { + "name": "grok-build-0.1", + "max_tokens": 256000, + "model_types": [ + "chat", + "vision", + "image2text" + ], + "alias": [ + "xai/grok-build-0.1", + "grok-code-fast-1", + "grok-code-fast", + "grok-code-fast-1-0825" + ] + }, + { + "name": "gpt-realtime", + "max_tokens": 32000, + "model_types": [ + "chat" + ] + }, + { + "name": "gpt-realtime-2025-08-28", + "max_tokens": 32000, + "model_types": [ + "chat", + "video_generation" + ] + }, + { + "name": "dop-lite", + "model_types": [ + "chat" + ] + }, + { + "name": "dop-preview", + "model_types": [ + "chat" + ] + }, + { + "name": "dop-turbo", + "model_types": [ + "chat" + ] + }, + { + "name": "higgsfield-api-soul", + "model_types": [ + "chat" + ] + }, + { + "name": "higgsfield-api-speak", + "model_types": [ + "chat" + ] + }, + { + "name": "kimi-k2-0905-preview", + "max_tokens": 262144, + "model_types": [ + "chat" + ] + }, + { + "name": "ByteDance-Seed/Seed-OSS-36B-Instruct", + "max_tokens": 256000, + "model_types": [ + "chat" + ] + }, + { + "name": "higgsfield-apps", + "model_types": [ + "chat" + ] + }, + { + "name": "Pro/moonshotai/Kimi-K2-Instruct-0905", + "max_tokens": 128000, + "model_types": [ + "chat" + ] + }, + { + "name": "sophnet/DeepSeek-V3.1-Fast", + "max_tokens": 163000, + "model_types": [ + "chat" + ] + }, + { + "name": "sophnet/DeepSeek-V3.1", + "max_tokens": 163000, + "model_types": [ + "chat" + ] + }, + { + "name": "sophnet/Qwen3-30B-A3B-Instruct-2507", + "max_tokens": 256000, + "model_types": [ + "chat" + ] + }, + { + "name": "sophnet/Seed-OSS-36B-Instruct", + "max_tokens": 512000, + "model_types": [ + "chat" + ] + }, + { + "name": "sophnet/LongCat-Flash-Chat", + "max_tokens": 128000, + "model_types": [ + "chat" + ] + }, + { + "name": "sophnet/Kimi-K2-0905", + "max_tokens": 256000, + "model_types": [ + "chat" + ] + }, + { + "name": "sophnet/Qwen3-30B-A3B-Thinking-2507", + "max_tokens": 256000, + "model_types": [ + "chat" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "doubao-seedream-4-0-250828", + "model_types": [ + "text-to-image", + "image_generation", + "image", + "image_edit" + ], + "alias": [ + "doubao-seedream-4-0" + ] + }, + { + "name": "inclusionAI/Ling-mini-2.0", + "max_tokens": 128000, + "model_types": [ + "chat" + ] + }, + { + "name": "sf/zai-org/GLM-4.5V", + "max_tokens": 64000, + "model_types": [ + "chat" + ] + }, + { + "name": "gpt-5-codex-low", + "max_tokens": 400000, + "model_types": [ + "chat" + ] + }, + { + "name": "gpt-5-codex-medium", + "max_tokens": 400000, + "model_types": [ + "chat" + ] + }, + { + "name": "gpt-5-codex-high", + "max_tokens": 400000, + "model_types": [ + "chat" + ] + }, + { + "name": "sophnet/Qwen3-Next-80B-A3B-Instruct", + "max_tokens": 256000, + "model_types": [ + "chat" + ] + }, + { + "name": "sophnet/Qwen3-Next-80B-A3B-Thinking", + "max_tokens": 256000, + "model_types": [ + "chat" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "sophnet2", + "alias": [ + "sophnet-img" + ], + "model_types": [ + "chat" + ] + }, + { + "name": "sophnet/GLM-4.5V", + "max_tokens": 66000, + "model_types": [ + "chat" + ] + }, + { + "name": "sophnet/Qwen3-VL-235B-A22B-Thinking", + "max_tokens": 128000, + "model_types": [ + "chat", + "image2text", + "vision" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "sophnet/Qwen3-VL-235B-A22B-Instruct", + "max_tokens": 128000, + "model_types": [ + "chat", + "image2text", + "vision" + ] + }, + { + "name": "sophnet/Qwen3-235B-A22B-Thinking-2507", + "max_tokens": 80000, + "model_types": [ + "chat" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "deepseek-v3.2-exp-thinking", + "max_tokens": 128000, + "model_types": [ + "chat" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "claude-sonnet-4-5-20250929", + "max_tokens": 200000, + "model_types": [ + "chat" + ], + "alias": [ + "anthropic/claude-sonnet-4-5-20250929" + ] + }, + { + "name": "claude-sonnet-4-5-20250929-thinking", + "max_tokens": 200000, + "model_types": [ + "chat" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "cc-sonnet-4-5-20250929", + "max_tokens": 200000, + "model_types": [ + "chat" + ] + }, + { + "name": "Kwaipilot/KAT-Dev", + "max_tokens": 128000, + "model_types": [ + "chat" + ] + }, + { + "name": "inclusionAI/Ring-flash-2.0", + "max_tokens": 128000, + "model_types": [ + "chat" + ] + }, + { + "name": "inclusionAI/Ling-flash-2.0", + "max_tokens": 128000, + "model_types": [ + "chat" + ] + }, + { + "name": "doubao-seed-1-6-vision-250815", + "max_tokens": 256000, + "model_types": [ + "chat", + "image2text", + "vision" + ], + "alias": [ + "doubao-seed-1-6-vision" + ], + "max_completion_tokens": 32768, + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "sora-2", + "max_tokens": 60000, + "model_types": [ + "chat", + "video_generation" + ], + "alias": [ + "openai/sora-2", + "Sora 2" + ] + }, + { + "name": "gpt-realtime-mini", + "max_tokens": 32000, + "model_types": [ + "chat" + ] + }, + { + "name": "gpt-realtime-mini-2025-10-06", + "max_tokens": 32000, + "model_types": [ + "chat" + ] + }, + { + "name": "gpt-image-1-mini", + "max_tokens": 32000, + "model_types": [ + "text-to-image", + "image_generation", + "image", + "image_edit", + "chat" + ], + "alias": [ + "openai/gpt-image-1-mini" + ] + }, + { + "name": "gpt-5-pro", + "max_tokens": 400000, + "model_types": [ + "chat" + ], + "alias": [ + "openai/gpt-5-pro" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "gpt-5-pro-2025-10-06", + "max_tokens": 400000, + "model_types": [ + "chat" + ], + "alias": [ + "openai/gpt-5-pro-2025-10-06" + ] + }, + { + "name": "Pro/deepseek-ai/DeepSeek-V3.2-Exp", + "max_tokens": 160000, + "model_types": [ + "chat" + ] + }, + { + "name": "sf/zai-org/GLM-4.6", + "max_tokens": 198000, + "model_types": [ + "chat" + ] + }, + { + "name": "sophnet/DeepSeek-V3.2-Exp", + "max_tokens": 163000, + "model_types": [ + "chat" + ] + }, + { + "name": "sophnet/GLM-4.6", + "max_tokens": 202000, + "model_types": [ + "chat" + ] + }, + { + "name": "cc-haiku-4-5-20251001", + "max_tokens": 200000, + "model_types": [ + "chat" + ] + }, + { + "name": "s1", + "max_tokens": 32000, + "model_types": [ + "chat" + ] + }, + { + "name": "kling-v2-5-turbo", + "model_types": [ + "chat" + ], + "alias": [ + "kling/kling-v2-5-turbo" + ] + }, + { + "name": "claude-haiku-4-5-20251001-thinking", + "max_tokens": 200000, + "model_types": [ + "chat" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "viduq2", + "model_types": [ + "chat", + "image", + "image_edit" + ] + }, + { + "name": "doubao-seedance-1-0-pro-fast-251015", + "model_types": [ + "video_generation" + ], + "alias": [ + "doubao-seedance-1-0-pro-fast" + ] + }, + { + "name": "Baichuan-M2-Plus", + "max_tokens": 32000, + "model_types": [ + "chat" + ] + }, + { + "name": "KAT-Coder-Air-V1", + "max_tokens": 128000, + "model_types": [ + "chat" + ] + }, + { + "name": "KAT-Coder-Pro-V1", + "max_tokens": 256000, + "model_types": [ + "chat" + ] + }, + { + "name": "KAT-Coder-Exp-72B-1010", + "max_tokens": 128000, + "model_types": [ + "chat" + ] + }, + { + "name": "MiniMax-Hailuo-2.3", + "model_types": [ + "chat", + "video_generation", + "video_understanding" + ] + }, + { + "name": "MiniMax-Hailuo-2.3-Fast", + "model_types": [ + "chat" + ] + }, + { + "name": "speech-2.6-turbo", + "model_types": [ + "chat", + "tts" + ], + "alias": [ + "minimax/speech-2.6-turbo", + "Minimax Speech 2.6 Turbo" + ], + "max_tokens": 448 + }, + { + "name": "speech-2.6-hd", + "model_types": [ + "chat", + "tts" + ] + }, + { + "name": "minimax-image-01", + "model_types": [ + "text-to-image", + "image_generation" + ], + "alias": [ + "minimaxi-image-01-live", + "minimax-image-01-live" + ] + }, + { + "name": "gpt-4o-transcribe-diarize", + "max_tokens": 16000, + "model_types": [ + "chat" + ] + }, + { + "name": "voyage-3-large", + "model_types": [ + "chat" + ] + }, + { + "name": "voyage-context-3", + "model_types": [ + "chat" + ] + }, + { + "name": "voyage-3.5", + "model_types": [ + "chat" + ] + }, + { + "name": "voyage-3.5-lite", + "model_types": [ + "chat" + ] + }, + { + "name": "voyage-code-3", + "model_types": [ + "chat" + ] + }, + { + "name": "voyage-finance-2", + "model_types": [ + "chat" + ] + }, + { + "name": "voyage-law-2", + "model_types": [ + "chat" + ] + }, + { + "name": "voyage-code-2", + "model_types": [ + "chat" + ] + }, + { + "name": "rerank-2.5", + "model_types": [ + "rerank" + ] + }, + { + "name": "rerank-2.5-lite", + "model_types": [ + "rerank" + ] + }, + { + "name": "music-2.0", + "model_types": [ + "chat" + ] + }, + { + "name": "music-1.5", + "model_types": [ + "chat" + ] + }, + { + "name": "kimi-k2-thinking", + "max_tokens": 262144, + "model_types": [ + "chat" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "kimi-k2-thinking-turbo", + "max_tokens": 262144, + "model_types": [ + "chat" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "doubao-seed-code-preview-251028", + "max_tokens": 256000, + "model_types": [ + "chat", + "vision", + "image2text" + ], + "alias": [ + "doubao-seed-code" + ], + "max_completion_tokens": 32768, + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "kimi-for-coding", + "max_tokens": 256000, + "model_types": [ + "chat" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "doubao-seed-code-preview-latest", + "max_tokens": 256000, + "model_types": [ + "chat" + ] + }, + { + "name": "gpt-5.1-plus", + "max_tokens": 400000, + "model_types": [ + "chat" + ] + }, + { + "name": "gpt-5.1-thinking-plus", + "max_tokens": 400000, + "model_types": [ + "chat" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "gpt-5.1-2025-11-13", + "max_tokens": 400000, + "model_types": [ + "chat" + ], + "alias": [ + "openai/gpt-5.1-2025-11-13" + ] + }, + { + "name": "gpt-5.1-chat-latest", + "max_tokens": 128000, + "model_types": [ + "chat" + ], + "alias": [ + "openai/gpt-5.1-chat-latest" + ] + }, + { + "name": "ernie-x1.1-preview", + "max_tokens": 128000, + "model_types": [ + "chat" + ] + }, + { + "name": "ernie-5.0-thinking-latest", + "max_tokens": 128000, + "model_types": [ + "chat" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "ernie-5.0-thinking-preview", + "max_tokens": 128000, + "model_types": [ + "chat", + "vision", + "image2text" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + }, + "alias": [ + "baidu/ernie-5.0-thinking-preview" + ], + "max_completion_tokens": 64000 + }, + { + "name": "grok-4.1", + "max_tokens": 200000, + "model_types": [ + "chat" + ] + }, + { + "name": "claude-opus-4-5-20251101", + "max_tokens": 200000, + "model_types": [ + "chat" + ], + "alias": [ + "anthropic/claude-opus-4-5-20251101", + "anthropic/claude-opus-4-5", + "claude-opus-4-5", + "anthropic/claude-opus-4.5", + "claude-opus-4.5" + ] + }, + { + "name": "cc-opus-4-5-20251101", + "max_tokens": 200000, + "model_types": [ + "chat" + ] + }, + { + "name": "deepseek-v3.2-thinking", + "max_tokens": 128000, + "model_types": [ + "chat" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "doubao-seedream-4-5-251128", + "model_types": [ + "text-to-image", + "image_generation", + "image", + "image_edit" + ], + "alias": [ + "doubao-seedream-4-5" + ] + }, + { + "name": "gpt-5.2-2025-12-11", + "max_tokens": 400000, + "model_types": [ + "chat" + ], + "alias": [ + "openai/gpt-5.2-2025-12-11" + ] + }, + { + "name": "gpt-5.2-chat-latest", + "max_tokens": 128000, + "model_types": [ + "chat" + ], + "alias": [ + "openai/gpt-5.2-chat-latest" + ] + }, + { + "name": "gpt-5.2-pro", + "max_tokens": 400000, + "model_types": [ + "chat" + ], + "alias": [ + "openai/gpt-5.2-pro" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "claude-opus-4-5-20251101-thinking", + "max_tokens": 200000, + "model_types": [ + "chat" + ] + }, + { + "name": "glm-asr-2512", + "model_types": [ + "asr", + "speech2text" + ] + }, + { + "name": "glm-tts-clone", + "model_types": [ + "tts" + ] + }, + { + "name": "mistral-large-2512", + "max_tokens": 128000, + "model_types": [ + "chat" + ] + }, + { + "name": "ministral-14b-2512", + "max_tokens": 128000, + "model_types": [ + "chat" + ] + }, + { + "name": "ministral-8b-2512", + "max_tokens": 128000, + "model_types": [ + "chat" + ] + }, + { + "name": "ministral-3b-2512", + "max_tokens": 128000, + "model_types": [ + "chat" + ] + }, + { + "name": "devstral-2512", + "max_tokens": 128000, + "model_types": [ + "chat" + ] + }, + { + "name": "gpt-4o-mini-tts-2025-12-15", + "model_types": [ + "tts", + "chat" + ], + "alias": [ + "openai/gpt-4o-mini-tts-2025-12-15" + ] + }, + { + "name": "gpt-image-1.5", + "max_tokens": 32000, + "model_types": [ + "text-to-image", + "image_generation", + "image", + "image_edit", + "chat" + ], + "alias": [ + "gpt-image-1.5-all", + "openai/gpt-image-1.5", + "GPT Image 1.5" + ] + }, + { + "name": "doubao-seed-1-8-251215", + "max_tokens": 224000, + "model_types": [ + "chat" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "glm-for-coding", + "max_tokens": 200000, + "model_types": [ + "chat" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "higgsfield-soul-standard", + "model_types": [ + "chat" + ] + }, + { + "name": "higgsfield-dop-standard", + "model_types": [ + "chat" + ] + }, + { + "name": "glm-4.7-preview", + "max_tokens": 200000, + "model_types": [ + "chat" + ] + }, + { + "name": "glm-4.7-coding-preview", + "max_tokens": 200000, + "model_types": [ + "chat" + ] + }, + { + "name": "MiniMax-M2.1-highspeed", + "max_tokens": 1000000, + "model_types": [ + "chat" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "doubao-seedance-1-5-pro-251215", + "model_types": [ + "video_generation" + ], + "alias": [ + "doubao-seedance-1-5-pro" + ] + }, + { + "name": "qwq-plus-latest", + "max_tokens": 128000, + "model_types": [ + "chat" + ] + }, + { + "name": "qwq-plus-2025-03-05", + "max_tokens": 128000, + "model_types": [ + "chat" + ] + }, + { + "name": "qvq-max-latest", + "max_tokens": 128000, + "model_types": [ + "chat", + "vision", + "image2text" + ] + }, + { + "name": "qvq-max-2025-05-15", + "max_tokens": 128000, + "model_types": [ + "chat" + ] + }, + { + "name": "qvq-max-2025-03-25", + "max_tokens": 128000, + "model_types": [ + "chat" + ] + }, + { + "name": "qvq-plus", + "max_tokens": 128000, + "model_types": [ + "chat" + ] + }, + { + "name": "qvq-plus-latest", + "max_tokens": 128000, + "model_types": [ + "chat" + ] + }, + { + "name": "qvq-plus-2025-05-15", + "max_tokens": 128000, + "model_types": [ + "chat" + ] + }, + { + "name": "qwen-plus-2024-07-23", + "max_tokens": 32000, + "model_types": [ + "chat" + ] + }, + { + "name": "qwen-max-2024-04-28", + "max_tokens": 131072, + "model_types": [ + "chat" + ] + }, + { + "name": "qwen-max-2024-04-03", + "max_tokens": 131072, + "model_types": [ + "chat" + ] + }, + { + "name": "qwen-turbo-2025-02-11", + "max_tokens": 1000000, + "model_types": [ + "chat" + ] + }, + { + "name": "qwen-turbo-2024-06-24", + "max_tokens": 8000, + "model_types": [ + "chat" + ] + }, + { + "name": "tongyi-intent-detect-v3", + "max_tokens": 8000, + "model_types": [ + "chat" + ] + }, + { + "name": "sophnet/DeepSeek-V3.2-Fast", + "max_tokens": 128000, + "model_types": [ + "chat" + ] + }, + { + "name": "sophnet/DeepSeek-Math-V2", + "max_tokens": 128000, + "model_types": [ + "chat" + ] + }, + { + "name": "sophnet/DeepSeek-V3.2", + "max_tokens": 128000, + "model_types": [ + "chat" + ] + }, + { + "name": "sophnet/DeepSeek-V3-0324", + "max_tokens": 128000, + "model_types": [ + "chat" + ] + }, + { + "name": "sophnet/MiMo-V2-Flash", + "max_tokens": 256000, + "model_types": [ + "chat" + ] + }, + { + "name": "sophnet/MiniMax-M2.1", + "max_tokens": 1000000, + "model_types": [ + "chat" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "sophnet/MiniMax-M2", + "max_tokens": 1000000, + "model_types": [ + "chat" + ] + }, + { + "name": "sophnet/GLM-4.7", + "max_tokens": 202000, + "model_types": [ + "chat" + ] + }, + { + "name": "sophnet/GLM-4.6V", + "max_tokens": 128000, + "model_types": [ + "chat" + ] + }, + { + "name": "sophnet/Kimi-K2-Thinking", + "max_tokens": 256000, + "model_types": [ + "chat" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "sophnet/LongCat-Flash-Thinking", + "max_tokens": 128000, + "model_types": [ + "chat" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "xiaomimimo/mimo-v2-flash", + "max_tokens": 262144, + "model_types": [ + "chat" + ], + "alias": [ + "mimo-v2-flash" + ], + "max_completion_tokens": 32000, + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "moonshotai/kimi-k2-thinking", + "max_tokens": 128000, + "model_types": [ + "chat" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + }, + "alias": [ + "Kimi K2 Thinking" + ], + "max_completion_tokens": 262144 + }, + { + "name": "kat-coder", + "max_tokens": 256000, + "model_types": [ + "chat" + ], + "max_completion_tokens": 128000 + }, + { + "name": "moonshotai/kimi-k2-0905", + "max_tokens": 262144, + "model_types": [ + "chat" + ], + "alias": [ + "kimi-k2-0905", + "Kimi K2 0905" + ], + "max_completion_tokens": 262144 + }, + { + "name": "baidu/ernie-4.5-vl-28b-a3b", + "max_tokens": 30000, + "model_types": [ + "chat", + "image2text", + "vision" + ], + "alias": [ + "ernie-4.5-vl-28b-a3b", + "ERNIE 4.5 VL 28B A3B" + ], + "max_completion_tokens": 8000, + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "Pro/moonshotai/Kimi-K2-Thinking", + "max_tokens": 256000, + "model_types": [ + "chat" + ] + }, + { + "name": "Pro/THUDM/GLM-4.1V-9B-Thinking", + "max_tokens": 64000, + "model_types": [ + "chat" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "ascend-tribe/pangu-pro-moe", + "max_tokens": 128000, + "model_types": [ + "chat" + ] + }, + { + "name": "Pro/deepseek-ai/DeepSeek-R1-Distill-Qwen-7B", + "max_tokens": 128000, + "model_types": [ + "chat" + ] + }, + { + "name": "s2", + "alias": [ + "s3" + ], + "max_tokens": 32000, + "model_types": [ + "chat" + ] + }, + { + "name": "u2", + "max_tokens": 32000, + "model_types": [ + "chat" + ] + }, + { + "name": "minimax-for-coding", + "max_tokens": 200000, + "model_types": [ + "chat" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "glm-4.7-flashx", + "max_tokens": 200000, + "model_types": [ + "chat" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "Baichuan-M3", + "max_tokens": 32000, + "model_types": [ + "chat" + ] + }, + { + "name": "qwen3-rerank", + "max_tokens": 30000, + "model_types": [ + "rerank" + ] + }, + { + "name": "M2-her", + "max_tokens": 1000000, + "model_types": [ + "chat" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + }, + "alias": [ + "minimax/m2-her" + ] + }, + { + "name": "music-2.5", + "model_types": [ + "chat" + ] + }, + { + "name": "Pro/moonshotai/Kimi-K2.5", + "max_tokens": 256000, + "model_types": [ + "chat" + ] + }, + { + "name": "deepseek/deepseek-ocr-2", + "max_tokens": 8192, + "model_types": [ + "chat", + "image2text", + "vision", + "ocr" + ], + "alias": [ + "DeepSeek-OCR 2" + ], + "max_completion_tokens": 8192 + }, + { + "name": "speech-2.8-hd", + "model_types": [ + "chat", + "tts" + ] + }, + { + "name": "speech-2.8-turbo", + "model_types": [ + "chat", + "tts" + ], + "alias": [ + "minimax/speech-2.8-turbo", + "Minimax Speech 2.8 Turbo" + ], + "max_tokens": 448 + }, + { + "name": "Pro/zai-org/GLM-5", + "max_tokens": 198000, + "model_types": [ + "chat" + ] + }, + { + "name": "MiniMax-M2.5-highspeed", + "max_tokens": 204800, + "model_types": [ + "chat" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + }, + "alias": [ + "minimax/minimax-m2.5-highspeed", + "MiniMax M2.5-highspeed" + ], + "max_completion_tokens": 131100 + }, + { + "name": "doubao-seed-2-0-pro-260215", + "max_tokens": 256000, + "model_types": [ + "chat", + "vision", + "image2text" + ], + "alias": [ + "doubao-seed-2-0-pro" + ], + "max_completion_tokens": 131072, + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "doubao-seed-2-0-lite-260215", + "max_tokens": 256000, + "model_types": [ + "chat", + "vision", + "image2text", + "audio", + "speech2text" + ], + "alias": [ + "doubao-seed-2-0-lite", + "doubao-seed-2-0-lite-260428" + ], + "max_completion_tokens": 131072, + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "doubao-seed-2-0-mini-260215", + "max_tokens": 256000, + "model_types": [ + "chat", + "vision", + "image2text", + "audio", + "speech2text" + ], + "alias": [ + "doubao-seed-2-0-mini", + "doubao-seed-2-0-mini-260428" + ], + "max_completion_tokens": 131072, + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "doubao-seed-2-0-code-preview-260215", + "max_tokens": 256000, + "model_types": [ + "chat", + "vision", + "image2text" + ], + "alias": [ + "doubao-seed-2-0-code" + ], + "max_completion_tokens": 131072, + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "sophnet/GLM-5", + "max_tokens": 202000, + "model_types": [ + "chat" + ] + }, + { + "name": "claude-sonnet-4-6-thinking", + "max_tokens": 1000000, + "model_types": [ + "chat" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "cc-sonnet-4-6", + "max_tokens": 1000000, + "model_types": [ + "chat" + ] + }, + { + "name": "doubao-seedream-5-0-260128", + "model_types": [ + "text-to-image", + "image_generation" + ], + "alias": [ + "doubao-seedream-5-0" + ] + }, + { + "name": "kling-v2-6", + "model_types": [ + "chat" + ], + "alias": [ + "kling/kling-v2-6" + ] + }, + { + "name": "gpt-5.3-chat-latest", + "max_tokens": 128000, + "model_types": [ + "chat" + ], + "alias": [ + "openai/gpt-5.3-chat-latest" + ] + }, + { + "name": "gpt-5.4-pro-2026-03-05", + "alias": [ + "gpt-5.4-pro", + "openai/gpt-5.4-pro", + "openai/gpt-5.4-pro-2026-03-05" + ], + "max_tokens": 1050000, + "model_types": [ + "chat" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "kling-image-o1", + "model_types": [ + "text-to-image", + "image_generation" + ] + }, + { + "name": "kling-v3-omni", + "model_types": [ + "chat" + ], + "alias": [ + "kling/kling-v3-omni" + ] + }, + { + "name": "glm-5-turbo", + "max_tokens": 200000, + "model_types": [ + "chat" + ], + "alias": [ + "zai-org/glm-5-turbo" + ], + "max_completion_tokens": 131072, + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "gpt-5.4-nano", + "max_tokens": 400000, + "model_types": [ + "chat" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + }, + "alias": [ + "openai/gpt-5.4-nano" + ] + }, + { + "name": "music-2.5+", + "model_types": [ + "chat" + ] + }, + { + "name": "MiniMax-M2.7-highspeed", + "max_tokens": 204800, + "model_types": [ + "chat" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + }, + "alias": [ + "minimax/minimax-m2.7-highspeed", + "MiniMax M2.7-highspeed" + ], + "max_completion_tokens": 131072 + }, + { + "name": "gpt-5.4-mini-2026-03-17", + "max_tokens": 400000, + "model_types": [ + "chat" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + }, + "alias": [ + "openai/gpt-5.4-mini-2026-03-17" + ] + }, + { + "name": "gpt-5.4-nano-2026-03-17", + "max_tokens": 400000, + "model_types": [ + "chat" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + }, + "alias": [ + "openai/gpt-5.4-nano-2026-03-17" + ] + }, + { + "name": "mimo-v2-pro", + "max_tokens": 1000000, + "model_types": [ + "chat" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + }, + "alias": [ + "xiaomimimo/mimo-v2-pro" + ], + "max_completion_tokens": 131072 + }, + { + "name": "mimo-v2-omni", + "max_tokens": 256000, + "model_types": [ + "chat" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "glm-5v-turbo", + "max_tokens": 200000, + "model_types": [ + "chat", + "vision", + "image2text" + ], + "alias": [ + "zai-org/glm-5v-turbo" + ], + "max_completion_tokens": 131072, + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "doubao-seedance-2-0-fast-260128", + "model_types": [ + "video_generation" + ], + "alias": [ + "doubao-seedance-2-0-fast" + ] + }, + { + "name": "doubao-seedance-2-0-260128", + "model_types": [ + "video_generation" + ], + "alias": [ + "doubao-seedance-2-0" + ] + }, + { + "name": "claude-opus-4-7", + "max_tokens": 1000000, + "model_types": [ + "chat", + "image2text", + "vision", + "ocr" + ], + "alias": [ + "anthropic/claude-opus-4-7", + "anthropic/claude-opus-4.7", + "claude-opus-4.7" + ] + }, + { + "name": "cc-opus-4-7", + "max_tokens": 200000, + "model_types": [ + "chat" + ] + }, + { + "name": "claude-opus-4-7-thinking", + "max_tokens": 1000000, + "model_types": [ + "chat" + ] + }, + { + "name": "chat-latest", + "max_tokens": 400000, + "model_types": [ + "chat" + ] + }, + { + "name": "sensenova-6.7-flash-lite", + "max_tokens": 32000, + "model_types": [ + "chat" + ] + }, + { + "name": "cc-opus-4-8", + "max_tokens": 200000, + "model_types": [ + "chat" + ] + }, + { + "name": "Bria/video_mask_by_key_points", + "alias": [ + "video_mask_by_key_points" + ], + "model_types": [ + "video_generation" + ] + }, + { + "name": "meta-llama/Llama-3.3-70B-Instruct-Turbo", + "alias": [ + "Llama-3.3-70B-Instruct-Turbo", + "Meta Llama 3.3 70B Instruct Turbo" + ], + "max_tokens": 131072, + "model_types": [ + "chat" + ] + }, + { + "name": "Qwen/Qwen3-TTS-VoiceDesign", + "alias": [ + "Qwen3-TTS-VoiceDesign" + ], + "model_types": [ + "tts" + ] + }, + { + "name": "PrunaAI/p-image", + "alias": [ + "p-image" + ], + "model_types": [ + "text-to-image", + "image_generation" + ] + }, + { + "name": "Wan-AI/Wan2.6-T2V", + "alias": [ + "Wan2.6-T2V" + ], + "model_types": [ + "video_generation" + ] + }, + { + "name": "openai/whisper-timestamped-medium.en", + "alias": [ + "whisper-timestamped-medium.en" + ], + "model_types": [ + "asr", + "speech2text" + ] + }, + { + "name": "deepseek-ai/Janus-Pro-1B", + "alias": [ + "Janus-Pro-1B" + ], + "model_types": [ + "text-to-image", + "image_generation" + ] + }, + { + "name": "ByteDance/Seedance-2.0", + "alias": [ + "Seedance-2.0", + "ByteDance Seedance 2.0" + ], + "model_types": [ + "video_generation" + ] + }, + { + "name": "Bria/video_eraser", + "alias": [ + "video_eraser" + ], + "model_types": [ + "video_generation" + ] + }, + { + "name": "Sao10K/L3.3-70B-Euryale-v2.3", + "alias": [ + "L3.3-70B-Euryale-v2.3" + ], + "max_tokens": 131072, + "model_types": [ + "chat" + ] + }, + { + "name": "nvidia/Llama-3.3-Nemotron-Super-49B-v1.5", + "alias": [ + "Llama-3.3-Nemotron-Super-49B-v1.5" + ], + "max_tokens": 131072, + "model_types": [ + "chat" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "sentence-transformers/clip-ViT-B-32-multilingual-v1", + "alias": [ + "clip-ViT-B-32-multilingual-v1" + ], + "max_tokens": 512, + "max_dimension": 512, + "model_types": [ + "embedding" + ] + }, + { + "name": "stabilityai/sd3.5-medium", + "alias": [ + "sd3.5-medium" + ], + "model_types": [ + "text-to-image", + "image_generation" + ] + }, + { + "name": "Qwen/Qwen3-Embedding-0.6B-batch", + "alias": [ + "Qwen3-Embedding-0.6B-batch" + ], + "max_tokens": 32768, + "max_dimension": 1024, + "model_types": [ + "embedding" + ] + }, + { + "name": "mistralai/Mixtral-8x7B-Instruct-v0.1", + "alias": [ + "Mixtral-8x7B-Instruct-v0.1", + "Mixtral-8x7B Instruct v0.1" + ], + "max_tokens": 32768, + "model_types": [ + "chat" + ] + }, + { + "name": "runwayml/stable-diffusion-v1-5", + "alias": [ + "stable-diffusion-v1-5" + ], + "model_types": [ + "text-to-image", + "image_generation" + ] + }, + { + "name": "Bria/erase", + "alias": [ + "erase" + ], + "model_types": [ + "text-to-image", + "image_generation" + ] + }, + { + "name": "mistralai/Mixtral-8x22B-Instruct-v0.1", + "alias": [ + "Mixtral-8x22B-Instruct-v0.1", + "Mixtral 8X22b Instruct V0.1" + ], + "max_tokens": 65536, + "model_types": [ + "chat" + ] + }, + { + "name": "allenai/olmOCR-7B-1025", + "alias": [ + "olmOCR-7B-1025" + ], + "max_tokens": 16384, + "model_types": [ + "chat", + "image2text", + "vision" + ] + }, + { + "name": "Wan-AI/Wan2.6-Image-Edit", + "alias": [ + "Wan2.6-Image-Edit" + ], + "model_types": [ + "text-to-image", + "image_generation" + ] + }, + { + "name": "mistralai/Voxtral-Small-24B-2507", + "alias": [ + "Voxtral-Small-24B-2507" + ], + "max_tokens": 32768, + "model_types": [ + "asr", + "speech2text" + ] + }, + { + "name": "Bria/fibo", + "alias": [ + "fibo" + ], + "model_types": [ + "text-to-image", + "image_generation" + ] + }, + { + "name": "sesame/csm-1b", + "alias": [ + "csm-1b" + ], + "model_types": [ + "tts" + ] + }, + { + "name": "Sao10K/L3.1-70B-Euryale-v2.2", + "alias": [ + "L3.1-70B-Euryale-v2.2" + ], + "max_tokens": 131072, + "model_types": [ + "chat" + ] + }, + { + "name": "stabilityai/stable-diffusion-2-1", + "alias": [ + "stable-diffusion-2-1" + ], + "model_types": [ + "text-to-image", + "image_generation" + ] + }, + { + "name": "inworld-ai/realtime-tts-2", + "alias": [ + "realtime-tts-2" + ], + "model_types": [ + "tts" + ] + }, + { + "name": "Bria/video_mask_by_prompt", + "alias": [ + "video_mask_by_prompt" + ], + "model_types": [ + "video_generation" + ] + }, + { + "name": "black-forest-labs/FLUX-1-Redux-dev", + "alias": [ + "FLUX-1-Redux-dev" + ], + "model_types": [ + "text-to-image", + "image_generation" + ] + }, + { + "name": "XiaomiMiMo/MiMo-V2.5-tts-voicedesign", + "alias": [ + "MiMo-V2.5-tts-voicedesign" + ], + "model_types": [ + "tts" + ] + }, + { + "name": "ByteDance/Seedream-4.5", + "alias": [ + "Seedream-4.5" + ], + "model_types": [ + "text-to-image", + "image_generation" + ] + }, + { + "name": "nvidia/Nemotron-3.5-ASR-Streaming-Multilingual-0.6b", + "alias": [ + "Nemotron-3.5-ASR-Streaming-Multilingual-0.6b" + ], + "model_types": [ + "asr", + "speech2text" + ] + }, + { + "name": "thenlper/gte-base", + "alias": [ + "gte-base" + ], + "max_tokens": 512, + "max_dimension": 768, + "model_types": [ + "embedding" + ] + }, + { + "name": "hexgrad/Kokoro-82M", + "alias": [ + "Kokoro-82M", + "Kokoro 82M" + ], + "model_types": [ + "tts" + ] + }, + { + "name": "intfloat/e5-base-v2", + "alias": [ + "e5-base-v2" + ], + "max_tokens": 512, + "max_dimension": 768, + "model_types": [ + "embedding" + ] + }, + { + "name": "ByteDance/Seed-2.0-mini", + "alias": [ + "Seed-2.0-mini" + ], + "max_tokens": 256000, + "model_types": [ + "chat", + "image2text", + "vision" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "Bria/remove_background", + "alias": [ + "remove_background" + ], + "model_types": [ + "text-to-image", + "image_generation" + ] + }, + { + "name": "meta-llama/Meta-Llama-3.1-8B-Instruct", + "alias": [ + "Meta-Llama-3.1-8B-Instruct" + ], + "max_tokens": 131072, + "model_types": [ + "chat" + ] + }, + { + "name": "stabilityai/sd3.5", + "alias": [ + "sd3.5" + ], + "model_types": [ + "text-to-image", + "image_generation" + ] + }, + { + "name": "thenlper/gte-large", + "alias": [ + "gte-large" + ], + "max_tokens": 512, + "max_dimension": 1024, + "model_types": [ + "embedding" + ] + }, + { + "name": "microsoft/WizardLM-2-8x22B", + "alias": [ + "WizardLM-2-8x22B", + "Wizardlm 2 8x22B" + ], + "max_tokens": 65536, + "model_types": [ + "chat" + ], + "max_completion_tokens": 8000 + }, + { + "name": "mistralai/Mistral-Small-3.1-24B-Instruct-2503", + "alias": [ + "Mistral-Small-3.1-24B-Instruct-2503" + ], + "max_tokens": 128000, + "model_types": [ + "chat" + ] + }, + { + "name": "mattshumer/Reflection-Llama-3.1-70B", + "alias": [ + "Reflection-Llama-3.1-70B" + ], + "max_tokens": 8192, + "model_types": [ + "chat" + ] + }, + { + "name": "anthropic/claude-4-opus", + "alias": [ + "claude-4-opus" + ], + "max_tokens": 200000, + "model_types": [ + "chat", + "image2text", + "vision", + "ocr" + ] + }, + { + "name": "canopylabs/orpheus-3b-0.1-ft", + "alias": [ + "orpheus-3b-0.1-ft", + "Orpheus 3B 0.1 FT" + ], + "model_types": [ + "tts" + ] + }, + { + "name": "black-forest-labs/FLUX-1-schnell", + "alias": [ + "FLUX-1-schnell", + "black-forest-labs/FLUX.1-schnell", + "FLUX.1-schnell", + "FLUX.1 Schnell" + ], + "model_types": [ + "text-to-image", + "image_generation" + ] + }, + { + "name": "ClarityAI/creative", + "alias": [ + "creative" + ], + "model_types": [ + "text-to-image", + "image_generation" + ] + }, + { + "name": "Bria/blur_background", + "alias": [ + "blur_background" + ], + "model_types": [ + "text-to-image", + "image_generation" + ] + }, + { + "name": "Bria/replace_background", + "alias": [ + "replace_background" + ], + "model_types": [ + "text-to-image", + "image_generation" + ] + }, + { + "name": "nvidia/Nemotron-3-Nano-Omni-30B-A3B-Reasoning", + "alias": [ + "Nemotron-3-Nano-Omni-30B-A3B-Reasoning" + ], + "max_tokens": 262144, + "model_types": [ + "chat", + "image2text", + "vision" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "Phind/Phind-CodeLlama-34B-v2", + "alias": [ + "Phind-CodeLlama-34B-v2" + ], + "max_tokens": 4096, + "model_types": [ + "chat" + ] + }, + { + "name": "microsoft/Phi-3-medium-4k-instruct", + "alias": [ + "Phi-3-medium-4k-instruct" + ], + "max_tokens": 4096, + "model_types": [ + "chat" + ] + }, + { + "name": "meta-llama/Llama-4-Maverick-17B-128E-Instruct-Turbo", + "alias": [ + "Llama-4-Maverick-17B-128E-Instruct-Turbo" + ], + "max_tokens": 8192, + "model_types": [ + "chat" + ] + }, + { + "name": "Wan-AI/Wan2.6-I2V", + "alias": [ + "Wan2.6-I2V" + ], + "model_types": [ + "video_generation" + ] + }, + { + "name": "run-diffusion/Juggernaut-Flux", + "alias": [ + "Juggernaut-Flux" + ], + "model_types": [ + "text-to-image", + "image_generation" + ] + }, + { + "name": "allenai/olmOCR-7B-0825", + "alias": [ + "olmOCR-7B-0825" + ], + "max_tokens": 16384, + "model_types": [ + "chat", + "image2text", + "vision" + ] + }, + { + "name": "anthropic/claude-4-sonnet", + "alias": [ + "claude-4-sonnet" + ], + "max_tokens": 200000, + "model_types": [ + "chat", + "image2text", + "vision", + "ocr" + ] + }, + { + "name": "nvidia/Nemotron-4-340B-Instruct", + "alias": [ + "Nemotron-4-340B-Instruct" + ], + "max_tokens": 4096, + "model_types": [ + "chat" + ] + }, + { + "name": "BAAI/bge-m3-multi", + "alias": [ + "bge-m3-multi" + ], + "max_tokens": 8192, + "max_dimension": 1024, + "model_types": [ + "embedding" + ] + }, + { + "name": "Wan-AI/Wan2.7-Image-Edit", + "alias": [ + "Wan2.7-Image-Edit" + ], + "model_types": [ + "text-to-image", + "image_generation" + ] + }, + { + "name": "cognitivecomputations/dolphin-2.6-mixtral-8x7b", + "alias": [ + "dolphin-2.6-mixtral-8x7b" + ], + "max_tokens": 32768, + "model_types": [ + "chat" + ] + }, + { + "name": "mistralai/Mistral-Small-24B-Instruct-2501", + "alias": [ + "Mistral-Small-24B-Instruct-2501", + "Mistral Small (24B) Instruct 25.01" + ], + "max_tokens": 32768, + "model_types": [ + "chat" + ] + }, + { + "name": "black-forest-labs/FLUX-1-dev", + "alias": [ + "FLUX-1-dev" + ], + "model_types": [ + "text-to-image", + "image_generation" + ] + }, + { + "name": "Wan-AI/Wan2.2-T2V-A14B", + "alias": [ + "Wan2.2-T2V-A14B", + "Wan 2.2 T2V" + ], + "model_types": [ + "video_generation" + ] + }, + { + "name": "ACE-Step/acestep-v15-xl-sft", + "alias": [ + "acestep-v15-xl-sft" + ], + "model_types": [ + "audio_generation" + ] + }, + { + "name": "Pixverse/Pixverse-T2V-HD", + "alias": [ + "Pixverse-T2V-HD" + ], + "model_types": [ + "video_generation" + ] + }, + { + "name": "openai/gpt-oss-120b-Turbo", + "alias": [ + "gpt-oss-120b-Turbo" + ], + "max_tokens": 131072, + "model_types": [ + "chat" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "microsoft/Phi-4-multimodal-instruct", + "alias": [ + "Phi-4-multimodal-instruct" + ], + "max_tokens": 131072, + "model_types": [ + "chat", + "image2text", + "vision" + ] + }, + { + "name": "Bria/video_increase_resolution", + "alias": [ + "video_increase_resolution" + ], + "model_types": [ + "video_generation" + ] + }, + { + "name": "sentence-transformers/multi-qa-mpnet-base-dot-v1", + "alias": [ + "multi-qa-mpnet-base-dot-v1" + ], + "max_tokens": 512, + "max_dimension": 768, + "model_types": [ + "embedding" + ] + }, + { + "name": "Bria/Bria-3.2", + "alias": [ + "Bria-3.2" + ], + "model_types": [ + "text-to-image", + "image_generation" + ] + }, + { + "name": "nvidia/NVIDIA-Nemotron-Nano-12B-v2-VL", + "alias": [ + "NVIDIA-Nemotron-Nano-12B-v2-VL" + ], + "max_tokens": 131072, + "model_types": [ + "chat", + "image2text", + "vision", + "ocr" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "NousResearch/Hermes-3-Llama-3.1-70B", + "alias": [ + "Hermes-3-Llama-3.1-70B" + ], + "max_tokens": 131072, + "model_types": [ + "chat" + ] + }, + { + "name": "cognitivecomputations/dolphin-2.9.1-llama-3-70b", + "alias": [ + "dolphin-2.9.1-llama-3-70b" + ], + "max_tokens": 8192, + "model_types": [ + "chat" + ] + }, + { + "name": "allenai/Olmo-3.1-32B-Instruct", + "alias": [ + "Olmo-3.1-32B-Instruct" + ], + "max_tokens": 65536, + "model_types": [ + "chat" + ] + }, + { + "name": "meta-llama/Meta-Llama-3.1-8B-Instruct-Turbo", + "alias": [ + "Meta-Llama-3.1-8B-Instruct-Turbo", + "Meta Llama 3.1 8B Instruct Turbo" + ], + "max_tokens": 131072, + "model_types": [ + "chat" + ] + }, + { + "name": "BAAI/bge-en-icl", + "alias": [ + "bge-en-icl" + ], + "max_tokens": 8192, + "max_dimension": 4096, + "model_types": [ + "embedding" + ] + }, + { + "name": "black-forest-labs/FLUX-pro", + "alias": [ + "FLUX-pro" + ], + "model_types": [ + "text-to-image", + "image_generation" + ] + }, + { + "name": "shibing624/text2vec-base-chinese", + "alias": [ + "text2vec-base-chinese" + ], + "max_tokens": 512, + "max_dimension": 768, + "model_types": [ + "embedding" + ] + }, + { + "name": "ByteDance/Seed-1.8", + "alias": [ + "Seed-1.8" + ], + "max_tokens": 256000, + "model_types": [ + "chat", + "image2text", + "vision" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "mistralai/Mistral-7B-Instruct-v0.3", + "alias": [ + "Mistral-7B-Instruct-v0.3", + "Mistral (7B) Instruct v0.3" + ], + "max_tokens": 32768, + "model_types": [ + "chat" + ] + }, + { + "name": "NovaSky-AI/Sky-T1-32B-Preview", + "alias": [ + "Sky-T1-32B-Preview" + ], + "max_tokens": 32768, + "model_types": [ + "chat" + ] + }, + { + "name": "Wan-AI/Wan2.1-T2V-1.3B", + "alias": [ + "Wan2.1-T2V-1.3B" + ], + "model_types": [ + "video_generation" + ] + }, + { + "name": "PrunaAI/p-video", + "alias": [ + "p-video" + ], + "model_types": [ + "video_generation" + ] + }, + { + "name": "mistralai/Mistral-Nemo-Instruct-2407", + "alias": [ + "Mistral-Nemo-Instruct-2407" + ], + "max_tokens": 131072, + "model_types": [ + "chat" + ] + }, + { + "name": "FastVideo/LTX2-Distilled-Diffusers", + "alias": [ + "LTX2-Distilled-Diffusers" + ], + "model_types": [ + "video_generation" + ] + }, + { + "name": "run-diffusion/Juggernaut-Lightning-Flux", + "alias": [ + "Juggernaut-Lightning-Flux", + "Rundiffusion/Juggernaut-Lightning-Flux", + "Juggernaut Lightning Flux by RunDiffusion" + ], + "model_types": [ + "text-to-image", + "image_generation" + ] + }, + { + "name": "intfloat/e5-large-v2", + "alias": [ + "e5-large-v2" + ], + "max_tokens": 512, + "max_dimension": 1024, + "model_types": [ + "embedding" + ] + }, + { + "name": "Zyphra/Zonos-v0.1-hybrid", + "alias": [ + "Zonos-v0.1-hybrid" + ], + "model_types": [ + "tts" + ] + }, + { + "name": "moonshotai/Kimi-K2.5-Turbo", + "alias": [ + "Kimi-K2.5-Turbo" + ], + "max_tokens": 262144, + "model_types": [ + "chat" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "Qwen/Qwen3-Coder-480B-A35B-Instruct-Turbo", + "alias": [ + "Qwen3-Coder-480B-A35B-Instruct-Turbo" + ], + "max_tokens": 262144, + "model_types": [ + "chat" + ] + }, + { + "name": "black-forest-labs/FLUX-2-klein-9b", + "alias": [ + "FLUX-2-klein-9b" + ], + "model_types": [ + "text-to-image", + "image_generation" + ] + }, + { + "name": "microsoft/WizardLM-2-7B", + "alias": [ + "WizardLM-2-7B" + ], + "max_tokens": 32768, + "model_types": [ + "chat" + ] + }, + { + "name": "NousResearch/Hermes-3-Llama-3.1-405B", + "alias": [ + "Hermes-3-Llama-3.1-405B" + ], + "max_tokens": 131072, + "model_types": [ + "chat" + ] + }, + { + "name": "Qwen/Qwen3-Embedding-4B-batch", + "alias": [ + "Qwen3-Embedding-4B-batch" + ], + "max_tokens": 32768, + "max_dimension": 2560, + "model_types": [ + "embedding" + ] + }, + { + "name": "XpucT/Deliberate", + "alias": [ + "Deliberate" + ], + "model_types": [ + "text-to-image", + "image_generation" + ] + }, + { + "name": "Wan-AI/Wan2.7-I2V", + "alias": [ + "Wan2.7-I2V", + "Wan 2.7 I2V" + ], + "model_types": [ + "video_generation" + ] + }, + { + "name": "deepseek-ai/DeepSeek-V3-0324-Turbo", + "alias": [ + "DeepSeek-V3-0324-Turbo" + ], + "max_tokens": 32768, + "model_types": [ + "chat" + ] + }, + { + "name": "lizpreciatior/lzlv_70b_fp16_hf", + "alias": [ + "lzlv_70b_fp16_hf" + ], + "max_tokens": 4096, + "model_types": [ + "chat" + ] + }, + { + "name": "sentence-transformers/clip-ViT-B-32", + "alias": [ + "clip-ViT-B-32" + ], + "max_tokens": 77, + "max_dimension": 512, + "model_types": [ + "embedding" + ] + }, + { + "name": "sentence-transformers/paraphrase-MiniLM-L6-v2", + "alias": [ + "paraphrase-MiniLM-L6-v2" + ], + "max_tokens": 512, + "max_dimension": 384, + "model_types": [ + "embedding" + ] + }, + { + "name": "bosonai/HiggsAudioV2.5", + "alias": [ + "HiggsAudioV2.5" + ], + "model_types": [ + "tts" + ] + }, + { + "name": "Wan-AI/Wan2.7-R2V", + "alias": [ + "Wan2.7-R2V", + "Wan 2.7 R2V" + ], + "model_types": [ + "video_generation" + ] + }, + { + "name": "inworld-ai/inworld-tts-1.5-max", + "alias": [ + "inworld-tts-1.5-max" + ], + "model_types": [ + "tts" + ] + }, + { + "name": "mistralai/Mistral-7B-Instruct-v0.1", + "alias": [ + "Mistral-7B-Instruct-v0.1", + "Mistral (7B) Instruct v0.1" + ], + "max_tokens": 32768, + "model_types": [ + "chat" + ] + }, + { + "name": "openai/whisper-timestamped-medium", + "alias": [ + "whisper-timestamped-medium" + ], + "model_types": [ + "asr", + "speech2text" + ] + }, + { + "name": "deepseek-ai/Janus-Pro-7B", + "alias": [ + "Janus-Pro-7B" + ], + "model_types": [ + "text-to-image", + "image_generation" + ] + }, + { + "name": "intfloat/multilingual-e5-large-instruct", + "alias": [ + "multilingual-e5-large-instruct", + "Multilingual E5 Large Instruct" + ], + "max_tokens": 512, + "max_dimension": 1024, + "model_types": [ + "embedding" + ] + }, + { + "name": "KoboldAI/LLaMA2-13B-Tiefighter", + "alias": [ + "LLaMA2-13B-Tiefighter" + ], + "max_tokens": 4096, + "model_types": [ + "chat" + ] + }, + { + "name": "microsoft/phi-4-reasoning-plus", + "alias": [ + "phi-4-reasoning-plus" + ], + "max_tokens": 32768, + "model_types": [ + "chat" + ] + }, + { + "name": "black-forest-labs/FLUX-2-dev", + "alias": [ + "FLUX-2-dev", + "black-forest-labs/FLUX.2-dev", + "FLUX.2-dev", + "FLUX.2 [dev]" + ], + "model_types": [ + "text-to-image", + "image_generation", + "image", + "image_edit" + ] + }, + { + "name": "openchat/openchat-3.6-8b", + "alias": [ + "openchat-3.6-8b" + ], + "max_tokens": 8192, + "model_types": [ + "chat" + ] + }, + { + "name": "Bria/video_remove_background", + "alias": [ + "video_remove_background" + ], + "model_types": [ + "video_generation" + ] + }, + { + "name": "mistralai/Mistral-7B-Instruct-v0.2", + "alias": [ + "Mistral-7B-Instruct-v0.2", + "mistral-7b" + ], + "max_tokens": 32768, + "model_types": [ + "chat" + ] + }, + { + "name": "CompVis/stable-diffusion-v1-4", + "alias": [ + "stable-diffusion-v1-4" + ], + "model_types": [ + "text-to-image", + "image_generation" + ] + }, + { + "name": "inworld-ai/realtime-tts-1.5-mini", + "alias": [ + "realtime-tts-1.5-mini" + ], + "model_types": [ + "tts" + ] + }, + { + "name": "ClarityAI/crystal", + "alias": [ + "crystal" + ], + "model_types": [ + "text-to-image", + "image_generation" + ] + }, + { + "name": "allenai/olmOCR-2", + "alias": [ + "olmOCR-2" + ], + "max_tokens": 16384, + "model_types": [ + "chat", + "image2text", + "vision" + ] + }, + { + "name": "Austism/chronos-hermes-13b-v2", + "alias": [ + "chronos-hermes-13b-v2" + ], + "max_tokens": 4096, + "model_types": [ + "chat" + ] + }, + { + "name": "bigcode/starcoder2-15b-instruct-v0.1", + "alias": [ + "starcoder2-15b-instruct-v0.1" + ], + "model_types": [ + "chat" + ] + }, + { + "name": "Qwen/Qwen3-Embedding-8B-batch", + "alias": [ + "Qwen3-Embedding-8B-batch" + ], + "max_tokens": 32768, + "max_dimension": 4096, + "model_types": [ + "embedding" + ] + }, + { + "name": "Bria/Bria-3.2-vector", + "alias": [ + "Bria-3.2-vector" + ], + "model_types": [ + "text-to-image", + "image_generation" + ] + }, + { + "name": "Bria/enhance", + "alias": [ + "enhance" + ], + "model_types": [ + "text-to-image", + "image_generation" + ] + }, + { + "name": "sentence-transformers/all-mpnet-base-v2", + "alias": [ + "all-mpnet-base-v2" + ], + "max_tokens": 512, + "max_dimension": 768, + "model_types": [ + "embedding" + ] + }, + { + "name": "Pixverse/Pixverse-6-I2V", + "alias": [ + "Pixverse-6-I2V" + ], + "model_types": [ + "video_generation" + ] + }, + { + "name": "meta-llama/Meta-Llama-3.1-405B-Instruct", + "alias": [ + "Meta-Llama-3.1-405B-Instruct" + ], + "max_tokens": 32768, + "model_types": [ + "chat" + ] + }, + { + "name": "intfloat/multilingual-e5-large", + "alias": [ + "multilingual-e5-large" + ], + "max_tokens": 512, + "max_dimension": 1024, + "model_types": [ + "embedding" + ] + }, + { + "name": "black-forest-labs/FLUX-1.1-pro", + "alias": [ + "FLUX-1.1-pro" + ], + "model_types": [ + "text-to-image", + "image_generation" + ] + }, + { + "name": "meta-llama/Meta-Llama-3.1-70B-Instruct-Turbo", + "alias": [ + "Meta-Llama-3.1-70B-Instruct-Turbo", + "Meta Llama 3.1 70B Instruct Turbo" + ], + "max_tokens": 131072, + "model_types": [ + "chat" + ] + }, + { + "name": "ResembleAI/chatterbox", + "alias": [ + "chatterbox" + ], + "model_types": [ + "tts" + ] + }, + { + "name": "Wan-AI/Wan2.1-T2V-14B", + "alias": [ + "Wan2.1-T2V-14B" + ], + "model_types": [ + "video_generation" + ] + }, + { + "name": "nvidia/Llama-3.1-Nemotron-70B-Instruct", + "alias": [ + "Llama-3.1-Nemotron-70B-Instruct", + "nim/nvidia/llama-3.1-nemotron-70b-instruct" + ], + "max_tokens": 131072, + "model_types": [ + "chat" + ] + }, + { + "name": "black-forest-labs/FLUX-2-pro", + "alias": [ + "FLUX-2-pro", + "black-forest-labs/FLUX.2-pro", + "FLUX.2-pro", + "FLUX.2 [pro]" + ], + "model_types": [ + "text-to-image", + "image_generation", + "chat", + "image", + "image_edit" + ] + }, + { + "name": "ByteDance/Seedance-1.5-Pro", + "alias": [ + "Seedance-1.5-Pro" + ], + "model_types": [ + "video_generation" + ] + }, + { + "name": "Bria/gen_fill", + "alias": [ + "gen_fill" + ], + "model_types": [ + "text-to-image", + "image_generation" + ] + }, + { + "name": "nvidia/NVIDIA-Nemotron-3-Super-120B-A12B", + "alias": [ + "NVIDIA-Nemotron-3-Super-120B-A12B" + ], + "max_tokens": 262144, + "model_types": [ + "chat" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "nvidia/NVIDIA-Nemotron-3-Ultra-550B-A55B", + "alias": [ + "NVIDIA-Nemotron-3-Ultra-550B-A55B" + ], + "max_tokens": 262144, + "model_types": [ + "chat", + "image2text", + "vision" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "Bria/expand", + "alias": [ + "expand" + ], + "model_types": [ + "text-to-image", + "image_generation" + ] + }, + { + "name": "inworld-ai/realtime-tts-1.5-max", + "alias": [ + "realtime-tts-1.5-max" + ], + "model_types": [ + "tts" + ] + }, + { + "name": "ResembleAI/chatterbox-turbo", + "alias": [ + "chatterbox-turbo" + ], + "model_types": [ + "tts" + ] + }, + { + "name": "deepinfra/airoboros-70b", + "alias": [ + "airoboros-70b" + ], + "max_tokens": 4096, + "model_types": [ + "chat" + ] + }, + { + "name": "Wan-AI/Wan2.6-T2I", + "alias": [ + "Wan2.6-T2I" + ], + "model_types": [ + "text-to-image", + "image_generation" + ] + }, + { + "name": "PrunaAI/p-video-avatar", + "alias": [ + "p-video-avatar" + ], + "model_types": [ + "video_generation" + ] + }, + { + "name": "stabilityai/sdxl-turbo", + "alias": [ + "sdxl-turbo" + ], + "model_types": [ + "text-to-image", + "image_generation" + ] + }, + { + "name": "BAAI/bge-base-en-v1.5", + "alias": [ + "bge-base-en-v1.5", + "BAAI-Bge-Base-1.5" + ], + "max_tokens": 512, + "max_dimension": 768, + "model_types": [ + "embedding" + ] + }, + { + "name": "Zyphra/Zonos-v0.1-transformer", + "alias": [ + "Zonos-v0.1-transformer" + ], + "model_types": [ + "tts" + ] + }, + { + "name": "Bria/video_foreground_mask", + "alias": [ + "video_foreground_mask" + ], + "model_types": [ + "video_generation" + ] + }, + { + "name": "ByteDance/Seed-2.0-code", + "alias": [ + "Seed-2.0-code" + ], + "max_tokens": 256000, + "model_types": [ + "chat", + "image2text", + "vision" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "Pixverse/Pixverse-T2V", + "alias": [ + "Pixverse-T2V" + ], + "model_types": [ + "video_generation" + ] + }, + { + "name": "nvidia/Cosmos3-Nano", + "alias": [ + "Cosmos3-Nano" + ], + "model_types": [ + "video_generation" + ] + }, + { + "name": "sentence-transformers/all-MiniLM-L12-v2", + "alias": [ + "all-MiniLM-L12-v2" + ], + "max_tokens": 512, + "max_dimension": 384, + "model_types": [ + "embedding" + ] + }, + { + "name": "nvidia/Nemotron-3-Nano-30B-A3B", + "alias": [ + "Nemotron-3-Nano-30B-A3B", + "Nemotron 3 Nano 30B A3B" + ], + "max_tokens": 262144, + "model_types": [ + "chat" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + }, + "max_completion_tokens": 32768 + }, + { + "name": "Sao10K/L3-8B-Lunaris-v1", + "alias": [ + "L3-8B-Lunaris-v1" + ], + "max_tokens": 8192, + "model_types": [ + "chat" + ] + }, + { + "name": "black-forest-labs/FLUX-2-klein-4b", + "alias": [ + "FLUX-2-klein-4b" + ], + "model_types": [ + "text-to-image", + "image_generation" + ] + }, + { + "name": "Sao10K/L3-70B-Euryale-v2.1", + "alias": [ + "L3-70B-Euryale-v2.1", + "L3 70B Euryale V2.1" + ], + "max_tokens": 8192, + "model_types": [ + "chat" + ], + "max_completion_tokens": 8192 + }, + { + "name": "deepseek-ai/DeepSeek-R1-0528-Turbo", + "alias": [ + "DeepSeek-R1-0528-Turbo" + ], + "max_tokens": 32768, + "model_types": [ + "chat" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "black-forest-labs/FLUX.1-Kontext-dev", + "alias": [ + "FLUX.1-Kontext-dev" + ], + "model_types": [ + "text-to-image", + "image_generation" + ] + }, + { + "name": "microsoft/phi-4", + "alias": [ + "phi-4" + ], + "max_tokens": 16384, + "model_types": [ + "chat" + ] + }, + { + "name": "allenai/olmOCR-2-7B-1025", + "alias": [ + "olmOCR-2-7B-1025" + ], + "max_tokens": 16384, + "model_types": [ + "chat", + "image2text", + "vision", + "ocr" + ] + }, + { + "name": "Bria/erase_foreground", + "alias": [ + "erase_foreground" + ], + "model_types": [ + "text-to-image", + "image_generation" + ] + }, + { + "name": "sentence-transformers/all-MiniLM-L6-v2", + "alias": [ + "all-MiniLM-L6-v2" + ], + "max_tokens": 512, + "max_dimension": 384, + "model_types": [ + "embedding" + ] + }, + { + "name": "Gryphe/MythoMax-L2-13b", + "alias": [ + "MythoMax-L2-13b", + "Mythomax L2 13B" + ], + "max_tokens": 4096, + "model_types": [ + "chat" + ], + "max_completion_tokens": 3200 + }, + { + "name": "XiaomiMiMo/MiMo-V2.5-tts-voiceclone", + "alias": [ + "MiMo-V2.5-tts-voiceclone" + ], + "model_types": [ + "tts" + ] + }, + { + "name": "openchat/openchat_3.5", + "alias": [ + "openchat_3.5" + ], + "max_tokens": 8192, + "model_types": [ + "chat" + ] + }, + { + "name": "mistralai/Voxtral-Mini-3B-2507", + "alias": [ + "Voxtral-Mini-3B-2507" + ], + "max_tokens": 32768, + "model_types": [ + "asr", + "speech2text" + ] + }, + { + "name": "Gryphe/MythoMax-L2-13b-turbo", + "alias": [ + "MythoMax-L2-13b-turbo" + ], + "max_tokens": 4096, + "model_types": [ + "chat" + ] + }, + { + "name": "Sao10K/L3-8B-Lunaris-v1-Turbo", + "alias": [ + "L3-8B-Lunaris-v1-Turbo" + ], + "max_tokens": 8192, + "model_types": [ + "chat" + ] + }, + { + "name": "black-forest-labs/FLUX-2-max", + "alias": [ + "FLUX-2-max", + "black-forest-labs/FLUX.2-max", + "FLUX.2-max", + "FLUX.2 [max]" + ], + "model_types": [ + "text-to-image", + "image_generation", + "image", + "image_edit" + ] + }, + { + "name": "PrunaAI/p-image-Edit", + "alias": [ + "p-image-Edit" + ], + "model_types": [ + "text-to-image", + "image_generation" + ] + }, + { + "name": "Bria/fibo_edit", + "alias": [ + "fibo_edit" + ], + "model_types": [ + "text-to-image", + "image_generation" + ] + }, + { + "name": "Qwen/Qwen3-TTS", + "alias": [ + "Qwen3-TTS" + ], + "model_types": [ + "tts" + ] + }, + { + "name": "deepseek-ai/DeepSeek-R1-Turbo", + "alias": [ + "DeepSeek-R1-Turbo" + ], + "max_tokens": 40960, + "model_types": [ + "chat" + ] + }, + { + "name": "Pixverse/Pixverse-6-T2V", + "alias": [ + "Pixverse-6-T2V" + ], + "model_types": [ + "video_generation" + ] + }, + { + "name": "allenai/olmOCR-7B-0725-FP8", + "alias": [ + "olmOCR-7B-0725-FP8" + ], + "max_tokens": 16384, + "model_types": [ + "chat", + "image2text", + "vision" + ] + }, + { + "name": "openbmb/MiniCPM-Llama3-V-2_5", + "alias": [ + "MiniCPM-Llama3-V-2_5" + ], + "max_tokens": 8192, + "model_types": [ + "chat", + "image2text", + "vision" + ] + }, + { + "name": "meta-llama/Meta-Llama-3.1-70B-Instruct", + "alias": [ + "Meta-Llama-3.1-70B-Instruct" + ], + "max_tokens": 131072, + "model_types": [ + "chat" + ] + }, + { + "name": "nvidia/Nemotron-Content-Safety-3.5", + "alias": [ + "Nemotron-Content-Safety-3.5" + ], + "max_tokens": 131072, + "model_types": [ + "chat", + "image2text", + "vision", + "ocr" + ] + }, + { + "name": "ByteDance/Seed-2.0-pro", + "alias": [ + "Seed-2.0-pro" + ], + "max_tokens": 256000, + "model_types": [ + "chat", + "image2text", + "vision" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "mistralai/Mistral-Small-3.2-24B-Instruct-2506", + "alias": [ + "Mistral-Small-3.2-24B-Instruct-2506" + ], + "max_tokens": 128000, + "model_types": [ + "chat", + "image2text", + "vision", + "ocr" + ] + }, + { + "name": "inworld-ai/inworld-tts-1.5-mini", + "alias": [ + "inworld-tts-1.5-mini" + ], + "model_types": [ + "tts" + ] + }, + { + "name": "ResembleAI/chatterbox-multilingual", + "alias": [ + "chatterbox-multilingual" + ], + "model_types": [ + "tts" + ] + }, + { + "name": "ByteDance/Seedream-4", + "alias": [ + "Seedream-4" + ], + "model_types": [ + "text-to-image", + "image_generation" + ] + }, + { + "name": "fishaudio/s2-pro", + "alias": [ + "s2-pro" + ], + "model_types": [ + "tts", + "audio" + ] + }, + { + "name": "fishaudio/s1-mini", + "alias": [ + "s1-mini" + ], + "model_types": [ + "tts", + "audio" + ] + }, + { + "name": "fishaudio/fish-speech-1.5", + "alias": [ + "fish-speech-1.5" + ], + "model_types": [ + "tts", + "audio" + ] + }, + { + "name": "fishaudio/fish-speech-1.4", + "alias": [ + "fish-speech-1.4" + ], + "model_types": [ + "tts", + "audio" + ] + }, + { + "name": "fishaudio/fish-agent-v0.1-3b", + "alias": [ + "fish-agent-v0.1-3b" + ], + "model_types": [ + "audio" + ] + }, + { + "name": "fishaudio/fish-speech-1.2-sft", + "alias": [ + "fish-speech-1.2-sft" + ], + "model_types": [ + "tts", + "audio" + ] + }, + { + "name": "fishaudio/fish-speech-1.2", + "alias": [ + "fish-speech-1.2" + ], + "model_types": [ + "tts", + "audio" + ] + }, + { + "name": "fishaudio/fish-speech-1", + "alias": [ + "fish-speech-1" + ], + "model_types": [ + "tts", + "audio" + ] + }, + { + "name": "fishaudio/speech-lm-v1", + "alias": [ + "speech-lm-v1" + ], + "model_types": [ + "tts", + "audio" + ] + }, + { + "name": "claude-opus-4-6", + "model_types": [ + "chat", + "vision", + "image2text", + "ocr" + ], + "alias": [ + "anthropic/claude-opus-4-6", + "anthropic/claude-opus-4.6", + "claude-opus-4.6" + ], + "max_tokens": 200000 + }, + { + "name": "opendatalab/mineru2.5-pro-2605-1.2b", + "alias": [ + "MinerU2.5-Pro-2605-1.2B" + ], + "max_tokens": 131072, + "model_types": [ + "chat", + "vision", + "image2text", + "ocr" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "opendatalab/mineru2.5-pro-2604-1.2b", + "alias": [ + "MinerU2.5-Pro-2604-1.2B" + ], + "max_tokens": 131072, + "model_types": [ + "chat", + "vision", + "image2text", + "ocr" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "opendatalab/mineru2.5-2509-1.2b", + "alias": [ + "MinerU2.5-2509-1.2B" + ], + "max_tokens": 131072, + "model_types": [ + "chat", + "vision", + "image2text", + "ocr" + ] + }, + { + "name": "opendatalab/mineru-html", + "alias": [ + "MinerU-HTML" + ], + "max_tokens": 131072, + "model_types": [ + "chat" + ] + }, + { + "name": "opendatalab/mineru-diffusion-v1-0320-2.5b", + "alias": [ + "MinerU-Diffusion-V1-0320-2.5B" + ], + "model_types": [ + "vision", + "image2text", + "ocr" + ] + }, + { + "name": "opendatalab/pdf-extract-kit-1.0", + "alias": [ + "PDF-Extract-Kit-1.0" + ], + "model_types": [ + "ocr", + "vision", + "image2text" + ] + }, + { + "name": "opendatalab/mineru-html-v1.1-hunyuan0.5b-compact", + "alias": [ + "MinerU-HTML-v1.1-hunyuan0.5B-compact" + ], + "max_tokens": 32768, + "model_types": [ + "chat" + ] + }, + { + "name": "opendatalab/chartverse-8b", + "alias": [ + "ChartVerse-8B" + ], + "max_tokens": 131072, + "model_types": [ + "chat", + "vision", + "image2text" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "opendatalab/chartverse-4b", + "alias": [ + "ChartVerse-4B" + ], + "max_tokens": 131072, + "model_types": [ + "chat", + "vision", + "image2text" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "opendatalab/chartverse-2b", + "alias": [ + "ChartVerse-2B" + ], + "max_tokens": 131072, + "model_types": [ + "chat", + "vision", + "image2text" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "opendatalab/chartverse-coder", + "alias": [ + "ChartVerse-Coder" + ], + "max_tokens": 131072, + "model_types": [ + "chat" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "opendatalab/trivia-3b", + "alias": [ + "TRivia-3B" + ], + "max_tokens": 131072, + "model_types": [ + "chat", + "vision", + "image2text" + ] + }, + { + "name": "opendatalab/belt_road_hungarian_beta1", + "alias": [ + "belt_road_hungarian_beta1" + ], + "max_tokens": 131072, + "model_types": [ + "chat", + "translation" + ] + }, + { + "name": "opendatalab/belt_road_hungarian_beta2", + "alias": [ + "belt_road_hungarian_beta2" + ], + "max_tokens": 131072, + "model_types": [ + "chat", + "translation" + ] + }, + { + "name": "opendatalab/mineru2.0-2505-0.9b", + "alias": [ + "MinerU2.0-2505-0.9B" + ], + "max_tokens": 131072, + "model_types": [ + "chat", + "vision", + "image2text", + "ocr" + ] + }, + { + "name": "opendatalab/meta-rater-1b-professionalism", + "alias": [ + "meta-rater-1b-professionalism" + ], + "max_tokens": 1024, + "model_types": [ + "chat" + ] + }, + { + "name": "opendatalab/meta-rater-1b-cleanliness", + "alias": [ + "meta-rater-1b-cleanliness" + ], + "max_tokens": 1024, + "model_types": [ + "chat" + ] + }, + { + "name": "opendatalab/meta-rater-1b-25raters", + "alias": [ + "meta-rater-1b-25raters" + ], + "max_tokens": 1024, + "model_types": [ + "chat" + ] + }, + { + "name": "opendatalab/meta-rater-1b-readability", + "alias": [ + "meta-rater-1b-readability" + ], + "max_tokens": 1024, + "model_types": [ + "chat" + ] + }, + { + "name": "opendatalab/meta-rater-1b-reasoning", + "alias": [ + "meta-rater-1b-reasoning" + ], + "max_tokens": 1024, + "model_types": [ + "chat" + ] + }, + { + "name": "opendatalab/meta-rater-1b-random", + "alias": [ + "meta-rater-1b-random" + ], + "max_tokens": 1024, + "model_types": [ + "chat" + ] + }, + { + "name": "opendatalab/meta-rater-3b-random", + "alias": [ + "meta-rater-3b-random" + ], + "max_tokens": 1024, + "model_types": [ + "chat" + ] + }, + { + "name": "opendatalab/meta-rater-3b-25raters", + "alias": [ + "meta-rater-3b-25raters" + ], + "max_tokens": 1024, + "model_types": [ + "chat" + ] + }, + { + "name": "opendatalab/meta-rater-7b-random", + "alias": [ + "meta-rater-7b-random" + ], + "max_tokens": 1024, + "model_types": [ + "chat" + ] + }, + { + "name": "opendatalab/meta-rater-7b-25raters", + "alias": [ + "meta-rater-7b-25raters" + ], + "max_tokens": 1024, + "model_types": [ + "chat" + ] + }, + { + "name": "opendatalab/meta-rater-cleanliness-rating", + "alias": [ + "meta-rater-cleanliness-rating" + ], + "max_tokens": 4096, + "model_types": [ + "classification" + ] + }, + { + "name": "opendatalab/meta-rater-readability-rating", + "alias": [ + "meta-rater-readability-rating" + ], + "max_tokens": 4096, + "model_types": [ + "classification" + ] + }, + { + "name": "opendatalab/meta-rater-professionalism-rating", + "alias": [ + "meta-rater-professionalism-rating" + ], + "max_tokens": 4096, + "model_types": [ + "classification" + ] + }, + { + "name": "opendatalab/meta-rater-reasoning-rating", + "alias": [ + "meta-rater-reasoning-rating" + ], + "max_tokens": 4096, + "model_types": [ + "classification" + ] + }, + { + "name": "opendatalab/pdf-extract-kit", + "alias": [ + "PDF-Extract-Kit" + ], + "model_types": [ + "ocr", + "vision", + "image2text" + ] + }, + { + "name": "mj_custom_zoom", + "alias": [ + "mj-custom-zoom" + ], + "model_types": [ + "text-to-image", + "image_generation" + ] + }, + { + "name": "kling-multi-elements", + "model_types": [ + "video_generation", + "video_understanding" + ] + }, + { + "name": "gpt-5.2-codex-2026-01-14", + "model_types": [ + "chat" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "o1-mini-all", + "model_types": [ + "chat", + "vision", + "image2text" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "pixverse-sound-effect", + "model_types": [ + "audio_generation" + ] + }, + { + "name": "pixverse-mimic", + "model_types": [ + "video_generation", + "video_understanding" + ] + }, + { + "name": "gpt-5.2-chat-2025-12-11", + "model_types": [ + "chat" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "mj_blend", + "alias": [ + "mj-blend" + ], + "model_types": [ + "text-to-image", + "image_generation" + ] + }, + { + "name": "glm-4", + "model_types": [ + "chat" + ] + }, + { + "name": "pixverse-lipsync", + "model_types": [ + "tts" + ] + }, + { + "name": "o1-mini-2024-09-12", + "model_types": [ + "chat" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "pixverse-multi-transition", + "model_types": [ + "video_generation", + "video_understanding" + ] + }, + { + "name": "qwq-72b-preview", + "model_types": [ + "chat" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "mj_edits", + "alias": [ + "mj-edits" + ], + "model_types": [ + "chat" + ] + }, + { + "name": "pixverse-modify", + "model_types": [ + "video_generation", + "video_understanding" + ] + }, + { + "name": "happyhorse-1.0-t2v", + "model_types": [ + "video_generation" + ], + "alias": [ + "alibaba/happyhorse-1.0-t2v", + "HappyHorse 1.0 T2V" + ] + }, + { + "name": "ERNIE-3.5-8K", + "model_types": [ + "chat" + ] + }, + { + "name": "gpt-5.5-2026-04-24", + "model_types": [ + "chat" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "mj_high_variation", + "alias": [ + "mj-high-variation" + ], + "model_types": [ + "text-to-image", + "image_generation" + ] + }, + { + "name": "gpt-4-turbo-preview", + "model_types": [ + "chat" + ] + }, + { + "name": "MiniMax-Voice-Design", + "model_types": [ + "tts" + ] + }, + { + "name": "suno_music_open", + "alias": [ + "suno-music-open" + ], + "model_types": [ + "audio_generation" + ] + }, + { + "name": "mj_video", + "alias": [ + "mj-video" + ], + "model_types": [ + "video_generation" + ] + }, + { + "name": "wan2.7-image-pro", + "model_types": [ + "image", + "image_edit", + "text-to-image", + "image_generation" + ] + }, + { + "name": "grok-4.2-image", + "model_types": [ + "text-to-image", + "image_generation" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "kling-image", + "model_types": [ + "image", + "image_edit" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "qwen3-coder", + "model_types": [ + "chat" + ] + }, + { + "name": "ERNIE-Functions-8K", + "model_types": [ + "chat" + ] + }, + { + "name": "mj_pan", + "alias": [ + "mj-pan" + ], + "model_types": [ + "text-to-image", + "image_generation" + ] + }, + { + "name": "happyhorse-1.0-i2v", + "model_types": [ + "video_generation" + ], + "alias": [ + "alibaba/happyhorse-1.0-i2v", + "HappyHorse 1.0 I2V" + ] + }, + { + "name": "o1-pro-all", + "model_types": [ + "chat" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "suno_upload_open", + "alias": [ + "suno-upload-open" + ], + "model_types": [ + "video_generation" + ] + }, + { + "name": "viduq1", + "model_types": [ + "video_generation" + ] + }, + { + "name": "kling-avatar-image2video", + "model_types": [ + "video_generation", + "video_understanding" + ] + }, + { + "name": "kling-motion-control", + "model_types": [ + "video_generation", + "video_understanding" + ] + }, + { + "name": "vidu-tts", + "model_types": [ + "tts" + ] + }, + { + "name": "gpt-audio-2025-08-28", + "model_types": [ + "video_generation" + ] + }, + { + "name": "suno_lyrics_open", + "alias": [ + "suno-lyrics-open" + ], + "model_types": [ + "video_generation" + ] + }, + { + "name": "suno_persona_open", + "alias": [ + "suno-persona-open" + ], + "model_types": [ + "video_generation" + ] + }, + { + "name": "o1-preview-all", + "model_types": [ + "chat", + "vision", + "image2text" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "kling-audio", + "model_types": [ + "tts" + ] + }, + { + "name": "audio1.0", + "model_types": [ + "audio_generation" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "grok-4.20-0309-reasoning", + "model_types": [ + "chat" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + }, + "max_tokens": 1000000, + "alias": [ + "xai/grok-4.20-reasoning", + "grok-4.20-reasoning", + "grok-4.20-reasoning-latest", + "grok-4.20-reasoning-gv2", + "grok-4.20-beta-0309-reasoning", + "grok-4.20-beta-reasoning", + "grok-4.20-beta-latest-reasoning", + "grok-4.20-experimental-beta-0304-reasoning", + "grok-4.20-experimental-beta-reasoning-latest", + "grok-4-20-reasoning" + ] + }, + { + "name": "mj_upload", + "alias": [ + "mj-upload" + ], + "model_types": [ + "chat" + ] + }, + { + "name": "SparkDesk-v3.1", + "model_types": [ + "chat" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "tts-hd-1", + "model_types": [ + "tts" + ] + }, + { + "name": "viduq3-turbo", + "model_types": [ + "video_generation" + ] + }, + { + "name": "grok-video-3-10s", + "model_types": [ + "video_generation" + ] + }, + { + "name": "gpt-5.1-chat", + "model_types": [ + "chat" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "mj_modal", + "alias": [ + "mj-modal" + ], + "model_types": [ + "text-to-image", + "image_generation" + ] + }, + { + "name": "Dolphin3.0-R1-Mistral-24B", + "model_types": [ + "chat" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "gpt-4o-mini-audio-preview", + "model_types": [ + "tts" + ] + }, + { + "name": "happyhorse-1.0-r2v", + "model_types": [ + "video_generation" + ], + "alias": [ + "alibaba/happyhorse-1.0-r2v", + "HappyHorse 1.0 R2V" + ] + }, + { + "name": "pixverse-swap", + "model_types": [ + "video_generation", + "video_understanding" + ] + }, + { + "name": "MiniMax-Voice-Clone", + "model_types": [ + "tts" + ] + }, + { + "name": "viduq2-pro", + "model_types": [ + "video_generation", + "video_understanding" + ] + }, + { + "name": "mj_reroll", + "alias": [ + "mj-reroll" + ], + "model_types": [ + "text-to-image", + "image_generation" + ] + }, + { + "name": "ERNIE-Lite-8K", + "model_types": [ + "chat" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "mj_low_variation", + "alias": [ + "mj-low-variation" + ], + "model_types": [ + "text-to-image", + "image_generation" + ] + }, + { + "name": "kling-custom-elements", + "model_types": [ + "video_generation" + ] + }, + { + "name": "grok-imagine-image-quality", + "model_types": [ + "text-to-image", + "image_generation" + ], + "alias": [ + "xai/grok-imagine-image-quality", + "grok-imagine-image-quality-20260403", + "grok-imagine-image-quality-latest", + "grok-imagine-image-pro" + ] + }, + { + "name": "babbage-002", + "model_types": [ + "chat" + ] + }, + { + "name": "qwen3-30b-a3b-think", + "model_types": [ + "chat" + ] + }, + { + "name": "llama-3-8b", + "model_types": [ + "chat" + ] + }, + { + "name": "gpt-5.3-chat", + "model_types": [ + "chat" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "qwen3-max-preview-n", + "model_types": [ + "chat" + ] + }, + { + "name": "gpt-5.1-codex-2025-11-13", + "model_types": [ + "chat" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "davinci-002", + "model_types": [ + "chat" + ] + }, + { + "name": "grok-3-reasoner", + "model_types": [ + "chat" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "kimi-k2", + "model_types": [ + "chat" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + }, + "alias": [ + "kimi-k2-thinking-251104" + ], + "max_tokens": 262144, + "max_completion_tokens": 32768 + }, + { + "name": "kimi-k2-250905", + "model_types": [ + "chat" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + }, + "max_tokens": 262144, + "max_completion_tokens": 32768 + }, + { + "name": "Embedding-V1", + "model_types": [ + "embedding" + ] + }, + { + "name": "gpt-5-chat", + "model_types": [ + "chat" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "gpt-5-codex-2025-09-15", + "model_types": [ + "chat" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "gpt-image-1-2025-04-15", + "model_types": [ + "chat" + ] + }, + { + "name": "SparkDesk-v3.5", + "model_types": [ + "chat" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "kling-video", + "model_types": [ + "video_generation" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "mj_upscale", + "alias": [ + "mj-upscale" + ], + "model_types": [ + "text-to-image", + "image_generation" + ] + }, + { + "name": "gpt-realtime-1.5", + "model_types": [ + "chat" + ] + }, + { + "name": "gpt-4o-mini-tts-1", + "model_types": [ + "tts" + ] + }, + { + "name": "grok-4-image", + "model_types": [ + "text-to-image", + "image_generation" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "gpt-5.2-chat", + "model_types": [ + "chat" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "kling-video-extend", + "model_types": [ + "video_generation" + ] + }, + { + "name": "o3-mini-high-all", + "model_types": [ + "chat" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "wen-max-2025-01-25", + "model_types": [ + "chat" + ] + }, + { + "name": "pixverse-mask-selection", + "model_types": [ + "video_generation", + "video_understanding" + ] + }, + { + "name": "longcat-flash", + "model_types": [ + "chat" + ] + }, + { + "name": "z-image-turbo", + "model_types": [ + "text-to-image", + "image_generation" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "kimi-k2.7-code", + "model_types": [ + "video_generation", + "chat", + "vision", + "image2text" + ], + "alias": [ + "moonshotai/kimi-k2.7-code", + "Kimi K2.7 Code", + "kimi/kimi-k2.7-code" + ], + "max_tokens": 262144, + "max_completion_tokens": 262144, + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "pixverse-restyle", + "model_types": [ + "video_generation" + ] + }, + { + "name": "suno_concat_open", + "alias": [ + "suno-concat-open" + ], + "model_types": [ + "video_generation" + ] + }, + { + "name": "kling-effects", + "model_types": [ + "video_generation" + ] + }, + { + "name": "llama-3-70b", + "model_types": [ + "chat" + ] + }, + { + "name": "grok-4.1-image", + "model_types": [ + "text-to-image", + "image_generation" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "SparkDesk-v2.1", + "model_types": [ + "chat" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "viduq3-mix", + "model_types": [ + "video_generation" + ] + }, + { + "name": "llama-3-sonar-small-32k-chat", + "model_types": [ + "chat" + ] + }, + { + "name": "ERNIE-Tiny-8K", + "model_types": [ + "chat" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "MiniMax-File-Upload", + "model_types": [ + "chat" + ] + }, + { + "name": "kling-image-recognize", + "model_types": [ + "image_understanding", + "vision" + ] + }, + { + "name": "gpt-5.3-chat-2026-03-03", + "model_types": [ + "chat" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "kling-advanced-custom-elements", + "model_types": [ + "video_generation" + ] + }, + { + "name": "viduq1-classic", + "model_types": [ + "video_generation" + ] + }, + { + "name": "suno_upsample_open", + "alias": [ + "suno-upsample-open" + ], + "model_types": [ + "video_generation" + ] + }, + { + "name": "grok-video-3", + "model_types": [ + "video_generation" + ] + }, + { + "name": "pixverse-upload", + "model_types": [ + "chat" + ] + }, + { + "name": "viduq3-pro", + "model_types": [ + "video_generation" + ] + }, + { + "name": "o1-preview-2024-09-12", + "model_types": [ + "chat" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "flux.1-kontext-pro", + "model_types": [ + "text-to-image", + "image_generation", + "image", + "image_edit" + ], + "alias": [ + "black-forest-labs/FLUX.1-kontext-pro", + "FLUX.1 Kontext [pro]" + ] + }, + { + "name": "mj_variation", + "alias": [ + "mj-variation" + ], + "model_types": [ + "text-to-image", + "image_generation" + ] + }, + { + "name": "kling-omni-image", + "model_types": [ + "text-to-image", + "image_generation" + ] + }, + { + "name": "kling-omni-video", + "model_types": [ + "video_generation" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "grok-3-image", + "model_types": [ + "text-to-image", + "image_generation" + ] + }, + { + "name": "mj_zoom", + "alias": [ + "mj-zoom" + ], + "model_types": [ + "text-to-image", + "image_generation" + ] + }, + { + "name": "mj_imagine", + "alias": [ + "mj-imagine" + ], + "model_types": [ + "text-to-image", + "image_generation" + ] + }, + { + "name": "mj_inpaint", + "alias": [ + "mj-inpaint" + ], + "model_types": [ + "image", + "image_edit" + ] + }, + { + "name": "gpt-5.2-pro-2025-12-11", + "model_types": [ + "chat" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + }, + "alias": [ + "openai/gpt-5.2-pro-2025-12-11" + ] + }, + { + "name": "kling-custom-voices", + "model_types": [ + "tts" + ] + }, + { + "name": "SparkDesk-v1.1", + "model_types": [ + "chat" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "ERNIE-Speed-8K", + "model_types": [ + "chat" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "viduq2-turbo", + "model_types": [ + "video_generation" + ] + }, + { + "name": "deepseek-v3-1-think-250821", + "model_types": [ + "chat" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "gpt-5.1-codex-max-2025-12-04", + "model_types": [ + "chat" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "o1-preview", + "model_types": [ + "chat" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "gpt-4o-mini-audio-preview-2024-12-17", + "model_types": [ + "tts" + ] + }, + { + "name": "wan2.5-i2v-preview", + "model_types": [ + "video_generation" + ] + }, + { + "name": "pixverse-image-template", + "model_types": [ + "video_generation" + ] + }, + { + "name": "gpt-5.3-codex-2026-02-24", + "model_types": [ + "chat" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "vidu2.0", + "model_types": [ + "video_generation" + ] + }, + { + "name": "o1-mini", + "model_types": [ + "chat" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "grok-3-reasoning", + "model_types": [ + "chat" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "gpt-5-chat-2025-08-07", + "model_types": [ + "chat" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "gpt-5-chat-2025-10-03", + "model_types": [ + "chat" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "gpt-audio", + "model_types": [ + "chat" + ] + }, + { + "name": "ERNIE-Character-8K", + "model_types": [ + "chat" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "kling-advanced-lip-sync", + "model_types": [ + "video_generation", + "video_understanding" + ] + }, + { + "name": "mj_describe", + "alias": [ + "mj-describe" + ], + "model_types": [ + "text-to-image", + "image_generation" + ] + }, + { + "name": "happyhorse-1.0-video-edit", + "model_types": [ + "video_generation", + "video_understanding" + ] + }, + { + "name": "viduq3", + "model_types": [ + "video_generation" + ] + }, + { + "name": "grok-4.20-0309-non-reasoning", + "model_types": [ + "chat" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + }, + "max_tokens": 1000000, + "alias": [ + "xai/grok-4.20-non-reasoning", + "grok-4.20-non-reasoning", + "grok-4.20-non-reasoning-latest", + "grok-4.20-non-reasoning-gv2", + "grok-4.20-beta-0309-non-reasoning", + "grok-4.20-beta-non-reasoning", + "grok-4.20-beta-latest-non-reasoning", + "grok-4.20-experimental-beta-0304-non-reasoning", + "grok-4.20-experimental-beta-non-reasoning-latest", + "grok-4-20-non-reasoning" + ] + }, + { + "name": "ERNIE-Speed-128K", + "model_types": [ + "chat" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "gpt-4-vision-preview", + "model_types": [ + "chat", + "vision", + "image2text" + ] + }, + { + "name": "deepseek-r1-2025-01-20", + "model_types": [ + "chat" + ] + }, + { + "name": "grok-3-deepsearch", + "model_types": [ + "chat" + ] + }, + { + "name": "suno_uploads", + "alias": [ + "suno-uploads" + ], + "model_types": [ + "audio_generation" + ] + }, + { + "name": "pixverse-video", + "model_types": [ + "video_generation" + ] + }, + { + "name": "MiniMax-Hailuo-02", + "model_types": [ + "video_generation" + ] + }, + { + "name": "llama-3-sonar-large-32k-chat", + "model_types": [ + "chat" + ] + }, + { + "name": "gpt-5.1-chat-2025-11-13", + "model_types": [ + "chat" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "grok-imagine-image", + "model_types": [ + "text-to-image", + "image_generation", + "chat" + ], + "alias": [ + "grok/grok-imagine-image", + "xai/grok-imagine-image", + "grok-imagine-image-2026-03-02" + ] + }, + { + "name": "suno_upsample-tags", + "alias": [ + "suno-upsample-tags" + ], + "model_types": [ + "video_generation" + ] + }, + { + "name": "nvidia/nemotron-3-super-120b-a12b", + "alias": [ + "nemotron-3-super-120b-a12b" + ], + "model_types": [ + "chat" + ] + }, + { + "name": "canopylabs/orpheus-arabic-saudi", + "alias": [ + "orpheus-arabic-saudi" + ], + "max_tokens": 4000, + "max_completion_tokens": 50000, + "model_types": [ + "tts" + ] + }, + { + "name": "llama-3.1-8b-instant", + "max_tokens": 131072, + "max_completion_tokens": 131072, + "model_types": [ + "chat" + ] + }, + { + "name": "groq/compound", + "alias": [ + "compound" + ], + "max_tokens": 131072, + "max_completion_tokens": 8192, + "model_types": [ + "chat" + ] + }, + { + "name": "groq/compound-mini", + "alias": [ + "compound-mini" + ], + "max_tokens": 131072, + "max_completion_tokens": 8192, + "model_types": [ + "chat" + ] + }, + { + "name": "llama-3.3-70b-versatile", + "max_tokens": 131072, + "max_completion_tokens": 32768, + "model_types": [ + "chat" + ] + }, + { + "name": "canopylabs/orpheus-v1-english", + "alias": [ + "orpheus-v1-english" + ], + "max_tokens": 4000, + "max_completion_tokens": 50000, + "model_types": [ + "tts" + ] + }, + { + "name": "allam-2-7b", + "max_tokens": 4096, + "max_completion_tokens": 4096, + "model_types": [ + "chat" + ] + }, + { + "name": "baidu/cobuddy", + "alias": [ + "cobuddy" + ], + "max_tokens": 131072, + "max_completion_tokens": 65536, + "model_types": [ + "chat" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "bunny", + "max_tokens": 262144, + "max_completion_tokens": 32768, + "model_types": [ + "chat" + ] + }, + { + "name": "zai-org/glm-4.7-h", + "alias": [ + "glm-4.7-h" + ], + "max_tokens": 204800, + "max_completion_tokens": 131072, + "model_types": [ + "chat" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "paddlepaddle/paddleocr-vl", + "alias": [ + "paddleocr-vl" + ], + "max_tokens": 16384, + "max_completion_tokens": 16384, + "model_types": [ + "chat", + "vision", + "image2text", + "ocr" + ] + }, + { + "name": "kwaipilot/kat-coder-pro", + "alias": [ + "kat-coder-pro", + "Kat Coder Pro" + ], + "max_tokens": 256000, + "max_completion_tokens": 128000, + "model_types": [ + "chat" + ] + }, + { + "name": "nex-agi/nex-n2-pro", + "alias": [ + "nex-n2-pro" + ], + "max_tokens": 262144, + "max_completion_tokens": 262144, + "model_types": [ + "chat", + "vision", + "image2text" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "mistralai/mistral-nemo", + "alias": [ + "mistral-nemo", + "Mistral Nemo" + ], + "max_tokens": 60288, + "max_completion_tokens": 16000, + "model_types": [ + "chat" + ] + }, + { + "name": "meta-llama/llama-3-8b-instruct", + "alias": [ + "llama-3-8b-instruct", + "Llama 3 8B Instruct" + ], + "max_tokens": 8192, + "max_completion_tokens": 8192, + "model_types": [ + "chat" + ] + }, + { + "name": "meta-llama/llama-3-70b-instruct", + "alias": [ + "llama-3-70b-instruct", + "Llama3 70B Instruct" + ], + "max_tokens": 8192, + "max_completion_tokens": 8000, + "model_types": [ + "chat" + ] + }, + { + "name": "openchat/openchat-7b", + "alias": [ + "openchat-7b", + "OpenChat 7B" + ], + "max_tokens": 4096, + "max_completion_tokens": 4096, + "model_types": [ + "chat" + ] + }, + { + "name": "nousresearch/hermes-2-pro-llama-3-8b", + "alias": [ + "hermes-2-pro-llama-3-8b", + "Hermes 2 Pro Llama 3 8B" + ], + "max_tokens": 8192, + "max_completion_tokens": 8192, + "model_types": [ + "chat" + ] + }, + { + "name": "nousresearch/nous-hermes-llama2-13b", + "alias": [ + "nous-hermes-llama2-13b", + "Nous Hermes Llama2 13B" + ], + "max_tokens": 4096, + "max_completion_tokens": 32768, + "model_types": [ + "chat" + ] + }, + { + "name": "teknium/openhermes-2.5-mistral-7b", + "alias": [ + "openhermes-2.5-mistral-7b", + "Openhermes2.5 Mistral 7B" + ], + "max_tokens": 4096, + "max_completion_tokens": 8000, + "model_types": [ + "chat" + ] + }, + { + "name": "sao10k/l3-8b-lunaris", + "alias": [ + "l3-8b-lunaris", + "Sao10k L3 8B Lunaris" + ], + "max_tokens": 8192, + "max_completion_tokens": 8192, + "model_types": [ + "chat" + ] + }, + { + "name": "Sao10K/L3-8B-Stheno-v3.2", + "alias": [ + "L3-8B-Stheno-v3.2", + "L3 8B Stheno V3.2" + ], + "max_tokens": 8192, + "max_completion_tokens": 32000, + "model_types": [ + "chat" + ] + }, + { + "name": "inclusionai/ring-2.6-1t", + "alias": [ + "ring-2.6-1t" + ], + "max_tokens": 262144, + "max_completion_tokens": 65536, + "model_types": [ + "chat" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "inclusionai/ling-2.6-flash", + "alias": [ + "ling-2.6-flash" + ], + "max_tokens": 262144, + "max_completion_tokens": 32768, + "model_types": [ + "chat" + ] + }, + { + "name": "inclusionai/ling-2.6-1t", + "alias": [ + "ling-2.6-1t" + ], + "max_tokens": 262144, + "max_completion_tokens": 32768, + "model_types": [ + "chat" + ] + }, + { + "name": "elephant", + "max_tokens": 262144, + "max_completion_tokens": 32768, + "model_types": [ + "chat" + ] + }, + { + "name": "ai_infer_test_3", + "max_tokens": 200000, + "max_completion_tokens": 200000, + "model_types": [ + "chat" + ] + }, + { + "name": "ai_infer_test_2", + "max_tokens": 200000, + "max_completion_tokens": 200000, + "model_types": [ + "chat" + ] + }, + { + "name": "ai_infer_test_1", + "max_tokens": 200000, + "max_completion_tokens": 200000, + "model_types": [ + "chat" + ] + }, + { + "name": "dev/glm46", + "alias": [ + "glm46" + ], + "max_tokens": 256000, + "max_completion_tokens": 256000, + "model_types": [ + "chat" + ] + }, + { + "name": "gt-4p", + "max_completion_tokens": 131072, + "model_types": [ + "chat", + "vision", + "image2text" + ] + }, + { + "name": "sao10k/l31-70b-euryale-v2.2", + "alias": [ + "l31-70b-euryale-v2.2", + "L31 70B Euryale V2.2" + ], + "max_tokens": 8192, + "max_completion_tokens": 8192, + "model_types": [ + "chat" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "orcarouter/fusion", + "alias": [ + "fusion" + ], + "model_types": [ + "chat" + ] + }, + { + "name": "orcarouter/fusion-flash", + "alias": [ + "fusion-flash" + ], + "model_types": [ + "chat" + ] + }, + { + "name": "orcarouter/fusion-mini", + "alias": [ + "fusion-mini" + ], + "model_types": [ + "chat" + ] + }, + { + "name": "orcarouter/auto", + "alias": [ + "auto" + ], + "model_types": [ + "chat" + ] + }, + { + "name": "anthropic/claude-opus-4", + "alias": [ + "claude-opus-4" + ], + "model_types": [ + "chat" + ] + }, + { + "name": "anthropic/claude-opus-4.1", + "alias": [ + "claude-opus-4.1" + ], + "model_types": [ + "chat" + ] + }, + { + "name": "anthropic/claude-sonnet-4", + "alias": [ + "claude-sonnet-4" + ], + "model_types": [ + "chat" + ] + }, + { + "name": "byteplus/dreamina-seedance-2-0-260128", + "alias": [ + "dreamina-seedance-2-0-260128" + ], + "model_types": [ + "chat", + "video_generation" + ] + }, + { + "name": "kling/kling-v3", + "alias": [ + "kling-v3" + ], + "model_types": [ + "chat" + ] + }, + { + "name": "kling/kling-video-o1", + "alias": [ + "kling-video-o1" + ], + "model_types": [ + "chat" + ] + }, + { + "name": "openai/gpt-4o-mini-search-preview-2025-03-11", + "alias": [ + "gpt-4o-mini-search-preview-2025-03-11" + ], + "model_types": [ + "chat" + ] + }, + { + "name": "openai/gpt-4o-mini-tts-2025-03-20", + "alias": [ + "gpt-4o-mini-tts-2025-03-20" + ], + "model_types": [ + "chat" + ] + }, + { + "name": "openai/gpt-4o-search-preview-2025-03-11", + "alias": [ + "gpt-4o-search-preview-2025-03-11" + ], + "model_types": [ + "chat" + ] + }, + { + "name": "openai/gpt-5-search-api", + "alias": [ + "gpt-5-search-api" + ], + "model_types": [ + "chat" + ] + }, + { + "name": "openai/gpt-5-search-api-2025-10-14", + "alias": [ + "gpt-5-search-api-2025-10-14" + ], + "model_types": [ + "chat" + ] + }, + { + "name": "openai/gpt-5.5-2026-04-23", + "alias": [ + "gpt-5.5-2026-04-23" + ], + "model_types": [ + "chat" + ] + }, + { + "name": "openai/gpt-5.5-pro", + "alias": [ + "gpt-5.5-pro" + ], + "model_types": [ + "chat" + ] + }, + { + "name": "openai/gpt-5.5-pro-2026-04-23", + "alias": [ + "gpt-5.5-pro-2026-04-23" + ], + "model_types": [ + "chat" + ] + }, + { + "name": "minimax/minimax-m2.1-h", + "alias": [ + "minimax-m2.1-h" + ], + "max_tokens": 204800, + "max_completion_tokens": 131072, + "model_types": [ + "chat" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "ppio-4b", + "alias": [ + "PPIO 4B" + ], + "max_tokens": 128000, + "max_completion_tokens": 8192, + "model_types": [ + "chat" + ] + }, + { + "name": "baidu/ernie-5.0-thinking-exp", + "alias": [ + "ernie-5.0-thinking-exp", + "Ernie 5.0 Thinking Exp" + ], + "max_tokens": 183000, + "max_completion_tokens": 64000, + "model_types": [ + "chat", + "vision", + "image2text" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "kwaipilot/kat-dev-72b-exp", + "alias": [ + "kat-dev-72b-exp" + ], + "max_tokens": 131072, + "max_completion_tokens": 65536, + "model_types": [ + "chat" + ] + }, + { + "name": "nvidia/nemotron-3-ultra-550b-a55b", + "alias": [ + "nemotron-3-ultra-550b-a55b", + "NVIDIA Nemotron 3 Ultra 550B A55B NVFP4" + ], + "max_tokens": 512288, + "model_types": [ + "chat" + ] + }, + { + "name": "pearl-ai/gemma-4-31b-it", + "alias": [ + "Pearl-ai Gemma-4-31B-it-pearl" + ], + "max_tokens": 262144, + "model_types": [ + "chat", + "vision", + "image2text" + ] + }, + { + "name": "Qwen/Qwen3-235B-A22B-Instruct-2507-tput", + "alias": [ + "Qwen3-235B-A22B-Instruct-2507-tput", + "Qwen3 235B A22B Instruct 2507 FP8 Throughput" + ], + "max_tokens": 262144, + "model_types": [ + "chat" + ] + }, + { + "name": "Qwen/Qwen2.5-7B-Instruct-Turbo", + "alias": [ + "Qwen2.5-7B-Instruct-Turbo", + "Qwen2.5 7B Instruct Turbo" + ], + "max_tokens": 32768, + "model_types": [ + "chat" + ] + }, + { + "name": "meta-llama/Meta-Llama-3-8B-Instruct-Lite", + "alias": [ + "Meta-Llama-3-8B-Instruct-Lite", + "Meta Llama 3 8B Instruct Lite" + ], + "max_tokens": 8192, + "model_types": [ + "chat" + ] + }, + { + "name": "black-forest-labs/FLUX.1-kontext-max", + "alias": [ + "FLUX.1-kontext-max", + "FLUX.1 Kontext [max]" + ], + "model_types": [ + "image", + "image_edit" + ] + }, + { + "name": "black-forest-labs/FLUX.2-flex", + "alias": [ + "FLUX.2-flex", + "FLUX.2 [flex]" + ], + "model_types": [ + "image", + "image_edit" + ] + }, + { + "name": "black-forest-labs/FLUX.1.1-pro", + "alias": [ + "FLUX.1.1-pro", + "FLUX1.1 [pro]" + ], + "model_types": [ + "text-to-image", + "image_generation" + ] + }, + { + "name": "arize-ai/qwen-2-1.5b-instruct", + "alias": [ + "qwen-2-1.5b-instruct", + "Arize AI Qwen 2 1.5B Instruct" + ], + "max_tokens": 32768, + "model_types": [ + "chat" + ] + }, + { + "name": "LiquidAI/LFM2-24B-A2B", + "alias": [ + "LFM2-24B-A2B" + ], + "max_tokens": 32768, + "model_types": [ + "chat" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "essentialai/rnj-1-instruct", + "alias": [ + "rnj-1-instruct", + "EssentialAI Rnj-1 Instruct" + ], + "max_tokens": 32768, + "model_types": [ + "chat" + ] + }, + { + "name": "kwaivgI/kling-1.6-pro", + "alias": [ + "kling-1.6-pro", + "Kling 1.6 Pro" + ], + "model_types": [ + "video_generation" + ] + }, + { + "name": "Wan-AI/Wan2.6-image", + "alias": [ + "Wan2.6-image", + "Wan 2.6 Image" + ], + "model_types": [ + "text-to-image", + "image_generation" + ] + }, + { + "name": "vidu/vidu-q1", + "alias": [ + "vidu-q1", + "Vidu Q1" + ], + "model_types": [ + "video_generation" + ] + }, + { + "name": "cartesia/sonic", + "alias": [ + "sonic", + "Cartesia Sonic" + ], + "model_types": [ + "tts" + ] + }, + { + "name": "ByteDance-Seed/Seedream-3.0", + "alias": [ + "Seedream-3.0", + "ByteDance Seedream 3.0" + ], + "model_types": [ + "text-to-image", + "image_generation" + ] + }, + { + "name": "ByteDance-Seed/Seedream-4.0", + "alias": [ + "Seedream-4.0", + "ByteDance Seedream 4.0" + ], + "model_types": [ + "text-to-image", + "image_generation" + ] + }, + { + "name": "kwaivgI/kling-2.1-master", + "alias": [ + "kling-2.1-master", + "Kling 2.1 Master" + ], + "model_types": [ + "video_generation" + ] + }, + { + "name": "ideogram/ideogram-3.0", + "alias": [ + "ideogram-3.0", + "Ideogram 3.0" + ], + "model_types": [ + "text-to-image", + "image_generation" + ] + }, + { + "name": "kwaivgI/kling-2.1-pro", + "alias": [ + "kling-2.1-pro", + "Kling 2.1 Pro" + ], + "model_types": [ + "video_generation" + ] + }, + { + "name": "Wan-AI/Wan2.2-I2V-A14B", + "alias": [ + "Wan2.2-I2V-A14B", + "Wan 2.2 I2V" + ], + "model_types": [ + "video_generation" + ] + }, + { + "name": "kwaivgI/kling-2.0-master", + "alias": [ + "kling-2.0-master", + "Kling 2.0 Master" + ], + "model_types": [ + "video_generation" + ] + }, + { + "name": "kwaivgI/kling-2.1-standard", + "alias": [ + "kling-2.1-standard", + "Kling 2.1 Standard" + ], + "model_types": [ + "video_generation" + ] + }, + { + "name": "vidu/vidu-2.0", + "alias": [ + "vidu-2.0", + "Vidu 2.0" + ], + "model_types": [ + "video_generation" + ] + }, + { + "name": "openai/sora-2-pro", + "alias": [ + "sora-2-pro", + "Sora 2 Pro" + ], + "model_types": [ + "video_generation" + ] + }, + { + "name": "pixverse/pixverse-v5", + "alias": [ + "pixverse-v5", + "PixVerse v5" + ], + "model_types": [ + "video_generation" + ] + }, + { + "name": "stabilityai/stable-diffusion-xl-base-1.0", + "alias": [ + "stable-diffusion-xl-base-1.0", + "SD XL" + ], + "model_types": [ + "text-to-image", + "image_generation" + ] + }, + { + "name": "ByteDance/Seedance-1.0-lite", + "alias": [ + "Seedance-1.0-lite", + "ByteDance Seedance 1.0 Lite" + ], + "model_types": [ + "video_generation" + ] + }, + { + "name": "cartesia/sonic-3", + "alias": [ + "sonic-3", + "Cartesia Sonic 3" + ], + "max_tokens": 448, + "model_types": [ + "tts" + ] + }, + { + "name": "ByteDance/Seedance-1.0-pro", + "alias": [ + "Seedance-1.0-pro", + "ByteDance Seedance 1.0 Pro" + ], + "model_types": [ + "video_generation" + ] + }, + { + "name": "HiDream-ai/HiDream-I1-Fast", + "alias": [ + "HiDream-I1-Fast" + ], + "model_types": [ + "text-to-image", + "image_generation" + ] + }, + { + "name": "stabilityai/stable-diffusion-3-medium", + "alias": [ + "stable-diffusion-3-medium", + "Stable Diffusion 3" + ], + "model_types": [ + "text-to-image", + "image_generation" + ] + }, + { + "name": "minimax/hailuo-02", + "alias": [ + "hailuo-02", + "MiniMax Hailuo 02" + ], + "model_types": [ + "video_generation" + ] + }, + { + "name": "RunDiffusion/Juggernaut-pro-flux", + "alias": [ + "Juggernaut-pro-flux", + "Juggernaut Pro Flux by RunDiffusion 1.0.0" + ], + "model_types": [ + "text-to-image", + "image_generation" + ] + }, + { + "name": "HiDream-ai/HiDream-I1-Dev", + "alias": [ + "HiDream-I1-Dev" + ], + "model_types": [ + "text-to-image", + "image_generation" + ] + }, + { + "name": "Lykon/DreamShaper", + "alias": [ + "DreamShaper" + ], + "model_types": [ + "text-to-image", + "image_generation" + ] + }, + { + "name": "HiDream-ai/HiDream-I1-Full", + "alias": [ + "HiDream-I1-Full" + ], + "model_types": [ + "text-to-image", + "image_generation" + ] + }, + { + "name": "kwaivgI/kling-1.6-standard", + "alias": [ + "kling-1.6-standard", + "Kling 1.6 Standard" + ], + "model_types": [ + "video_generation" + ] + }, + { + "name": "minimax/video-01-director", + "alias": [ + "video-01-director", + "MiniMax 01 Director" + ], + "model_types": [ + "video_generation" + ] + }, + { + "name": "cartesia/sonic-2", + "alias": [ + "sonic-2", + "Cartesia Sonic 2" + ], + "max_tokens": 448, + "model_types": [ + "tts" + ] + }, + { + "name": "pixverse/pixverse-v5.6", + "alias": [ + "pixverse-v5.6", + "PixVerse v5.6" + ], + "model_types": [ + "video_generation" + ] + }, + { + "name": "Wan-AI/wan2.7-t2v", + "alias": [ + "wan2.7-t2v", + "Wan 2.7 T2V" + ], + "model_types": [ + "video_generation" + ] + }, + { + "name": "vidu/vidu-q3", + "alias": [ + "vidu-q3", + "Vidu Q3" + ], + "model_types": [ + "video_generation" + ] + }, + { + "name": "vidu/vidu-q3-turbo", + "alias": [ + "vidu-q3-turbo", + "Vidu Q3 Turbo" + ], + "model_types": [ + "video_generation" + ] + }, + { + "name": "deepcogito/cogito-v2-1-671b", + "alias": [ + "cogito-v2-1-671b", + "Cogito v2.1 671B" + ], + "max_tokens": 163840, + "model_types": [ + "chat" + ] + }, + { + "name": "pixverse/pixverse-v6", + "alias": [ + "pixverse-v6", + "PixVerse v6" + ], + "model_types": [ + "video_generation" + ] + }, + { + "name": "ByteDance/Seedream-5.0-lite", + "alias": [ + "Seedream-5.0-lite", + "ByteDance Seedream 5.0 Lite" + ], + "model_types": [ + "text-to-image", + "image_generation" + ] + }, + { + "name": "nvidia/nemotron-3-asr-streaming-0.6b", + "alias": [ + "nemotron-3-asr-streaming-0.6b", + "Nvidia Nemotron 3 ASR Streaming 0.6B" + ], + "max_tokens": 448, + "model_types": [ + "asr", + "speech2text" + ] + }, + { + "name": "ideogram/ideogram-4.0", + "alias": [ + "ideogram-4.0", + "Ideogram 4.0" + ], + "model_types": [ + "text-to-image", + "image_generation" + ] + }, + { + "name": "facebook/cwm", + "alias": [ + "cwm", + "Facebook CWM" + ], + "max_tokens": 131072, + "model_types": [ + "chat" + ] + }, + { + "name": "deepgram/aura-2", + "alias": [ + "aura-2", + "Deepgram Aura 2" + ], + "max_tokens": 448, + "model_types": [ + "audio_generation" + ] + }, + { + "name": "nim/nv-mistralai/mistral-nemo-12b-instruct", + "alias": [ + "mistral-nemo-12b-instruct" + ], + "max_tokens": 16384, + "model_types": [ + "chat" + ] + }, + { + "name": "arcee-ai/trinity-mini", + "alias": [ + "trinity-mini", + "Trinity Mini" + ], + "max_tokens": 128000, + "model_types": [ + "chat" + ] + }, + { + "name": "meta-llama/Meta-Llama-3-70B-Instruct-Turbo", + "alias": [ + "Meta-Llama-3-70B-Instruct-Turbo", + "Meta Llama 3 70B Instruct Turbo" + ], + "max_tokens": 8192, + "model_types": [ + "chat" + ] + }, + { + "name": "rime-labs/rime-arcana-v2", + "alias": [ + "rime-arcana-v2", + "Rime Labs Arcana v2" + ], + "model_types": [ + "audio_generation" + ] + }, + { + "name": "rime-labs/rime-arcana-v3", + "alias": [ + "rime-arcana-v3", + "Rime Labs Arcana v3" + ], + "model_types": [ + "audio_generation" + ] + }, + { + "name": "allenai/Molmo-7B-D-0924", + "alias": [ + "Molmo-7B-D-0924", + "Molmo 7B D 0924" + ], + "max_tokens": 4096, + "model_types": [ + "chat" + ] + }, + { + "name": "zai-org/GLM-4.7-fp4", + "alias": [ + "GLM-4.7-fp4", + "GLM 4.7 FP4" + ], + "max_tokens": 202752, + "model_types": [ + "chat" + ] + }, + { + "name": "Hcompany/Holo3-35B-A3B", + "alias": [ + "Holo3-35B-A3B", + "Holo3 35B A3b" + ], + "max_tokens": 262144, + "model_types": [ + "chat" + ] + }, + { + "name": "meta-llama/Llama-4-Scout-17B-16E-Instruct-FP8-Lora", + "alias": [ + "Llama-4-Scout-17B-16E-Instruct-FP8-Lora", + "Llama 4 Scout 17B 16E Instruct Fp8 Lora" + ], + "max_tokens": 10485760, + "model_types": [ + "chat", + "vision", + "image2text" + ] + }, + { + "name": "deepgram/nova-3-en", + "alias": [ + "nova-3-en", + "Deepgram Nova 3" + ], + "max_tokens": 448, + "model_types": [ + "asr", + "speech2text" + ] + }, + { + "name": "deepcogito/cogito-v1-preview-llama-70B", + "alias": [ + "cogito-v1-preview-llama-70B", + "Cogito V1 Preview Llama 70B" + ], + "max_tokens": 131072, + "model_types": [ + "chat" + ] + }, + { + "name": "deepcogito/cogito-v1-preview-llama-70B-Turbo", + "alias": [ + "cogito-v1-preview-llama-70B-Turbo", + "Cogito V1 Preview Llama 70B Turbo" + ], + "max_tokens": 131072, + "model_types": [ + "chat" + ] + }, + { + "name": "rime-labs/rime-arcana-v3-turbo", + "alias": [ + "rime-arcana-v3-turbo", + "Rime Labs Arcana v3 Turbo" + ], + "max_tokens": 448, + "model_types": [ + "audio_generation" + ] + }, + { + "name": "deepcogito/cogito-v1-preview-llama-8B", + "alias": [ + "cogito-v1-preview-llama-8B", + "Cogito V1 Preview Llama 8B" + ], + "max_tokens": 131072, + "model_types": [ + "chat" + ] + }, + { + "name": "deepcogito/cogito-v1-preview-qwen-14B", + "alias": [ + "cogito-v1-preview-qwen-14B", + "Cogito V1 Preview Qwen 14B" + ], + "max_tokens": 131072, + "model_types": [ + "chat" + ] + }, + { + "name": "deepcogito/cogito-v1-preview-qwen-32B", + "alias": [ + "cogito-v1-preview-qwen-32B", + "Cogito V1 Preview Qwen 32B" + ], + "max_tokens": 131072, + "model_types": [ + "chat" + ] + }, + { + "name": "deepgram/nova-3-multi", + "alias": [ + "nova-3-multi", + "Deepgram Nova 3 Multilingual" + ], + "max_tokens": 448, + "model_types": [ + "asr", + "speech2text" + ] + }, + { + "name": "mistralai/Mixtral-8x7B-Instruct-v0.1-FP8-Lora", + "alias": [ + "Mixtral-8x7B-Instruct-v0.1-FP8-Lora", + "Mixtral 8x7B Instruct V0.1 FP8 Lora" + ], + "max_tokens": 32768, + "model_types": [ + "chat" + ] + }, + { + "name": "nvidia/NVIDIA-Nemotron-3-Super-120B-A12B-FP8", + "alias": [ + "NVIDIA-Nemotron-3-Super-120B-A12B-FP8", + "Nvidia Nemotron 3 Super 120B A12b Fp8" + ], + "max_tokens": 262144, + "model_types": [ + "chat" + ] + }, + { + "name": "agentica-org/DeepCoder-14B-Preview", + "alias": [ + "DeepCoder-14B-Preview", + "Deepcoder 14B Preview" + ], + "max_tokens": 131072, + "model_types": [ + "chat" + ] + }, + { + "name": "mixedbread-ai/mxbai-rerank-large-v2", + "alias": [ + "mxbai-rerank-large-v2", + "Mxbai Rerank Large V2" + ], + "max_tokens": 32768, + "model_types": [ + "rerank" + ] + }, + { + "name": "nvidia/nemotron-3-nano-omni-30b-a3b-reasoning-fp8", + "alias": [ + "nemotron-3-nano-omni-30b-a3b-reasoning-fp8", + "Nemotron 3 Nano Omni 30B A3b Reasoning Fp8" + ], + "max_tokens": 131072, + "model_types": [ + "chat" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "MiniMaxAI/MiniMax-M2.5-FP4", + "alias": [ + "MiniMax-M2.5-FP4", + "MiniMax M2.5 FP4" + ], + "max_tokens": 8192, + "model_types": [ + "chat" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "togethercomputer/meta-llama-3.1-8B-Instruct-AWQ-INT4", + "alias": [ + "meta-llama-3.1-8B-Instruct-AWQ-INT4", + "Meta Llama 3.1 8B Instruct Awq Int4" + ], + "max_tokens": 131072, + "model_types": [ + "chat" + ] + }, + { + "name": "Qwen/Qwen3-30B-A3B-Instruct-2507-Lora", + "alias": [ + "Qwen3-30B-A3B-Instruct-2507-Lora", + "Qwen3 30B A3B Instruct 2507 Lora" + ], + "max_tokens": 262144, + "model_types": [ + "chat" + ] + }, + { + "name": "Qwen/Qwen3-8B-Lora", + "alias": [ + "Qwen3-8B-Lora", + "Qwen3 8B Lora" + ], + "max_tokens": 40960, + "model_types": [ + "chat" + ] + }, + { + "name": "nvidia/Llama-3.1-Nemotron-70B-Instruct-HF", + "alias": [ + "Llama-3.1-Nemotron-70B-Instruct-HF", + "Llama 3.1 Nemotron 70B Instruct HF" + ], + "max_tokens": 32768, + "model_types": [ + "chat" + ] + }, + { + "name": "rime-labs/rime-mist-v2", + "alias": [ + "rime-mist-v2", + "Rime Labs Mist v2" + ], + "model_types": [ + "audio_generation" + ] + }, + { + "name": "sarvamai/sarvam-m", + "alias": [ + "sarvam-m", + "Sarvam M" + ], + "max_tokens": 32768, + "model_types": [ + "chat" + ] + }, + { + "name": "togethercomputer/EssentialAI-RNJ-1-Instruct", + "alias": [ + "EssentialAI-RNJ-1-Instruct" + ], + "max_tokens": 32768, + "model_types": [ + "chat" + ] + }, + { + "name": "meta-llama/Meta-Llama-3.1-8B", + "alias": [ + "Meta-Llama-3.1-8B", + "Meta Llama 3.1 8B" + ], + "max_tokens": 16384, + "model_types": [ + "chat" + ] + }, + { + "name": "meta-llama/Llama-3.3-70B-Instruct-FP8-Lora", + "alias": [ + "Llama-3.3-70B-Instruct-FP8-Lora", + "Llama 3.3 70B Instruct FP8 Lora" + ], + "max_tokens": 131072, + "model_types": [ + "chat" + ] + }, + { + "name": "nim/nvidia/llama-3.3-nemotron-super-49b-v1", + "alias": [ + "llama-3.3-nemotron-super-49b-v1" + ], + "max_tokens": 16384, + "model_types": [ + "chat" + ] + }, + { + "name": "Qwen/Qwen2.5-72B-Instruct-Turbo", + "alias": [ + "Qwen2.5-72B-Instruct-Turbo", + "Qwen2.5 72B Instruct Turbo" + ], + "max_tokens": 131072, + "model_types": [ + "chat" + ] + }, + { + "name": "Salesforce/Llama-Rank-V1", + "alias": [ + "Llama-Rank-V1", + "Salesforce Llama Rank V1 (8B)" + ], + "max_tokens": 8192, + "model_types": [ + "rerank" + ] + }, + { + "name": "zai-org/GLM-5-FP4", + "alias": [ + "GLM-5-FP4" + ], + "max_tokens": 202752, + "model_types": [ + "chat" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "meta-llama/Llama-3-8b-chat-hf", + "alias": [ + "Llama-3-8b-chat-hf", + "Meta Llama 3 8B Instruct Reference" + ], + "max_tokens": 8192, + "model_types": [ + "chat" + ] + }, + { + "name": "mistralai/Magistral-Small-2506", + "alias": [ + "Magistral-Small-2506", + "Magistral Small 2506" + ], + "max_tokens": 40960, + "model_types": [ + "chat" + ] + }, + { + "name": "mistralai/Mistral-7B-v0.1", + "alias": [ + "Mistral-7B-v0.1", + "Mistral 7B v0.1" + ], + "max_tokens": 32768, + "model_types": [ + "chat" + ] + }, + { + "name": "meta-llama/Meta-Llama-3.1-70B", + "alias": [ + "Meta-Llama-3.1-70B", + "Llama 3.1 70B" + ], + "max_tokens": 131072, + "model_types": [ + "chat" + ] + }, + { + "name": "nim/mistralai/mixtral-8x22b-instruct-v01", + "alias": [ + "mixtral-8x22b-instruct-v01" + ], + "max_tokens": 16384, + "model_types": [ + "chat" + ] + }, + { + "name": "nvidia/NVIDIA-Nemotron-3-Super-120B-A12B-BF16", + "alias": [ + "NVIDIA-Nemotron-3-Super-120B-A12B-BF16", + "Nvidia Nemotron 3 Super 120B A12b Bf16" + ], + "max_tokens": 262144, + "model_types": [ + "chat" + ] + }, + { + "name": "rime-labs/rime-mist-v3", + "alias": [ + "rime-mist-v3", + "Rime Labs Mist v3" + ], + "max_tokens": 448, + "model_types": [ + "audio_generation" + ] + }, + { + "name": "mistralai/Mixtral-8x7B-v0.1", + "alias": [ + "Mixtral-8x7B-v0.1", + "Mixtral 8X7b V0.1" + ], + "max_tokens": 32768, + "model_types": [ + "chat" + ] + }, + { + "name": "rime-labs/rime-mist-v3-omni", + "alias": [ + "rime-mist-v3-omni", + "Rime Labs Mist v3 Omni" + ], + "max_tokens": 448, + "model_types": [ + "audio_generation" + ] + }, + { + "name": "moonshotai/Kimi-K2.5-fp4", + "alias": [ + "Kimi-K2.5-fp4", + "Kimi K2.5 Fp4" + ], + "max_tokens": 262144, + "model_types": [ + "chat" + ] + }, + { + "name": "meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP4", + "alias": [ + "Llama-4-Maverick-17B-128E-Instruct-FP4", + "Llama 4 Maverick 17B 128E Instruct Nvfp4" + ], + "max_tokens": 1048576, + "model_types": [ + "chat", + "vision", + "image2text" + ] + }, + { + "name": "NousResearch/Nous-Hermes-2-Mixtral-8x7B-DPO", + "alias": [ + "Nous-Hermes-2-Mixtral-8x7B-DPO", + "Nous Hermes 2 Mixtral 8X7B Dpo" + ], + "max_tokens": 32768, + "model_types": [ + "chat" + ] + }, + { + "name": "Qwen/Qwen3.5-35B-A3B-Lora", + "alias": [ + "Qwen3.5-35B-A3B-Lora", + "Qwen3.5 35B A3b LoRa" + ], + "max_tokens": 262144, + "model_types": [ + "chat" + ] + }, + { + "name": "Qwen/Qwen3.5-9B-FP8", + "alias": [ + "Qwen3.5-9B-FP8" + ], + "max_tokens": 262144, + "model_types": [ + "chat" + ] + }, + { + "name": "mistralai/Ministral-3-14B-Instruct-2512", + "alias": [ + "Ministral-3-14B-Instruct-2512", + "Ministral 3 14B Instruct 2512" + ], + "max_tokens": 262144, + "model_types": [ + "chat" + ] + }, + { + "name": "nim/mistralai/mixtral-8x7b-instruct-v01", + "alias": [ + "mixtral-8x7b-instruct-v01" + ], + "max_tokens": 16384, + "model_types": [ + "chat" + ] + }, + { + "name": "doubao-lite-128k-240428", + "alias": [ + "doubao-lite-128k", + "doubao-lite-128k-240828" + ], + "model_types": [ + "chat" + ], + "max_tokens": 131072, + "max_completion_tokens": 4096 + }, + { + "name": "doubao-lite-4k-240328", + "alias": [ + "doubao-lite-4k", + "doubao-lite-4k-character-240515", + "doubao-lite-4k-pretrain-character-240516", + "doubao-lite-4k-character-240828" + ], + "model_types": [ + "chat" + ], + "max_tokens": 4096, + "max_completion_tokens": 4096 + }, + { + "name": "doubao-lite-32k-240428", + "alias": [ + "doubao-lite-32k", + "doubao-lite-32k-240628", + "doubao-lite-32k-240828", + "doubao-lite-32k-character-241015", + "doubao-lite-32k-character-250228" + ], + "model_types": [ + "chat" + ], + "max_tokens": 32768, + "max_completion_tokens": 4096 + }, + { + "name": "doubao-pro-4k-240515", + "alias": [ + "doubao-pro-4k", + "doubao-pro-4k-character-240515", + "doubao-pro-4k-functioncall-240515", + "doubao-pro-4k-browsing-240524", + "doubao-pro-4k-functioncall-240615", + "doubao-pro-4k-character-240728" + ], + "model_types": [ + "chat" + ] + }, + { + "name": "doubao-embedding-text-240515", + "alias": [ + "doubao-embedding", + "doubao-embedding-text-240715" + ], + "model_types": [ + "embedding" + ] + }, + { + "name": "doubao-embedding-large-text-240915", + "alias": [ + "doubao-embedding-large", + "doubao-embedding-large-text-250515" + ], + "max_tokens": 4096, + "model_types": [ + "embedding" + ] + }, + { + "name": "doubao-seaweed-241128", + "alias": [ + "doubao-seaweed" + ], + "model_types": [ + "video_generation" + ] + }, + { + "name": "doubao-pro-256k-241115", + "alias": [ + "doubao-pro-256k" + ], + "model_types": [ + "chat" + ] + }, + { + "name": "doubao-1-5-lite-32k-250115", + "alias": [ + "doubao-1-5-lite-32k" + ], + "max_tokens": 32768, + "max_completion_tokens": 12288, + "model_types": [ + "chat" + ] + }, + { + "name": "doubao-1-5-pro-32k-250115", + "alias": [ + "doubao-1-5-pro-32k", + "doubao-1-5-pro-32k-character-250228", + "doubao-1-5-pro-32k-character-250715" + ], + "max_tokens": 131072, + "max_completion_tokens": 12288, + "model_types": [ + "chat" + ] + }, + { + "name": "doubao-1-5-vision-pro-32k-250115", + "alias": [ + "doubao-1-5-vision-pro-32k" + ], + "max_tokens": 32768, + "max_completion_tokens": 12288, + "model_types": [ + "chat", + "vision", + "image2text" + ] + }, + { + "name": "doubao-embedding-vision-241215", + "alias": [ + "doubao-embedding-vision", + "doubao-embedding-vision-250328", + "doubao-embedding-vision-250615", + "doubao-embedding-vision-251215" + ], + "model_types": [ + "embedding" + ], + "max_tokens": 131072 + }, + { + "name": "doubao-1-5-pro-256k-250115", + "alias": [ + "doubao-1-5-pro-256k" + ], + "max_tokens": 262144, + "max_completion_tokens": 12288, + "model_types": [ + "chat" + ] + }, + { + "name": "wan2-1-14b-i2v-250225", + "alias": [ + "wan2-1-14b", + "wan2-1-14b-t2v-250225", + "wan2-1-14b-flf2v-250417" + ], + "model_types": [ + "video_generation" + ] + }, + { + "name": "glm-4-5-air-20250728", + "alias": [ + "glm-4-5-air" + ], + "model_types": [ + "chat" + ] + }, + { + "name": "qwen2-5-72b-20240919", + "alias": [ + "qwen2-5-72b" + ], + "model_types": [ + "chat" + ] + }, + { + "name": "doubao-seed-translation-250915", + "alias": [ + "doubao-seed-translation" + ], + "max_tokens": 4096, + "max_completion_tokens": 3072, + "model_types": [ + "chat" + ] + }, + { + "name": "doubao-smart-router-250928", + "alias": [ + "doubao-smart-router" + ], + "model_types": [ + "chat" + ] + }, + { + "name": "doubao-seed-1-6-lite-251015", + "alias": [ + "doubao-seed-1-6-lite" + ], + "max_tokens": 262144, + "max_completion_tokens": 65536, + "model_types": [ + "chat", + "vision", + "image2text" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "doubao-seed3d-1-0-250928", + "alias": [ + "doubao-seed3d-1-0" + ], + "model_types": [ + "3d_generation" + ] + }, + { + "name": "qwen3-0-6b-20250429", + "alias": [ + "qwen3-0-6b" + ], + "model_types": [ + "chat" + ] + }, + { + "name": "glm-4-7-251222", + "alias": [ + "glm-4-7" + ], + "max_tokens": 204800, + "max_completion_tokens": 131072, + "model_types": [ + "chat" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "doubao-seed-1-8-251228", + "alias": [ + "doubao-seed-1-8" + ], + "max_tokens": 262144, + "max_completion_tokens": 65536, + "model_types": [ + "chat", + "vision", + "image2text" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "doubao-seed-character-251128", + "alias": [ + "doubao-seed-character" + ], + "max_tokens": 131072, + "max_completion_tokens": 32768, + "model_types": [ + "chat" + ] + }, + { + "name": "hyper3d-gen2-260112", + "alias": [ + "hyper3d-gen2" + ], + "model_types": [ + "3d_generation" + ] + }, + { + "name": "hitem3d-2-0-251223", + "alias": [ + "hitem3d-2-0" + ], + "model_types": [ + "3d_generation" + ] + }, + { + "name": "doubao-seed3d-2-0-260328", + "alias": [ + "doubao-seed3d-2-0" + ], + "model_types": [ + "3d_generation" + ] + }, + { + "name": "solar-mini", + "model_types": [ + "chat" + ], + "alias": [ + "solar-mini-250422" + ] + }, + { + "name": "solar-pro2", + "model_types": [ + "chat" + ], + "alias": [ + "solar-pro2-251215" + ] + }, + { + "name": "solar-pro3", + "model_types": [ + "chat" + ], + "alias": [ + "solar-pro3-260323" + ] + }, + { + "name": "syn-pro", + "model_types": [ + "chat" + ], + "alias": [ + "syn-pro-251021" + ] + }, + { + "name": "step-tts-2", + "model_types": [ + "tts" + ] + }, + { + "name": "stepaudio-2.5-tts", + "model_types": [ + "tts" + ] + }, + { + "name": "stepaudio-2.5-asr", + "model_types": [ + "asr", + "speech2text" + ] + }, + { + "name": "step-image-edit-2", + "model_types": [ + "image", + "image_edit" + ] + }, + { + "name": "animate-anyone-detect-gen2", + "model_types": [ + "video_generation" + ] + }, + { + "name": "animate-anyone-gen2", + "model_types": [ + "video_generation" + ] + }, + { + "name": "animate-anyone-template-gen2", + "model_types": [ + "video_generation" + ] + }, + { + "name": "claude-opus-4.6-fast", + "model_types": [ + "chat" + ] + }, + { + "name": "claude-opus-4.7-fast", + "model_types": [ + "chat" + ] + }, + { + "name": "claude-opus-4.8-fast", + "model_types": [ + "chat" + ] + }, + { + "name": "doubao-seed-1.6-250615", + "model_types": [ + "chat" + ] + }, + { + "name": "dreamina-seedance-2-0-fast-260128", + "model_types": [ + "video_generation" + ] + }, + { + "name": "emo-detect-v1", + "model_types": [ + "video_generation" + ] + }, + { + "name": "emo-v1", + "model_types": [ + "video_generation" + ] + }, + { + "name": "fun-asr", + "model_types": [ + "asr", + "speech2text" + ] + }, + { + "name": "fun-asr-flash-8k-realtime", + "model_types": [ + "asr", + "speech2text" + ] + }, + { + "name": "fun-asr-mtl", + "model_types": [ + "asr", + "speech2text" + ] + }, + { + "name": "fun-asr-mtl-realtime", + "model_types": [ + "asr", + "speech2text" + ] + }, + { + "name": "fun-asr-realtime", + "model_types": [ + "asr", + "speech2text" + ] + }, + { + "name": "gpt-5.4-image-2", + "model_types": [ + "chat", + "vision", + "image2text" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "gpt-5-image", + "model_types": [ + "chat", + "vision", + "image2text" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "gpt-5-image-mini", + "model_types": [ + "chat", + "vision", + "image2text" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "gpt-oss-120b-250805", + "model_types": [ + "chat" + ] + }, + { + "name": "JIUTIAN-75B-32K", + "model_types": [ + "chat" + ] + }, + { + "name": "JIUTIAN-75B-8K-Chat", + "model_types": [ + "chat" + ] + }, + { + "name": "Kling-3.0", + "model_types": [ + "video_generation" + ] + }, + { + "name": "Kling-3.0-Omni", + "model_types": [ + "video_generation" + ] + }, + { + "name": "Kling-O1", + "model_types": [ + "video_generation" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "liveportrait", + "model_types": [ + "video_generation" + ] + }, + { + "name": "liveportrait-detect", + "model_types": [ + "video_generation" + ] + }, + { + "name": "paraformer-8k-v2", + "model_types": [ + "asr", + "speech2text" + ] + }, + { + "name": "paraformer-realtime-8k-v2", + "model_types": [ + "asr", + "speech2text" + ] + }, + { + "name": "paraformer-realtime-v2", + "model_types": [ + "asr", + "speech2text" + ] + }, + { + "name": "paraformer-v2", + "model_types": [ + "asr", + "speech2text" + ] + }, + { + "name": "qwen-flash-character", + "model_types": [ + "chat" + ] + }, + { + "name": "seed-1-8-251228", + "model_types": [ + "chat" + ] + }, + { + "name": "seed-2-0-code-preview-260328", + "model_types": [ + "chat" + ] + }, + { + "name": "seed-2-0-lite-260228", + "model_types": [ + "chat" + ] + }, + { + "name": "seed-2-0-lite-260428", + "model_types": [ + "chat" + ] + }, + { + "name": "seed-2-0-mini-260215", + "model_types": [ + "chat" + ] + }, + { + "name": "seed-2-0-mini-260428", + "model_types": [ + "chat" + ] + }, + { + "name": "seed-2-0-pro-260328", + "model_types": [ + "chat" + ] + }, + { + "name": "seedance-1-0-pro-250528", + "model_types": [ + "video_generation" + ] + }, + { + "name": "seedance-1-0-pro-fast-251015", + "model_types": [ + "video_generation" + ] + }, + { + "name": "seedance-1-5-pro-251215", + "model_types": [ + "video_generation" + ] + }, + { + "name": "Seedance 2.0", + "model_types": [ + "video_generation" + ] + }, + { + "name": "seedream-4-0-250828", + "model_types": [ + "text-to-image", + "image_generation" + ] + }, + { + "name": "seedream-4-5-251128", + "model_types": [ + "text-to-image", + "image_generation" + ] + }, + { + "name": "seedream-5-0-lite-260128", + "model_types": [ + "text-to-image", + "image_generation" + ] + }, + { + "name": "wan2.2-animate-mix", + "model_types": [ + "video_generation" + ] + }, + { + "name": "wan2.2-animate-move", + "model_types": [ + "video_generation" + ] + }, + { + "name": "wan2.2-kf2v-flash", + "model_types": [ + "video_generation" + ] + }, + { + "name": "wan2.2-t2v-plus", + "model_types": [ + "video_generation" + ] + }, + { + "name": "wan2.5-i2i-preview", + "model_types": [ + "text-to-image", + "image_generation" + ] + }, + { + "name": "wan2.6-i2v-flash", + "model_types": [ + "video_generation" + ] + }, + { + "name": "wan2.6-i2v-us", + "model_types": [ + "video_generation" + ] + }, + { + "name": "wan2.6-r2v", + "model_types": [ + "video_generation" + ] + }, + { + "name": "wan2.6-r2v-flash", + "model_types": [ + "video_generation" + ] + }, + { + "name": "wan2.7-image", + "model_types": [ + "text-to-image", + "image_generation" + ] + }, + { + "name": "wan2.7-videoedit", + "model_types": [ + "video_generation" + ] + }, + { + "name": "wanx2.0-t2i-turbo", + "model_types": [ + "text-to-image", + "image_generation" + ] + }, + { + "name": "tokenhub-chat-test", + "model_types": [ + "chat" + ] + }, + { + "name": "grok-imagine-video", + "model_types": [ + "video_generation" + ], + "alias": [ + "xai/grok-imagine-video" + ] + }, + { + "name": "grok-imagine-video-1.5-preview", + "model_types": [ + "video_generation" + ], + "alias": [ + "xai/grok-imagine-video-1.5-preview", + "grok-imagine-video-1.5-2026-05-30" + ] + }, + { + "name": "grok-4.20-multi-agent-0309", + "max_tokens": 1000000, + "thinking": { + "default_value": true, + "clear_thinking": true + }, + "model_types": [ + "chat" + ], + "alias": [ + "xai/grok-4.20-multi-agent", + "grok-4.20-multi-agent", + "grok-4.20-multi-agent-latest", + "grok-4.20-multi-agent-beta-0309", + "grok-4.20-multi-agent-beta-latest", + "grok-4.20-multi-agent-experimental-beta-0304", + "grok-4.20-multi-agent-experimental-beta-latest" + ] } ] }