diff --git a/conf/all_models.json b/conf/all_models.json index 3710d26488..9c7389a154 100644 --- a/conf/all_models.json +++ b/conf/all_models.json @@ -7,7 +7,7 @@ "Embedding-3" ], "max_tokens": 8192, - "dimension": 2048, + "max_dimension": 2048, "dimensions": [ 256, 512, @@ -25,7 +25,7 @@ "Embedding-2" ], "max_tokens": 8192, - "dimension": 1024, + "max_dimension": 1024, "model_types": [ "embedding" ] @@ -3898,7 +3898,7 @@ "model_types": [ "embedding" ], - "dimension": 2560, + "max_dimension": 2560, "dimensions": [ 2560, 2048, @@ -5576,7 +5576,7 @@ "qwen3-vl-embedding-2b" ], "max_tokens": 32768, - "dimension": 2048, + "max_dimension": 2048, "model_types": [ "embedding" ] @@ -5588,7 +5588,7 @@ "qwen3-vl-embedding-8b" ], "max_tokens": 32768, - "dimension": 4096, + "max_dimension": 4096, "model_types": [ "embedding" ] @@ -6794,7 +6794,7 @@ "qwen3-embedding-0.6b-gguf" ], "max_tokens": 32768, - "dimension": 1024, + "max_dimension": 1024, "model_types": [ "embedding" ] @@ -6806,7 +6806,7 @@ "qwen3-embedding-4b-gguf" ], "max_tokens": 32768, - "dimension": 2560, + "max_dimension": 2560, "model_types": [ "embedding" ] @@ -6818,7 +6818,7 @@ "qwen3-embedding-8b-gguf" ], "max_tokens": 32768, - "dimension": 4096, + "max_dimension": 4096, "model_types": [ "embedding" ] @@ -6843,7 +6843,7 @@ "Qwen3-Embedding-8B" ], "max_tokens": 32768, - "dimension": 4096, + "max_dimension": 4096, "model_types": [ "embedding" ] @@ -6856,7 +6856,7 @@ "Qwen3-Embedding-4B" ], "max_tokens": 32768, - "dimension": 2560, + "max_dimension": 2560, "model_types": [ "embedding" ] @@ -6869,7 +6869,7 @@ "Qwen3-Embedding-0.6B" ], "max_tokens": 32768, - "dimension": 1024, + "max_dimension": 1024, "model_types": [ "embedding" ] @@ -10599,7 +10599,6 @@ { "name": "baidu/nava", "alias": [ - "baidu/nava", "baidu/NAVA", "nava" ], @@ -10610,7 +10609,6 @@ { "name": "baidu/ernie-image-aes", "alias": [ - "baidu/ernie-image-aes", "baidu/ERNIE-Image-Aes", "ernie-image-aes" ], @@ -10621,7 +10619,6 @@ { "name": "baidu/ernie-image-turbo", "alias": [ - "baidu/ernie-image-turbo", "baidu/ERNIE-Image-Turbo", "ernie-image-turbo" ], @@ -10632,7 +10629,6 @@ { "name": "baidu/ernie-image", "alias": [ - "baidu/ernie-image", "baidu/ERNIE-Image", "ernie-image" ], @@ -10643,7 +10639,6 @@ { "name": "baidu/qianfan-ocr", "alias": [ - "baidu/qianfan-ocr", "baidu/Qianfan-OCR", "qianfan-ocr" ], @@ -10657,7 +10652,6 @@ { "name": "baidu/qianfan-vl-70b", "alias": [ - "baidu/qianfan-vl-70b", "baidu/Qianfan-VL-70B", "qianfan-vl-70b" ], @@ -10675,7 +10669,6 @@ { "name": "baidu/qianfan-vl-8b", "alias": [ - "baidu/qianfan-vl-8b", "baidu/Qianfan-VL-8B", "qianfan-vl-8b" ], @@ -10693,7 +10686,6 @@ { "name": "baidu/qianfan-vl-3b", "alias": [ - "baidu/qianfan-vl-3b", "baidu/Qianfan-VL-3B", "qianfan-vl-3b" ], @@ -10707,7 +10699,6 @@ { "name": "baidu/ernie-4.5-vl-28b-a3b-pt", "alias": [ - "baidu/ernie-4.5-vl-28b-a3b-pt", "baidu/ERNIE-4.5-VL-28B-A3B-PT", "ernie-4.5-vl-28b-a3b-pt" ], @@ -10722,7 +10713,6 @@ { "name": "baidu/ernie-4.5-vl-28b-a3b-thinking", "alias": [ - "baidu/ernie-4.5-vl-28b-a3b-thinking", "baidu/ERNIE-4.5-VL-28B-A3B-Thinking", "ernie-4.5-vl-28b-a3b-thinking" ], @@ -10741,7 +10731,6 @@ { "name": "baidu/ernie-4.5-vl-28b-a3b-base-pt", "alias": [ - "baidu/ernie-4.5-vl-28b-a3b-base-pt", "baidu/ERNIE-4.5-VL-28B-A3B-Base-PT", "ernie-4.5-vl-28b-a3b-base-pt" ], @@ -10754,7 +10743,6 @@ { "name": "baidu/ernie-4.5-vl-424b-a47b-pt", "alias": [ - "baidu/ernie-4.5-vl-424b-a47b-pt", "baidu/ERNIE-4.5-VL-424B-A47B-PT", "ernie-4.5-vl-424b-a47b-pt" ], @@ -10769,7 +10757,6 @@ { "name": "baidu/ernie-4.5-vl-424b-a47b-base-pt", "alias": [ - "baidu/ernie-4.5-vl-424b-a47b-base-pt", "baidu/ERNIE-4.5-VL-424B-A47B-Base-PT", "ernie-4.5-vl-424b-a47b-base-pt" ], @@ -10782,7 +10769,6 @@ { "name": "baidu/ernie-4.5-21b-a3b-base-pt", "alias": [ - "baidu/ernie-4.5-21b-a3b-base-pt", "baidu/ERNIE-4.5-21B-A3B-Base-PT", "ernie-4.5-21b-a3b-base-pt" ], @@ -10794,7 +10780,6 @@ { "name": "baidu/ernie-4.5-300b-a47b-base-pt", "alias": [ - "baidu/ernie-4.5-300b-a47b-base-pt", "baidu/ERNIE-4.5-300B-A47B-Base-PT", "ernie-4.5-300b-a47b-base-pt" ], @@ -10806,7 +10791,6 @@ { "name": "baidu/ernie-4.5-21b-a3b-thinking", "alias": [ - "baidu/ernie-4.5-21b-a3b-thinking", "baidu/ERNIE-4.5-21B-A3B-Thinking", "ernie-4.5-21b-a3b-thinking" ], @@ -10822,7 +10806,6 @@ { "name": "baidu/ernie-4.5-21b-a3b-pt", "alias": [ - "baidu/ernie-4.5-21b-a3b-pt", "baidu/ERNIE-4.5-21B-A3B-PT", "ernie-4.5-21b-a3b-pt" ], @@ -10834,7 +10817,6 @@ { "name": "baidu/ernie-4.5-300b-a47b-pt", "alias": [ - "baidu/ernie-4.5-300b-a47b-pt", "baidu/ERNIE-4.5-300B-A47B-PT", "ernie-4.5-300b-a47b-pt" ], @@ -10846,7 +10828,6 @@ { "name": "baidu/ernie-4.5-300b-a47b-2bits-paddle", "alias": [ - "baidu/ernie-4.5-300b-a47b-2bits-paddle", "baidu/ERNIE-4.5-300B-A47B-2Bits-Paddle", "ernie-4.5-300b-a47b-2bits-paddle" ], @@ -10858,7 +10839,6 @@ { "name": "baidu/ernie-4.5-300b-a47b-2bits-tp4-paddle", "alias": [ - "baidu/ernie-4.5-300b-a47b-2bits-tp4-paddle", "baidu/ERNIE-4.5-300B-A47B-2Bits-TP4-Paddle", "ernie-4.5-300b-a47b-2bits-tp4-paddle" ], @@ -10870,7 +10850,6 @@ { "name": "baidu/ernie-4.5-300b-a47b-2bits-tp2-paddle", "alias": [ - "baidu/ernie-4.5-300b-a47b-2bits-tp2-paddle", "baidu/ERNIE-4.5-300B-A47B-2Bits-TP2-Paddle", "ernie-4.5-300b-a47b-2bits-tp2-paddle" ], @@ -10882,7 +10861,6 @@ { "name": "baidu/ernie-4.5-21b-a3b-paddle", "alias": [ - "baidu/ernie-4.5-21b-a3b-paddle", "baidu/ERNIE-4.5-21B-A3B-Paddle", "ernie-4.5-21b-a3b-paddle" ], @@ -10894,7 +10872,6 @@ { "name": "baidu/ernie-4.5-300b-a47b-paddle", "alias": [ - "baidu/ernie-4.5-300b-a47b-paddle", "baidu/ERNIE-4.5-300B-A47B-Paddle", "ernie-4.5-300b-a47b-paddle" ], @@ -10906,7 +10883,6 @@ { "name": "baidu/ernie-4.5-300b-a47b-base-paddle", "alias": [ - "baidu/ernie-4.5-300b-a47b-base-paddle", "baidu/ERNIE-4.5-300B-A47B-Base-Paddle", "ernie-4.5-300b-a47b-base-paddle" ], @@ -10918,7 +10894,6 @@ { "name": "baidu/ernie-4.5-300b-a47b-fp8-paddle", "alias": [ - "baidu/ernie-4.5-300b-a47b-fp8-paddle", "baidu/ERNIE-4.5-300B-A47B-FP8-Paddle", "ernie-4.5-300b-a47b-fp8-paddle" ], @@ -10930,7 +10905,6 @@ { "name": "baidu/ernie-4.5-300b-a47b-w4a8c8-tp4-paddle", "alias": [ - "baidu/ernie-4.5-300b-a47b-w4a8c8-tp4-paddle", "baidu/ERNIE-4.5-300B-A47B-W4A8C8-TP4-Paddle", "ernie-4.5-300b-a47b-w4a8c8-tp4-paddle" ], @@ -10942,7 +10916,6 @@ { "name": "baidu/ernie-4.5-0.3b-base-pt", "alias": [ - "baidu/ernie-4.5-0.3b-base-pt", "baidu/ERNIE-4.5-0.3B-Base-PT", "ernie-4.5-0.3b-base-pt" ], @@ -10954,7 +10927,6 @@ { "name": "baidu/ernie-4.5-0.3b-pt", "alias": [ - "baidu/ernie-4.5-0.3b-pt", "baidu/ERNIE-4.5-0.3B-PT", "ernie-4.5-0.3b-pt" ], @@ -10966,7 +10938,6 @@ { "name": "baidu/ernie-4.5-vl-424b-a47b-paddle", "alias": [ - "baidu/ernie-4.5-vl-424b-a47b-paddle", "baidu/ERNIE-4.5-VL-424B-A47B-Paddle", "ernie-4.5-vl-424b-a47b-paddle" ], @@ -10981,7 +10952,6 @@ { "name": "baidu/ernie-4.5-vl-28b-a3b-base-paddle", "alias": [ - "baidu/ernie-4.5-vl-28b-a3b-base-paddle", "baidu/ERNIE-4.5-VL-28B-A3B-Base-Paddle", "ernie-4.5-vl-28b-a3b-base-paddle" ], @@ -10994,7 +10964,6 @@ { "name": "baidu/ernie-4.5-21b-a3b-base-paddle", "alias": [ - "baidu/ernie-4.5-21b-a3b-base-paddle", "baidu/ERNIE-4.5-21B-A3B-Base-Paddle", "ernie-4.5-21b-a3b-base-paddle" ], @@ -11006,7 +10975,6 @@ { "name": "baidu/ernie-4.5-vl-28b-a3b-paddle", "alias": [ - "baidu/ernie-4.5-vl-28b-a3b-paddle", "baidu/ERNIE-4.5-VL-28B-A3B-Paddle", "ernie-4.5-vl-28b-a3b-paddle" ], @@ -11021,7 +10989,6 @@ { "name": "baidu/ernie-4.5-0.3b-base-paddle", "alias": [ - "baidu/ernie-4.5-0.3b-base-paddle", "baidu/ERNIE-4.5-0.3B-Base-Paddle", "ernie-4.5-0.3b-base-paddle" ], @@ -11033,7 +11000,6 @@ { "name": "baidu/ernie-4.5-0.3b-paddle", "alias": [ - "baidu/ernie-4.5-0.3b-paddle", "baidu/ERNIE-4.5-0.3B-Paddle", "ernie-4.5-0.3b-paddle" ], @@ -11045,7 +11011,6 @@ { "name": "baidu/ernie-4.5-vl-424b-a47b-base-paddle", "alias": [ - "baidu/ernie-4.5-vl-424b-a47b-base-paddle", "baidu/ERNIE-4.5-VL-424B-A47B-Base-Paddle", "ernie-4.5-vl-424b-a47b-base-paddle" ], @@ -11425,10 +11390,9 @@ { "name": "jinaai/jina-embeddings-v5-omni-small-text-matching", "alias": [ - "jinaai/jina-embeddings-v5-omni-small-text-matching", "jina-embeddings-v5-omni-small-text-matching" ], - "dimension": 1024, + "max_dimension": 1024, "dimensions": [ 32, 64, @@ -11448,10 +11412,9 @@ { "name": "jinaai/jina-embeddings-v5-omni-nano-retrieval", "alias": [ - "jinaai/jina-embeddings-v5-omni-nano-retrieval", "jina-embeddings-v5-omni-nano-retrieval" ], - "dimension": 1024, + "max_dimension": 1024, "dimensions": [ 32, 64, @@ -11471,10 +11434,9 @@ { "name": "jinaai/jina-embeddings-v5-omni-nano-classification", "alias": [ - "jinaai/jina-embeddings-v5-omni-nano-classification", "jina-embeddings-v5-omni-nano-classification" ], - "dimension": 1024, + "max_dimension": 1024, "dimensions": [ 32, 64, @@ -11494,10 +11456,9 @@ { "name": "jinaai/jina-embeddings-v5-omni-nano-clustering", "alias": [ - "jinaai/jina-embeddings-v5-omni-nano-clustering", "jina-embeddings-v5-omni-nano-clustering" ], - "dimension": 1024, + "max_dimension": 1024, "dimensions": [ 32, 64, @@ -11517,10 +11478,9 @@ { "name": "jinaai/jina-embeddings-v5-omni-nano-text-matching", "alias": [ - "jinaai/jina-embeddings-v5-omni-nano-text-matching", "jina-embeddings-v5-omni-nano-text-matching" ], - "dimension": 1024, + "max_dimension": 1024, "dimensions": [ 32, 64, @@ -11540,10 +11500,9 @@ { "name": "jinaai/jina-embeddings-v5-omni-nano", "alias": [ - "jinaai/jina-embeddings-v5-omni-nano", "jina-embeddings-v5-omni-nano" ], - "dimension": 1024, + "max_dimension": 1024, "dimensions": [ 32, 64, @@ -11563,10 +11522,9 @@ { "name": "jinaai/jina-embeddings-v5-omni-small-retrieval", "alias": [ - "jinaai/jina-embeddings-v5-omni-small-retrieval", "jina-embeddings-v5-omni-small-retrieval" ], - "dimension": 1024, + "max_dimension": 1024, "dimensions": [ 32, 64, @@ -11586,10 +11544,9 @@ { "name": "jinaai/jina-embeddings-v5-omni-small-classification", "alias": [ - "jinaai/jina-embeddings-v5-omni-small-classification", "jina-embeddings-v5-omni-small-classification" ], - "dimension": 1024, + "max_dimension": 1024, "dimensions": [ 32, 64, @@ -11609,10 +11566,9 @@ { "name": "jinaai/jina-embeddings-v5-omni-small-clustering", "alias": [ - "jinaai/jina-embeddings-v5-omni-small-clustering", "jina-embeddings-v5-omni-small-clustering" ], - "dimension": 1024, + "max_dimension": 1024, "dimensions": [ 32, 64, @@ -11632,10 +11588,9 @@ { "name": "jinaai/jina-embeddings-v5-omni-small", "alias": [ - "jinaai/jina-embeddings-v5-omni-small", "jina-embeddings-v5-omni-small" ], - "dimension": 1024, + "max_dimension": 1024, "dimensions": [ 32, 64, @@ -11655,10 +11610,9 @@ { "name": "jinaai/jina-embeddings-v5-omni-nano-mlx", "alias": [ - "jinaai/jina-embeddings-v5-omni-nano-mlx", "jina-embeddings-v5-omni-nano-mlx" ], - "dimension": 1024, + "max_dimension": 1024, "dimensions": [ 32, 64, @@ -11678,10 +11632,9 @@ { "name": "jinaai/jina-embeddings-v5-omni-small-mlx", "alias": [ - "jinaai/jina-embeddings-v5-omni-small-mlx", "jina-embeddings-v5-omni-small-mlx" ], - "dimension": 1024, + "max_dimension": 1024, "dimensions": [ 32, 64, @@ -11701,12 +11654,11 @@ { "name": "jinaai/jina-embeddings-v5-omni-small-text-matching-gguf", "alias": [ - "jinaai/jina-embeddings-v5-omni-small-text-matching-gguf", "jinaai/jina-embeddings-v5-omni-small-text-matching-GGUF", "jina-embeddings-v5-omni-small-text-matching-GGUF", "jina-embeddings-v5-omni-small-text-matching-gguf" ], - "dimension": 1024, + "max_dimension": 1024, "dimensions": [ 32, 64, @@ -11726,12 +11678,11 @@ { "name": "jinaai/jina-embeddings-v5-omni-small-clustering-gguf", "alias": [ - "jinaai/jina-embeddings-v5-omni-small-clustering-gguf", "jinaai/jina-embeddings-v5-omni-small-clustering-GGUF", "jina-embeddings-v5-omni-small-clustering-GGUF", "jina-embeddings-v5-omni-small-clustering-gguf" ], - "dimension": 1024, + "max_dimension": 1024, "dimensions": [ 32, 64, @@ -11751,12 +11702,11 @@ { "name": "jinaai/jina-embeddings-v5-omni-small-classification-gguf", "alias": [ - "jinaai/jina-embeddings-v5-omni-small-classification-gguf", "jinaai/jina-embeddings-v5-omni-small-classification-GGUF", "jina-embeddings-v5-omni-small-classification-GGUF", "jina-embeddings-v5-omni-small-classification-gguf" ], - "dimension": 1024, + "max_dimension": 1024, "dimensions": [ 32, 64, @@ -11776,12 +11726,11 @@ { "name": "jinaai/jina-embeddings-v5-omni-small-retrieval-gguf", "alias": [ - "jinaai/jina-embeddings-v5-omni-small-retrieval-gguf", "jinaai/jina-embeddings-v5-omni-small-retrieval-GGUF", "jina-embeddings-v5-omni-small-retrieval-GGUF", "jina-embeddings-v5-omni-small-retrieval-gguf" ], - "dimension": 1024, + "max_dimension": 1024, "dimensions": [ 32, 64, @@ -11801,12 +11750,11 @@ { "name": "jinaai/jina-embeddings-v5-omni-nano-text-matching-gguf", "alias": [ - "jinaai/jina-embeddings-v5-omni-nano-text-matching-gguf", "jinaai/jina-embeddings-v5-omni-nano-text-matching-GGUF", "jina-embeddings-v5-omni-nano-text-matching-GGUF", "jina-embeddings-v5-omni-nano-text-matching-gguf" ], - "dimension": 1024, + "max_dimension": 1024, "dimensions": [ 32, 64, @@ -11826,12 +11774,11 @@ { "name": "jinaai/jina-embeddings-v5-omni-nano-clustering-gguf", "alias": [ - "jinaai/jina-embeddings-v5-omni-nano-clustering-gguf", "jinaai/jina-embeddings-v5-omni-nano-clustering-GGUF", "jina-embeddings-v5-omni-nano-clustering-GGUF", "jina-embeddings-v5-omni-nano-clustering-gguf" ], - "dimension": 1024, + "max_dimension": 1024, "dimensions": [ 32, 64, @@ -11851,12 +11798,11 @@ { "name": "jinaai/jina-embeddings-v5-omni-nano-classification-gguf", "alias": [ - "jinaai/jina-embeddings-v5-omni-nano-classification-gguf", "jinaai/jina-embeddings-v5-omni-nano-classification-GGUF", "jina-embeddings-v5-omni-nano-classification-GGUF", "jina-embeddings-v5-omni-nano-classification-gguf" ], - "dimension": 1024, + "max_dimension": 1024, "dimensions": [ 32, 64, @@ -11876,12 +11822,11 @@ { "name": "jinaai/jina-embeddings-v5-omni-nano-retrieval-gguf", "alias": [ - "jinaai/jina-embeddings-v5-omni-nano-retrieval-gguf", "jinaai/jina-embeddings-v5-omni-nano-retrieval-GGUF", "jina-embeddings-v5-omni-nano-retrieval-GGUF", "jina-embeddings-v5-omni-nano-retrieval-gguf" ], - "dimension": 1024, + "max_dimension": 1024, "dimensions": [ 32, 64, @@ -11901,10 +11846,9 @@ { "name": "jinaai/jina-embeddings-v5-omni-small-text-matching-mlx", "alias": [ - "jinaai/jina-embeddings-v5-omni-small-text-matching-mlx", "jina-embeddings-v5-omni-small-text-matching-mlx" ], - "dimension": 1024, + "max_dimension": 1024, "dimensions": [ 32, 64, @@ -11924,10 +11868,9 @@ { "name": "jinaai/jina-embeddings-v5-omni-small-clustering-mlx", "alias": [ - "jinaai/jina-embeddings-v5-omni-small-clustering-mlx", "jina-embeddings-v5-omni-small-clustering-mlx" ], - "dimension": 1024, + "max_dimension": 1024, "dimensions": [ 32, 64, @@ -11947,10 +11890,9 @@ { "name": "jinaai/jina-embeddings-v5-omni-small-classification-mlx", "alias": [ - "jinaai/jina-embeddings-v5-omni-small-classification-mlx", "jina-embeddings-v5-omni-small-classification-mlx" ], - "dimension": 1024, + "max_dimension": 1024, "dimensions": [ 32, 64, @@ -11970,10 +11912,9 @@ { "name": "jinaai/jina-embeddings-v5-omni-small-retrieval-mlx", "alias": [ - "jinaai/jina-embeddings-v5-omni-small-retrieval-mlx", "jina-embeddings-v5-omni-small-retrieval-mlx" ], - "dimension": 1024, + "max_dimension": 1024, "dimensions": [ 32, 64, @@ -11993,10 +11934,9 @@ { "name": "jinaai/jina-embeddings-v5-omni-nano-text-matching-mlx", "alias": [ - "jinaai/jina-embeddings-v5-omni-nano-text-matching-mlx", "jina-embeddings-v5-omni-nano-text-matching-mlx" ], - "dimension": 1024, + "max_dimension": 1024, "dimensions": [ 32, 64, @@ -12016,10 +11956,9 @@ { "name": "jinaai/jina-embeddings-v5-omni-nano-clustering-mlx", "alias": [ - "jinaai/jina-embeddings-v5-omni-nano-clustering-mlx", "jina-embeddings-v5-omni-nano-clustering-mlx" ], - "dimension": 1024, + "max_dimension": 1024, "dimensions": [ 32, 64, @@ -12039,10 +11978,9 @@ { "name": "jinaai/jina-embeddings-v5-omni-nano-classification-mlx", "alias": [ - "jinaai/jina-embeddings-v5-omni-nano-classification-mlx", "jina-embeddings-v5-omni-nano-classification-mlx" ], - "dimension": 1024, + "max_dimension": 1024, "dimensions": [ 32, 64, @@ -12062,10 +12000,9 @@ { "name": "jinaai/jina-embeddings-v5-omni-nano-retrieval-mlx", "alias": [ - "jinaai/jina-embeddings-v5-omni-nano-retrieval-mlx", "jina-embeddings-v5-omni-nano-retrieval-mlx" ], - "dimension": 1024, + "max_dimension": 1024, "dimensions": [ 32, 64, @@ -12085,10 +12022,9 @@ { "name": "jinaai/jina-embeddings-v5-text-small-text-matching", "alias": [ - "jinaai/jina-embeddings-v5-text-small-text-matching", "jina-embeddings-v5-text-small-text-matching" ], - "dimension": 1024, + "max_dimension": 1024, "dimensions": [ 32, 64, @@ -12106,10 +12042,9 @@ { "name": "jinaai/jina-embeddings-v5-text-small-classification", "alias": [ - "jinaai/jina-embeddings-v5-text-small-classification", "jina-embeddings-v5-text-small-classification" ], - "dimension": 1024, + "max_dimension": 1024, "dimensions": [ 32, 64, @@ -12127,10 +12062,9 @@ { "name": "jinaai/jina-embeddings-v5-text-small-clustering", "alias": [ - "jinaai/jina-embeddings-v5-text-small-clustering", "jina-embeddings-v5-text-small-clustering" ], - "dimension": 1024, + "max_dimension": 1024, "dimensions": [ 32, 64, @@ -12148,10 +12082,9 @@ { "name": "jinaai/jina-embeddings-v5-text-small-retrieval", "alias": [ - "jinaai/jina-embeddings-v5-text-small-retrieval", "jina-embeddings-v5-text-small-retrieval" ], - "dimension": 1024, + "max_dimension": 1024, "dimensions": [ 32, 64, @@ -12169,10 +12102,9 @@ { "name": "jinaai/jina-embeddings-v5-text-nano-classification", "alias": [ - "jinaai/jina-embeddings-v5-text-nano-classification", "jina-embeddings-v5-text-nano-classification" ], - "dimension": 1024, + "max_dimension": 1024, "dimensions": [ 32, 64, @@ -12190,10 +12122,9 @@ { "name": "jinaai/jina-embeddings-v5-text-nano-clustering", "alias": [ - "jinaai/jina-embeddings-v5-text-nano-clustering", "jina-embeddings-v5-text-nano-clustering" ], - "dimension": 1024, + "max_dimension": 1024, "dimensions": [ 32, 64, @@ -12211,10 +12142,9 @@ { "name": "jinaai/jina-embeddings-v5-text-nano-text-matching", "alias": [ - "jinaai/jina-embeddings-v5-text-nano-text-matching", "jina-embeddings-v5-text-nano-text-matching" ], - "dimension": 1024, + "max_dimension": 1024, "dimensions": [ 32, 64, @@ -12232,10 +12162,9 @@ { "name": "jinaai/jina-embeddings-v5-text-nano-retrieval", "alias": [ - "jinaai/jina-embeddings-v5-text-nano-retrieval", "jina-embeddings-v5-text-nano-retrieval" ], - "dimension": 1024, + "max_dimension": 1024, "dimensions": [ 32, 64, @@ -12253,10 +12182,9 @@ { "name": "jinaai/jina-embeddings-v5-text-nano", "alias": [ - "jinaai/jina-embeddings-v5-text-nano", "jina-embeddings-v5-text-nano" ], - "dimension": 1024, + "max_dimension": 1024, "dimensions": [ 32, 64, @@ -12274,10 +12202,9 @@ { "name": "jinaai/jina-embeddings-v5-text-small", "alias": [ - "jinaai/jina-embeddings-v5-text-small", "jina-embeddings-v5-text-small" ], - "dimension": 1024, + "max_dimension": 1024, "dimensions": [ 32, 64, @@ -12295,7 +12222,6 @@ { "name": "jinaai/jina-reranker-m0", "alias": [ - "jinaai/jina-reranker-m0", "jina-reranker-m0" ], "model_types": [ @@ -12306,10 +12232,9 @@ { "name": "jinaai/jina-embeddings-v4", "alias": [ - "jinaai/jina-embeddings-v4", "jina-embeddings-v4" ], - "dimension": 2048, + "max_dimension": 2048, "dimensions": [ 128, 256, @@ -12326,10 +12251,9 @@ { "name": "jinaai/jina-embeddings-v3-hf", "alias": [ - "jinaai/jina-embeddings-v3-hf", "jina-embeddings-v3-hf" ], - "dimension": 1024, + "max_dimension": 1024, "dimensions": [ 32, 64, @@ -12347,10 +12271,9 @@ { "name": "jinaai/jina-embeddings-v3", "alias": [ - "jinaai/jina-embeddings-v3", "jina-embeddings-v3" ], - "dimension": 1024, + "max_dimension": 1024, "dimensions": [ 32, 64, @@ -12368,10 +12291,9 @@ { "name": "jinaai/jina-clip-v1", "alias": [ - "jinaai/jina-clip-v1", "jina-clip-v1" ], - "dimension": 768, + "max_dimension": 768, "dimensions": [ 64, 128, @@ -12388,10 +12310,9 @@ { "name": "jinaai/jina-clip-v2", "alias": [ - "jinaai/jina-clip-v2", "jina-clip-v2" ], - "dimension": 1024, + "max_dimension": 1024, "dimensions": [ 64, 128, @@ -12409,7 +12330,6 @@ { "name": "jinaai/jina-vlm", "alias": [ - "jinaai/jina-vlm", "jina-vlm" ], "max_tokens": 32768, @@ -12422,7 +12342,6 @@ { "name": "jinaai/jina-reranker-v3", "alias": [ - "jinaai/jina-reranker-v3", "jina-reranker-v3" ], "model_types": [ @@ -12433,10 +12352,9 @@ { "name": "jinaai/jina-embeddings-v4-mlx-8bit", "alias": [ - "jinaai/jina-embeddings-v4-mlx-8bit", "jina-embeddings-v4-mlx-8bit" ], - "dimension": 2048, + "max_dimension": 2048, "dimensions": [ 128, 256, @@ -12453,7 +12371,6 @@ { "name": "jinaai/xlm-roberta-flash-implementation", "alias": [ - "jinaai/xlm-roberta-flash-implementation", "xlm-roberta-flash-implementation" ], "model_types": [ @@ -12463,12 +12380,11 @@ { "name": "jinaai/jina-embeddings-v5-text-nano-classification-gguf", "alias": [ - "jinaai/jina-embeddings-v5-text-nano-classification-gguf", "jinaai/jina-embeddings-v5-text-nano-classification-GGUF", "jina-embeddings-v5-text-nano-classification-GGUF", "jina-embeddings-v5-text-nano-classification-gguf" ], - "dimension": 1024, + "max_dimension": 1024, "dimensions": [ 32, 64, @@ -12486,12 +12402,11 @@ { "name": "jinaai/jina-embeddings-v5-text-nano-clustering-gguf", "alias": [ - "jinaai/jina-embeddings-v5-text-nano-clustering-gguf", "jinaai/jina-embeddings-v5-text-nano-clustering-GGUF", "jina-embeddings-v5-text-nano-clustering-GGUF", "jina-embeddings-v5-text-nano-clustering-gguf" ], - "dimension": 1024, + "max_dimension": 1024, "dimensions": [ 32, 64, @@ -12509,12 +12424,11 @@ { "name": "jinaai/jina-embeddings-v5-text-nano-retrieval-gguf", "alias": [ - "jinaai/jina-embeddings-v5-text-nano-retrieval-gguf", "jinaai/jina-embeddings-v5-text-nano-retrieval-GGUF", "jina-embeddings-v5-text-nano-retrieval-GGUF", "jina-embeddings-v5-text-nano-retrieval-gguf" ], - "dimension": 1024, + "max_dimension": 1024, "dimensions": [ 32, 64, @@ -12532,12 +12446,11 @@ { "name": "jinaai/jina-embeddings-v5-text-nano-text-matching-gguf", "alias": [ - "jinaai/jina-embeddings-v5-text-nano-text-matching-gguf", "jinaai/jina-embeddings-v5-text-nano-text-matching-GGUF", "jina-embeddings-v5-text-nano-text-matching-GGUF", "jina-embeddings-v5-text-nano-text-matching-gguf" ], - "dimension": 1024, + "max_dimension": 1024, "dimensions": [ 32, 64, @@ -12555,10 +12468,9 @@ { "name": "jinaai/jina-embeddings-v5-text-nano-mlx", "alias": [ - "jinaai/jina-embeddings-v5-text-nano-mlx", "jina-embeddings-v5-text-nano-mlx" ], - "dimension": 1024, + "max_dimension": 1024, "dimensions": [ 32, 64, @@ -12576,10 +12488,9 @@ { "name": "jinaai/jina-embeddings-v5-text-small-mlx", "alias": [ - "jinaai/jina-embeddings-v5-text-small-mlx", "jina-embeddings-v5-text-small-mlx" ], - "dimension": 1024, + "max_dimension": 1024, "dimensions": [ 32, 64, @@ -12597,10 +12508,9 @@ { "name": "jinaai/jina-embeddings-v5-text-nano-classification-mlx", "alias": [ - "jinaai/jina-embeddings-v5-text-nano-classification-mlx", "jina-embeddings-v5-text-nano-classification-mlx" ], - "dimension": 1024, + "max_dimension": 1024, "dimensions": [ 32, 64, @@ -12618,10 +12528,9 @@ { "name": "jinaai/jina-embeddings-v5-text-nano-clustering-mlx", "alias": [ - "jinaai/jina-embeddings-v5-text-nano-clustering-mlx", "jina-embeddings-v5-text-nano-clustering-mlx" ], - "dimension": 1024, + "max_dimension": 1024, "dimensions": [ 32, 64, @@ -12639,10 +12548,9 @@ { "name": "jinaai/jina-embeddings-v5-text-nano-text-matching-mlx", "alias": [ - "jinaai/jina-embeddings-v5-text-nano-text-matching-mlx", "jina-embeddings-v5-text-nano-text-matching-mlx" ], - "dimension": 1024, + "max_dimension": 1024, "dimensions": [ 32, 64, @@ -12660,10 +12568,9 @@ { "name": "jinaai/jina-embeddings-v5-text-nano-retrieval-mlx", "alias": [ - "jinaai/jina-embeddings-v5-text-nano-retrieval-mlx", "jina-embeddings-v5-text-nano-retrieval-mlx" ], - "dimension": 1024, + "max_dimension": 1024, "dimensions": [ 32, 64, @@ -12681,10 +12588,9 @@ { "name": "jinaai/jina-embeddings-v5-text-small-classification-mlx", "alias": [ - "jinaai/jina-embeddings-v5-text-small-classification-mlx", "jina-embeddings-v5-text-small-classification-mlx" ], - "dimension": 1024, + "max_dimension": 1024, "dimensions": [ 32, 64, @@ -12702,10 +12608,9 @@ { "name": "jinaai/jina-embeddings-v5-text-small-clustering-mlx", "alias": [ - "jinaai/jina-embeddings-v5-text-small-clustering-mlx", "jina-embeddings-v5-text-small-clustering-mlx" ], - "dimension": 1024, + "max_dimension": 1024, "dimensions": [ 32, 64, @@ -12723,10 +12628,9 @@ { "name": "jinaai/jina-embeddings-v5-text-small-text-matching-mlx", "alias": [ - "jinaai/jina-embeddings-v5-text-small-text-matching-mlx", "jina-embeddings-v5-text-small-text-matching-mlx" ], - "dimension": 1024, + "max_dimension": 1024, "dimensions": [ 32, 64, @@ -12744,10 +12648,9 @@ { "name": "jinaai/jina-embeddings-v5-text-small-retrieval-mlx", "alias": [ - "jinaai/jina-embeddings-v5-text-small-retrieval-mlx", "jina-embeddings-v5-text-small-retrieval-mlx" ], - "dimension": 1024, + "max_dimension": 1024, "dimensions": [ 32, 64, @@ -12765,10 +12668,9 @@ { "name": "jinaai/jina-code-embeddings-1.5b-mlx", "alias": [ - "jinaai/jina-code-embeddings-1.5b-mlx", "jina-code-embeddings-1.5b-mlx" ], - "dimension": 1024, + "max_dimension": 1024, "dimensions": [ 256, 512, @@ -12783,10 +12685,9 @@ { "name": "jinaai/jina-code-embeddings-0.5b-mlx", "alias": [ - "jinaai/jina-code-embeddings-0.5b-mlx", "jina-code-embeddings-0.5b-mlx" ], - "dimension": 1024, + "max_dimension": 1024, "dimensions": [ 256, 512, @@ -12801,12 +12702,11 @@ { "name": "jinaai/jina-embeddings-v5-text-small-retrieval-gguf", "alias": [ - "jinaai/jina-embeddings-v5-text-small-retrieval-gguf", "jinaai/jina-embeddings-v5-text-small-retrieval-GGUF", "jina-embeddings-v5-text-small-retrieval-GGUF", "jina-embeddings-v5-text-small-retrieval-gguf" ], - "dimension": 1024, + "max_dimension": 1024, "dimensions": [ 32, 64, @@ -12824,12 +12724,11 @@ { "name": "jinaai/jina-embeddings-v5-text-small-classification-gguf", "alias": [ - "jinaai/jina-embeddings-v5-text-small-classification-gguf", "jinaai/jina-embeddings-v5-text-small-classification-GGUF", "jina-embeddings-v5-text-small-classification-GGUF", "jina-embeddings-v5-text-small-classification-gguf" ], - "dimension": 1024, + "max_dimension": 1024, "dimensions": [ 32, 64, @@ -12847,12 +12746,11 @@ { "name": "jinaai/jina-embeddings-v5-text-small-clustering-gguf", "alias": [ - "jinaai/jina-embeddings-v5-text-small-clustering-gguf", "jinaai/jina-embeddings-v5-text-small-clustering-GGUF", "jina-embeddings-v5-text-small-clustering-GGUF", "jina-embeddings-v5-text-small-clustering-gguf" ], - "dimension": 1024, + "max_dimension": 1024, "dimensions": [ 32, 64, @@ -12870,12 +12768,11 @@ { "name": "jinaai/jina-embeddings-v5-text-small-text-matching-gguf", "alias": [ - "jinaai/jina-embeddings-v5-text-small-text-matching-gguf", "jinaai/jina-embeddings-v5-text-small-text-matching-GGUF", "jina-embeddings-v5-text-small-text-matching-GGUF", "jina-embeddings-v5-text-small-text-matching-gguf" ], - "dimension": 1024, + "max_dimension": 1024, "dimensions": [ 32, 64, @@ -12893,7 +12790,6 @@ { "name": "jinaai/jina-vlm-mlx", "alias": [ - "jinaai/jina-vlm-mlx", "jina-vlm-mlx" ], "max_tokens": 32768, @@ -12906,7 +12802,6 @@ { "name": "jinaai/jina-reranker-v2-base-multilingual", "alias": [ - "jinaai/jina-reranker-v2-base-multilingual", "jina-reranker-v2-base-multilingual" ], "model_types": [ @@ -12917,7 +12812,6 @@ { "name": "jinaai/jina-reranker-v3-gguf", "alias": [ - "jinaai/jina-reranker-v3-gguf", "jinaai/jina-reranker-v3-GGUF", "jina-reranker-v3-GGUF", "jina-reranker-v3-gguf" @@ -12930,7 +12824,6 @@ { "name": "jinaai/jina-reranker-v3-mlx", "alias": [ - "jinaai/jina-reranker-v3-mlx", "jina-reranker-v3-mlx" ], "model_types": [ @@ -12941,10 +12834,9 @@ { "name": "jinaai/jina-code-embeddings-0.5b", "alias": [ - "jinaai/jina-code-embeddings-0.5b", "jina-code-embeddings-0.5b" ], - "dimension": 1024, + "max_dimension": 1024, "dimensions": [ 256, 512, @@ -12959,10 +12851,9 @@ { "name": "jinaai/jina-code-embeddings-1.5b", "alias": [ - "jinaai/jina-code-embeddings-1.5b", "jina-code-embeddings-1.5b" ], - "dimension": 1024, + "max_dimension": 1024, "dimensions": [ 256, 512, @@ -12977,12 +12868,11 @@ { "name": "jinaai/jina-embeddings-v4-text-matching-gguf", "alias": [ - "jinaai/jina-embeddings-v4-text-matching-gguf", "jinaai/jina-embeddings-v4-text-matching-GGUF", "jina-embeddings-v4-text-matching-GGUF", "jina-embeddings-v4-text-matching-gguf" ], - "dimension": 2048, + "max_dimension": 2048, "dimensions": [ 128, 256, @@ -12998,12 +12888,11 @@ { "name": "jinaai/jina-embeddings-v4-text-code-gguf", "alias": [ - "jinaai/jina-embeddings-v4-text-code-gguf", "jinaai/jina-embeddings-v4-text-code-GGUF", "jina-embeddings-v4-text-code-GGUF", "jina-embeddings-v4-text-code-gguf" ], - "dimension": 2048, + "max_dimension": 2048, "dimensions": [ 128, 256, @@ -13019,12 +12908,11 @@ { "name": "jinaai/jina-embeddings-v4-text-retrieval-gguf", "alias": [ - "jinaai/jina-embeddings-v4-text-retrieval-gguf", "jinaai/jina-embeddings-v4-text-retrieval-GGUF", "jina-embeddings-v4-text-retrieval-GGUF", "jina-embeddings-v4-text-retrieval-gguf" ], - "dimension": 2048, + "max_dimension": 2048, "dimensions": [ 128, 256, @@ -13040,10 +12928,9 @@ { "name": "jinaai/jina-embeddings-v4-vllm-retrieval", "alias": [ - "jinaai/jina-embeddings-v4-vllm-retrieval", "jina-embeddings-v4-vllm-retrieval" ], - "dimension": 2048, + "max_dimension": 2048, "dimensions": [ 128, 256, @@ -13060,7 +12947,6 @@ { "name": "jinaai/jina-reranker-v1-tiny-en", "alias": [ - "jinaai/jina-reranker-v1-tiny-en", "jina-reranker-v1-tiny-en" ], "model_types": [ @@ -13071,7 +12957,6 @@ { "name": "jinaai/jina-reranker-v1-turbo-en", "alias": [ - "jinaai/jina-reranker-v1-turbo-en", "jina-reranker-v1-turbo-en" ], "model_types": [ @@ -13082,12 +12967,11 @@ { "name": "jinaai/jina-code-embeddings-1.5b-gguf", "alias": [ - "jinaai/jina-code-embeddings-1.5b-gguf", "jinaai/jina-code-embeddings-1.5b-GGUF", "jina-code-embeddings-1.5b-GGUF", "jina-code-embeddings-1.5b-gguf" ], - "dimension": 1024, + "max_dimension": 1024, "dimensions": [ 256, 512, @@ -13102,12 +12986,11 @@ { "name": "jinaai/jina-code-embeddings-0.5b-gguf", "alias": [ - "jinaai/jina-code-embeddings-0.5b-gguf", "jinaai/jina-code-embeddings-0.5b-GGUF", "jina-code-embeddings-0.5b-GGUF", "jina-code-embeddings-0.5b-gguf" ], - "dimension": 1024, + "max_dimension": 1024, "dimensions": [ 256, 512, @@ -13122,10 +13005,9 @@ { "name": "jinaai/jina-embeddings-v4-vllm-code", "alias": [ - "jinaai/jina-embeddings-v4-vllm-code", "jina-embeddings-v4-vllm-code" ], - "dimension": 2048, + "max_dimension": 2048, "dimensions": [ 128, 256, @@ -13142,10 +13024,9 @@ { "name": "jinaai/jina-embeddings-v4-vllm-text-matching", "alias": [ - "jinaai/jina-embeddings-v4-vllm-text-matching", "jina-embeddings-v4-vllm-text-matching" ], - "dimension": 2048, + "max_dimension": 2048, "dimensions": [ 128, 256, @@ -13162,7 +13043,6 @@ { "name": "jinaai/jina-reranker-m0-gguf", "alias": [ - "jinaai/jina-reranker-m0-gguf", "jinaai/jina-reranker-m0-GGUF", "jina-reranker-m0-GGUF", "jina-reranker-m0-gguf" @@ -13175,7 +13055,6 @@ { "name": "jinaai/jina-clip-implementation", "alias": [ - "jinaai/jina-clip-implementation", "jina-clip-implementation" ], "model_types": [ @@ -13185,7 +13064,6 @@ { "name": "jinaai/jina-reranker-m0-debug", "alias": [ - "jinaai/jina-reranker-m0-debug", "jina-reranker-m0-debug" ], "model_types": [ @@ -13196,7 +13074,6 @@ { "name": "jinaai/readerlm-v2", "alias": [ - "jinaai/readerlm-v2", "jinaai/ReaderLM-v2", "ReaderLM-v2", "readerlm-v2" @@ -13209,10 +13086,9 @@ { "name": "jinaai/jina-colbert-v2", "alias": [ - "jinaai/jina-colbert-v2", "jina-colbert-v2" ], - "dimension": 128, + "max_dimension": 128, "dimensions": [ 128 ], @@ -13224,7 +13100,6 @@ { "name": "jinaai/reader-lm-1.5b", "alias": [ - "jinaai/reader-lm-1.5b", "reader-lm-1.5b" ], "max_tokens": 128000, @@ -13235,10 +13110,9 @@ { "name": "jinaai/jina-embedding-s-en-v1", "alias": [ - "jinaai/jina-embedding-s-en-v1", "jina-embedding-s-en-v1" ], - "dimension": 512, + "max_dimension": 512, "dimensions": [ 512 ], @@ -13250,10 +13124,9 @@ { "name": "jinaai/jina-embedding-b-en-v1", "alias": [ - "jinaai/jina-embedding-b-en-v1", "jina-embedding-b-en-v1" ], - "dimension": 768, + "max_dimension": 768, "dimensions": [ 768 ], @@ -13265,10 +13138,9 @@ { "name": "jinaai/jina-embedding-l-en-v1", "alias": [ - "jinaai/jina-embedding-l-en-v1", "jina-embedding-l-en-v1" ], - "dimension": 1024, + "max_dimension": 1024, "dimensions": [ 1024 ], @@ -13280,10 +13152,9 @@ { "name": "jinaai/jina-embeddings-v2-base-code", "alias": [ - "jinaai/jina-embeddings-v2-base-code", "jina-embeddings-v2-base-code" ], - "dimension": 768, + "max_dimension": 768, "dimensions": [ 768 ], @@ -13295,10 +13166,9 @@ { "name": "jinaai/jina-embeddings-v2-base-es", "alias": [ - "jinaai/jina-embeddings-v2-base-es", "jina-embeddings-v2-base-es" ], - "dimension": 768, + "max_dimension": 768, "dimensions": [ 768 ], @@ -13310,10 +13180,9 @@ { "name": "jinaai/jina-embeddings-v2-base-de", "alias": [ - "jinaai/jina-embeddings-v2-base-de", "jina-embeddings-v2-base-de" ], - "dimension": 768, + "max_dimension": 768, "dimensions": [ 768 ], @@ -13325,10 +13194,9 @@ { "name": "jinaai/jina-embeddings-v2-small-en", "alias": [ - "jinaai/jina-embeddings-v2-small-en", "jina-embeddings-v2-small-en" ], - "dimension": 512, + "max_dimension": 512, "dimensions": [ 512 ], @@ -13340,10 +13208,9 @@ { "name": "jinaai/jina-embeddings-v2-base-zh", "alias": [ - "jinaai/jina-embeddings-v2-base-zh", "jina-embeddings-v2-base-zh" ], - "dimension": 768, + "max_dimension": 768, "dimensions": [ 768 ], @@ -13355,10 +13222,9 @@ { "name": "jinaai/jina-embeddings-v2-base-en", "alias": [ - "jinaai/jina-embeddings-v2-base-en", "jina-embeddings-v2-base-en" ], - "dimension": 768, + "max_dimension": 768, "dimensions": [ 768 ], @@ -13370,10 +13236,9 @@ { "name": "jinaai/jina-colbert-v1-en", "alias": [ - "jinaai/jina-colbert-v1-en", "jina-colbert-v1-en" ], - "dimension": 128, + "max_dimension": 128, "dimensions": [ 128 ], @@ -13385,10 +13250,9 @@ { "name": "jinaai/jina-colbert-v2-64", "alias": [ - "jinaai/jina-colbert-v2-64", "jina-colbert-v2-64" ], - "dimension": 64, + "max_dimension": 64, "dimensions": [ 64 ], @@ -13400,7 +13264,6 @@ { "name": "jinaai/reader-lm-0.5b", "alias": [ - "jinaai/reader-lm-0.5b", "reader-lm-0.5b" ], "max_tokens": 128000, @@ -13411,7 +13274,6 @@ { "name": "jinaai/text-seg-lm-qwen2-0.5b", "alias": [ - "jinaai/text-seg-lm-qwen2-0.5b", "text-seg-lm-qwen2-0.5b" ], "max_tokens": 32768, @@ -13422,7 +13284,6 @@ { "name": "jinaai/text-seg-lm-qwen2-0.5b-summary-chunking", "alias": [ - "jinaai/text-seg-lm-qwen2-0.5b-summary-chunking", "text-seg-lm-qwen2-0.5b-summary-chunking" ], "max_tokens": 32768, @@ -13433,7 +13294,6 @@ { "name": "jinaai/text-seg-lm-qwen2-0.5b-cot-topic-chunking", "alias": [ - "jinaai/text-seg-lm-qwen2-0.5b-cot-topic-chunking", "text-seg-lm-qwen2-0.5b-cot-topic-chunking" ], "max_tokens": 32768, @@ -13444,7 +13304,6 @@ { "name": "jinaai/xlm-roberta-flash-implementation-onnx", "alias": [ - "jinaai/xlm-roberta-flash-implementation-onnx", "xlm-roberta-flash-implementation-onnx" ], "model_types": [ @@ -13454,10 +13313,9 @@ { "name": "jinaai/jina-embeddings-v3-small-ci", "alias": [ - "jinaai/jina-embeddings-v3-small-ci", "jina-embeddings-v3-small-ci" ], - "dimension": 1024, + "max_dimension": 1024, "dimensions": [ 32, 64, @@ -13475,7 +13333,6 @@ { "name": "jinaai/jina-bert-flash-implementation", "alias": [ - "jinaai/jina-bert-flash-implementation", "jina-bert-flash-implementation" ], "model_types": [ @@ -13485,7 +13342,6 @@ { "name": "jinaai/phi-3-tiny-untrained", "alias": [ - "jinaai/phi-3-tiny-untrained", "jinaai/Phi-3-tiny-untrained", "Phi-3-tiny-untrained", "phi-3-tiny-untrained" @@ -13497,7 +13353,6 @@ { "name": "jinaai/jina-bert-v2-qk-post-norm", "alias": [ - "jinaai/jina-bert-v2-qk-post-norm", "jina-bert-v2-qk-post-norm" ], "model_types": [ @@ -13507,7 +13362,6 @@ { "name": "jinaai/jina-bert-v2-qk-devlin-norm-1e-2", "alias": [ - "jinaai/jina-bert-v2-qk-devlin-norm-1e-2", "jina-bert-v2-qk-devlin-norm-1e-2" ], "model_types": [ @@ -13517,7 +13371,6 @@ { "name": "jinaai/jina-bert-implementation", "alias": [ - "jinaai/jina-bert-implementation", "jina-bert-implementation" ], "model_types": [ @@ -13527,7 +13380,6 @@ { "name": "jinaai/clip-models", "alias": [ - "jinaai/clip-models", "clip-models" ], "model_types": [ @@ -13537,10 +13389,9 @@ { "name": "jinaai/jina-embedding-t-en-v1", "alias": [ - "jinaai/jina-embedding-t-en-v1", "jina-embedding-t-en-v1" ], - "dimension": 312, + "max_dimension": 312, "dimensions": [ 312 ], @@ -13552,7 +13403,6 @@ { "name": "jinaai/starcoder-1b-textbook", "alias": [ - "jinaai/starcoder-1b-textbook", "starcoder-1b-textbook" ], "model_types": [ @@ -13562,7 +13412,6 @@ { "name": "jinaai/flat-2d-animerge", "alias": [ - "jinaai/flat-2d-animerge", "flat-2d-animerge" ], "model_types": [ @@ -13572,7 +13421,6 @@ { "name": "jinaai/falcon-7b-code-alpaca-lora", "alias": [ - "jinaai/falcon-7b-code-alpaca-lora", "falcon-7b-code-alpaca-lora" ], "model_types": [ @@ -13582,7 +13430,6 @@ { "name": "jinaai/falcon-40b-code-alpaca", "alias": [ - "jinaai/falcon-40b-code-alpaca", "falcon-40b-code-alpaca" ], "model_types": [ @@ -13592,7 +13439,6 @@ { "name": "jinaai/falcon-40b-code-alpaca-lora", "alias": [ - "jinaai/falcon-40b-code-alpaca-lora", "falcon-40b-code-alpaca-lora" ], "model_types": [ @@ -13602,7 +13448,6 @@ { "name": "jinaai/falcon-7b-code-alpaca", "alias": [ - "jinaai/falcon-7b-code-alpaca", "falcon-7b-code-alpaca" ], "model_types": [ @@ -13612,7 +13457,6 @@ { "name": "openai/privacy-filter", "alias": [ - "openai/privacy-filter", "privacy-filter" ], "max_tokens": 4096, @@ -13623,7 +13467,6 @@ { "name": "openai/gpt-oss-safeguard-20b", "alias": [ - "openai/gpt-oss-safeguard-20b", "gpt-oss-safeguard-20b" ], "max_tokens": 131072, @@ -13638,7 +13481,6 @@ { "name": "openai/circuit-sparsity", "alias": [ - "openai/circuit-sparsity", "circuit-sparsity" ], "model_types": [ @@ -13648,7 +13490,6 @@ { "name": "openai/gpt-oss-safeguard-120b", "alias": [ - "openai/gpt-oss-safeguard-120b", "gpt-oss-safeguard-120b" ], "max_tokens": 131072, @@ -13663,7 +13504,6 @@ { "name": "openai/gpt-oss-20b", "alias": [ - "openai/gpt-oss-20b", "gpt-oss-20b" ], "max_tokens": 131072, @@ -13678,7 +13518,6 @@ { "name": "openai/gpt-oss-120b", "alias": [ - "openai/gpt-oss-120b", "gpt-oss-120b" ], "max_tokens": 131072, @@ -13693,7 +13532,6 @@ { "name": "openai/whisper-large-v3-turbo", "alias": [ - "openai/whisper-large-v3-turbo", "whisper-large-v3-turbo" ], "model_types": [ @@ -13703,7 +13541,6 @@ { "name": "openai/whisper-large-v3", "alias": [ - "openai/whisper-large-v3", "whisper-large-v3" ], "model_types": [ @@ -13713,7 +13550,6 @@ { "name": "openai/whisper-large-v2", "alias": [ - "openai/whisper-large-v2", "whisper-large-v2" ], "model_types": [ @@ -13723,7 +13559,6 @@ { "name": "openai/whisper-large", "alias": [ - "openai/whisper-large", "whisper-large" ], "model_types": [ @@ -13733,7 +13568,6 @@ { "name": "openai/whisper-medium", "alias": [ - "openai/whisper-medium", "whisper-medium" ], "model_types": [ @@ -13743,7 +13577,6 @@ { "name": "openai/whisper-small", "alias": [ - "openai/whisper-small", "whisper-small" ], "model_types": [ @@ -13753,7 +13586,6 @@ { "name": "openai/whisper-tiny", "alias": [ - "openai/whisper-tiny", "whisper-tiny" ], "model_types": [ @@ -13763,7 +13595,6 @@ { "name": "openai/whisper-base", "alias": [ - "openai/whisper-base", "whisper-base" ], "model_types": [ @@ -13773,10 +13604,9 @@ { "name": "openai/clip-vit-base-patch32", "alias": [ - "openai/clip-vit-base-patch32", "clip-vit-base-patch32" ], - "dimension": 512, + "max_dimension": 512, "dimensions": [ 512 ], @@ -13788,7 +13618,6 @@ { "name": "openai/whisper-medium.en", "alias": [ - "openai/whisper-medium.en", "whisper-medium.en" ], "model_types": [ @@ -13798,7 +13627,6 @@ { "name": "openai/whisper-small.en", "alias": [ - "openai/whisper-small.en", "whisper-small.en" ], "model_types": [ @@ -13808,7 +13636,6 @@ { "name": "openai/whisper-tiny.en", "alias": [ - "openai/whisper-tiny.en", "whisper-tiny.en" ], "model_types": [ @@ -13818,7 +13645,6 @@ { "name": "openai/whisper-base.en", "alias": [ - "openai/whisper-base.en", "whisper-base.en" ], "model_types": [ @@ -13828,7 +13654,6 @@ { "name": "openai/shap-e", "alias": [ - "openai/shap-e", "shap-e" ], "model_types": [ @@ -13838,7 +13663,6 @@ { "name": "openai/consistency-decoder", "alias": [ - "openai/consistency-decoder", "consistency-decoder" ], "model_types": [ @@ -13848,7 +13672,6 @@ { "name": "openai/diffusers-ct_imagenet64", "alias": [ - "openai/diffusers-ct_imagenet64", "diffusers-ct_imagenet64" ], "model_types": [ @@ -13858,7 +13681,6 @@ { "name": "openai/diffusers-cd_imagenet64_lpips", "alias": [ - "openai/diffusers-cd_imagenet64_lpips", "diffusers-cd_imagenet64_lpips" ], "model_types": [ @@ -13868,7 +13690,6 @@ { "name": "openai/diffusers-cd_imagenet64_l2", "alias": [ - "openai/diffusers-cd_imagenet64_l2", "diffusers-cd_imagenet64_l2" ], "model_types": [ @@ -13878,10 +13699,9 @@ { "name": "openai/clip-vit-large-patch14", "alias": [ - "openai/clip-vit-large-patch14", "clip-vit-large-patch14" ], - "dimension": 768, + "max_dimension": 768, "dimensions": [ 768 ], @@ -13893,7 +13713,6 @@ { "name": "openai/shap-e-img2img", "alias": [ - "openai/shap-e-img2img", "shap-e-img2img" ], "model_types": [ @@ -13904,7 +13723,6 @@ { "name": "openai/diffusers-cd_cat256_lpips", "alias": [ - "openai/diffusers-cd_cat256_lpips", "diffusers-cd_cat256_lpips" ], "model_types": [ @@ -13914,7 +13732,6 @@ { "name": "openai/diffusers-cd_cat256_l2", "alias": [ - "openai/diffusers-cd_cat256_l2", "diffusers-cd_cat256_l2" ], "model_types": [ @@ -13924,7 +13741,6 @@ { "name": "openai/diffusers-cd_bedroom256_l2", "alias": [ - "openai/diffusers-cd_bedroom256_l2", "diffusers-cd_bedroom256_l2" ], "model_types": [ @@ -13934,7 +13750,6 @@ { "name": "openai/diffusers-ct_bedroom256", "alias": [ - "openai/diffusers-ct_bedroom256", "diffusers-ct_bedroom256" ], "model_types": [ @@ -13944,7 +13759,6 @@ { "name": "openai/diffusers-cd_bedroom256_lpips", "alias": [ - "openai/diffusers-cd_bedroom256_lpips", "diffusers-cd_bedroom256_lpips" ], "model_types": [ @@ -13954,7 +13768,6 @@ { "name": "openai/diffusers-ct_cat256", "alias": [ - "openai/diffusers-ct_cat256", "diffusers-ct_cat256" ], "model_types": [ @@ -13964,7 +13777,6 @@ { "name": "openai/imagegpt-small", "alias": [ - "openai/imagegpt-small", "imagegpt-small" ], "model_types": [ @@ -13974,7 +13786,6 @@ { "name": "openai/imagegpt-medium", "alias": [ - "openai/imagegpt-medium", "imagegpt-medium" ], "model_types": [ @@ -13984,7 +13795,6 @@ { "name": "openai/imagegpt-large", "alias": [ - "openai/imagegpt-large", "imagegpt-large" ], "model_types": [ @@ -13994,7 +13804,6 @@ { "name": "openai/jukebox-5b-lyrics", "alias": [ - "openai/jukebox-5b-lyrics", "jukebox-5b-lyrics" ], "model_types": [ @@ -14004,7 +13813,6 @@ { "name": "openai/jukebox-1b-lyrics", "alias": [ - "openai/jukebox-1b-lyrics", "jukebox-1b-lyrics" ], "model_types": [ @@ -14014,10 +13822,9 @@ { "name": "openai/clip-vit-base-patch16", "alias": [ - "openai/clip-vit-base-patch16", "clip-vit-base-patch16" ], - "dimension": 512, + "max_dimension": 512, "dimensions": [ 512 ], @@ -14029,10 +13836,9 @@ { "name": "openai/clip-vit-large-patch14-336", "alias": [ - "openai/clip-vit-large-patch14-336", "clip-vit-large-patch14-336" ], - "dimension": 768, + "max_dimension": 768, "dimensions": [ 768 ], @@ -14044,7 +13850,6 @@ { "name": "gpt-5.4", "alias": [ - "gpt-5.4" ], "max_tokens": 1050000, "model_types": [ @@ -14058,7 +13863,6 @@ { "name": "gpt-image-2", "alias": [ - "gpt-image-2" ], "model_types": [ "image", @@ -14068,7 +13872,6 @@ { "name": "gpt-5.1", "alias": [ - "gpt-5.1" ], "max_tokens": 400000, "model_types": [ @@ -14082,7 +13885,6 @@ { "name": "gpt-5.2", "alias": [ - "gpt-5.2" ], "max_tokens": 400000, "model_types": [ @@ -14096,7 +13898,6 @@ { "name": "gpt-5.4-mini", "alias": [ - "gpt-5.4-mini" ], "max_tokens": 400000, "model_types": [ @@ -14110,7 +13911,6 @@ { "name": "gpt-5", "alias": [ - "gpt-5" ], "max_tokens": 400000, "model_types": [ @@ -14124,7 +13924,6 @@ { "name": "gpt-5-codex", "alias": [ - "gpt-5-codex" ], "max_tokens": 400000, "model_types": [ @@ -14138,7 +13937,6 @@ { "name": "gpt-5.3-codex", "alias": [ - "gpt-5.3-codex" ], "max_tokens": 400000, "model_types": [ @@ -14152,7 +13950,6 @@ { "name": "gpt-5.1-codex", "alias": [ - "gpt-5.1-codex" ], "max_tokens": 400000, "model_types": [ @@ -14166,7 +13963,6 @@ { "name": "gpt-5.3-codex-spark", "alias": [ - "gpt-5.3-codex-spark" ], "model_types": [ "chat" @@ -14179,7 +13975,6 @@ { "name": "gpt-5-codex-mini", "alias": [ - "gpt-5-codex-mini" ], "model_types": [ "chat" @@ -14192,7 +13987,6 @@ { "name": "gpt-5.1-codex-max", "alias": [ - "gpt-5.1-codex-max" ], "max_tokens": 400000, "model_types": [ @@ -14206,7 +14000,6 @@ { "name": "gpt-5.5", "alias": [ - "gpt-5.5" ], "max_tokens": 1050000, "model_types": [ @@ -14220,7 +14013,6 @@ { "name": "gpt-5.1-codex-mini", "alias": [ - "gpt-5.1-codex-mini" ], "max_tokens": 400000, "model_types": [ @@ -14234,7 +14026,6 @@ { "name": "gpt-5.2-codex", "alias": [ - "gpt-5.2-codex" ], "max_tokens": 400000, "model_types": [ @@ -14248,7 +14039,6 @@ { "name": "claude-fable-5", "alias": [ - "claude-fable-5", "anthropic.claude-fable-5" ], "max_tokens": 1000000, @@ -14264,7 +14054,6 @@ { "name": "claude-mythos-5", "alias": [ - "claude-mythos-5" ], "max_tokens": 1000000, "model_types": [ @@ -14279,7 +14068,6 @@ { "name": "claude-opus-4-8", "alias": [ - "claude-opus-4-8", "anthropic.claude-opus-4-8" ], "max_tokens": 1000000, @@ -14295,7 +14083,6 @@ { "name": "claude-sonnet-4-7", "alias": [ - "claude-sonnet-4-7", "anthropic.claude-sonnet-4-7" ], "max_tokens": 1000000, @@ -14311,7 +14098,6 @@ { "name": "claude-sonnet-4-6", "alias": [ - "claude-sonnet-4-6", "anthropic.claude-sonnet-4-6" ], "max_tokens": 1000000, @@ -14327,7 +14113,6 @@ { "name": "claude-sonnet-4-5", "alias": [ - "claude-sonnet-4-5", "anthropic.claude-sonnet-4-5" ], "max_tokens": 1000000, @@ -14343,7 +14128,6 @@ { "name": "claude-haiku-4-5-20251001", "alias": [ - "claude-haiku-4-5-20251001", "claude-haiku-4-5", "anthropic.claude-haiku-4-5-20251001-v1:0" ], @@ -14356,6 +14140,6845 @@ "default_value": true, "clear_thinking": true } + }, + { + "name": "moonshotai/kimi-k2.6", + "alias": [ + "moonshotai/Kimi-K2.6", + "kimi-k2.6" + ], + "model_types": [ + "chat", + "vision", + "image2text" + ], + "max_tokens": 262144, + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "moonshotai/kimi-k2.5", + "alias": [ + "moonshotai/Kimi-K2.5", + "kimi-k2.5" + ], + "model_types": [ + "chat", + "vision", + "image2text" + ], + "max_tokens": 262144, + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "moonshotai/kimi-k2-instruct", + "alias": [ + "moonshotai/Kimi-K2-Instruct", + "kimi-k2-instruct" + ], + "model_types": [ + "chat" + ], + "max_tokens": 262144, + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "moonshotai/kimi-vl-a3b-thinking-2506", + "alias": [ + "moonshotai/Kimi-VL-A3B-Thinking-2506", + "kimi-vl-a3b-thinking-2506" + ], + "model_types": [ + "chat", + "vision", + "image2text" + ], + "max_tokens": 262144, + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "moonshotai/kimi-vl-a3b-thinking", + "alias": [ + "moonshotai/Kimi-VL-A3B-Thinking", + "kimi-vl-a3b-thinking" + ], + "model_types": [ + "chat", + "vision", + "image2text" + ], + "max_tokens": 262144, + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "moonshotai/moonlight-16b-a3b-instruct", + "alias": [ + "moonshotai/Moonlight-16B-A3B-Instruct", + "moonlight-16b-a3b-instruct" + ], + "model_types": [ + "chat" + ], + "max_tokens": 262144, + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "moonshotai/kimi-k2-base", + "alias": [ + "moonshotai/Kimi-K2-Base", + "kimi-k2-base" + ], + "model_types": [ + "chat" + ], + "max_tokens": 262144 + }, + { + "name": "moonshotai/moonlight-16b-a3b", + "alias": [ + "moonshotai/Moonlight-16B-A3B", + "moonlight-16b-a3b" + ], + "model_types": [ + "chat" + ], + "max_tokens": 262144 + }, + { + "name": "moonshotai/kimi-vl-a3b-instruct", + "alias": [ + "moonshotai/Kimi-VL-A3B-Instruct", + "kimi-vl-a3b-instruct" + ], + "model_types": [ + "chat", + "vision", + "image2text" + ], + "max_tokens": 262144 + }, + { + "name": "moonshotai/kimi-linear-48b-a3b-base", + "alias": [ + "moonshotai/Kimi-Linear-48B-A3B-Base", + "kimi-linear-48b-a3b-base" + ], + "model_types": [ + "chat" + ], + "max_tokens": 262144 + }, + { + "name": "moonshotai/kimi-k2-instruct-0905", + "alias": [ + "moonshotai/Kimi-K2-Instruct-0905", + "kimi-k2-instruct-0905" + ], + "model_types": [ + "chat" + ], + "max_tokens": 262144, + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "moonshotai/kimi-linear-48b-a3b-instruct", + "alias": [ + "moonshotai/Kimi-Linear-48B-A3B-Instruct", + "kimi-linear-48b-a3b-instruct" + ], + "model_types": [ + "chat" + ], + "max_tokens": 262144, + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "moonshotai/kimi-dev-72b", + "alias": [ + "moonshotai/Kimi-Dev-72B", + "kimi-dev-72b" + ], + "model_types": [ + "chat" + ], + "max_tokens": 262144, + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "moonshotai/kimi-audio-7b-instruct", + "alias": [ + "moonshotai/Kimi-Audio-7B-Instruct", + "kimi-audio-7b-instruct" + ], + "model_types": [ + "audio", + "tts" + ], + "max_tokens": 0 + }, + { + "name": "moonshotai/kimi-audio-7b", + "alias": [ + "moonshotai/Kimi-Audio-7B", + "kimi-audio-7b" + ], + "model_types": [ + "audio", + "tts" + ], + "max_tokens": 0 + }, + { + "name": "moonshotai/moonvit-so-400m", + "alias": [ + "moonshotai/MoonViT-SO-400M", + "moonvit-so-400m" + ], + "model_types": [ + "vision" + ], + "max_tokens": 0 + }, + { + "name": "minimaxai/minimax-m2.7", + "alias": [ + "minimaxai/MiniMax-M2.7", + "minimax-m2.7", + "minimax/minimax-m2.7" + ], + "model_types": [ + "chat" + ], + "max_tokens": 1000000, + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "minimaxai/minimax-m2.5", + "alias": [ + "minimaxai/MiniMax-M2.5", + "minimax-m2.5", + "minimax/minimax-m2.5" + ], + "model_types": [ + "chat" + ], + "max_tokens": 1000000, + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "minimaxai/minimax-m2.1", + "alias": [ + "minimaxai/MiniMax-M2.1", + "minimax-m2.1", + "minimax/minimax-m2.1" + ], + "model_types": [ + "chat" + ], + "max_tokens": 1000000, + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "minimaxai/minimax-m2", + "alias": [ + "minimaxai/MiniMax-M2", + "minimax-m2", + "minimax/minimax-m2" + ], + "model_types": [ + "chat" + ], + "max_tokens": 1000000, + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "minimaxai/vtp-large-f16d64", + "alias": [ + "minimaxai/VTP-Large-f16d64", + "vtp-large-f16d64" + ], + "model_types": [ + "embedding", + "vision" + ], + "max_dimension": 512, + "dimensions": [ + 512 + ], + "max_tokens": 0 + }, + { + "name": "minimaxai/vtp-base-f16d64", + "alias": [ + "minimaxai/VTP-Base-f16d64", + "vtp-base-f16d64" + ], + "model_types": [ + "embedding", + "vision" + ], + "max_dimension": 512, + "dimensions": [ + 512 + ], + "max_tokens": 0 + }, + { + "name": "minimaxai/vtp-small-f16d64", + "alias": [ + "minimaxai/VTP-Small-f16d64", + "vtp-small-f16d64" + ], + "model_types": [ + "embedding", + "vision" + ], + "max_dimension": 512, + "dimensions": [ + 512 + ], + "max_tokens": 0 + }, + { + "name": "minimaxai/minimax-m1-40k-hf", + "alias": [ + "minimaxai/MiniMax-M1-40k-hf", + "minimax-m1-40k-hf" + ], + "model_types": [ + "chat" + ], + "max_tokens": 40000, + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "minimaxai/minimax-text-01-hf", + "alias": [ + "minimaxai/MiniMax-Text-01-hf", + "minimax-text-01-hf" + ], + "model_types": [ + "chat" + ], + "max_tokens": 1000000, + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "minimaxai/minimax-m1-80k-hf", + "alias": [ + "minimaxai/MiniMax-M1-80k-hf", + "minimax-m1-80k-hf" + ], + "model_types": [ + "chat" + ], + "max_tokens": 80000, + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "minimaxai/minimax-m1-80k", + "alias": [ + "minimaxai/MiniMax-M1-80k", + "minimax-m1-80k" + ], + "model_types": [ + "chat" + ], + "max_tokens": 80000, + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "minimaxai/minimax-m1-40k", + "alias": [ + "minimaxai/MiniMax-M1-40k", + "minimax-m1-40k" + ], + "model_types": [ + "chat" + ], + "max_tokens": 40000, + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "minimaxai/minimax-text-01", + "alias": [ + "minimaxai/MiniMax-Text-01", + "minimax-text-01" + ], + "model_types": [ + "chat" + ], + "max_tokens": 1000000, + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "minimaxai/minimax-vl-01", + "alias": [ + "minimaxai/MiniMax-VL-01", + "minimax-vl-01" + ], + "model_types": [ + "chat", + "vision", + "image2text" + ], + "max_tokens": 1000000, + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "minimaxai/synlogic-32b", + "alias": [ + "minimaxai/SynLogic-32B", + "synlogic-32b" + ], + "model_types": [ + "chat" + ], + "max_tokens": 1000000, + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "minimaxai/synlogic-7b", + "alias": [ + "minimaxai/SynLogic-7B", + "synlogic-7b" + ], + "model_types": [ + "chat" + ], + "max_tokens": 1000000, + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "minimaxai/synlogic-mix-3-32b", + "alias": [ + "minimaxai/SynLogic-Mix-3-32B", + "synlogic-mix-3-32b" + ], + "model_types": [ + "chat" + ], + "max_tokens": 1000000, + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "stepfun-ai/Step-3.7-Flash-GGUF", + "alias": [ + "Step-3.7-Flash-GGUF" + ], + "model_types": [ + "chat", + "vision", + "image2text" + ], + "max_tokens": 262144, + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "stepfun-ai/Step-3.7-Flash", + "alias": [ + "Step-3.7-Flash" + ], + "model_types": [ + "chat", + "vision", + "image2text" + ], + "max_tokens": 262144, + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "stepfun-ai/Step-3.7-Flash-NVFP4", + "alias": [ + "Step-3.7-Flash-NVFP4" + ], + "model_types": [ + "chat", + "vision", + "image2text" + ], + "max_tokens": 262144, + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "stepfun-ai/Step-3.7-Flash-FP8", + "alias": [ + "Step-3.7-Flash-FP8" + ], + "model_types": [ + "chat", + "vision", + "image2text" + ], + "max_tokens": 262144, + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "stepfun-ai/Step-3.5-Flash", + "alias": [ + "Step-3.5-Flash" + ], + "model_types": [ + "chat" + ], + "max_tokens": 262144, + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "stepfun-ai/Step-3.5-Flash-Base-Midtrain", + "alias": [ + "Step-3.5-Flash-Base-Midtrain" + ], + "model_types": [ + "chat" + ], + "max_tokens": 262144, + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "stepfun-ai/Step-3.5-Flash-Base", + "alias": [ + "Step-3.5-Flash-Base" + ], + "model_types": [ + "chat" + ], + "max_tokens": 262144, + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "stepfun-ai/Step-3.5-Flash-FP8", + "alias": [ + "Step-3.5-Flash-FP8" + ], + "model_types": [ + "chat" + ], + "max_tokens": 262144, + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "stepfun-ai/NextStep-1.1-Pretrain-256px", + "alias": [ + "NextStep-1.1-Pretrain-256px" + ], + "model_types": [ + "image" + ], + "max_tokens": 0 + }, + { + "name": "stepfun-ai/Step-Audio-R1.1", + "alias": [ + "Step-Audio-R1.1" + ], + "model_types": [ + "audio", + "speech" + ], + "max_tokens": 0 + }, + { + "name": "stepfun-ai/Step-Audio-EditX", + "alias": [ + "Step-Audio-EditX" + ], + "model_types": [ + "audio", + "speech_edit" + ], + "max_tokens": 0 + }, + { + "name": "stepfun-ai/Step-Audio-2-mini", + "alias": [ + "Step-Audio-2-mini" + ], + "model_types": [ + "audio", + "speech" + ], + "max_tokens": 0 + }, + { + "name": "stepfun-ai/Step-3.5-Flash-GGUF-Q8_0", + "alias": [ + "Step-3.5-Flash-GGUF-Q8_0" + ], + "model_types": [ + "chat" + ], + "max_tokens": 262144 + }, + { + "name": "stepfun-ai/Step-3.5-Flash-GGUF-Q4_K_S", + "alias": [ + "Step-3.5-Flash-GGUF-Q4_K_S" + ], + "model_types": [ + "chat" + ], + "max_tokens": 262144 + }, + { + "name": "stepfun-ai/Step3-VL-10B-FP8", + "alias": [ + "Step3-VL-10B-FP8" + ], + "model_types": [ + "vision", + "image2text" + ], + "max_tokens": 65536 + }, + { + "name": "stepfun-ai/Step3-VL-10B", + "alias": [ + "Step3-VL-10B" + ], + "model_types": [ + "vision", + "image2text" + ], + "max_tokens": 65536 + }, + { + "name": "stepfun-ai/Step3-VL-10B-Base", + "alias": [ + "Step3-VL-10B-Base" + ], + "model_types": [ + "vision", + "image2text" + ], + "max_tokens": 65536 + }, + { + "name": "stepfun-ai/PaCoRe-8B", + "alias": [ + "PaCoRe-8B" + ], + "model_types": [ + "chat" + ], + "max_tokens": 262144 + }, + { + "name": "stepfun-ai/RLVR-8B-0926", + "alias": [ + "RLVR-8B-0926" + ], + "model_types": [ + "chat" + ], + "max_tokens": 262144 + }, + { + "name": "stepfun-ai/Step1X-Edit-v1p2", + "alias": [ + "Step1X-Edit-v1p2" + ], + "model_types": [ + "image" + ], + "max_tokens": 0 + }, + { + "name": "stepfun-ai/NextStep-1.1", + "alias": [ + "NextStep-1.1" + ], + "model_types": [ + "image" + ], + "max_tokens": 0 + }, + { + "name": "stepfun-ai/NextStep-1.1-Pretrain", + "alias": [ + "NextStep-1.1-Pretrain" + ], + "model_types": [ + "image" + ], + "max_tokens": 0 + }, + { + "name": "stepfun-ai/GELab-Zero-4B-preview", + "alias": [ + "GELab-Zero-4B-preview" + ], + "model_types": [ + "vision", + "image2text" + ], + "max_tokens": 65536 + }, + { + "name": "stepfun-ai/Step-Audio-R1", + "alias": [ + "Step-Audio-R1" + ], + "model_types": [ + "audio" + ], + "max_tokens": 0 + }, + { + "name": "stepfun-ai/StepFun-Formalizer-32B", + "alias": [ + "StepFun-Formalizer-32B" + ], + "model_types": [ + "chat" + ], + "max_tokens": 262144, + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "stepfun-ai/StepFun-Formalizer-7B", + "alias": [ + "StepFun-Formalizer-7B" + ], + "model_types": [ + "chat" + ], + "max_tokens": 262144, + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "stepfun-ai/StepFun-Prover-Preview-32B", + "alias": [ + "StepFun-Prover-Preview-32B" + ], + "model_types": [ + "chat" + ], + "max_tokens": 262144, + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "stepfun-ai/StepFun-Prover-Preview-7B", + "alias": [ + "StepFun-Prover-Preview-7B" + ], + "model_types": [ + "chat" + ], + "max_tokens": 262144, + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "stepfun-ai/Step-Audio-EditX-AWQ-4bit", + "alias": [ + "Step-Audio-EditX-AWQ-4bit" + ], + "model_types": [ + "audio" + ], + "max_tokens": 0 + }, + { + "name": "stepfun-ai/Step-Audio-2-mini-Think", + "alias": [ + "Step-Audio-2-mini-Think" + ], + "model_types": [ + "audio" + ], + "max_tokens": 0 + }, + { + "name": "stepfun-ai/Step-Audio-2-mini-Base", + "alias": [ + "Step-Audio-2-mini-Base" + ], + "model_types": [ + "audio" + ], + "max_tokens": 0 + }, + { + "name": "stepfun-ai/NextStep-1-f8ch16-Tokenizer", + "alias": [ + "NextStep-1-f8ch16-Tokenizer" + ], + "model_types": [ + "other" + ], + "max_tokens": 0 + }, + { + "name": "stepfun-ai/step3-fp8", + "alias": [ + "step3-fp8" + ], + "model_types": [ + "chat", + "vision", + "image2text" + ], + "max_tokens": 65536 + }, + { + "name": "stepfun-ai/step3", + "alias": [ + "step3" + ], + "model_types": [ + "chat", + "vision", + "image2text" + ], + "max_tokens": 65536 + }, + { + "name": "tencent/hy-mt2-1.8b-1.25bit-gguf", + "alias": [ + "tencent/Hy-MT2-1.8B-1.25Bit-GGUF", + "Hy-MT2-1.8B-1.25Bit-GGUF", + "hy-mt2-1.8b-1.25bit-gguf" + ], + "max_tokens": 262144, + "model_types": [ + "chat", + "translation" + ] + }, + { + "name": "tencent/hy-mt1.5-1.8b-1.25bit-gguf", + "alias": [ + "tencent/Hy-MT1.5-1.8B-1.25bit-GGUF", + "Hy-MT1.5-1.8B-1.25bit-GGUF", + "hy-mt1.5-1.8b-1.25bit-gguf" + ], + "max_tokens": 262144, + "model_types": [ + "chat", + "translation" + ] + }, + { + "name": "tencent/universal_audio_tokenizer", + "alias": [ + "tencent/Universal_Audio_Tokenizer", + "Universal_Audio_Tokenizer", + "universal_audio_tokenizer" + ], + "model_types": [ + "audio_codec" + ] + }, + { + "name": "tencent/hy-mt1.5-7b", + "alias": [ + "tencent/HY-MT1.5-7B", + "HY-MT1.5-7B", + "hy-mt1.5-7b" + ], + "max_tokens": 262144, + "model_types": [ + "chat", + "translation" + ] + }, + { + "name": "tencent/hy-mt1.5-1.8b-1.25bit", + "alias": [ + "tencent/Hy-MT1.5-1.8B-1.25bit", + "Hy-MT1.5-1.8B-1.25bit", + "hy-mt1.5-1.8b-1.25bit" + ], + "max_tokens": 262144, + "model_types": [ + "chat", + "translation" + ] + }, + { + "name": "tencent/hy-mt2-1.8b-2bit-gguf", + "alias": [ + "tencent/Hy-MT2-1.8B-2Bit-GGUF", + "Hy-MT2-1.8B-2Bit-GGUF", + "hy-mt2-1.8b-2bit-gguf" + ], + "max_tokens": 262144, + "model_types": [ + "chat", + "translation" + ] + }, + { + "name": "tencent/hy-mt2-7b-gguf", + "alias": [ + "tencent/Hy-MT2-7B-GGUF", + "Hy-MT2-7B-GGUF", + "hy-mt2-7b-gguf" + ], + "max_tokens": 262144, + "model_types": [ + "chat", + "translation" + ] + }, + { + "name": "tencent/hy-mt2-1.8b-gguf", + "alias": [ + "tencent/Hy-MT2-1.8B-GGUF", + "Hy-MT2-1.8B-GGUF", + "hy-mt2-1.8b-gguf" + ], + "max_tokens": 262144, + "model_types": [ + "chat", + "translation" + ] + }, + { + "name": "tencent/hy-mt2-30b-a3b-fp8", + "alias": [ + "tencent/Hy-MT2-30B-A3B-FP8", + "Hy-MT2-30B-A3B-FP8", + "hy-mt2-30b-a3b-fp8" + ], + "max_tokens": 262144, + "model_types": [ + "chat", + "translation" + ] + }, + { + "name": "tencent/hy-mt2-7b-fp8", + "alias": [ + "tencent/Hy-MT2-7B-FP8", + "Hy-MT2-7B-FP8", + "hy-mt2-7b-fp8" + ], + "max_tokens": 262144, + "model_types": [ + "chat", + "translation" + ] + }, + { + "name": "tencent/hy-mt2-1.8b-fp8", + "alias": [ + "tencent/Hy-MT2-1.8B-FP8", + "Hy-MT2-1.8B-FP8", + "hy-mt2-1.8b-fp8" + ], + "max_tokens": 262144, + "model_types": [ + "chat", + "translation" + ] + }, + { + "name": "tencent/hy-mt2-1.8b", + "alias": [ + "tencent/Hy-MT2-1.8B", + "Hy-MT2-1.8B", + "hy-mt2-1.8b" + ], + "max_tokens": 262144, + "model_types": [ + "chat", + "translation" + ] + }, + { + "name": "tencent/hy-mt2-7b", + "alias": [ + "tencent/Hy-MT2-7B", + "Hy-MT2-7B", + "hy-mt2-7b" + ], + "max_tokens": 262144, + "model_types": [ + "chat", + "translation" + ] + }, + { + "name": "tencent/hy-mt2-30b-a3b", + "alias": [ + "tencent/Hy-MT2-30B-A3B", + "Hy-MT2-30B-A3B", + "hy-mt2-30b-a3b" + ], + "max_tokens": 262144, + "model_types": [ + "chat", + "translation" + ] + }, + { + "name": "tencent/hy-world-2.0", + "alias": [ + "tencent/HY-World-2.0", + "HY-World-2.0", + "hy-world-2.0" + ], + "model_types": [ + "3d_generation" + ] + }, + { + "name": "tencent/hy-omniweaving", + "alias": [ + "tencent/HY-OmniWeaving", + "HY-OmniWeaving", + "hy-omniweaving" + ], + "model_types": [ + "video_generation" + ] + }, + { + "name": "tencent/hy-mt1.5-1.8b-2bit", + "alias": [ + "tencent/Hy-MT1.5-1.8B-2bit", + "Hy-MT1.5-1.8B-2bit", + "hy-mt1.5-1.8b-2bit" + ], + "max_tokens": 262144, + "model_types": [ + "chat", + "translation" + ] + }, + { + "name": "tencent/hy-mt1.5-1.8b-2bit-gguf", + "alias": [ + "tencent/Hy-MT1.5-1.8B-2bit-GGUF", + "Hy-MT1.5-1.8B-2bit-GGUF", + "hy-mt1.5-1.8b-2bit-gguf" + ], + "max_tokens": 262144, + "model_types": [ + "chat", + "translation" + ] + }, + { + "name": "tencent/points-seeker", + "alias": [ + "tencent/POINTS-Seeker", + "POINTS-Seeker", + "points-seeker" + ], + "max_tokens": 262144, + "model_types": [ + "chat", + "vision", + "image2text" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "tencent/hy-embodied-0.5-x", + "alias": [ + "tencent/HY-Embodied-0.5-X", + "HY-Embodied-0.5-X", + "hy-embodied-0.5-x" + ], + "max_tokens": 262144, + "model_types": [ + "chat", + "vision", + "image2text" + ] + }, + { + "name": "tencent/hy3-preview-base", + "alias": [ + "tencent/Hy3-preview-Base", + "Hy3-preview-Base", + "hy3-preview-base" + ], + "max_tokens": 262144, + "model_types": [ + "chat" + ] + }, + { + "name": "tencent/hy3-preview", + "alias": [ + "tencent/Hy3-preview", + "Hy3-preview", + "hy3-preview" + ], + "max_tokens": 262144, + "model_types": [ + "chat" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "tencent/unified_audio_schema", + "alias": [ + "tencent/Unified_Audio_Schema", + "Unified_Audio_Schema", + "unified_audio_schema" + ], + "max_tokens": 262144, + "model_types": [ + "chat", + "audio", + "asr" + ] + }, + { + "name": "tencent/disca", + "alias": [ + "tencent/DisCa", + "DisCa", + "disca" + ], + "model_types": [ + "other" + ] + }, + { + "name": "tencent/hy-embodied-0.5", + "alias": [ + "tencent/HY-Embodied-0.5", + "HY-Embodied-0.5", + "hy-embodied-0.5" + ], + "max_tokens": 262144, + "model_types": [ + "chat", + "vision", + "image2text" + ] + }, + { + "name": "tencent/unicom-unified-multimodal-modeling-via-compressed-continuous-semantic-representations", + "alias": [ + "tencent/Unicom-Unified-Multimodal-Modeling-via-Compressed-Continuous-Semantic-Representations", + "Unicom-Unified-Multimodal-Modeling-via-Compressed-Continuous-Semantic-Representations", + "unicom-unified-multimodal-modeling-via-compressed-continuous-semantic-representations" + ], + "model_types": [ + "image" + ] + }, + { + "name": "tencent/sequential-hidden-decoding-8b-n8-instruct", + "alias": [ + "tencent/Sequential-Hidden-Decoding-8B-n8-Instruct", + "Sequential-Hidden-Decoding-8B-n8-Instruct", + "sequential-hidden-decoding-8b-n8-instruct" + ], + "max_tokens": 262144, + "model_types": [ + "chat" + ] + }, + { + "name": "tencent/versavit", + "alias": [ + "tencent/VersaViT", + "VersaViT", + "versavit" + ], + "model_types": [ + "vision" + ] + }, + { + "name": "tencent/covo-audio-chat", + "alias": [ + "tencent/Covo-Audio-Chat", + "Covo-Audio-Chat", + "covo-audio-chat" + ], + "max_tokens": 262144, + "model_types": [ + "chat", + "audio", + "asr", + "tts" + ] + }, + { + "name": "tencent/sequential-hidden-decoding-8b-n8", + "alias": [ + "tencent/Sequential-Hidden-Decoding-8B-n8", + "Sequential-Hidden-Decoding-8B-n8", + "sequential-hidden-decoding-8b-n8" + ], + "max_tokens": 262144, + "model_types": [ + "chat" + ] + }, + { + "name": "tencent/penguin-vl-2b", + "alias": [ + "tencent/Penguin-VL-2B", + "Penguin-VL-2B", + "penguin-vl-2b" + ], + "max_tokens": 262144, + "model_types": [ + "chat", + "vision", + "image2text" + ] + }, + { + "name": "tencent/penguin-vl-8b", + "alias": [ + "tencent/Penguin-VL-8B", + "Penguin-VL-8B", + "penguin-vl-8b" + ], + "max_tokens": 262144, + "model_types": [ + "chat", + "vision", + "image2text" + ] + }, + { + "name": "tencent/points-gui-g", + "alias": [ + "tencent/POINTS-GUI-G", + "POINTS-GUI-G", + "points-gui-g" + ], + "max_tokens": 262144, + "model_types": [ + "chat", + "vision", + "image2text" + ] + }, + { + "name": "tencent/sequential-hidden-decoding-8b-n2", + "alias": [ + "tencent/Sequential-Hidden-Decoding-8B-n2", + "Sequential-Hidden-Decoding-8B-n2", + "sequential-hidden-decoding-8b-n2" + ], + "max_tokens": 262144, + "model_types": [ + "chat" + ] + }, + { + "name": "tencent/sequential-hidden-decoding-8b-n4", + "alias": [ + "tencent/Sequential-Hidden-Decoding-8B-n4", + "Sequential-Hidden-Decoding-8B-n4", + "sequential-hidden-decoding-8b-n4" + ], + "max_tokens": 262144, + "model_types": [ + "chat" + ] + }, + { + "name": "tencent/penguin-encoder", + "alias": [ + "tencent/Penguin-Encoder", + "Penguin-Encoder", + "penguin-encoder" + ], + "model_types": [ + "embedding", + "vision" + ] + }, + { + "name": "tencent/hy-worldplay", + "alias": [ + "tencent/HY-WorldPlay", + "HY-WorldPlay", + "hy-worldplay" + ], + "model_types": [ + "video_generation" + ] + }, + { + "name": "tencent/hy-wu", + "alias": [ + "tencent/HY-WU", + "HY-WU", + "hy-wu" + ], + "model_types": [ + "image" + ] + }, + { + "name": "tencent/songgeneration", + "alias": [ + "tencent/SongGeneration", + "SongGeneration", + "songgeneration" + ], + "model_types": [ + "audio_generation" + ] + }, + { + "name": "tencent/stabletoken", + "alias": [ + "tencent/StableToken", + "StableToken", + "stabletoken" + ], + "model_types": [ + "audio_codec" + ] + }, + { + "name": "tencent/youtu-llm-2b", + "alias": [ + "tencent/Youtu-LLM-2B", + "Youtu-LLM-2B", + "youtu-llm-2b" + ], + "max_tokens": 262144, + "model_types": [ + "chat" + ] + }, + { + "name": "tencent/youtu-llm-2b-base", + "alias": [ + "tencent/Youtu-LLM-2B-Base", + "Youtu-LLM-2B-Base", + "youtu-llm-2b-base" + ], + "max_tokens": 262144, + "model_types": [ + "chat" + ] + }, + { + "name": "tencent/youtu-vl-4b-instruct-gguf", + "alias": [ + "tencent/Youtu-VL-4B-Instruct-GGUF", + "Youtu-VL-4B-Instruct-GGUF", + "youtu-vl-4b-instruct-gguf" + ], + "max_tokens": 262144, + "model_types": [ + "chat", + "vision", + "image2text" + ] + }, + { + "name": "tencent/youtu-vl-4b-instruct", + "alias": [ + "tencent/Youtu-VL-4B-Instruct", + "Youtu-VL-4B-Instruct", + "youtu-vl-4b-instruct" + ], + "max_tokens": 262144, + "model_types": [ + "chat", + "vision", + "image2text" + ] + }, + { + "name": "tencent/kalm-embedding-gemma3-12b-2511", + "alias": [ + "tencent/KaLM-Embedding-Gemma3-12B-2511", + "KaLM-Embedding-Gemma3-12B-2511", + "kalm-embedding-gemma3-12b-2511" + ], + "model_types": [ + "embedding" + ] + }, + { + "name": "tencent/hy3d-bench", + "alias": [ + "tencent/HY3D-Bench", + "HY3D-Bench", + "hy3d-bench" + ], + "model_types": [ + "3d_generation" + ] + }, + { + "name": "tencent/youtu-hichunk", + "alias": [ + "tencent/Youtu-HiChunk", + "Youtu-HiChunk", + "youtu-hichunk" + ], + "model_types": [ + "embedding", + "vision" + ] + }, + { + "name": "tencent/hunyuanimage-3.0-instruct-distil", + "alias": [ + "tencent/HunyuanImage-3.0-Instruct-Distil", + "HunyuanImage-3.0-Instruct-Distil", + "hunyuanimage-3.0-instruct-distil" + ], + "model_types": [ + "image_edit" + ] + }, + { + "name": "tencent/hunyuanimage-3.0-instruct", + "alias": [ + "tencent/HunyuanImage-3.0-Instruct", + "HunyuanImage-3.0-Instruct", + "hunyuanimage-3.0-instruct" + ], + "model_types": [ + "image_edit" + ] + }, + { + "name": "tencent/youtu-parsing", + "alias": [ + "tencent/Youtu-Parsing", + "Youtu-Parsing", + "youtu-parsing" + ], + "max_tokens": 262144, + "model_types": [ + "vision", + "image2text" + ] + }, + { + "name": "tencent/hunyuanimage-3.0", + "alias": [ + "tencent/HunyuanImage-3.0", + "HunyuanImage-3.0", + "hunyuanimage-3.0" + ], + "model_types": [ + "image" + ] + }, + { + "name": "tencent/hy-video-prfl", + "alias": [ + "tencent/HY-Video-PRFL", + "HY-Video-PRFL", + "hy-video-prfl" + ], + "model_types": [ + "video_generation" + ] + }, + { + "name": "tencent/hunyuanocr", + "alias": [ + "tencent/HunyuanOCR", + "HunyuanOCR", + "hunyuanocr" + ], + "model_types": [ + "ocr", + "vision", + "image2text" + ] + }, + { + "name": "tencent/tcandon-router", + "alias": [ + "tencent/TCAndon-Router", + "TCAndon-Router", + "tcandon-router" + ], + "max_tokens": 262144, + "model_types": [ + "chat" + ] + }, + { + "name": "tencent/hy-mt1.5-7b-gguf", + "alias": [ + "tencent/HY-MT1.5-7B-GGUF", + "HY-MT1.5-7B-GGUF", + "hy-mt1.5-7b-gguf" + ], + "max_tokens": 262144, + "model_types": [ + "chat", + "translation" + ] + }, + { + "name": "tencent/hy-mt1.5-1.8b-gguf", + "alias": [ + "tencent/HY-MT1.5-1.8B-GGUF", + "HY-MT1.5-1.8B-GGUF", + "hy-mt1.5-1.8b-gguf" + ], + "max_tokens": 262144, + "model_types": [ + "chat", + "translation" + ] + }, + { + "name": "tencent/youtu-llm-2b-gguf", + "alias": [ + "tencent/Youtu-LLM-2B-GGUF", + "Youtu-LLM-2B-GGUF", + "youtu-llm-2b-gguf" + ], + "max_tokens": 262144, + "model_types": [ + "chat" + ] + }, + { + "name": "tencent/hy-mt1.5-7b-gptq-int4", + "alias": [ + "tencent/HY-MT1.5-7B-GPTQ-Int4", + "HY-MT1.5-7B-GPTQ-Int4", + "hy-mt1.5-7b-gptq-int4" + ], + "max_tokens": 262144, + "model_types": [ + "chat", + "translation" + ] + }, + { + "name": "tencent/hy-mt1.5-7b-fp8", + "alias": [ + "tencent/HY-MT1.5-7B-FP8", + "HY-MT1.5-7B-FP8", + "hy-mt1.5-7b-fp8" + ], + "max_tokens": 262144, + "model_types": [ + "chat", + "translation" + ] + }, + { + "name": "tencent/hy-mt1.5-1.8b-gptq-int4", + "alias": [ + "tencent/HY-MT1.5-1.8B-GPTQ-Int4", + "HY-MT1.5-1.8B-GPTQ-Int4", + "hy-mt1.5-1.8b-gptq-int4" + ], + "max_tokens": 262144, + "model_types": [ + "chat", + "translation" + ] + }, + { + "name": "tencent/hy-mt1.5-1.8b-fp8", + "alias": [ + "tencent/HY-MT1.5-1.8B-FP8", + "HY-MT1.5-1.8B-FP8", + "hy-mt1.5-1.8b-fp8" + ], + "max_tokens": 262144, + "model_types": [ + "chat", + "translation" + ] + }, + { + "name": "tencent/hy-mt1.5-1.8b", + "alias": [ + "tencent/HY-MT1.5-1.8B", + "HY-MT1.5-1.8B", + "hy-mt1.5-1.8b" + ], + "max_tokens": 262144, + "model_types": [ + "chat", + "translation" + ] + }, + { + "name": "tencent/wedlm-8b-instruct", + "alias": [ + "tencent/WeDLM-8B-Instruct", + "WeDLM-8B-Instruct", + "wedlm-8b-instruct" + ], + "max_tokens": 262144, + "model_types": [ + "chat" + ] + }, + { + "name": "tencent/hy-motion-1.0", + "alias": [ + "tencent/HY-Motion-1.0", + "HY-Motion-1.0", + "hy-motion-1.0" + ], + "model_types": [ + "3d_generation" + ] + }, + { + "name": "tencent/hunyuan-mt-7b", + "alias": [ + "tencent/Hunyuan-MT-7B", + "Hunyuan-MT-7B", + "hunyuan-mt-7b" + ], + "max_tokens": 262144, + "model_types": [ + "chat", + "translation" + ] + }, + { + "name": "tencent/wedlm-7b-instruct", + "alias": [ + "tencent/WeDLM-7B-Instruct", + "WeDLM-7B-Instruct", + "wedlm-7b-instruct" + ], + "max_tokens": 262144, + "model_types": [ + "chat" + ] + }, + { + "name": "tencent/wedlm-7b-base", + "alias": [ + "tencent/WeDLM-7B-Base", + "WeDLM-7B-Base", + "wedlm-7b-base" + ], + "max_tokens": 262144, + "model_types": [ + "chat" + ] + }, + { + "name": "tencent/wedlm-8b-base", + "alias": [ + "tencent/WeDLM-8B-Base", + "WeDLM-8B-Base", + "wedlm-8b-base" + ], + "max_tokens": 262144, + "model_types": [ + "chat" + ] + }, + { + "name": "tencent/hunyuanvideo-1.5", + "alias": [ + "tencent/HunyuanVideo-1.5", + "HunyuanVideo-1.5", + "hunyuanvideo-1.5" + ], + "model_types": [ + "video_generation" + ] + }, + { + "name": "tencent/youtu-embedding", + "alias": [ + "tencent/Youtu-Embedding", + "Youtu-Embedding", + "youtu-embedding" + ], + "model_types": [ + "embedding" + ] + }, + { + "name": "tencent/drive-rl", + "alias": [ + "tencent/DRIVE-RL", + "DRIVE-RL", + "drive-rl" + ], + "max_tokens": 262144, + "model_types": [ + "chat" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "tencent/drive-sft", + "alias": [ + "tencent/DRIVE-SFT", + "DRIVE-SFT", + "drive-sft" + ], + "max_tokens": 262144, + "model_types": [ + "chat" + ] + }, + { + "name": "tencent/deepseek-v3.1-terminus-w4afp8", + "alias": [ + "tencent/DeepSeek-V3.1-Terminus-W4AFP8", + "DeepSeek-V3.1-Terminus-W4AFP8", + "deepseek-v3.1-terminus-w4afp8" + ], + "max_tokens": 262144, + "model_types": [ + "chat" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "tencent/hunyuan-4b-instruct", + "alias": [ + "tencent/Hunyuan-4B-Instruct", + "Hunyuan-4B-Instruct", + "hunyuan-4b-instruct" + ], + "max_tokens": 262144, + "model_types": [ + "chat" + ] + }, + { + "name": "tencent/hunyuanworld-mirror", + "alias": [ + "tencent/HunyuanWorld-Mirror", + "HunyuanWorld-Mirror", + "hunyuanworld-mirror" + ], + "model_types": [ + "3d_generation" + ] + }, + { + "name": "tencent/songprep-7b", + "alias": [ + "tencent/SongPrep-7B", + "SongPrep-7B", + "songprep-7b" + ], + "model_types": [ + "asr" + ] + }, + { + "name": "tencent/hunyuanworld-1", + "alias": [ + "tencent/HunyuanWorld-1", + "HunyuanWorld-1", + "hunyuanworld-1" + ], + "model_types": [ + "3d_generation" + ] + }, + { + "name": "tencent/hunyuan3d-part", + "alias": [ + "tencent/Hunyuan3D-Part", + "Hunyuan3D-Part", + "hunyuan3d-part" + ], + "model_types": [ + "3d_generation" + ] + }, + { + "name": "tencent/hunyuanworld-voyager", + "alias": [ + "tencent/HunyuanWorld-Voyager", + "HunyuanWorld-Voyager", + "hunyuanworld-voyager" + ], + "model_types": [ + "video_generation" + ] + }, + { + "name": "tencent/hunyuan3d-2mv", + "alias": [ + "tencent/Hunyuan3D-2mv", + "Hunyuan3D-2mv", + "hunyuan3d-2mv" + ], + "model_types": [ + "3d_generation" + ] + }, + { + "name": "tencent/hunyuan3d-omni", + "alias": [ + "tencent/Hunyuan3D-Omni", + "Hunyuan3D-Omni", + "hunyuan3d-omni" + ], + "model_types": [ + "3d_generation" + ] + }, + { + "name": "tencent/hunyuan3d-2mini", + "alias": [ + "tencent/Hunyuan3D-2mini", + "Hunyuan3D-2mini", + "hunyuan3d-2mini" + ], + "model_types": [ + "3d_generation" + ] + }, + { + "name": "tencent/hunyuan3d-2.1", + "alias": [ + "tencent/Hunyuan3D-2.1", + "Hunyuan3D-2.1", + "hunyuan3d-2.1" + ], + "model_types": [ + "3d_generation" + ] + }, + { + "name": "tencent/hunyuan3d-2", + "alias": [ + "tencent/Hunyuan3D-2", + "Hunyuan3D-2", + "hunyuan3d-2" + ], + "model_types": [ + "3d_generation" + ] + }, + { + "name": "tencent/hunyuan3d-1", + "alias": [ + "tencent/Hunyuan3D-1", + "Hunyuan3D-1", + "hunyuan3d-1" + ], + "model_types": [ + "3d_generation" + ] + }, + { + "name": "tencent/hunyuanimage-2.1", + "alias": [ + "tencent/HunyuanImage-2.1", + "HunyuanImage-2.1", + "hunyuanimage-2.1" + ], + "model_types": [ + "image" + ] + }, + { + "name": "tencent/hunyuanvideo-foley", + "alias": [ + "tencent/HunyuanVideo-Foley", + "HunyuanVideo-Foley", + "hunyuanvideo-foley" + ], + "model_types": [ + "audio_generation" + ] + }, + { + "name": "tencent/srpo", + "alias": [ + "tencent/SRPO", + "SRPO", + "srpo" + ], + "model_types": [ + "image" + ] + }, + { + "name": "tencent/points-reader", + "alias": [ + "tencent/POINTS-Reader", + "POINTS-Reader", + "points-reader" + ], + "max_tokens": 262144, + "model_types": [ + "vision", + "image2text" + ] + }, + { + "name": "tencent/hunyuan-mt-chimera-7b", + "alias": [ + "tencent/Hunyuan-MT-Chimera-7B", + "Hunyuan-MT-Chimera-7B", + "hunyuan-mt-chimera-7b" + ], + "max_tokens": 262144, + "model_types": [ + "chat", + "translation" + ] + }, + { + "name": "tencent/hunyuan-mt-chimera-7b-fp8", + "alias": [ + "tencent/Hunyuan-MT-Chimera-7B-fp8", + "Hunyuan-MT-Chimera-7B-fp8", + "hunyuan-mt-chimera-7b-fp8" + ], + "max_tokens": 262144, + "model_types": [ + "chat", + "translation" + ] + }, + { + "name": "tencent/hunyuan-mt-7b-fp8", + "alias": [ + "tencent/Hunyuan-MT-7B-fp8", + "Hunyuan-MT-7B-fp8", + "hunyuan-mt-7b-fp8" + ], + "max_tokens": 262144, + "model_types": [ + "chat", + "translation" + ] + }, + { + "name": "tencent/hunyuan-0.5b-instruct-gptq-int4", + "alias": [ + "tencent/Hunyuan-0.5B-Instruct-GPTQ-Int4", + "Hunyuan-0.5B-Instruct-GPTQ-Int4", + "hunyuan-0.5b-instruct-gptq-int4" + ], + "max_tokens": 262144, + "model_types": [ + "chat" + ] + }, + { + "name": "tencent/hunyuan-7b-instruct-fp8", + "alias": [ + "tencent/Hunyuan-7B-Instruct-FP8", + "Hunyuan-7B-Instruct-FP8", + "hunyuan-7b-instruct-fp8" + ], + "max_tokens": 262144, + "model_types": [ + "chat" + ] + }, + { + "name": "tencent/hunyuan-7b-instruct-gptq-int4", + "alias": [ + "tencent/Hunyuan-7B-Instruct-GPTQ-Int4", + "Hunyuan-7B-Instruct-GPTQ-Int4", + "hunyuan-7b-instruct-gptq-int4" + ], + "max_tokens": 262144, + "model_types": [ + "chat" + ] + }, + { + "name": "tencent/hunyuan-7b-instruct", + "alias": [ + "tencent/Hunyuan-7B-Instruct", + "Hunyuan-7B-Instruct", + "hunyuan-7b-instruct" + ], + "max_tokens": 262144, + "model_types": [ + "chat" + ] + }, + { + "name": "tencent/hunyuan-7b-instruct-awq-int4", + "alias": [ + "tencent/Hunyuan-7B-Instruct-AWQ-Int4", + "Hunyuan-7B-Instruct-AWQ-Int4", + "hunyuan-7b-instruct-awq-int4" + ], + "max_tokens": 262144, + "model_types": [ + "chat" + ] + }, + { + "name": "tencent/hunyuan-7b-pretrain", + "alias": [ + "tencent/Hunyuan-7B-Pretrain", + "Hunyuan-7B-Pretrain", + "hunyuan-7b-pretrain" + ], + "max_tokens": 262144, + "model_types": [ + "chat" + ] + }, + { + "name": "tencent/hunyuan-4b-instruct-gptq-int4", + "alias": [ + "tencent/Hunyuan-4B-Instruct-GPTQ-Int4", + "Hunyuan-4B-Instruct-GPTQ-Int4", + "hunyuan-4b-instruct-gptq-int4" + ], + "max_tokens": 262144, + "model_types": [ + "chat" + ] + }, + { + "name": "tencent/hunyuan-4b-instruct-awq-int4", + "alias": [ + "tencent/Hunyuan-4B-Instruct-AWQ-Int4", + "Hunyuan-4B-Instruct-AWQ-Int4", + "hunyuan-4b-instruct-awq-int4" + ], + "max_tokens": 262144, + "model_types": [ + "chat" + ] + }, + { + "name": "tencent/hunyuan-1.8b-instruct-gptq-int4", + "alias": [ + "tencent/Hunyuan-1.8B-Instruct-GPTQ-Int4", + "Hunyuan-1.8B-Instruct-GPTQ-Int4", + "hunyuan-1.8b-instruct-gptq-int4" + ], + "max_tokens": 262144, + "model_types": [ + "chat" + ] + }, + { + "name": "tencent/hunyuan-1.8b-instruct-awq-int4", + "alias": [ + "tencent/Hunyuan-1.8B-Instruct-AWQ-Int4", + "Hunyuan-1.8B-Instruct-AWQ-Int4", + "hunyuan-1.8b-instruct-awq-int4" + ], + "max_tokens": 262144, + "model_types": [ + "chat" + ] + }, + { + "name": "tencent/hunyuan-0.5b-instruct-fp8", + "alias": [ + "tencent/Hunyuan-0.5B-Instruct-FP8", + "Hunyuan-0.5B-Instruct-FP8", + "hunyuan-0.5b-instruct-fp8" + ], + "max_tokens": 262144, + "model_types": [ + "chat" + ] + }, + { + "name": "tencent/hunyuan-1.8b-instruct-fp8", + "alias": [ + "tencent/Hunyuan-1.8B-Instruct-FP8", + "Hunyuan-1.8B-Instruct-FP8", + "hunyuan-1.8b-instruct-fp8" + ], + "max_tokens": 262144, + "model_types": [ + "chat" + ] + }, + { + "name": "tencent/hunyuan-0.5b-instruct-awq-int4", + "alias": [ + "tencent/Hunyuan-0.5B-Instruct-AWQ-Int4", + "Hunyuan-0.5B-Instruct-AWQ-Int4", + "hunyuan-0.5b-instruct-awq-int4" + ], + "max_tokens": 262144, + "model_types": [ + "chat" + ] + }, + { + "name": "tencent/hunyuan-4b-instruct-fp8", + "alias": [ + "tencent/Hunyuan-4B-Instruct-FP8", + "Hunyuan-4B-Instruct-FP8", + "hunyuan-4b-instruct-fp8" + ], + "max_tokens": 262144, + "model_types": [ + "chat" + ] + }, + { + "name": "tencent/hunyuan-a13b-instruct", + "alias": [ + "tencent/Hunyuan-A13B-Instruct", + "Hunyuan-A13B-Instruct", + "hunyuan-a13b-instruct" + ], + "max_tokens": 262144, + "model_types": [ + "chat" + ] + }, + { + "name": "tencent/hunyuan-gamecraft-1.0", + "alias": [ + "tencent/Hunyuan-GameCraft-1.0", + "Hunyuan-GameCraft-1.0", + "hunyuan-gamecraft-1.0" + ], + "model_types": [ + "video_generation" + ] + }, + { + "name": "tencent/dogr", + "alias": [ + "tencent/DOGR", + "DOGR", + "dogr" + ], + "max_tokens": 262144, + "model_types": [ + "chat" + ] + }, + { + "name": "tencent/hunyuan-4b-pretrain", + "alias": [ + "tencent/Hunyuan-4B-Pretrain", + "Hunyuan-4B-Pretrain", + "hunyuan-4b-pretrain" + ], + "max_tokens": 262144, + "model_types": [ + "chat" + ] + }, + { + "name": "tencent/hunyuan-1.8b-pretrain", + "alias": [ + "tencent/Hunyuan-1.8B-Pretrain", + "Hunyuan-1.8B-Pretrain", + "hunyuan-1.8b-pretrain" + ], + "max_tokens": 262144, + "model_types": [ + "chat" + ] + }, + { + "name": "tencent/hunyuan-1.8b-instruct", + "alias": [ + "tencent/Hunyuan-1.8B-Instruct", + "Hunyuan-1.8B-Instruct", + "hunyuan-1.8b-instruct" + ], + "max_tokens": 262144, + "model_types": [ + "chat" + ] + }, + { + "name": "tencent/hunyuan-0.5b-pretrain", + "alias": [ + "tencent/Hunyuan-0.5B-Pretrain", + "Hunyuan-0.5B-Pretrain", + "hunyuan-0.5b-pretrain" + ], + "max_tokens": 262144, + "model_types": [ + "chat" + ] + }, + { + "name": "tencent/hunyuan-0.5b-instruct", + "alias": [ + "tencent/Hunyuan-0.5B-Instruct", + "Hunyuan-0.5B-Instruct", + "hunyuan-0.5b-instruct" + ], + "max_tokens": 262144, + "model_types": [ + "chat" + ] + }, + { + "name": "tencent/depthcrafter", + "alias": [ + "tencent/DepthCrafter", + "DepthCrafter", + "depthcrafter" + ], + "model_types": [ + "depth_estimation" + ] + }, + { + "name": "tencent/hunyuan-7b-instruct-0124", + "alias": [ + "tencent/Hunyuan-7B-Instruct-0124", + "Hunyuan-7B-Instruct-0124", + "hunyuan-7b-instruct-0124" + ], + "max_tokens": 262144, + "model_types": [ + "chat" + ] + }, + { + "name": "tencent/mimicmotion", + "alias": [ + "tencent/MimicMotion", + "MimicMotion", + "mimicmotion" + ], + "model_types": [ + "video_generation" + ] + }, + { + "name": "tencent/hunyuan-a13b-instruct-gguf", + "alias": [ + "tencent/Hunyuan-A13B-Instruct-GGUF", + "Hunyuan-A13B-Instruct-GGUF", + "hunyuan-a13b-instruct-gguf" + ], + "max_tokens": 262144, + "model_types": [ + "chat" + ] + }, + { + "name": "tencent/hunyuan-a13b-instruct-gptq-int4", + "alias": [ + "tencent/Hunyuan-A13B-Instruct-GPTQ-Int4", + "Hunyuan-A13B-Instruct-GPTQ-Int4", + "hunyuan-a13b-instruct-gptq-int4" + ], + "max_tokens": 262144, + "model_types": [ + "chat" + ] + }, + { + "name": "tencent/hunyuan-a13b-pretrain", + "alias": [ + "tencent/Hunyuan-A13B-Pretrain", + "Hunyuan-A13B-Pretrain", + "hunyuan-a13b-pretrain" + ], + "max_tokens": 262144, + "model_types": [ + "chat" + ] + }, + { + "name": "tencent/hunyuan-a13b-instruct-fp8", + "alias": [ + "tencent/Hunyuan-A13B-Instruct-FP8", + "Hunyuan-A13B-Instruct-FP8", + "hunyuan-a13b-instruct-fp8" + ], + "max_tokens": 262144, + "model_types": [ + "chat" + ] + }, + { + "name": "tencent/hunyuan-7b-pretrain-0124", + "alias": [ + "tencent/Hunyuan-7B-Pretrain-0124", + "Hunyuan-7B-Pretrain-0124", + "hunyuan-7b-pretrain-0124" + ], + "max_tokens": 262144, + "model_types": [ + "chat" + ] + }, + { + "name": "tencent/hunyuancustom", + "alias": [ + "tencent/HunyuanCustom", + "HunyuanCustom", + "hunyuancustom" + ], + "model_types": [ + "video_generation" + ] + }, + { + "name": "tencent/hunyuanvideo-avatar", + "alias": [ + "tencent/HunyuanVideo-Avatar", + "HunyuanVideo-Avatar", + "hunyuanvideo-avatar" + ], + "model_types": [ + "video_generation" + ] + }, + { + "name": "tencent/hunyuanportrait", + "alias": [ + "tencent/HunyuanPortrait", + "HunyuanPortrait", + "hunyuanportrait" + ], + "model_types": [ + "video_generation" + ] + }, + { + "name": "tencent/instantcharacter", + "alias": [ + "tencent/InstantCharacter", + "InstantCharacter", + "instantcharacter" + ], + "model_types": [ + "image" + ] + }, + { + "name": "tencent/hunyuanvideo-i2v", + "alias": [ + "tencent/HunyuanVideo-I2V", + "HunyuanVideo-I2V", + "hunyuanvideo-i2v" + ], + "model_types": [ + "video_generation" + ] + }, + { + "name": "tencent/hunyuanvideo", + "alias": [ + "tencent/HunyuanVideo", + "HunyuanVideo", + "hunyuanvideo" + ], + "model_types": [ + "video_generation" + ] + }, + { + "name": "tencent/tencent-hunyuan-large", + "alias": [ + "tencent/Tencent-Hunyuan-Large", + "Tencent-Hunyuan-Large", + "tencent-hunyuan-large" + ], + "max_tokens": 262144, + "model_types": [ + "chat" + ] + }, + { + "name": "tencent/hunyuanvideo-promptrewrite", + "alias": [ + "tencent/HunyuanVideo-PromptRewrite", + "HunyuanVideo-PromptRewrite", + "hunyuanvideo-promptrewrite" + ], + "max_tokens": 262144, + "model_types": [ + "chat" + ] + }, + { + "name": "us.amazon.nova-pro-v1:0", + "alias": [ + "amazon.nova-pro-v1:0" + ], + "max_tokens": 300000, + "model_types": [ + "chat" + ] + }, + { + "name": "us.amazon.nova-lite-v1:0", + "alias": [ + "amazon.nova-lite-v1:0", + "apac.amazon.nova-lite-v1:0" + ], + "max_tokens": 300000, + "model_types": [ + "chat" + ] + }, + { + "name": "us.amazon.nova-micro-v1:0", + "alias": [ + "amazon.nova-micro-v1:0" + ], + "max_tokens": 300000, + "model_types": [ + "chat" + ] + }, + { + "name": "us.anthropic.claude-3-5-sonnet-20241022-v2:0", + "alias": [ + "anthropic.claude-3-5-sonnet-20241022-v2:0", + "apac.anthropic.claude-3-5-sonnet-20241022-v2:0" + ], + "max_tokens": 200000, + "model_types": [ + "chat" + ] + }, + { + "name": "us.anthropic.claude-3-5-haiku-20241022-v1:0", + "alias": [ + "anthropic.claude-3-5-haiku-20241022-v1:0" + ], + "max_tokens": 200000, + "model_types": [ + "chat" + ] + }, + { + "name": "amazon.titan-embed-text-v1", + "alias": [ + ], + "max_tokens": 8192, + "model_types": [ + "embedding" + ] + }, + { + "name": "stability.stable-diffusion-xl-v1", + "alias": [ + "1024-x-1024/50-steps/stability.stable-diffusion-xl-v1" + ], + "max_tokens": 77, + "model_types": [ + "image_generation" + ] + }, + { + "name": "azure/gpt-4o", + "alias": [ + "azure/global-standard/gpt-4o-2024-08-06", + "azure/eu/gpt-4o" + ], + "max_tokens": 128000, + "model_types": [ + "chat" + ] + }, + { + "name": "azure/gpt-4o-mini", + "alias": [ + "azure/global-standard/gpt-4o-mini" + ], + "max_tokens": 128000, + "model_types": [ + "chat" + ] + }, + { + "name": "azure/o1-preview", + "alias": [ + "azure/eu/o1-preview" + ], + "max_tokens": 128000, + "model_types": [ + "chat" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "azure/o3-mini", + "alias": [ + "azure/eu/o3-mini" + ], + "max_tokens": 200000, + "model_types": [ + "chat" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "xai/grok-2-1212", + "alias": [ + "grok-2-1212", + "grok-2" + ], + "max_tokens": 131072, + "model_types": [ + "chat" + ] + }, + { + "name": "xai/grok-2-vision-1212", + "alias": [ + "grok-2-vision" + ], + "max_tokens": 131072, + "model_types": [ + "chat" + ] + }, + { + "name": "xai/grok-beta", + "alias": [ + "grok-beta" + ], + "max_tokens": 131072, + "model_types": [ + "chat" + ] + }, + { + "name": "meta-llama/prompt-guard-86m", + "alias": [ + "meta-llama/Prompt-Guard-86M", + "Prompt-Guard-86M", + "prompt-guard-86m" + ], + "model_types": [ + "moderation" + ] + }, + { + "name": "meta-llama/meta-llama-3-8b-instruct", + "alias": [ + "meta-llama/Meta-Llama-3-8B-Instruct", + "Meta-Llama-3-8B-Instruct", + "meta-llama-3-8b-instruct" + ], + "max_tokens": 8192, + "model_types": [ + "chat" + ] + }, + { + "name": "meta-llama/meta-llama-3-70b-instruct", + "alias": [ + "meta-llama/Meta-Llama-3-70B-Instruct", + "Meta-Llama-3-70B-Instruct", + "meta-llama-3-70b-instruct" + ], + "max_tokens": 8192, + "model_types": [ + "chat" + ] + }, + { + "name": "meta-llama/llama-4-maverick-17b-128e-instruct", + "alias": [ + "meta-llama/Llama-4-Maverick-17B-128E-Instruct", + "Llama-4-Maverick-17B-128E-Instruct", + "llama-4-maverick-17b-128e-instruct" + ], + "max_tokens": 1048576, + "model_types": [ + "chat", + "vision", + "image2text" + ] + }, + { + "name": "meta-llama/llama-4-maverick-17b-128e-instruct-fp8", + "alias": [ + "meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8", + "Llama-4-Maverick-17B-128E-Instruct-FP8", + "llama-4-maverick-17b-128e-instruct-fp8" + ], + "max_tokens": 1048576, + "model_types": [ + "chat", + "vision", + "image2text" + ] + }, + { + "name": "meta-llama/llama-4-scout-17b-16e-instruct", + "alias": [ + "meta-llama/Llama-4-Scout-17B-16E-Instruct", + "Llama-4-Scout-17B-16E-Instruct", + "llama-4-scout-17b-16e-instruct" + ], + "max_tokens": 10485760, + "model_types": [ + "chat", + "vision", + "image2text" + ] + }, + { + "name": "meta-llama/llama-4-maverick-17b-128e-instruct-original", + "alias": [ + "meta-llama/Llama-4-Maverick-17B-128E-Instruct-Original", + "Llama-4-Maverick-17B-128E-Instruct-Original", + "llama-4-maverick-17b-128e-instruct-original" + ], + "max_tokens": 1048576, + "model_types": [ + "chat", + "vision", + "image2text" + ] + }, + { + "name": "meta-llama/llama-guard-4-12b", + "alias": [ + "meta-llama/Llama-Guard-4-12B", + "Llama-Guard-4-12B", + "llama-guard-4-12b" + ], + "max_tokens": 131072, + "model_types": [ + "moderation", + "vision", + "image2text" + ] + }, + { + "name": "meta-llama/llama-prompt-guard-2-86m", + "alias": [ + "meta-llama/Llama-Prompt-Guard-2-86M", + "Llama-Prompt-Guard-2-86M", + "llama-prompt-guard-2-86m" + ], + "model_types": [ + "moderation" + ] + }, + { + "name": "meta-llama/llama-prompt-guard-2-22m", + "alias": [ + "meta-llama/Llama-Prompt-Guard-2-22M", + "Llama-Prompt-Guard-2-22M", + "llama-prompt-guard-2-22m" + ], + "model_types": [ + "moderation" + ] + }, + { + "name": "meta-llama/llama-4-maverick-17b-128e", + "alias": [ + "meta-llama/Llama-4-Maverick-17B-128E", + "Llama-4-Maverick-17B-128E", + "llama-4-maverick-17b-128e" + ], + "max_tokens": 1048576, + "model_types": [ + "chat", + "vision", + "image2text" + ] + }, + { + "name": "meta-llama/llama-4-scout-17b-16e", + "alias": [ + "meta-llama/Llama-4-Scout-17B-16E", + "Llama-4-Scout-17B-16E", + "llama-4-scout-17b-16e" + ], + "max_tokens": 10485760, + "model_types": [ + "chat", + "vision", + "image2text" + ] + }, + { + "name": "meta-llama/llama-4-maverick-17b-128e-original", + "alias": [ + "meta-llama/Llama-4-Maverick-17B-128E-Original", + "Llama-4-Maverick-17B-128E-Original", + "llama-4-maverick-17b-128e-original" + ], + "max_tokens": 1048576, + "model_types": [ + "chat", + "vision", + "image2text" + ] + }, + { + "name": "meta-llama/llama-4-scout-17b-16e-original", + "alias": [ + "meta-llama/Llama-4-Scout-17B-16E-Original", + "Llama-4-Scout-17B-16E-Original", + "llama-4-scout-17b-16e-original" + ], + "max_tokens": 10485760, + "model_types": [ + "chat", + "vision", + "image2text" + ] + }, + { + "name": "meta-llama/llama-4-maverick-17b-128e-instruct-fp8-original", + "alias": [ + "meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8-Original", + "Llama-4-Maverick-17B-128E-Instruct-FP8-Original", + "llama-4-maverick-17b-128e-instruct-fp8-original" + ], + "max_tokens": 1048576, + "model_types": [ + "chat", + "vision", + "image2text" + ] + }, + { + "name": "meta-llama/llama-4-scout-17b-16e-instruct-original", + "alias": [ + "meta-llama/Llama-4-Scout-17B-16E-Instruct-Original", + "Llama-4-Scout-17B-16E-Instruct-Original", + "llama-4-scout-17b-16e-instruct-original" + ], + "max_tokens": 10485760, + "model_types": [ + "chat", + "vision", + "image2text" + ] + }, + { + "name": "meta-llama/llama-3.2-90b-vision-instruct", + "alias": [ + "meta-llama/Llama-3.2-90B-Vision-Instruct", + "Llama-3.2-90B-Vision-Instruct", + "llama-3.2-90b-vision-instruct" + ], + "max_tokens": 131072, + "model_types": [ + "chat", + "vision", + "image2text" + ] + }, + { + "name": "meta-llama/llama-3.3-70b-instruct", + "alias": [ + "meta-llama/Llama-3.3-70B-Instruct", + "Llama-3.3-70B-Instruct", + "llama-3.3-70b-instruct" + ], + "max_tokens": 131072, + "model_types": [ + "chat" + ] + }, + { + "name": "meta-llama/llama-3.1-70b-instruct", + "alias": [ + "meta-llama/Llama-3.1-70B-Instruct", + "Llama-3.1-70B-Instruct", + "llama-3.1-70b-instruct" + ], + "max_tokens": 131072, + "model_types": [ + "chat" + ] + }, + { + "name": "meta-llama/llama-3.1-405b-fp8", + "alias": [ + "meta-llama/Llama-3.1-405B-FP8", + "Llama-3.1-405B-FP8", + "llama-3.1-405b-fp8" + ], + "max_tokens": 131072, + "model_types": [ + "chat" + ] + }, + { + "name": "meta-llama/llama-3.2-11b-vision-instruct", + "alias": [ + "meta-llama/Llama-3.2-11B-Vision-Instruct", + "Llama-3.2-11B-Vision-Instruct", + "llama-3.2-11b-vision-instruct" + ], + "max_tokens": 131072, + "model_types": [ + "chat", + "vision", + "image2text" + ] + }, + { + "name": "meta-llama/llama-3.2-3b-instruct-qlora_int4_eo8", + "alias": [ + "meta-llama/Llama-3.2-3B-Instruct-QLORA_INT4_EO8", + "Llama-3.2-3B-Instruct-QLORA_INT4_EO8", + "llama-3.2-3b-instruct-qlora_int4_eo8" + ], + "max_tokens": 131072, + "model_types": [ + "chat" + ] + }, + { + "name": "meta-llama/llama-3.2-3b-instruct-spinquant_int4_eo8", + "alias": [ + "meta-llama/Llama-3.2-3B-Instruct-SpinQuant_INT4_EO8", + "Llama-3.2-3B-Instruct-SpinQuant_INT4_EO8", + "llama-3.2-3b-instruct-spinquant_int4_eo8" + ], + "max_tokens": 131072, + "model_types": [ + "chat" + ] + }, + { + "name": "meta-llama/llama-3.2-1b-instruct-spinquant_int4_eo8", + "alias": [ + "meta-llama/Llama-3.2-1B-Instruct-SpinQuant_INT4_EO8", + "Llama-3.2-1B-Instruct-SpinQuant_INT4_EO8", + "llama-3.2-1b-instruct-spinquant_int4_eo8" + ], + "max_tokens": 131072, + "model_types": [ + "chat" + ] + }, + { + "name": "meta-llama/llama-3.2-1b-instruct-qlora_int4_eo8", + "alias": [ + "meta-llama/Llama-3.2-1B-Instruct-QLORA_INT4_EO8", + "Llama-3.2-1B-Instruct-QLORA_INT4_EO8", + "llama-3.2-1b-instruct-qlora_int4_eo8" + ], + "max_tokens": 131072, + "model_types": [ + "chat" + ] + }, + { + "name": "meta-llama/llama-guard-3-11b-vision", + "alias": [ + "meta-llama/Llama-Guard-3-11B-Vision", + "Llama-Guard-3-11B-Vision", + "llama-guard-3-11b-vision" + ], + "max_tokens": 131072, + "model_types": [ + "moderation", + "vision", + "image2text" + ] + }, + { + "name": "meta-llama/llama-3.2-1b", + "alias": [ + "meta-llama/Llama-3.2-1B", + "Llama-3.2-1B", + "llama-3.2-1b" + ], + "max_tokens": 131072, + "model_types": [ + "chat" + ] + }, + { + "name": "meta-llama/llama-3.2-1b-instruct", + "alias": [ + "meta-llama/Llama-3.2-1B-Instruct", + "Llama-3.2-1B-Instruct", + "llama-3.2-1b-instruct" + ], + "max_tokens": 131072, + "model_types": [ + "chat" + ] + }, + { + "name": "meta-llama/llama-3.2-3b", + "alias": [ + "meta-llama/Llama-3.2-3B", + "Llama-3.2-3B", + "llama-3.2-3b" + ], + "max_tokens": 131072, + "model_types": [ + "chat" + ] + }, + { + "name": "meta-llama/llama-3.2-3b-instruct", + "alias": [ + "meta-llama/Llama-3.2-3B-Instruct", + "Llama-3.2-3B-Instruct", + "llama-3.2-3b-instruct" + ], + "max_tokens": 131072, + "model_types": [ + "chat" + ] + }, + { + "name": "meta-llama/llama-3.1-8b", + "alias": [ + "meta-llama/Llama-3.1-8B", + "Llama-3.1-8B", + "llama-3.1-8b" + ], + "max_tokens": 131072, + "model_types": [ + "chat" + ] + }, + { + "name": "meta-llama/llama-guard-3-8b", + "alias": [ + "meta-llama/Llama-Guard-3-8B", + "Llama-Guard-3-8B", + "llama-guard-3-8b" + ], + "max_tokens": 131072, + "model_types": [ + "moderation" + ] + }, + { + "name": "meta-llama/meta-llama-3-70b", + "alias": [ + "meta-llama/Meta-Llama-3-70B", + "Meta-Llama-3-70B", + "meta-llama-3-70b" + ], + "max_tokens": 8192, + "model_types": [ + "chat" + ] + }, + { + "name": "meta-llama/meta-llama-3-8b", + "alias": [ + "meta-llama/Meta-Llama-3-8B", + "Meta-Llama-3-8B", + "meta-llama-3-8b" + ], + "max_tokens": 8192, + "model_types": [ + "chat" + ] + }, + { + "name": "meta-llama/llama-3.2-90b-vision", + "alias": [ + "meta-llama/Llama-3.2-90B-Vision", + "Llama-3.2-90B-Vision", + "llama-3.2-90b-vision" + ], + "max_tokens": 131072, + "model_types": [ + "chat", + "vision", + "image2text" + ] + }, + { + "name": "meta-llama/llama-3.2-11b-vision", + "alias": [ + "meta-llama/Llama-3.2-11B-Vision", + "Llama-3.2-11B-Vision", + "llama-3.2-11b-vision" + ], + "max_tokens": 131072, + "model_types": [ + "chat", + "vision", + "image2text" + ] + }, + { + "name": "meta-llama/llama-guard-3-1b", + "alias": [ + "meta-llama/Llama-Guard-3-1B", + "Llama-Guard-3-1B", + "llama-guard-3-1b" + ], + "max_tokens": 131072, + "model_types": [ + "moderation" + ] + }, + { + "name": "meta-llama/llama-guard-3-1b-int4", + "alias": [ + "meta-llama/Llama-Guard-3-1B-INT4", + "Llama-Guard-3-1B-INT4", + "llama-guard-3-1b-int4" + ], + "max_tokens": 131072, + "model_types": [ + "moderation" + ] + }, + { + "name": "meta-llama/llama-3.1-405b-instruct-fp8", + "alias": [ + "meta-llama/Llama-3.1-405B-Instruct-FP8", + "Llama-3.1-405B-Instruct-FP8", + "llama-3.1-405b-instruct-fp8" + ], + "max_tokens": 131072, + "model_types": [ + "chat" + ] + }, + { + "name": "meta-llama/llama-3.1-405b-instruct", + "alias": [ + "meta-llama/Llama-3.1-405B-Instruct", + "Llama-3.1-405B-Instruct", + "llama-3.1-405b-instruct" + ], + "max_tokens": 131072, + "model_types": [ + "chat" + ] + }, + { + "name": "meta-llama/llama-3.1-405b", + "alias": [ + "meta-llama/Llama-3.1-405B", + "Llama-3.1-405B", + "llama-3.1-405b" + ], + "max_tokens": 131072, + "model_types": [ + "chat" + ] + }, + { + "name": "meta-llama/llama-3.1-70b", + "alias": [ + "meta-llama/Llama-3.1-70B", + "Llama-3.1-70B", + "llama-3.1-70b" + ], + "max_tokens": 131072, + "model_types": [ + "chat" + ] + }, + { + "name": "meta-llama/llama-3.1-8b-instruct", + "alias": [ + "meta-llama/Llama-3.1-8B-Instruct", + "Llama-3.1-8B-Instruct", + "llama-3.1-8b-instruct" + ], + "max_tokens": 131072, + "model_types": [ + "chat" + ] + }, + { + "name": "meta-llama/llama-guard-3-8b-int8", + "alias": [ + "meta-llama/Llama-Guard-3-8B-INT8", + "Llama-Guard-3-8B-INT8", + "llama-guard-3-8b-int8" + ], + "max_tokens": 131072, + "model_types": [ + "moderation" + ] + }, + { + "name": "meta-llama/meta-llama-guard-2-8b", + "alias": [ + "meta-llama/Meta-Llama-Guard-2-8B", + "Meta-Llama-Guard-2-8B", + "meta-llama-guard-2-8b" + ], + "max_tokens": 4096, + "model_types": [ + "moderation" + ] + }, + { + "name": "meta-llama/llamaguard-7b", + "alias": [ + "meta-llama/LlamaGuard-7b", + "LlamaGuard-7b", + "llamaguard-7b" + ], + "max_tokens": 4096, + "model_types": [ + "moderation" + ] + }, + { + "name": "meta-llama/llama-2-70b-chat-hf", + "alias": [ + "meta-llama/Llama-2-70b-chat-hf", + "Llama-2-70b-chat-hf", + "llama-2-70b-chat-hf" + ], + "max_tokens": 4096, + "model_types": [ + "chat" + ] + }, + { + "name": "meta-llama/llama-2-13b-chat-hf", + "alias": [ + "meta-llama/Llama-2-13b-chat-hf", + "Llama-2-13b-chat-hf", + "llama-2-13b-chat-hf" + ], + "max_tokens": 4096, + "model_types": [ + "chat" + ] + }, + { + "name": "meta-llama/llama-2-7b-chat-hf", + "alias": [ + "meta-llama/Llama-2-7b-chat-hf", + "Llama-2-7b-chat-hf", + "llama-2-7b-chat-hf" + ], + "max_tokens": 4096, + "model_types": [ + "chat" + ] + }, + { + "name": "meta-llama/llama-2-70b-hf", + "alias": [ + "meta-llama/Llama-2-70b-hf", + "Llama-2-70b-hf", + "llama-2-70b-hf" + ], + "max_tokens": 4096, + "model_types": [ + "chat" + ] + }, + { + "name": "meta-llama/llama-2-13b-hf", + "alias": [ + "meta-llama/Llama-2-13b-hf", + "Llama-2-13b-hf", + "llama-2-13b-hf" + ], + "max_tokens": 4096, + "model_types": [ + "chat" + ] + }, + { + "name": "meta-llama/llama-2-7b-hf", + "alias": [ + "meta-llama/Llama-2-7b-hf", + "Llama-2-7b-hf", + "llama-2-7b-hf" + ], + "max_tokens": 4096, + "model_types": [ + "chat" + ] + }, + { + "name": "meta-llama/llama-2-70b-chat", + "alias": [ + "meta-llama/Llama-2-70b-chat", + "Llama-2-70b-chat", + "llama-2-70b-chat" + ], + "max_tokens": 4096, + "model_types": [ + "chat" + ] + }, + { + "name": "meta-llama/llama-2-13b-chat", + "alias": [ + "meta-llama/Llama-2-13b-chat", + "Llama-2-13b-chat", + "llama-2-13b-chat" + ], + "max_tokens": 4096, + "model_types": [ + "chat" + ] + }, + { + "name": "meta-llama/llama-2-7b-chat", + "alias": [ + "meta-llama/Llama-2-7b-chat", + "Llama-2-7b-chat", + "llama-2-7b-chat" + ], + "max_tokens": 4096, + "model_types": [ + "chat" + ] + }, + { + "name": "meta-llama/llama-2-70b", + "alias": [ + "meta-llama/Llama-2-70b", + "Llama-2-70b", + "llama-2-70b" + ], + "max_tokens": 4096, + "model_types": [ + "chat" + ] + }, + { + "name": "meta-llama/llama-2-13b", + "alias": [ + "meta-llama/Llama-2-13b", + "Llama-2-13b", + "llama-2-13b" + ], + "max_tokens": 4096, + "model_types": [ + "chat" + ] + }, + { + "name": "meta-llama/llama-2-7b", + "alias": [ + "meta-llama/Llama-2-7b", + "Llama-2-7b", + "llama-2-7b" + ], + "max_tokens": 4096, + "model_types": [ + "chat" + ] + }, + { + "name": "meta-llama/codellama-70b-instruct-hf", + "alias": [ + "meta-llama/CodeLlama-70b-Instruct-hf", + "CodeLlama-70b-Instruct-hf", + "codellama-70b-instruct-hf" + ], + "max_tokens": 16384, + "model_types": [ + "chat" + ] + }, + { + "name": "meta-llama/codellama-70b-python-hf", + "alias": [ + "meta-llama/CodeLlama-70b-Python-hf", + "CodeLlama-70b-Python-hf", + "codellama-70b-python-hf" + ], + "max_tokens": 16384, + "model_types": [ + "chat" + ] + }, + { + "name": "meta-llama/codellama-70b-hf", + "alias": [ + "meta-llama/CodeLlama-70b-hf", + "CodeLlama-70b-hf", + "codellama-70b-hf" + ], + "max_tokens": 16384, + "model_types": [ + "chat" + ] + }, + { + "name": "meta-llama/codellama-34b-instruct-hf", + "alias": [ + "meta-llama/CodeLlama-34b-Instruct-hf", + "CodeLlama-34b-Instruct-hf", + "codellama-34b-instruct-hf" + ], + "max_tokens": 16384, + "model_types": [ + "chat" + ] + }, + { + "name": "meta-llama/codellama-34b-python-hf", + "alias": [ + "meta-llama/CodeLlama-34b-Python-hf", + "CodeLlama-34b-Python-hf", + "codellama-34b-python-hf" + ], + "max_tokens": 16384, + "model_types": [ + "chat" + ] + }, + { + "name": "meta-llama/codellama-34b-hf", + "alias": [ + "meta-llama/CodeLlama-34b-hf", + "CodeLlama-34b-hf", + "codellama-34b-hf" + ], + "max_tokens": 16384, + "model_types": [ + "chat" + ] + }, + { + "name": "meta-llama/codellama-13b-instruct-hf", + "alias": [ + "meta-llama/CodeLlama-13b-Instruct-hf", + "CodeLlama-13b-Instruct-hf", + "codellama-13b-instruct-hf" + ], + "max_tokens": 16384, + "model_types": [ + "chat" + ] + }, + { + "name": "meta-llama/codellama-13b-python-hf", + "alias": [ + "meta-llama/CodeLlama-13b-Python-hf", + "CodeLlama-13b-Python-hf", + "codellama-13b-python-hf" + ], + "max_tokens": 16384, + "model_types": [ + "chat" + ] + }, + { + "name": "meta-llama/codellama-13b-hf", + "alias": [ + "meta-llama/CodeLlama-13b-hf", + "CodeLlama-13b-hf", + "codellama-13b-hf" + ], + "max_tokens": 16384, + "model_types": [ + "chat" + ] + }, + { + "name": "meta-llama/codellama-7b-instruct-hf", + "alias": [ + "meta-llama/CodeLlama-7b-Instruct-hf", + "CodeLlama-7b-Instruct-hf", + "codellama-7b-instruct-hf" + ], + "max_tokens": 16384, + "model_types": [ + "chat" + ] + }, + { + "name": "meta-llama/codellama-7b-python-hf", + "alias": [ + "meta-llama/CodeLlama-7b-Python-hf", + "CodeLlama-7b-Python-hf", + "codellama-7b-python-hf" + ], + "max_tokens": 16384, + "model_types": [ + "chat" + ] + }, + { + "name": "meta-llama/codellama-7b-hf", + "alias": [ + "meta-llama/CodeLlama-7b-hf", + "CodeLlama-7b-hf", + "codellama-7b-hf" + ], + "max_tokens": 16384, + "model_types": [ + "chat" + ] + }, + { + "name": "nvidia/nemotron-3-content-safety", + "alias": [ + "nvidia/Nemotron-3-Content-Safety", + "Nemotron-3-Content-Safety", + "nemotron-3-content-safety" + ], + "model_types": [ + "moderation", + "vision" + ] + }, + { + "name": "nvidia/llama-nemotron-embed-vl-1b-v2-fp8", + "alias": [ + "llama-nemotron-embed-vl-1b-v2-fp8" + ], + "model_types": [ + "embedding", + "vision" + ] + }, + { + "name": "nvidia/kimi-k2.6-eagle3", + "alias": [ + "nvidia/Kimi-K2.6-Eagle3", + "Kimi-K2.6-Eagle3", + "kimi-k2.6-eagle3" + ], + "max_tokens": 262144, + "model_types": [ + "chat" + ] + }, + { + "name": "nvidia/kimi-k2.5-thinking-eagle3", + "alias": [ + "nvidia/Kimi-K2.5-Thinking-Eagle3", + "Kimi-K2.5-Thinking-Eagle3", + "kimi-k2.5-thinking-eagle3" + ], + "max_tokens": 262144, + "model_types": [ + "chat" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "nvidia/diffusiongemma-26b-a4b-it-nvfp4", + "alias": [ + "nvidia/diffusiongemma-26B-A4B-it-NVFP4", + "diffusiongemma-26B-A4B-it-NVFP4", + "diffusiongemma-26b-a4b-it-nvfp4" + ], + "max_tokens": 131072, + "model_types": [ + "chat" + ] + }, + { + "name": "nvidia/deepseek-v4-flash-nvfp4", + "alias": [ + "nvidia/DeepSeek-V4-Flash-NVFP4", + "DeepSeek-V4-Flash-NVFP4", + "deepseek-v4-flash-nvfp4" + ], + "max_tokens": 1048576, + "model_types": [ + "chat" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "nvidia/nv-kermt-70m-v2", + "alias": [ + "nvidia/NV-KERMT-70M-v2", + "NV-KERMT-70M-v2", + "nv-kermt-70m-v2" + ], + "model_types": [ + "other" + ] + }, + { + "name": "nvidia/nvidia-nemotron-3-ultra-550b-a55b-nvfp4", + "alias": [ + "nvidia/NVIDIA-Nemotron-3-Ultra-550B-A55B-NVFP4", + "NVIDIA-Nemotron-3-Ultra-550B-A55B-NVFP4", + "nvidia-nemotron-3-ultra-550b-a55b-nvfp4" + ], + "max_tokens": 262144, + "model_types": [ + "chat" + ] + }, + { + "name": "nvidia/nvidia-nemotron-3-ultra-550b-a55b-bf16", + "alias": [ + "nvidia/NVIDIA-Nemotron-3-Ultra-550B-A55B-BF16", + "NVIDIA-Nemotron-3-Ultra-550B-A55B-BF16", + "nvidia-nemotron-3-ultra-550b-a55b-bf16" + ], + "max_tokens": 262144, + "model_types": [ + "chat" + ] + }, + { + "name": "nvidia/nemotron-speech-streaming-en-0.6b", + "alias": [ + "nemotron-speech-streaming-en-0.6b" + ], + "max_tokens": 262144, + "model_types": [ + "chat" + ] + }, + { + "name": "nvidia/parakeet-unified-en-0.6b", + "alias": [ + "parakeet-unified-en-0.6b" + ], + "model_types": [ + "asr" + ] + }, + { + "name": "nvidia/geotransolver_drivaerml", + "alias": [ + "geotransolver_drivaerml" + ], + "model_types": [ + "other" + ] + }, + { + "name": "nvidia/locateanything-3b", + "alias": [ + "nvidia/LocateAnything-3B", + "LocateAnything-3B", + "locateanything-3b" + ], + "model_types": [ + "chat", + "vision", + "image2text" + ] + }, + { + "name": "nvidia/cosmos3-super", + "alias": [ + "nvidia/Cosmos3-Super", + "Cosmos3-Super", + "cosmos3-super" + ], + "model_types": [ + "other" + ] + }, + { + "name": "nvidia/nemotron-3.5-asr-streaming-0.6b", + "alias": [ + "nemotron-3.5-asr-streaming-0.6b" + ], + "model_types": [ + "asr" + ] + }, + { + "name": "nvidia/omni-dreams-models", + "alias": [ + "omni-dreams-models" + ], + "model_types": [ + "video_generation" + ] + }, + { + "name": "nvidia/deepseek-v4-pro-nvfp4", + "alias": [ + "nvidia/DeepSeek-V4-Pro-NVFP4", + "DeepSeek-V4-Pro-NVFP4", + "deepseek-v4-pro-nvfp4" + ], + "max_tokens": 1048576, + "model_types": [ + "chat" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "nvidia/nvidia-nemotron-3-ultra-550b-a55b-genrm", + "alias": [ + "nvidia/NVIDIA-Nemotron-3-Ultra-550B-A55B-GenRM", + "NVIDIA-Nemotron-3-Ultra-550B-A55B-GenRM", + "nvidia-nemotron-3-ultra-550b-a55b-genrm" + ], + "max_tokens": 262144, + "model_types": [ + "chat" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "nvidia/nvidia-nemotron-3-ultra-550b-a55b-base-bf16", + "alias": [ + "nvidia/NVIDIA-Nemotron-3-Ultra-550B-A55B-Base-BF16", + "NVIDIA-Nemotron-3-Ultra-550B-A55B-Base-BF16", + "nvidia-nemotron-3-ultra-550b-a55b-base-bf16" + ], + "max_tokens": 262144, + "model_types": [ + "chat" + ] + }, + { + "name": "nvidia/artifixer", + "alias": [ + "nvidia/ArtiFixer", + "ArtiFixer", + "artifixer" + ], + "model_types": [ + "other" + ] + }, + { + "name": "nvidia/nemotron-3.5-content-safety", + "alias": [ + "nvidia/Nemotron-3.5-Content-Safety", + "Nemotron-3.5-Content-Safety", + "nemotron-3.5-content-safety" + ], + "model_types": [ + "moderation", + "vision" + ] + }, + { + "name": "nvidia/nemotron-labs-diffusion-vlm-8b", + "alias": [ + "nvidia/Nemotron-Labs-Diffusion-VLM-8B", + "Nemotron-Labs-Diffusion-VLM-8B", + "nemotron-labs-diffusion-vlm-8b" + ], + "max_tokens": 262144, + "model_types": [ + "chat", + "vision", + "image2text" + ] + }, + { + "name": "nvidia/nemotron-labs-diffusion-3b-base", + "alias": [ + "nvidia/Nemotron-Labs-Diffusion-3B-Base", + "Nemotron-Labs-Diffusion-3B-Base", + "nemotron-labs-diffusion-3b-base" + ], + "max_tokens": 262144, + "model_types": [ + "chat" + ] + }, + { + "name": "nvidia/nemotron-labs-diffusion-8b-base", + "alias": [ + "nvidia/Nemotron-Labs-Diffusion-8B-Base", + "Nemotron-Labs-Diffusion-8B-Base", + "nemotron-labs-diffusion-8b-base" + ], + "max_tokens": 262144, + "model_types": [ + "chat" + ] + }, + { + "name": "nvidia/nemotron-labs-diffusion-14b-base", + "alias": [ + "nvidia/Nemotron-Labs-Diffusion-14B-Base", + "Nemotron-Labs-Diffusion-14B-Base", + "nemotron-labs-diffusion-14b-base" + ], + "max_tokens": 262144, + "model_types": [ + "chat" + ] + }, + { + "name": "nvidia/nemotron-labs-diffusion-14b", + "alias": [ + "nvidia/Nemotron-Labs-Diffusion-14B", + "Nemotron-Labs-Diffusion-14B", + "nemotron-labs-diffusion-14b" + ], + "max_tokens": 262144, + "model_types": [ + "chat" + ] + }, + { + "name": "nvidia/nemotron-labs-diffusion-3b", + "alias": [ + "nvidia/Nemotron-Labs-Diffusion-3B", + "Nemotron-Labs-Diffusion-3B", + "nemotron-labs-diffusion-3b" + ], + "max_tokens": 262144, + "model_types": [ + "chat" + ] + }, + { + "name": "nvidia/nemotron-labs-diffusion-8b", + "alias": [ + "nvidia/Nemotron-Labs-Diffusion-8B", + "Nemotron-Labs-Diffusion-8B", + "nemotron-labs-diffusion-8b" + ], + "max_tokens": 262144, + "model_types": [ + "chat" + ] + }, + { + "name": "nvidia/llama-nemotron-embed-vl-1b-v2", + "alias": [ + "llama-nemotron-embed-vl-1b-v2" + ], + "model_types": [ + "embedding", + "vision" + ] + }, + { + "name": "nvidia/qwen3.5-122b-a10b-nvfp4", + "alias": [ + "nvidia/Qwen3.5-122B-A10B-NVFP4", + "Qwen3.5-122B-A10B-NVFP4", + "qwen3.5-122b-a10b-nvfp4" + ], + "max_tokens": 262144, + "model_types": [ + "chat" + ] + }, + { + "name": "nvidia/nemotron-climb-proxy-models", + "alias": [ + "nemotron-climb-proxy-models" + ], + "max_tokens": 262144, + "model_types": [ + "chat" + ] + }, + { + "name": "nvidia/gr00t-h", + "alias": [ + "nvidia/GR00T-H", + "GR00T-H", + "gr00t-h" + ], + "model_types": [ + "other" + ] + }, + { + "name": "nvidia/parakeet-tdt-0.6b-v3", + "alias": [ + "parakeet-tdt-0.6b-v3" + ], + "model_types": [ + "asr" + ] + }, + { + "name": "nvidia/llama-nemotron-embed-1b-v2", + "alias": [ + "llama-nemotron-embed-1b-v2" + ], + "model_types": [ + "embedding" + ] + }, + { + "name": "nvidia/llama-nemotron-rerank-1b-v2", + "alias": [ + "llama-nemotron-rerank-1b-v2" + ], + "model_types": [ + "rerank" + ] + }, + { + "name": "nvidia/llama-nemotron-rerank-vl-1b-v2", + "alias": [ + "llama-nemotron-rerank-vl-1b-v2" + ], + "model_types": [ + "rerank" + ] + }, + { + "name": "nvidia/llama-nv-embed-reasoning-3b", + "alias": [ + "llama-nv-embed-reasoning-3b" + ], + "model_types": [ + "embedding" + ] + }, + { + "name": "nvidia/llama-nemotron-colembed-vl-3b-v2", + "alias": [ + "llama-nemotron-colembed-vl-3b-v2" + ], + "model_types": [ + "embedding", + "vision" + ] + }, + { + "name": "nvidia/wan2.2-t2v-a14b-diffusers-fp8", + "alias": [ + "nvidia/Wan2.2-T2V-A14B-Diffusers-FP8", + "Wan2.2-T2V-A14B-Diffusers-FP8", + "wan2.2-t2v-a14b-diffusers-fp8" + ], + "model_types": [ + "other" + ] + }, + { + "name": "nvidia/wan2.2-t2v-a14b-diffusers-nvfp4", + "alias": [ + "nvidia/Wan2.2-T2V-A14B-Diffusers-NVFP4", + "Wan2.2-T2V-A14B-Diffusers-NVFP4", + "wan2.2-t2v-a14b-diffusers-nvfp4" + ], + "model_types": [ + "other" + ] + }, + { + "name": "nvidia/cosmos-embed1-448p-anomaly-detection", + "alias": [ + "nvidia/Cosmos-Embed1-448p-anomaly-detection", + "Cosmos-Embed1-448p-anomaly-detection", + "cosmos-embed1-448p-anomaly-detection" + ], + "model_types": [ + "embedding", + "vision" + ] + }, + { + "name": "nvidia/kimi-k2.6-nvfp4", + "alias": [ + "nvidia/Kimi-K2.6-NVFP4", + "Kimi-K2.6-NVFP4", + "kimi-k2.6-nvfp4" + ], + "max_tokens": 262144, + "model_types": [ + "chat" + ] + }, + { + "name": "nvidia/re-use", + "alias": [ + "nvidia/RE-USE", + "RE-USE", + "re-use" + ], + "model_types": [ + "audio", + "asr", + "tts" + ] + }, + { + "name": "nvidia/kimi-k2.5-nvfp4", + "alias": [ + "nvidia/Kimi-K2.5-NVFP4", + "Kimi-K2.5-NVFP4", + "kimi-k2.5-nvfp4" + ], + "max_tokens": 262144, + "model_types": [ + "chat" + ] + }, + { + "name": "nvidia/audio-flamingo-next-hf", + "alias": [ + "audio-flamingo-next-hf" + ], + "model_types": [ + "chat", + "audio", + "asr" + ] + }, + { + "name": "nvidia/audio-flamingo-next-think-hf", + "alias": [ + "audio-flamingo-next-think-hf" + ], + "model_types": [ + "chat", + "audio", + "asr" + ] + }, + { + "name": "nvidia/audio-flamingo-next-captioner-hf", + "alias": [ + "audio-flamingo-next-captioner-hf" + ], + "model_types": [ + "chat", + "audio", + "asr" + ] + }, + { + "name": "nvidia/nemotron-climb-fasttext-classifiers", + "alias": [ + "nemotron-climb-fasttext-classifiers" + ], + "max_tokens": 262144, + "model_types": [ + "chat" + ] + }, + { + "name": "nvidia/lyra-2.0", + "alias": [ + "nvidia/Lyra-2.0", + "Lyra-2.0", + "lyra-2.0" + ], + "model_types": [ + "3d_generation" + ] + }, + { + "name": "nvidia/gemma-4-26b-a4b-nvfp4", + "alias": [ + "nvidia/Gemma-4-26B-A4B-NVFP4", + "Gemma-4-26B-A4B-NVFP4", + "gemma-4-26b-a4b-nvfp4" + ], + "max_tokens": 131072, + "model_types": [ + "chat" + ] + }, + { + "name": "nvidia/pointworld_models", + "alias": [ + "nvidia/PointWorld_models", + "PointWorld_models", + "pointworld_models" + ], + "model_types": [ + "other" + ] + }, + { + "name": "nvidia/nemotron-elastic-12b", + "alias": [ + "nvidia/Nemotron-Elastic-12B", + "Nemotron-Elastic-12B", + "nemotron-elastic-12b" + ], + "max_tokens": 262144, + "model_types": [ + "chat" + ] + }, + { + "name": "nvidia/nemotron-3-nano-omni-30b-a3b-reasoning-bf16", + "alias": [ + "nvidia/Nemotron-3-Nano-Omni-30B-A3B-Reasoning-BF16", + "Nemotron-3-Nano-Omni-30B-A3B-Reasoning-BF16", + "nemotron-3-nano-omni-30b-a3b-reasoning-bf16" + ], + "max_tokens": 262144, + "model_types": [ + "chat" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "nvidia/gpt-oss-120b-eagle3-v3", + "alias": [ + "nvidia/gpt-oss-120b-Eagle3-v3", + "gpt-oss-120b-Eagle3-v3", + "gpt-oss-120b-eagle3-v3" + ], + "max_tokens": 131072, + "model_types": [ + "chat" + ] + }, + { + "name": "nvidia/nvidia-nemotron-labs-3-elastic-30b-a3b-nvfp4", + "alias": [ + "nvidia/NVIDIA-Nemotron-Labs-3-Elastic-30B-A3B-NVFP4", + "NVIDIA-Nemotron-Labs-3-Elastic-30B-A3B-NVFP4", + "nvidia-nemotron-labs-3-elastic-30b-a3b-nvfp4" + ], + "max_tokens": 262144, + "model_types": [ + "chat" + ] + }, + { + "name": "nvidia/nvidia-nemotron-labs-3-elastic-30b-a3b-fp8", + "alias": [ + "nvidia/NVIDIA-Nemotron-Labs-3-Elastic-30B-A3B-FP8", + "NVIDIA-Nemotron-Labs-3-Elastic-30B-A3B-FP8", + "nvidia-nemotron-labs-3-elastic-30b-a3b-fp8" + ], + "max_tokens": 262144, + "model_types": [ + "chat" + ] + }, + { + "name": "nvidia/nvidia-nemotron-labs-3-elastic-30b-a3b-bf16", + "alias": [ + "nvidia/NVIDIA-Nemotron-Labs-3-Elastic-30B-A3B-BF16", + "NVIDIA-Nemotron-Labs-3-Elastic-30B-A3B-BF16", + "nvidia-nemotron-labs-3-elastic-30b-a3b-bf16" + ], + "max_tokens": 262144, + "model_types": [ + "chat" + ] + }, + { + "name": "nvidia/gemma-4-31b-it-nvfp4", + "alias": [ + "nvidia/Gemma-4-31B-IT-NVFP4", + "Gemma-4-31B-IT-NVFP4", + "gemma-4-31b-it-nvfp4" + ], + "max_tokens": 131072, + "model_types": [ + "chat" + ] + }, + { + "name": "nvidia/asset-harvester", + "alias": [ + "asset-harvester" + ], + "model_types": [ + "3d_generation" + ] + }, + { + "name": "nvidia/corrdiff-cmip6-era5", + "alias": [ + "corrdiff-cmip6-era5" + ], + "model_types": [ + "other" + ] + }, + { + "name": "nvidia/g1_locomanip_finetune", + "alias": [ + "g1_locomanip_finetune" + ], + "model_types": [ + "other" + ] + }, + { + "name": "nvidia/nv-raw2insights-mri", + "alias": [ + "nvidia/NV-Raw2insights-MRI", + "NV-Raw2insights-MRI", + "nv-raw2insights-mri" + ], + "model_types": [ + "other" + ] + }, + { + "name": "nvidia/canary-qwen-2.5b", + "alias": [ + "canary-qwen-2.5b" + ], + "model_types": [ + "asr" + ] + }, + { + "name": "nvidia/nvidia-nemotron-nano-9b-v2-japanese", + "alias": [ + "nvidia/NVIDIA-Nemotron-Nano-9B-v2-Japanese", + "NVIDIA-Nemotron-Nano-9B-v2-Japanese", + "nvidia-nemotron-nano-9b-v2-japanese" + ], + "max_tokens": 262144, + "model_types": [ + "chat" + ] + }, + { + "name": "nvidia/gr00t-n1.7-libero", + "alias": [ + "nvidia/GR00T-N1.7-LIBERO", + "GR00T-N1.7-LIBERO", + "gr00t-n1.7-libero" + ], + "model_types": [ + "other" + ] + }, + { + "name": "nvidia/gr00t-n1.7-droid", + "alias": [ + "nvidia/GR00T-N1.7-DROID", + "GR00T-N1.7-DROID", + "gr00t-n1.7-droid" + ], + "model_types": [ + "other" + ] + }, + { + "name": "nvidia/gr00t-n1.7-simplerenv-fractal", + "alias": [ + "nvidia/GR00T-N1.7-SimplerEnv-Fractal", + "GR00T-N1.7-SimplerEnv-Fractal", + "gr00t-n1.7-simplerenv-fractal" + ], + "model_types": [ + "other" + ] + }, + { + "name": "nvidia/gr00t-n1.7-simplerenv-bridge", + "alias": [ + "nvidia/GR00T-N1.7-SimplerEnv-Bridge", + "GR00T-N1.7-SimplerEnv-Bridge", + "gr00t-n1.7-simplerenv-bridge" + ], + "model_types": [ + "other" + ] + }, + { + "name": "nvidia/gn1x-tuned-arena-g1-loco-manipulation", + "alias": [ + "nvidia/GN1x-Tuned-Arena-G1-Loco-Manipulation", + "GN1x-Tuned-Arena-G1-Loco-Manipulation", + "gn1x-tuned-arena-g1-loco-manipulation" + ], + "model_types": [ + "robotics" + ] + }, + { + "name": "nvidia/minimax-m2.5-nvfp4", + "alias": [ + "nvidia/MiniMax-M2.5-NVFP4", + "MiniMax-M2.5-NVFP4", + "minimax-m2.5-nvfp4" + ], + "max_tokens": 1000000, + "model_types": [ + "chat" + ] + }, + { + "name": "nvidia/cosmos-h-surgical-simulator", + "alias": [ + "nvidia/Cosmos-H-Surgical-Simulator", + "Cosmos-H-Surgical-Simulator", + "cosmos-h-surgical-simulator" + ], + "model_types": [ + "other" + ] + }, + { + "name": "nvidia/pixeldit-imagenet", + "alias": [ + "nvidia/PixelDiT-ImageNet", + "PixelDiT-ImageNet", + "pixeldit-imagenet" + ], + "model_types": [ + "image" + ] + }, + { + "name": "nvidia/pixeldit-1300m-1024px", + "alias": [ + "nvidia/PixelDiT-1300M-1024px", + "PixelDiT-1300M-1024px", + "pixeldit-1300m-1024px" + ], + "model_types": [ + "image" + ] + }, + { + "name": "nvidia/ising-calibration-1-35b-a3b", + "alias": [ + "nvidia/Ising-Calibration-1-35B-A3B", + "Ising-Calibration-1-35B-A3B", + "ising-calibration-1-35b-a3b" + ], + "model_types": [ + "other" + ] + }, + { + "name": "nvidia/cosmos-h-surgical", + "alias": [ + "nvidia/Cosmos-H-Surgical", + "Cosmos-H-Surgical", + "cosmos-h-surgical" + ], + "model_types": [ + "other" + ] + }, + { + "name": "nvidia/nvidia-nemotron-parse-v1.1-tc", + "alias": [ + "nvidia/NVIDIA-Nemotron-Parse-v1.1-TC", + "NVIDIA-Nemotron-Parse-v1.1-TC", + "nvidia-nemotron-parse-v1.1-tc" + ], + "max_tokens": 262144, + "model_types": [ + "chat", + "vision", + "image2text" + ] + }, + { + "name": "nvidia/gn1x-tuned-arena-gr1-manipulation", + "alias": [ + "nvidia/GN1x-Tuned-Arena-GR1-Manipulation", + "GN1x-Tuned-Arena-GR1-Manipulation", + "gn1x-tuned-arena-gr1-manipulation" + ], + "model_types": [ + "robotics" + ] + }, + { + "name": "nvidia/gn1.6-tuned-arena-gr1-placeitemclosedoor-task", + "alias": [ + "nvidia/GN1.6-Tuned-Arena-GR1-PlaceItemCloseDoor-Task", + "GN1.6-Tuned-Arena-GR1-PlaceItemCloseDoor-Task", + "gn1.6-tuned-arena-gr1-placeitemclosedoor-task" + ], + "model_types": [ + "robotics" + ] + }, + { + "name": "nvidia/parakeet-tdt-0.6b-v2", + "alias": [ + "parakeet-tdt-0.6b-v2" + ], + "model_types": [ + "asr" + ] + }, + { + "name": "nvidia/audio-flamingo-3-hf", + "alias": [ + "audio-flamingo-3-hf" + ], + "model_types": [ + "chat", + "audio", + "asr" + ] + }, + { + "name": "nvidia/gear-sonic", + "alias": [ + "nvidia/GEAR-SONIC", + "GEAR-SONIC", + "gear-sonic" + ], + "model_types": [ + "robotics" + ] + }, + { + "name": "nvidia/glm-5-nvfp4", + "alias": [ + "nvidia/GLM-5-NVFP4", + "GLM-5-NVFP4", + "glm-5-nvfp4" + ], + "max_tokens": 131072, + "model_types": [ + "chat" + ] + }, + { + "name": "nvidia/kimodo-soma-seed-v1.1", + "alias": [ + "nvidia/Kimodo-SOMA-SEED-v1.1", + "Kimodo-SOMA-SEED-v1.1", + "kimodo-soma-seed-v1.1" + ], + "model_types": [ + "robotics" + ] + }, + { + "name": "nvidia/kimodo-soma-rp-v1.1", + "alias": [ + "nvidia/Kimodo-SOMA-RP-v1.1", + "Kimodo-SOMA-RP-v1.1", + "kimodo-soma-rp-v1.1" + ], + "model_types": [ + "robotics" + ] + }, + { + "name": "nvidia/tmr-soma-rp-v1", + "alias": [ + "nvidia/TMR-SOMA-RP-v1", + "TMR-SOMA-RP-v1", + "tmr-soma-rp-v1" + ], + "model_types": [ + "robotics" + ] + }, + { + "name": "nvidia/egm-8b-sft", + "alias": [ + "nvidia/EGM-8B-SFT", + "EGM-8B-SFT", + "egm-8b-sft" + ], + "model_types": [ + "chat", + "vision", + "image2text" + ] + }, + { + "name": "nvidia/egm-4b-sft", + "alias": [ + "nvidia/EGM-4B-SFT", + "EGM-4B-SFT", + "egm-4b-sft" + ], + "model_types": [ + "chat", + "vision", + "image2text" + ] + }, + { + "name": "nvidia/egm-8b", + "alias": [ + "nvidia/EGM-8B", + "EGM-8B", + "egm-8b" + ], + "model_types": [ + "chat", + "vision", + "image2text" + ] + }, + { + "name": "nvidia/egm-4b", + "alias": [ + "nvidia/EGM-4B", + "EGM-4B", + "egm-4b" + ], + "model_types": [ + "chat", + "vision", + "image2text" + ] + }, + { + "name": "nvidia/music-flamingo-2601-hf", + "alias": [ + "music-flamingo-2601-hf" + ], + "model_types": [ + "chat", + "audio", + "asr" + ] + }, + { + "name": "nvidia/esm2_t48_15b_ur50d", + "alias": [ + "nvidia/esm2_t48_15B_UR50D", + "esm2_t48_15B_UR50D", + "esm2_t48_15b_ur50d" + ], + "model_types": [ + "other" + ] + }, + { + "name": "nvidia/esm2_t36_3b_ur50d", + "alias": [ + "nvidia/esm2_t36_3B_UR50D", + "esm2_t36_3B_UR50D", + "esm2_t36_3b_ur50d" + ], + "model_types": [ + "other" + ] + }, + { + "name": "nvidia/esm2_t33_650m_ur50d", + "alias": [ + "nvidia/esm2_t33_650M_UR50D", + "esm2_t33_650M_UR50D", + "esm2_t33_650m_ur50d" + ], + "model_types": [ + "other" + ] + }, + { + "name": "nvidia/1_install_trocar_1gpu_64bs_50k_steps_53_data", + "alias": [ + "1_install_trocar_1gpu_64bs_50k_steps_53_data" + ], + "model_types": [ + "other" + ] + }, + { + "name": "nvidia/nvidia-nemotron-3-nano-4b-fp8", + "alias": [ + "nvidia/NVIDIA-Nemotron-3-Nano-4B-FP8", + "NVIDIA-Nemotron-3-Nano-4B-FP8", + "nvidia-nemotron-3-nano-4b-fp8" + ], + "max_tokens": 262144, + "model_types": [ + "chat" + ] + }, + { + "name": "nvidia/nvidia-nemotron-3-nano-4b-bf16", + "alias": [ + "nvidia/NVIDIA-Nemotron-3-Nano-4B-BF16", + "NVIDIA-Nemotron-3-Nano-4B-BF16", + "nvidia-nemotron-3-nano-4b-bf16" + ], + "max_tokens": 262144, + "model_types": [ + "chat" + ] + }, + { + "name": "nvidia/nvila-8b-hd-video", + "alias": [ + "nvidia/NVILA-8B-HD-Video", + "NVILA-8B-HD-Video", + "nvila-8b-hd-video" + ], + "model_types": [ + "video_generation" + ] + }, + { + "name": "nvidia/autogaze", + "alias": [ + "nvidia/AutoGaze", + "AutoGaze", + "autogaze" + ], + "model_types": [ + "vision" + ] + }, + { + "name": "nvidia/cosmos-tokenizer-surg", + "alias": [ + "nvidia/Cosmos-Tokenizer-Surg", + "Cosmos-Tokenizer-Surg", + "cosmos-tokenizer-surg" + ], + "model_types": [ + "other" + ] + }, + { + "name": "nvidia/nvidia-nemotron-3-nano-4b-gguf", + "alias": [ + "nvidia/NVIDIA-Nemotron-3-Nano-4B-GGUF", + "NVIDIA-Nemotron-3-Nano-4B-GGUF", + "nvidia-nemotron-3-nano-4b-gguf" + ], + "max_tokens": 262144, + "model_types": [ + "chat" + ] + }, + { + "name": "nvidia/soma-x", + "alias": [ + "nvidia/SOMA-X", + "SOMA-X", + "soma-x" + ], + "model_types": [ + "robotics" + ] + }, + { + "name": "nvidia/kimodo-smplx-rp-v1", + "alias": [ + "nvidia/Kimodo-SMPLX-RP-v1", + "Kimodo-SMPLX-RP-v1", + "kimodo-smplx-rp-v1" + ], + "model_types": [ + "robotics" + ] + }, + { + "name": "nvidia/kimodo-soma-rp-v1", + "alias": [ + "nvidia/Kimodo-SOMA-RP-v1", + "Kimodo-SOMA-RP-v1", + "kimodo-soma-rp-v1" + ], + "model_types": [ + "robotics" + ] + }, + { + "name": "nvidia/kimodo-soma-seed-v1", + "alias": [ + "nvidia/Kimodo-SOMA-SEED-v1", + "Kimodo-SOMA-SEED-v1", + "kimodo-soma-seed-v1" + ], + "model_types": [ + "robotics" + ] + }, + { + "name": "nvidia/kimodo-g1-seed-v1", + "alias": [ + "nvidia/Kimodo-G1-SEED-v1", + "Kimodo-G1-SEED-v1", + "kimodo-g1-seed-v1" + ], + "model_types": [ + "robotics" + ] + }, + { + "name": "nvidia/kimodo-g1-rp-v1", + "alias": [ + "nvidia/Kimodo-G1-RP-v1", + "Kimodo-G1-RP-v1", + "kimodo-g1-rp-v1" + ], + "model_types": [ + "robotics" + ] + }, + { + "name": "nvidia/finite-difference-flow-optimization", + "alias": [ + "finite-difference-flow-optimization" + ], + "model_types": [ + "image" + ] + }, + { + "name": "nvidia/nv-proteina-complexa-ame-160m-v1", + "alias": [ + "nvidia/NV-Proteina-Complexa-AME-160M-v1", + "NV-Proteina-Complexa-AME-160M-v1", + "nv-proteina-complexa-ame-160m-v1" + ], + "model_types": [ + "other" + ] + }, + { + "name": "nvidia/nv-proteina-complexa-protein-target-160m-v1", + "alias": [ + "nvidia/NV-Proteina-Complexa-Protein-Target-160M-v1", + "NV-Proteina-Complexa-Protein-Target-160M-v1", + "nv-proteina-complexa-protein-target-160m-v1" + ], + "model_types": [ + "other" + ] + }, + { + "name": "nvidia/nv-proteina-complexa-ligand-target-160m-v1", + "alias": [ + "nvidia/NV-Proteina-Complexa-Ligand-Target-160M-v1", + "NV-Proteina-Complexa-Ligand-Target-160M-v1", + "nv-proteina-complexa-ligand-target-160m-v1" + ], + "model_types": [ + "other" + ] + }, + { + "name": "nvidia/nvidia-nemotron-3-nano-30b-a3b-base-bf16", + "alias": [ + "nvidia/NVIDIA-Nemotron-3-Nano-30B-A3B-Base-BF16", + "NVIDIA-Nemotron-3-Nano-30B-A3B-Base-BF16", + "nvidia-nemotron-3-nano-30b-a3b-base-bf16" + ], + "max_tokens": 262144, + "model_types": [ + "chat" + ] + }, + { + "name": "nvidia/nvidia-nemotron-3-nano-30b-a3b-nvfp4", + "alias": [ + "nvidia/NVIDIA-Nemotron-3-Nano-30B-A3B-NVFP4", + "NVIDIA-Nemotron-3-Nano-30B-A3B-NVFP4", + "nvidia-nemotron-3-nano-30b-a3b-nvfp4" + ], + "max_tokens": 262144, + "model_types": [ + "chat" + ] + }, + { + "name": "nvidia/nvidia-nemotron-3-nano-30b-a3b-bf16", + "alias": [ + "nvidia/NVIDIA-Nemotron-3-Nano-30B-A3B-BF16", + "NVIDIA-Nemotron-3-Nano-30B-A3B-BF16", + "nvidia-nemotron-3-nano-30b-a3b-bf16" + ], + "max_tokens": 262144, + "model_types": [ + "chat" + ] + }, + { + "name": "nvidia/nvidia-nemotron-3-nano-30b-a3b-fp8", + "alias": [ + "nvidia/NVIDIA-Nemotron-3-Nano-30B-A3B-FP8", + "NVIDIA-Nemotron-3-Nano-30B-A3B-FP8", + "nvidia-nemotron-3-nano-30b-a3b-fp8" + ], + "max_tokens": 262144, + "model_types": [ + "chat" + ] + }, + { + "name": "nvidia/nvidia-nemotron-3-super-120b-a12b-base-bf16", + "alias": [ + "nvidia/NVIDIA-Nemotron-3-Super-120B-A12B-Base-BF16", + "NVIDIA-Nemotron-3-Super-120B-A12B-Base-BF16", + "nvidia-nemotron-3-super-120b-a12b-base-bf16" + ], + "max_tokens": 262144, + "model_types": [ + "chat" + ] + }, + { + "name": "nvidia/cosmos-embed1-448p", + "alias": [ + "nvidia/Cosmos-Embed1-448p", + "Cosmos-Embed1-448p", + "cosmos-embed1-448p" + ], + "model_types": [ + "embedding", + "vision" + ] + }, + { + "name": "nvidia/cosmos-embed1-336p", + "alias": [ + "nvidia/Cosmos-Embed1-336p", + "Cosmos-Embed1-336p", + "cosmos-embed1-336p" + ], + "model_types": [ + "embedding", + "vision" + ] + }, + { + "name": "nvidia/gr00t-n1.5-rl-rheo-assembletrocar", + "alias": [ + "nvidia/GR00T-N1.5-RL-Rheo-AssembleTrocar", + "GR00T-N1.5-RL-Rheo-AssembleTrocar", + "gr00t-n1.5-rl-rheo-assembletrocar" + ], + "model_types": [ + "other" + ] + }, + { + "name": "nvidia/gr00t-n1.6-rheo-sim-pushcart", + "alias": [ + "nvidia/GR00T-N1.6-Rheo-Sim-PushCart", + "GR00T-N1.6-Rheo-Sim-PushCart", + "gr00t-n1.6-rheo-sim-pushcart" + ], + "model_types": [ + "other" + ] + }, + { + "name": "nvidia/gr00t-n1.6-rheo-picknplacetray", + "alias": [ + "nvidia/GR00T-N1.6-Rheo-PickNPlaceTray", + "GR00T-N1.6-Rheo-PickNPlaceTray", + "gr00t-n1.6-rheo-picknplacetray" + ], + "model_types": [ + "other" + ] + }, + { + "name": "nvidia/cosmos-embed1-224p", + "alias": [ + "nvidia/Cosmos-Embed1-224p", + "Cosmos-Embed1-224p", + "cosmos-embed1-224p" + ], + "model_types": [ + "embedding", + "vision" + ] + }, + { + "name": "nvidia/kimi-k2-thinking-eagle3", + "alias": [ + "nvidia/Kimi-K2-Thinking-Eagle3", + "Kimi-K2-Thinking-Eagle3", + "kimi-k2-thinking-eagle3" + ], + "max_tokens": 262144, + "model_types": [ + "chat" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "nvidia/nemotron-graphic-elements-v1", + "alias": [ + "nemotron-graphic-elements-v1" + ], + "model_types": [ + "vision" + ] + }, + { + "name": "nvidia/nemotron-table-structure-v1", + "alias": [ + "nemotron-table-structure-v1" + ], + "model_types": [ + "vision" + ] + }, + { + "name": "nvidia/nemotron-page-elements-v3", + "alias": [ + "nemotron-page-elements-v3" + ], + "model_types": [ + "vision" + ] + }, + { + "name": "nvidia/qwen3-30b-a3b-thinking-2507-eagle3", + "alias": [ + "nvidia/Qwen3-30B-A3B-Thinking-2507-Eagle3", + "Qwen3-30B-A3B-Thinking-2507-Eagle3", + "qwen3-30b-a3b-thinking-2507-eagle3" + ], + "max_tokens": 262144, + "model_types": [ + "chat" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "nvidia/qwen3-235b-a22b-thinking-2507-fp4-eagle3", + "alias": [ + "nvidia/Qwen3-235B-A22B-Thinking-2507-FP4-Eagle3", + "Qwen3-235B-A22B-Thinking-2507-FP4-Eagle3", + "qwen3-235b-a22b-thinking-2507-fp4-eagle3" + ], + "max_tokens": 262144, + "model_types": [ + "chat" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "nvidia/qwen3-235b-a22b-thinking-2507-eagle3", + "alias": [ + "nvidia/Qwen3-235B-A22B-Thinking-2507-Eagle3", + "Qwen3-235B-A22B-Thinking-2507-Eagle3", + "qwen3-235b-a22b-thinking-2507-eagle3" + ], + "max_tokens": 262144, + "model_types": [ + "chat" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "nvidia/qwen3-nemotron-235b-a22b-genrm-2603", + "alias": [ + "nvidia/Qwen3-Nemotron-235B-A22B-GenRM-2603", + "Qwen3-Nemotron-235B-A22B-GenRM-2603", + "qwen3-nemotron-235b-a22b-genrm-2603" + ], + "max_tokens": 262144, + "model_types": [ + "chat" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "nvidia/audio2emotion-v2.2", + "alias": [ + "nvidia/Audio2Emotion-v2.2", + "Audio2Emotion-v2.2", + "audio2emotion-v2.2" + ], + "model_types": [ + "audio" + ] + }, + { + "name": "nvidia/audio2emotion-v3.0", + "alias": [ + "nvidia/Audio2Emotion-v3.0", + "Audio2Emotion-v3.0", + "audio2emotion-v3.0" + ], + "model_types": [ + "audio" + ] + }, + { + "name": "nvidia/diffit", + "alias": [ + "nvidia/DiffiT", + "DiffiT", + "diffit" + ], + "model_types": [ + "image" + ] + }, + { + "name": "nvidia/fourcastnet3", + "alias": [ + "fourcastnet3" + ], + "model_types": [ + "other" + ] + }, + { + "name": "nvidia/fourcastnet1", + "alias": [ + "fourcastnet1" + ], + "model_types": [ + "other" + ] + }, + { + "name": "nvidia/stormscope-goes-mrms", + "alias": [ + "stormscope-goes-mrms" + ], + "model_types": [ + "other" + ] + }, + { + "name": "nvidia/dlesym-v1-era5", + "alias": [ + "dlesym-v1-era5" + ], + "model_types": [ + "other" + ] + }, + { + "name": "nvidia/stormcast-v1-era5-hrrr", + "alias": [ + "stormcast-v1-era5-hrrr" + ], + "model_types": [ + "other" + ] + }, + { + "name": "nvidia/nvidia-nemotron-nano-9b-v2", + "alias": [ + "nvidia/NVIDIA-Nemotron-Nano-9B-v2", + "NVIDIA-Nemotron-Nano-9B-v2", + "nvidia-nemotron-nano-9b-v2" + ], + "max_tokens": 262144, + "model_types": [ + "chat" + ] + }, + { + "name": "nvidia/cbottle", + "alias": [ + "cbottle" + ], + "model_types": [ + "other" + ] + }, + { + "name": "nvidia/atlas-era5", + "alias": [ + "atlas-era5" + ], + "model_types": [ + "other" + ] + }, + { + "name": "nvidia/qwen3-vl-235b-a22b-instruct-nvfp4", + "alias": [ + "nvidia/Qwen3-VL-235B-A22B-Instruct-NVFP4", + "Qwen3-VL-235B-A22B-Instruct-NVFP4", + "qwen3-vl-235b-a22b-instruct-nvfp4" + ], + "max_tokens": 262144, + "model_types": [ + "chat", + "vision", + "image2text" + ] + }, + { + "name": "nvidia/cosmos-predict2.5-2b", + "alias": [ + "nvidia/Cosmos-Predict2.5-2B", + "Cosmos-Predict2.5-2B", + "cosmos-predict2.5-2b" + ], + "model_types": [ + "video_generation" + ] + }, + { + "name": "nvidia/personaplex-7b-v1", + "alias": [ + "personaplex-7b-v1" + ], + "model_types": [ + "audio", + "asr", + "tts" + ] + }, + { + "name": "nvidia/nemotron-research-goosereason-4b-instruct", + "alias": [ + "nvidia/Nemotron-Research-GooseReason-4B-Instruct", + "Nemotron-Research-GooseReason-4B-Instruct", + "nemotron-research-goosereason-4b-instruct" + ], + "max_tokens": 262144, + "model_types": [ + "chat" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "nvidia/nemotron-terminal-32b", + "alias": [ + "nvidia/Nemotron-Terminal-32B", + "Nemotron-Terminal-32B", + "nemotron-terminal-32b" + ], + "max_tokens": 262144, + "model_types": [ + "chat" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "nvidia/nemotron-terminal-14b", + "alias": [ + "nvidia/Nemotron-Terminal-14B", + "Nemotron-Terminal-14B", + "nemotron-terminal-14b" + ], + "max_tokens": 262144, + "model_types": [ + "chat" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "nvidia/nemotron-terminal-8b", + "alias": [ + "nvidia/Nemotron-Terminal-8B", + "Nemotron-Terminal-8B", + "nemotron-terminal-8b" + ], + "max_tokens": 262144, + "model_types": [ + "chat" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "nvidia/dreamdojo", + "alias": [ + "nvidia/DreamDojo", + "DreamDojo", + "dreamdojo" + ], + "model_types": [ + "video_generation" + ] + }, + { + "name": "nvidia/omnivinci", + "alias": [ + "omnivinci" + ], + "model_types": [ + "other" + ] + }, + { + "name": "nvidia/nemotron-colembed-vl-4b-v2", + "alias": [ + "nemotron-colembed-vl-4b-v2" + ], + "model_types": [ + "embedding", + "vision" + ] + }, + { + "name": "nvidia/nemotron-colembed-vl-8b-v2", + "alias": [ + "nemotron-colembed-vl-8b-v2" + ], + "model_types": [ + "embedding", + "vision" + ] + }, + { + "name": "nvidia/physicalai-simulation-vomp-model", + "alias": [ + "nvidia/PhysicalAI-Simulation-VoMP-Model", + "PhysicalAI-Simulation-VoMP-Model", + "physicalai-simulation-vomp-model" + ], + "model_types": [ + "other" + ] + }, + { + "name": "nvidia/cosmos-transfer2.5-2b", + "alias": [ + "nvidia/Cosmos-Transfer2.5-2B", + "Cosmos-Transfer2.5-2B", + "cosmos-transfer2.5-2b" + ], + "model_types": [ + "video_generation" + ] + }, + { + "name": "nvidia/llama-3.3-70b-instruct-eagle3", + "alias": [ + "nvidia/Llama-3.3-70B-Instruct-Eagle3", + "Llama-3.3-70B-Instruct-Eagle3", + "llama-3.3-70b-instruct-eagle3" + ], + "model_types": [ + "other" + ] + }, + { + "name": "nvidia/kimi-k2-thinking-nvfp4", + "alias": [ + "nvidia/Kimi-K2-Thinking-NVFP4", + "Kimi-K2-Thinking-NVFP4", + "kimi-k2-thinking-nvfp4" + ], + "max_tokens": 262144, + "model_types": [ + "chat" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "nvidia/qwen3-next-80b-a3b-thinking-nvfp4", + "alias": [ + "nvidia/Qwen3-Next-80B-A3B-Thinking-NVFP4", + "Qwen3-Next-80B-A3B-Thinking-NVFP4", + "qwen3-next-80b-a3b-thinking-nvfp4" + ], + "max_tokens": 262144, + "model_types": [ + "chat" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "nvidia/qwen3-next-80b-a3b-instruct-nvfp4", + "alias": [ + "nvidia/Qwen3-Next-80B-A3B-Instruct-NVFP4", + "Qwen3-Next-80B-A3B-Instruct-NVFP4", + "qwen3-next-80b-a3b-instruct-nvfp4" + ], + "max_tokens": 262144, + "model_types": [ + "chat" + ] + }, + { + "name": "nvidia/parakeet-ctc-0.6b-vietnamese", + "alias": [ + "nvidia/parakeet-ctc-0.6b-Vietnamese", + "parakeet-ctc-0.6b-Vietnamese", + "parakeet-ctc-0.6b-vietnamese" + ], + "model_types": [ + "asr" + ] + }, + { + "name": "nvidia/nitrogen", + "alias": [ + "nvidia/NitroGen", + "NitroGen", + "nitrogen" + ], + "model_types": [ + "robotics" + ] + }, + { + "name": "nvidia/qwen3-coder-480b-a35b-instruct-nvfp4", + "alias": [ + "nvidia/Qwen3-Coder-480B-A35B-Instruct-NVFP4", + "Qwen3-Coder-480B-A35B-Instruct-NVFP4", + "qwen3-coder-480b-a35b-instruct-nvfp4" + ], + "max_tokens": 262144, + "model_types": [ + "chat" + ] + }, + { + "name": "nvidia/llama-nemoretriever-colembed-3b-v1", + "alias": [ + "llama-nemoretriever-colembed-3b-v1" + ], + "model_types": [ + "embedding" + ] + }, + { + "name": "nvidia/llama-nemoretriever-colembed-1b-v1", + "alias": [ + "llama-nemoretriever-colembed-1b-v1" + ], + "model_types": [ + "embedding" + ] + }, + { + "name": "nvidia/qwen3-vl-235b-a22b-instruct-nvfp4-mlperf-inference-closed-v6.0", + "alias": [ + "nvidia/Qwen3-VL-235B-A22B-Instruct-NVFP4-MLPerf-Inference-Closed-V6.0", + "Qwen3-VL-235B-A22B-Instruct-NVFP4-MLPerf-Inference-Closed-V6.0", + "qwen3-vl-235b-a22b-instruct-nvfp4-mlperf-inference-closed-v6.0" + ], + "max_tokens": 262144, + "model_types": [ + "chat", + "vision", + "image2text" + ] + }, + { + "name": "nvidia/cosmos-policy-aloha-planning-model-predict2-2b", + "alias": [ + "nvidia/Cosmos-Policy-ALOHA-Planning-Model-Predict2-2B", + "Cosmos-Policy-ALOHA-Planning-Model-Predict2-2B", + "cosmos-policy-aloha-planning-model-predict2-2b" + ], + "model_types": [ + "robotics" + ] + }, + { + "name": "nvidia/cosmos-policy-aloha-predict2-2b", + "alias": [ + "nvidia/Cosmos-Policy-ALOHA-Predict2-2B", + "Cosmos-Policy-ALOHA-Predict2-2B", + "cosmos-policy-aloha-predict2-2b" + ], + "model_types": [ + "robotics" + ] + }, + { + "name": "nvidia/cosmos-policy-robocasa-predict2-2b", + "alias": [ + "nvidia/Cosmos-Policy-RoboCasa-Predict2-2B", + "Cosmos-Policy-RoboCasa-Predict2-2B", + "cosmos-policy-robocasa-predict2-2b" + ], + "model_types": [ + "robotics" + ] + }, + { + "name": "nvidia/cosmos-policy-libero-predict2-2b", + "alias": [ + "nvidia/Cosmos-Policy-LIBERO-Predict2-2B", + "Cosmos-Policy-LIBERO-Predict2-2B", + "cosmos-policy-libero-predict2-2b" + ], + "model_types": [ + "robotics" + ] + }, + { + "name": "nvidia/gr00t-n1.6-droid", + "alias": [ + "nvidia/GR00T-N1.6-DROID", + "GR00T-N1.6-DROID", + "gr00t-n1.6-droid" + ], + "model_types": [ + "other" + ] + }, + { + "name": "nvidia/qwen3-235b-a22b-thinking-2507-nvfp4", + "alias": [ + "nvidia/Qwen3-235B-A22B-Thinking-2507-NVFP4", + "Qwen3-235B-A22B-Thinking-2507-NVFP4", + "qwen3-235b-a22b-thinking-2507-nvfp4" + ], + "max_tokens": 262144, + "model_types": [ + "chat" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "nvidia/qwen3-235b-a22b-instruct-2507-nvfp4", + "alias": [ + "nvidia/Qwen3-235B-A22B-Instruct-2507-NVFP4", + "Qwen3-235B-A22B-Instruct-2507-NVFP4", + "qwen3-235b-a22b-instruct-2507-nvfp4" + ], + "max_tokens": 262144, + "model_types": [ + "chat" + ] + }, + { + "name": "nvidia/c-radiov2-h", + "alias": [ + "nvidia/C-RADIOv2-H", + "C-RADIOv2-H", + "c-radiov2-h" + ], + "model_types": [ + "embedding", + "vision" + ] + }, + { + "name": "nvidia/c-radiov2-l", + "alias": [ + "nvidia/C-RADIOv2-L", + "C-RADIOv2-L", + "c-radiov2-l" + ], + "model_types": [ + "embedding", + "vision" + ] + }, + { + "name": "nvidia/c-radiov3-g", + "alias": [ + "nvidia/C-RADIOv3-g", + "C-RADIOv3-g", + "c-radiov3-g" + ], + "model_types": [ + "embedding", + "vision" + ] + }, + { + "name": "nvidia/c-radiov3-h", + "alias": [ + "nvidia/C-RADIOv3-H", + "C-RADIOv3-H", + "c-radiov3-h" + ], + "model_types": [ + "embedding", + "vision" + ] + }, + { + "name": "nvidia/c-radiov3-l", + "alias": [ + "nvidia/C-RADIOv3-L", + "C-RADIOv3-L", + "c-radiov3-l" + ], + "model_types": [ + "embedding", + "vision" + ] + }, + { + "name": "nvidia/c-radiov3-b", + "alias": [ + "nvidia/C-RADIOv3-B", + "C-RADIOv3-B", + "c-radiov3-b" + ], + "model_types": [ + "embedding", + "vision" + ] + }, + { + "name": "nvidia/c-radiov4-h", + "alias": [ + "nvidia/C-RADIOv4-H", + "C-RADIOv4-H", + "c-radiov4-h" + ], + "model_types": [ + "embedding", + "vision" + ] + }, + { + "name": "nvidia/c-radiov4-so400m", + "alias": [ + "nvidia/C-RADIOv4-SO400M", + "C-RADIOv4-SO400M", + "c-radiov4-so400m" + ], + "model_types": [ + "embedding", + "vision" + ] + }, + { + "name": "nvidia/c-radiov2-b", + "alias": [ + "nvidia/C-RADIOv2-B", + "C-RADIOv2-B", + "c-radiov2-b" + ], + "model_types": [ + "embedding", + "vision" + ] + }, + { + "name": "nvidia/multitalker-parakeet-streaming-0.6b-v1", + "alias": [ + "multitalker-parakeet-streaming-0.6b-v1" + ], + "model_types": [ + "asr" + ] + }, + { + "name": "nvidia/gpt-oss-120b-eagle3-short-context", + "alias": [ + "nvidia/gpt-oss-120b-Eagle3-short-context", + "gpt-oss-120b-Eagle3-short-context", + "gpt-oss-120b-eagle3-short-context" + ], + "max_tokens": 131072, + "model_types": [ + "chat" + ] + }, + { + "name": "nvidia/gpt-oss-120b-eagle3-throughput", + "alias": [ + "nvidia/gpt-oss-120b-Eagle3-throughput", + "gpt-oss-120b-Eagle3-throughput", + "gpt-oss-120b-eagle3-throughput" + ], + "max_tokens": 131072, + "model_types": [ + "chat" + ] + }, + { + "name": "nvidia/qwen3-235b-a22b-eagle3", + "alias": [ + "nvidia/Qwen3-235B-A22B-Eagle3", + "Qwen3-235B-A22B-Eagle3", + "qwen3-235b-a22b-eagle3" + ], + "max_tokens": 262144, + "model_types": [ + "chat" + ] + }, + { + "name": "nvidia/gpt-oss-120b-eagle3-long-context", + "alias": [ + "nvidia/gpt-oss-120b-Eagle3-long-context", + "gpt-oss-120b-Eagle3-long-context", + "gpt-oss-120b-eagle3-long-context" + ], + "max_tokens": 131072, + "model_types": [ + "chat" + ] + }, + { + "name": "nvidia/gn16-tuned-arena-gr1-manipulation", + "alias": [ + "nvidia/GN16-Tuned-Arena-GR1-Manipulation", + "GN16-Tuned-Arena-GR1-Manipulation", + "gn16-tuned-arena-gr1-manipulation" + ], + "model_types": [ + "robotics" + ] + }, + { + "name": "nvidia/qwen3-8b-dms-8x", + "alias": [ + "nvidia/Qwen3-8B-DMS-8x", + "Qwen3-8B-DMS-8x", + "qwen3-8b-dms-8x" + ], + "max_tokens": 262144, + "model_types": [ + "chat" + ] + }, + { + "name": "nvidia/kvzap-mlp-llama-3.1-8b-instruct", + "alias": [ + "nvidia/KVzap-mlp-Llama-3.1-8B-Instruct", + "KVzap-mlp-Llama-3.1-8B-Instruct", + "kvzap-mlp-llama-3.1-8b-instruct" + ], + "model_types": [ + "other" + ] + }, + { + "name": "nvidia/kvzap-mlp-qwen3-32b", + "alias": [ + "nvidia/KVzap-mlp-Qwen3-32B", + "KVzap-mlp-Qwen3-32B", + "kvzap-mlp-qwen3-32b" + ], + "max_tokens": 262144, + "model_types": [ + "chat" + ] + }, + { + "name": "nvidia/kvzap-mlp-qwen3-8b", + "alias": [ + "nvidia/KVzap-mlp-Qwen3-8B", + "KVzap-mlp-Qwen3-8B", + "kvzap-mlp-qwen3-8b" + ], + "max_tokens": 262144, + "model_types": [ + "chat" + ] + }, + { + "name": "nvidia/kvzap-linear-llama-3.1-8b-instruct", + "alias": [ + "nvidia/KVzap-linear-Llama-3.1-8B-Instruct", + "KVzap-linear-Llama-3.1-8B-Instruct", + "kvzap-linear-llama-3.1-8b-instruct" + ], + "model_types": [ + "other" + ] + }, + { + "name": "nvidia/kvzap-linear-qwen3-32b", + "alias": [ + "nvidia/KVzap-linear-Qwen3-32B", + "KVzap-linear-Qwen3-32B", + "kvzap-linear-qwen3-32b" + ], + "max_tokens": 262144, + "model_types": [ + "chat" + ] + }, + { + "name": "nvidia/kvzap-linear-qwen3-8b", + "alias": [ + "nvidia/KVzap-linear-Qwen3-8B", + "KVzap-linear-Qwen3-8B", + "kvzap-linear-qwen3-8b" + ], + "max_tokens": 262144, + "model_types": [ + "chat" + ] + }, + { + "name": "nvidia/deepseek-v3.2-nvfp4", + "alias": [ + "nvidia/DeepSeek-V3.2-NVFP4", + "DeepSeek-V3.2-NVFP4", + "deepseek-v3.2-nvfp4" + ], + "max_tokens": 163840, + "model_types": [ + "chat" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "nvidia/riva-translate-4b-instruct-v1.1", + "alias": [ + "nvidia/Riva-Translate-4B-Instruct-v1.1", + "Riva-Translate-4B-Instruct-v1.1", + "riva-translate-4b-instruct-v1.1" + ], + "model_types": [ + "chat" + ] + }, + { + "name": "nvidia/nemotron-4-mini-hindi-4b-base", + "alias": [ + "nvidia/Nemotron-4-Mini-Hindi-4B-Base", + "Nemotron-4-Mini-Hindi-4B-Base", + "nemotron-4-mini-hindi-4b-base" + ], + "max_tokens": 262144, + "model_types": [ + "chat" + ] + }, + { + "name": "nvidia/deepseek-v3.1-nvfp4", + "alias": [ + "nvidia/DeepSeek-V3.1-NVFP4", + "DeepSeek-V3.1-NVFP4", + "deepseek-v3.1-nvfp4" + ], + "max_tokens": 163840, + "model_types": [ + "chat" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "nvidia/qwen2.5-vl-7b-surg-cholect50", + "alias": [ + "nvidia/Qwen2.5-VL-7B-Surg-CholecT50", + "Qwen2.5-VL-7B-Surg-CholecT50", + "qwen2.5-vl-7b-surg-cholect50" + ], + "max_tokens": 131072, + "model_types": [ + "chat", + "vision", + "image2text" + ] + }, + { + "name": "nvidia/rnapro-private-best-500m", + "alias": [ + "nvidia/RNAPro-Private-Best-500M", + "RNAPro-Private-Best-500M", + "rnapro-private-best-500m" + ], + "model_types": [ + "other" + ] + }, + { + "name": "nvidia/rnapro-public-best-500m", + "alias": [ + "nvidia/RNAPro-Public-Best-500M", + "RNAPro-Public-Best-500M", + "rnapro-public-best-500m" + ], + "model_types": [ + "other" + ] + }, + { + "name": "nvidia/nemotron-flash-3b-instruct", + "alias": [ + "nvidia/Nemotron-Flash-3B-Instruct", + "Nemotron-Flash-3B-Instruct", + "nemotron-flash-3b-instruct" + ], + "max_tokens": 262144, + "model_types": [ + "chat" + ] + }, + { + "name": "nvidia/nemotron-flash-3b", + "alias": [ + "nvidia/Nemotron-Flash-3B", + "Nemotron-Flash-3B", + "nemotron-flash-3b" + ], + "max_tokens": 262144, + "model_types": [ + "chat" + ] + }, + { + "name": "nvidia/nemotron-flash-1b", + "alias": [ + "nvidia/Nemotron-Flash-1B", + "Nemotron-Flash-1B", + "nemotron-flash-1b" + ], + "max_tokens": 262144, + "model_types": [ + "chat" + ] + }, + { + "name": "nvidia/nv-reasyn-eb-174m-v2", + "alias": [ + "nvidia/NV-ReaSyn-EB-174M-v2", + "NV-ReaSyn-EB-174M-v2", + "nv-reasyn-eb-174m-v2" + ], + "model_types": [ + "other" + ] + }, + { + "name": "nvidia/nv-reasyn-ar-166m-v2", + "alias": [ + "nvidia/NV-ReaSyn-AR-166M-v2", + "NV-ReaSyn-AR-166M-v2", + "nv-reasyn-ar-166m-v2" + ], + "model_types": [ + "other" + ] + }, + { + "name": "nvidia/nv-reasyn-ar-166m-v1", + "alias": [ + "nvidia/NV-ReaSyn-AR-166M-v1", + "NV-ReaSyn-AR-166M-v1", + "nv-reasyn-ar-166m-v1" + ], + "model_types": [ + "other" + ] + }, + { + "name": "nvidia/nvidia-nemotron-nano-9b-v2-nvfp4", + "alias": [ + "nvidia/NVIDIA-Nemotron-Nano-9B-v2-NVFP4", + "NVIDIA-Nemotron-Nano-9B-v2-NVFP4", + "nvidia-nemotron-nano-9b-v2-nvfp4" + ], + "max_tokens": 262144, + "model_types": [ + "chat" + ] + }, + { + "name": "nvidia/nvidia-nemotron-nano-9b-v2-fp8", + "alias": [ + "nvidia/NVIDIA-Nemotron-Nano-9B-v2-FP8", + "NVIDIA-Nemotron-Nano-9B-v2-FP8", + "nvidia-nemotron-nano-9b-v2-fp8" + ], + "max_tokens": 262144, + "model_types": [ + "chat" + ] + }, + { + "name": "nvidia/isaaclab-arena-envs", + "alias": [ + "isaaclab-arena-envs" + ], + "model_types": [ + "robotics" + ] + }, + { + "name": "nvidia/qwen2.5-cascaderl-rm-72b", + "alias": [ + "nvidia/Qwen2.5-CascadeRL-RM-72B", + "Qwen2.5-CascadeRL-RM-72B", + "qwen2.5-cascaderl-rm-72b" + ], + "model_types": [ + "chat" + ] + }, + { + "name": "nvidia/nemotron-cascade-8b-thinking", + "alias": [ + "nvidia/Nemotron-Cascade-8B-Thinking", + "Nemotron-Cascade-8B-Thinking", + "nemotron-cascade-8b-thinking" + ], + "max_tokens": 262144, + "model_types": [ + "chat" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "nvidia/nemotron-cascade-8b", + "alias": [ + "nvidia/Nemotron-Cascade-8B", + "Nemotron-Cascade-8B", + "nemotron-cascade-8b" + ], + "max_tokens": 262144, + "model_types": [ + "chat" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "nvidia/nemotron-cascade-14b-thinking", + "alias": [ + "nvidia/Nemotron-Cascade-14B-Thinking", + "Nemotron-Cascade-14B-Thinking", + "nemotron-cascade-14b-thinking" + ], + "max_tokens": 262144, + "model_types": [ + "chat" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "nvidia/diar_streaming_sortformer_4spk-v2", + "alias": [ + "diar_streaming_sortformer_4spk-v2" + ], + "model_types": [ + "asr" + ] + }, + { + "name": "nvidia/diar_streaming_sortformer_4spk-v2.1", + "alias": [ + "diar_streaming_sortformer_4spk-v2.1" + ], + "model_types": [ + "asr" + ] + }, + { + "name": "nvidia/nemotron-cascade-8b-intermediate-ckpts", + "alias": [ + "nvidia/Nemotron-Cascade-8B-Intermediate-ckpts", + "Nemotron-Cascade-8B-Intermediate-ckpts", + "nemotron-cascade-8b-intermediate-ckpts" + ], + "max_tokens": 262144, + "model_types": [ + "chat" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "nvidia/qwen3-nemotron-14b-brrm", + "alias": [ + "nvidia/Qwen3-Nemotron-14B-BRRM", + "Qwen3-Nemotron-14B-BRRM", + "qwen3-nemotron-14b-brrm" + ], + "max_tokens": 262144, + "model_types": [ + "chat" + ] + }, + { + "name": "nvidia/qwen3-nemotron-8b-brrm", + "alias": [ + "nvidia/Qwen3-Nemotron-8B-BRRM", + "Qwen3-Nemotron-8B-BRRM", + "qwen3-nemotron-8b-brrm" + ], + "max_tokens": 262144, + "model_types": [ + "chat" + ] + }, + { + "name": "nvidia/pi05-arena-gr1-microwave", + "alias": [ + "pi05-arena-gr1-microwave" + ], + "model_types": [ + "robotics" + ] + }, + { + "name": "nvidia/smolvla-arena-gr1-microwave", + "alias": [ + "smolvla-arena-gr1-microwave" + ], + "model_types": [ + "robotics" + ] + }, + { + "name": "nvidia/gr00t-n1.6-3b", + "alias": [ + "nvidia/GR00T-N1.6-3B", + "GR00T-N1.6-3B", + "gr00t-n1.6-3b" + ], + "model_types": [ + "other" + ] + }, + { + "name": "nvidia/groot-n1.6-behavior1k", + "alias": [ + "groot-n1.6-behavior1k" + ], + "model_types": [ + "robotics" + ] + }, + { + "name": "nvidia/groot-n1.6-bridge", + "alias": [ + "groot-n1.6-bridge" + ], + "model_types": [ + "robotics" + ] + }, + { + "name": "nvidia/groot-n1.6-g1-pnpappletoplate", + "alias": [ + "groot-n1.6-g1-pnpappletoplate" + ], + "model_types": [ + "robotics" + ] + }, + { + "name": "nvidia/groot-n1.6-fractal", + "alias": [ + "groot-n1.6-fractal" + ], + "model_types": [ + "robotics" + ] + }, + { + "name": "nvidia/geneformer_v2_316m", + "alias": [ + "geneformer_v2_316m" + ], + "model_types": [ + "other" + ] + }, + { + "name": "nvidia/geneformer_v2_104m_clcancer", + "alias": [ + "geneformer_v2_104m_clcancer" + ], + "model_types": [ + "other" + ] + }, + { + "name": "nvidia/geneformer_v2_104m", + "alias": [ + "geneformer_v2_104m" + ], + "model_types": [ + "other" + ] + }, + { + "name": "nvidia/diar_sortformer_4spk-v1", + "alias": [ + "diar_sortformer_4spk-v1" + ], + "model_types": [ + "asr" + ] + }, + { + "name": "nvidia/qwen3-nemotron-235b-a22b-genrm", + "alias": [ + "qwen3-nemotron-235b-a22b-genrm" + ], + "max_tokens": 262144, + "model_types": [ + "chat" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "nvidia/nvpanoptix-3d", + "alias": [ + "nvpanoptix-3d" + ], + "model_types": [ + "other" + ] + }, + { + "name": "nvidia/geneformer_v1_10m", + "alias": [ + "geneformer_v1_10m" + ], + "model_types": [ + "other" + ] + }, + { + "name": "nvidia/llama-4-scout-17b-16e-instruct-nvfp4", + "alias": [ + "llama-4-scout-17b-16e-instruct-nvfp4" + ], + "max_tokens": 10485760, + "model_types": [ + "chat" + ] + }, + { + "name": "nvidia/llama-4-scout-17b-16e-instruct-fp8", + "alias": [ + "llama-4-scout-17b-16e-instruct-fp8" + ], + "max_tokens": 10485760, + "model_types": [ + "chat" + ] + }, + { + "name": "nvidia/qwen2.5-vl-7b-instruct-fp8", + "alias": [ + "qwen2.5-vl-7b-instruct-fp8" + ], + "max_tokens": 131072, + "model_types": [ + "chat", + "vision", + "image2text" + ] + }, + { + "name": "nvidia/riva-translate-4b-instruct", + "alias": [ + "riva-translate-4b-instruct" + ], + "max_tokens": 32768, + "model_types": [ + "chat" + ] + }, + { + "name": "nvidia/cosmos-reason1-7b", + "alias": [ + "cosmos-reason1-7b" + ], + "model_types": [ + "chat", + "vision", + "image2text" + ] + }, + { + "name": "nvidia/nv-dualbind-1m-v1", + "alias": [ + "nv-dualbind-1m-v1" + ], + "model_types": [ + "embedding", + "vision" + ] + }, + { + "name": "nvidia/nv-megalodon-qm9-v1", + "alias": [ + "nv-megalodon-qm9-v1" + ], + "model_types": [ + "other" + ] + }, + { + "name": "nvidia/nv-megalodon-geom-drugs-v1", + "alias": [ + "nv-megalodon-geom-drugs-v1" + ], + "model_types": [ + "other" + ] + }, + { + "name": "nvidia/nv-genmol-89m-v1", + "alias": [ + "nv-genmol-89m-v1" + ], + "model_types": [ + "other" + ] + }, + { + "name": "nvidia/nv-genmol-89m-v2", + "alias": [ + "nv-genmol-89m-v2" + ], + "model_types": [ + "other" + ] + }, + { + "name": "nvidia/nv-proteina-60m-v1", + "alias": [ + "nv-proteina-60m-v1" + ], + "model_types": [ + "other" + ] + }, + { + "name": "nvidia/nv-proteina-200m-v1", + "alias": [ + "nv-proteina-200m-v1" + ], + "model_types": [ + "other" + ] + }, + { + "name": "nvidia/nv-proteina-400m-v1", + "alias": [ + "nv-proteina-400m-v1" + ], + "model_types": [ + "other" + ] + }, + { + "name": "nvidia/nv-la-proteina-motif-v1", + "alias": [ + "nv-la-proteina-motif-v1" + ], + "model_types": [ + "other" + ] + }, + { + "name": "nvidia/nv-la-proteina-ucond-v1", + "alias": [ + "nv-la-proteina-ucond-v1" + ], + "model_types": [ + "other" + ] + }, + { + "name": "nvidia/gliner-pii", + "alias": [ + "gliner-pii" + ], + "model_types": [ + "moderation" + ] + }, + { + "name": "nvidia/nemotron-content-safety-reasoning-4b", + "alias": [ + "nemotron-content-safety-reasoning-4b" + ], + "model_types": [ + "moderation" + ] + }, + { + "name": "nvidia/qwen2.5-vl-7b-instruct-nvfp4", + "alias": [ + "qwen2.5-vl-7b-instruct-nvfp4" + ], + "max_tokens": 131072, + "model_types": [ + "chat", + "vision", + "image2text" + ] + }, + { + "name": "nvidia/cosmos-predict2.5-14b", + "alias": [ + "cosmos-predict2.5-14b" + ], + "model_types": [ + "video_generation" + ] + }, + { + "name": "nvidia/llama-3.1-nemotron-nano-vl-8b-v1", + "alias": [ + "llama-3.1-nemotron-nano-vl-8b-v1" + ], + "max_tokens": 262144, + "model_types": [ + "chat", + "vision", + "image2text" + ] + }, + { + "name": "nvidia/fixer", + "alias": [ + "fixer" + ], + "model_types": [ + "image_edit" + ] + }, + { + "name": "nvidia/parakeet_realtime_eou_120m-v1", + "alias": [ + "parakeet_realtime_eou_120m-v1" + ], + "model_types": [ + "asr" + ] + }, + { + "name": "nvidia/parakeet-tdt-1.1b", + "alias": [ + "parakeet-tdt-1.1b" + ], + "model_types": [ + "asr" + ] + }, + { + "name": "nvidia/parakeet-rnnt-0.6b", + "alias": [ + "parakeet-rnnt-0.6b" + ], + "model_types": [ + "asr" + ] + }, + { + "name": "nvidia/canary-1b-v2", + "alias": [ + "canary-1b-v2" + ], + "model_types": [ + "asr" + ] + }, + { + "name": "nvidia/canary-1b", + "alias": [ + "canary-1b" + ], + "model_types": [ + "asr" + ] + }, + { + "name": "nvidia/canary-1b-flash", + "alias": [ + "canary-1b-flash" + ], + "model_types": [ + "asr" + ] + }, + { + "name": "nvidia/compass", + "alias": [ + "compass" + ], + "model_types": [ + "other" + ] + }, + { + "name": "nvidia/difix", + "alias": [ + "difix" + ], + "model_types": [ + "image_edit" + ] + }, + { + "name": "nvidia/nvidia-nemotron-nano-12b-v2-vl-bf16", + "alias": [ + "nvidia-nemotron-nano-12b-v2-vl-bf16" + ], + "max_tokens": 262144, + "model_types": [ + "chat", + "vision", + "image2text" + ] + }, + { + "name": "nvidia/nemotron-orchestrator-8b", + "alias": [ + "nemotron-orchestrator-8b" + ], + "max_tokens": 262144, + "model_types": [ + "chat" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "nvidia/eagle2.5-8b", + "alias": [ + "eagle2.5-8b" + ], + "model_types": [ + "chat", + "vision", + "image2text" + ] + }, + { + "name": "nvidia/audio-flamingo-3", + "alias": [ + "audio-flamingo-3" + ], + "model_types": [ + "chat", + "audio", + "asr" + ] + }, + { + "name": "nvidia/parakeet-rnnt-1.1b", + "alias": [ + "parakeet-rnnt-1.1b" + ], + "model_types": [ + "asr" + ] + }, + { + "name": "nvidia/llama-3_3-nemotron-super-49b-v1_5-nvfp4", + "alias": [ + "llama-3_3-nemotron-super-49b-v1_5-nvfp4" + ], + "max_tokens": 262144, + "model_types": [ + "chat" + ] + }, + { + "name": "nvidia/hymba-1.5b-base", + "alias": [ + "hymba-1.5b-base" + ], + "max_tokens": 131072, + "model_types": [ + "chat" + ] + }, + { + "name": "nvidia/physicalai-robotics-groot-x-embodiment-sim", + "alias": [ + "physicalai-robotics-groot-x-embodiment-sim" + ], + "model_types": [ + "robotics" + ] + }, + { + "name": "nvidia/nvidia-nemotron-nano-12b-v2", + "alias": [ + "nvidia-nemotron-nano-12b-v2" + ], + "max_tokens": 262144, + "model_types": [ + "chat" + ] + }, + { + "name": "nvidia/cosmos-tokenizer-ci8x8-lidar", + "alias": [ + "cosmos-tokenizer-ci8x8-lidar" + ], + "model_types": [ + "other" + ] + }, + { + "name": "nvidia/cosmos-transfer-lidargen", + "alias": [ + "cosmos-transfer-lidargen" + ], + "model_types": [ + "video_generation" + ] + }, + { + "name": "nvidia/nemotron-research-reasoning-qwen-1.5b", + "alias": [ + "nemotron-research-reasoning-qwen-1.5b" + ], + "max_tokens": 262144, + "model_types": [ + "chat" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "nvidia/cosmos-transfer1-7b", + "alias": [ + "cosmos-transfer1-7b" + ], + "model_types": [ + "video_generation" + ] + }, + { + "name": "nvidia/nvidia-nemotron-nano-12b-v2-vl-fp8", + "alias": [ + "nvidia-nemotron-nano-12b-v2-vl-fp8" + ], + "max_tokens": 262144, + "model_types": [ + "chat", + "vision", + "image2text" + ] + }, + { + "name": "nvidia/nvidia-nemotron-nano-12b-v2-base", + "alias": [ + "nvidia-nemotron-nano-12b-v2-base" + ], + "max_tokens": 262144, + "model_types": [ + "chat" + ] + }, + { + "name": "nvidia/nvidia-nemotron-nano-9b-v2-base", + "alias": [ + "nvidia-nemotron-nano-9b-v2-base" + ], + "max_tokens": 262144, + "model_types": [ + "chat" + ] + }, + { + "name": "nvidia/groot-n1.5-3b-wavehand", + "alias": [ + "groot-n1.5-3b-wavehand" + ], + "model_types": [ + "robotics" + ] + }, + { + "name": "nvidia/qwen3-nemotron-32b-rlbff", + "alias": [ + "qwen3-nemotron-32b-rlbff" + ], + "max_tokens": 262144, + "model_types": [ + "chat" + ] + }, + { + "name": "nvidia/qwen3-nemotron-32b-genrm-principle", + "alias": [ + "qwen3-nemotron-32b-genrm-principle" + ], + "max_tokens": 262144, + "model_types": [ + "chat" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "nvidia/llama-3.3-nemotron-70b-reward-principle", + "alias": [ + "llama-3.3-nemotron-70b-reward-principle" + ], + "max_tokens": 262144, + "model_types": [ + "chat" + ] + }, + { + "name": "nvidia/llama-3.1-nemotron-safety-guard-8b-v3", + "alias": [ + "llama-3.1-nemotron-safety-guard-8b-v3" + ], + "model_types": [ + "moderation" + ] + }, + { + "name": "nvidia/nv-codonfm-encodon-te-cdwt-1b-v1", + "alias": [ + "nv-codonfm-encodon-te-cdwt-1b-v1" + ], + "model_types": [ + "other" + ] + }, + { + "name": "nvidia/nv-codonfm-encodon-te-1b-v1", + "alias": [ + "nv-codonfm-encodon-te-1b-v1" + ], + "model_types": [ + "other" + ] + }, + { + "name": "nvidia/nv-codonfm-encodon-te-600m-v1", + "alias": [ + "nv-codonfm-encodon-te-600m-v1" + ], + "model_types": [ + "other" + ] + }, + { + "name": "nvidia/nv-codonfm-encodon-te-80m-v1", + "alias": [ + "nv-codonfm-encodon-te-80m-v1" + ], + "model_types": [ + "other" + ] + }, + { + "name": "nvidia/nv-segment-ctmrmedtech", + "alias": [ + "nv-segment-ctmrmedtech" + ], + "model_types": [ + "other" + ] + }, + { + "name": "nvidia/nv-reason-cxr-3b", + "alias": [ + "nv-reason-cxr-3b" + ], + "model_types": [ + "chat", + "vision", + "image2text" + ] + }, + { + "name": "nvidia/nv-codonfm-encodon-cdwt-1b-v1", + "alias": [ + "nv-codonfm-encodon-cdwt-1b-v1" + ], + "model_types": [ + "other" + ] + }, + { + "name": "nvidia/nv-codonfm-encodon-1b-v1", + "alias": [ + "nv-codonfm-encodon-1b-v1" + ], + "model_types": [ + "other" + ] + }, + { + "name": "nvidia/nv-codonfm-encodon-600m-v1", + "alias": [ + "nv-codonfm-encodon-600m-v1" + ], + "model_types": [ + "other" + ] + }, + { + "name": "nvidia/nv-codonfm-encodon-80m-v1", + "alias": [ + "nv-codonfm-encodon-80m-v1" + ], + "model_types": [ + "other" + ] + }, + { + "name": "nvidia/dler-r1-7b-research", + "alias": [ + "dler-r1-7b-research" + ], + "model_types": [ + "chat" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "nvidia/dler-r1-1.5b-research", + "alias": [ + "dler-r1-1.5b-research" + ], + "model_types": [ + "chat" + ], + "thinking": { + "default_value": true, + "clear_thinking": true + } + }, + { + "name": "nvidia/dler-llama-nemotron-8b-merge-research", + "alias": [ + "dler-llama-nemotron-8b-merge-research" + ], + "max_tokens": 262144, + "model_types": [ + "chat" + ] + }, + { + "name": "nvidia/nemotron-h-4b-base-8k", + "alias": [ + "nemotron-h-4b-base-8k" + ], + "max_tokens": 8192, + "model_types": [ + "chat" + ] + }, + { + "name": "nvidia/nemotron-h-4b-instruct-128k", + "alias": [ + "nemotron-h-4b-instruct-128k" + ], + "max_tokens": 131072, + "model_types": [ + "chat" + ] + }, + { + "name": "nvidia/stt_ar_fastconformer_hybrid_large_pc_v1.0", + "alias": [ + "stt_ar_fastconformer_hybrid_large_pc_v1.0" + ], + "model_types": [ + "asr" + ] + }, + { + "name": "nvidia/audio2face-3d-v2.3.1-james", + "alias": [ + "audio2face-3d-v2.3.1-james" + ], + "model_types": [ + "audio", + "3d_generation" + ] + }, + { + "name": "nvidia/audio2face-3d-v2.3.1-claire", + "alias": [ + "audio2face-3d-v2.3.1-claire" + ], + "model_types": [ + "audio", + "3d_generation" + ] + }, + { + "name": "nvidia/audio2face-3d-v2.3-mark", + "alias": [ + "audio2face-3d-v2.3-mark" + ], + "model_types": [ + "audio", + "3d_generation" + ] } ] }