Files
ragflow/conf/models/tokenpony.json
dripsmvcp ed04893415 Go: implement provider: TokenPony (#15091)
## Summary
- Adds a `TokenPony` Go driver so the new API server can route TokenPony
chat instances, matching the existing Python `TokenPonyChat`
(`rag/llm/chat_model.py:1210`). Follows the same SaaS-driver shape used
for Astraflow, Avian, Novita, TogetherAI, Replicate, DeepInfra, Upstage,
and LongCat.

Closes #15086

---------

Co-authored-by: Jin Hai <haijin.chn@gmail.com>
2026-05-22 15:21:45 +08:00

94 lines
1.9 KiB
JSON

{
"name": "TokenPony",
"url": {
"default": "https://api.tokenpony.cn/v1"
},
"url_suffix": {
"chat": "chat/completions",
"models": "models"
},
"class": "tokenpony",
"models": [
{
"name": "qwen3-8b",
"max_tokens": 128000,
"model_types": ["chat"]
},
{
"name": "deepseek-v3-0324",
"max_tokens": 128000,
"model_types": ["chat"]
},
{
"name": "qwen3-32b",
"max_tokens": 128000,
"model_types": ["chat"]
},
{
"name": "kimi-k2-instruct-0905",
"max_tokens": 256000,
"model_types": ["chat"]
},
{
"name": "deepseek-r1-0528",
"max_tokens": 164000,
"model_types": ["chat"]
},
{
"name": "qwen3-coder-480b",
"max_tokens": 1024000,
"model_types": ["chat"]
},
{
"name": "hunyuan-a13b-instruct",
"max_tokens": 256000,
"model_types": ["chat"]
},
{
"name": "qwen3-next-80b-a3b-instruct",
"max_tokens": 1024000,
"model_types": ["chat"]
},
{
"name": "deepseek-v3.2-exp",
"max_tokens": 128000,
"model_types": ["chat"]
},
{
"name": "deepseek-v3.1-terminus",
"max_tokens": 128000,
"model_types": ["chat"]
},
{
"name": "qwen3-vl-235b-a22b-instruct",
"max_tokens": 262000,
"model_types": ["chat"]
},
{
"name": "qwen3-vl-30b-a3b-instruct",
"max_tokens": 262000,
"model_types": ["chat"]
},
{
"name": "deepseek-ocr",
"max_tokens": 8000,
"model_types": ["chat"]
},
{
"name": "qwen3-235b-a22b-instruct-2507",
"max_tokens": 256000,
"model_types": ["chat"]
},
{
"name": "glm-4.6",
"max_tokens": 200000,
"model_types": ["chat"]
},
{
"name": "minimax-m2",
"max_tokens": 200000,
"model_types": ["chat"]
}
]
}