From 2980981da2eaec18c39ec5042a9bb3cc459470e2 Mon Sep 17 00:00:00 2001
From: buua436 <sz_buua@foxmail.com>
Date: Wed, 10 Jun 2026 19:09:18 +0800
Subject: [PATCH] fix: route visual agent calls to image model (#15906)

### What problem does this PR solve?
Ensure agent components with image inputs route to `image2text` models
instead of staying on the chat path, so visual requests use the CV
wrapper when supported.

### Type of change
- [x] Bug Fix (non-breaking change which fixes an issue)
---
 agent/component/llm.py | 7 ++++++-
 1 file changed, 6 insertions(+), 1 deletion(-)

diff --git a/agent/component/llm.py b/agent/component/llm.py
index b4b2ee038b..0ccc8bf4af 100644
--- a/agent/component/llm.py
+++ b/agent/component/llm.py
@@ -249,7 +249,12 @@ class LLM(ComponentBase):
 
         self.imgs = self._uniq_images(self.imgs + extracted_imgs)
         model_types = get_model_type_by_name(self._canvas.get_tenant_id(), self._param.llm_id)
-        model_type = LLMType.CHAT.value if LLMType.CHAT.value in model_types else model_types[0]
+        if self.imgs and LLMType.IMAGE2TEXT.value in model_types:
+            model_type = LLMType.IMAGE2TEXT.value
+        elif LLMType.CHAT.value in model_types:
+            model_type = LLMType.CHAT.value
+        else:
+            model_type = model_types[0]
         model_config = get_model_config_from_provider_instance(self._canvas.get_tenant_id(), model_type, self._param.llm_id)
         if self.imgs:
             self.chat_mdl = LLMBundle(self._canvas.get_tenant_id(), model_config, max_retries=self._param.max_retries,