feat: Auto-adjust chunk recall weights based on user feedback (#12689)

### What problem does this PR solve? Implements automatic adjustment of knowledge base chunk recall weights based on user feedback (upvotes/downvotes). When users upvote or downvote a response, the system locates the corresponding knowledge snippets and adjusts their recall weight to improve future retrieval quality. **Closes #12670** **How it works:** 1. User upvotes/downvotes a response via `POST /thumbup` 2. System extracts chunk IDs from the conversation reference 3. For each referenced chunk: - Reads current `pagerank_fea` value from document store - Increments (+1) for upvote or decrements (-1) for downvote - Clamps weight to [0, 100] range - Updates chunk in ES/Infinity/OceanBase 4. Future retrievals score these chunks higher/lower based on accumulated feedback **Files changed:** - `api/db/services/chunk_feedback_service.py` - New service for updating chunk pagerank weights - `api/apps/conversation_app.py` - Integrated feedback service into thumbup endpoint - `test/testcases/test_web_api/test_chunk_feedback/` - Unit tests ### Type of change - [x] New Feature (non-breaking change which adds functionality)  ## Summary by CodeRabbit * **New Features** * Chat message feedback now updates per-chunk relevance weights (feature-flag gated), with configurable weighting and atomic updates across storage backends. * **Bug Fixes** * Stricter validation for message feedback inputs and more robust handling of feedback transitions. * **Tests** * Expanded test coverage for chunk-feedback behavior, weighting strategies, storage backends, and thumb-flip scenarios. * **Chores** * CI workflow extended to run the new chunk-feedback web API tests.  --------- Co-authored-by: mkdev11 <YOUR_GITHUB_ID+MkDev11@users.noreply.github.com> Co-authored-by: mkdev11 <MkDev11@users.noreply.github.com>
2026-07-03 01:01:56 +08:00 · 2026-04-07 18:52:18 -07:00
parent 4a2a17c27a
commit cfee2bc9db
11 changed files with 1293 additions and 13 deletions
--- a/api/apps/restful_apis/chat_api.py
+++ b/api/apps/restful_apis/chat_api.py
@@ -28,6 +28,7 @@ from api.db.joint_services.tenant_model_service import (
    get_model_config_by_type_and_name,
    get_tenant_default_model_by_type,
 )
+from api.db.services.chunk_feedback_service import ChunkFeedbackService
 from api.db.services.conversation_service import ConversationService, structure_answer
 from api.db.services.dialog_service import DialogService, async_ask, async_chat, gen_mindmap
 from api.db.services.knowledgebase_service import KnowledgebaseService
@@ -769,28 +770,64 @@ async def delete_session_message(chat_id, session_id, msg_id):
@manager.route("/chats/<chat_id>/sessions/<session_id>/messages/<msg_id>/feedback", methods=["PUT"])  # noqa: F821
@login_required
 async def update_message_feedback(chat_id, session_id, msg_id):
-    if not _ensure_owned_chat(chat_id):
+    owned = _ensure_owned_chat(chat_id)
+    if not owned:
        return get_json_result(data=False, message="No authorization.", code=RetCode.AUTHENTICATION_ERROR)
    try:
        req = await get_request_json()
        ok, conv = ConversationService.get_by_id(session_id)
        if not ok or conv.dialog_id != chat_id:
            return get_data_error_result(message="Session not found!")
-        up_down = req.get("thumbup")
+        thumb_raw = req.get("thumbup")
+        if not isinstance(thumb_raw, bool):
+            return get_data_error_result(message="thumbup must be a boolean")
        feedback = req.get("feedback", "")
-        conv = conv.to_dict()
-        for msg in conv["message"]:
+        conv_dict = conv.to_dict()
+        message_index = None
+        apply_chunk_feedback = False
+        prior_thumb = None
+        for i, msg in enumerate(conv_dict["message"]):
            if msg_id == msg.get("id", "") and msg.get("role", "") == "assistant":
-                if up_down:
+                prior_thumb = msg.get("thumbup")
+                if thumb_raw is True:
                    msg["thumbup"] = True
                    msg.pop("feedback", None)
+                    apply_chunk_feedback = prior_thumb is not True
                else:
                    msg["thumbup"] = False
                    if feedback:
                        msg["feedback"] = feedback
+                    apply_chunk_feedback = prior_thumb is not False
+                message_index = i
                break
-        ConversationService.update_by_id(conv["id"], conv)
-        return get_json_result(data=_build_session_response(conv))
+
+        if message_index is not None and apply_chunk_feedback:
+            try:
+                ref_index = (message_index - 1) // 2
+                if 0 <= ref_index < len(conv_dict.get("reference", [])):
+                    reference = conv_dict["reference"][ref_index]
+                    if reference:
+                        if isinstance(prior_thumb, bool) and prior_thumb != thumb_raw:
+                            ChunkFeedbackService.apply_feedback(
+                                tenant_id=current_user.id,
+                                reference=reference,
+                                is_positive=not prior_thumb,
+                            )
+                        feedback_result = ChunkFeedbackService.apply_feedback(
+                            tenant_id=current_user.id,
+                            reference=reference,
+                            is_positive=thumb_raw is True,
+                        )
+                        logging.debug(
+                            "Chunk feedback applied: %s succeeded, %s failed",
+                            feedback_result["success_count"],
+                            feedback_result["fail_count"],
+                        )
+            except Exception as e:
+                logging.warning("Failed to apply chunk feedback: %s", e)
+
+        ConversationService.update_by_id(conv_dict["id"], conv_dict)
+        return get_json_result(data=_build_session_response(conv_dict))
    except Exception as ex:
        return server_error_response(ex)

--- a/api/db/services/chunk_feedback_service.py
+++ b/api/db/services/chunk_feedback_service.py
@@ -0,0 +1,321 @@
+#
+#  Copyright 2025 The InfiniFlow Authors. All Rights Reserved.
+#
+#  Licensed under the Apache License, Version 2.0 (the "License");
+#  you may not use this file except in compliance with the License.
+#  You may obtain a copy of the License at
+#
+#      http://www.apache.org/licenses/LICENSE-2.0
+#
+#  Unless required by applicable law or agreed to in writing, software
+#  distributed under the License is distributed on an "AS IS" BASIS,
+#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+#  See the License for the specific language governing permissions and
+#  limitations under the License.
+#
+"""
+Service for adjusting chunk recall weights based on user feedback.
+
+When users upvote or downvote responses, this service updates the pagerank_fea
+field of the referenced chunks to improve future retrieval quality.
+
+This feature is disabled by default. Enable it by setting the environment
+variable CHUNK_FEEDBACK_ENABLED=true.
+
+Weighting modes (CHUNK_FEEDBACK_WEIGHTING):
+- relevance (default): one small budget per feedback event is split across
+  cited chunks using retrieval scores (similarity / vector_similarity /
+  term_similarity) from the reference payload, so chunks that drove the answer
+  move more than weak tail context.
+- uniform: legacy behavior — each cited chunk receives the full increment or
+  decrement (stronger total effect when many chunks are cited).
+
+Budget per feedback event is a small integer (1) applied to pagerank_fea
+(0–100, integer in Infinity/OB/ES mappings). Relevance mode splits that unit
+across cited chunks; uniform mode applies one unit per chunk (legacy, stronger
+when many chunks are cited).
+
+Infinity uses row_id (returned by search results since PR #13901) for targeted
+single-row updates. If a concurrent update changes the row_id, the Infinity
+connector retries with a fresh row_id lookup.
+"""
+import logging
+import math
+import os
+from typing import List, Tuple
+
+from common.constants import PAGERANK_FLD
+from common import settings
+from rag.nlp.search import index_name
+
+
+# Feature flag - disabled by default to prevent unintended side effects
+CHUNK_FEEDBACK_ENABLED = os.getenv("CHUNK_FEEDBACK_ENABLED", "false").lower() == "true"
+
+# relevance: fixed budget split by retrieval signals; uniform: delta per chunk
+CHUNK_FEEDBACK_WEIGHTING = os.getenv("CHUNK_FEEDBACK_WEIGHTING", "relevance").strip().lower()
+
+# Integer units — matches pagerank_fea integer columns in doc stores
+UPVOTE_WEIGHT_INCREMENT = 1
+DOWNVOTE_WEIGHT_DECREMENT = 1
+MIN_PAGERANK_WEIGHT = 0
+MAX_PAGERANK_WEIGHT = 100
+
+_SCORE_KEYS = ("similarity", "vector_similarity", "term_similarity")
+
+
+def _retrieval_signal(chunk: dict) -> float:
+    """Best available retrieval score for feedback allocation; 0 if none."""
+    best = 0.0
+    for key in _SCORE_KEYS:
+        raw = chunk.get(key)
+        if raw is None:
+            continue
+        try:
+            val = float(raw)
+        except (TypeError, ValueError):
+            continue
+        if math.isfinite(val) and val > best:
+            best = val
+    return best
+
+
+def _split_integer_budget(magnitudes: List[float], budget: int) -> List[int]:
+    """Split nonnegative integer budget across positive magnitudes (largest remainder)."""
+    n = len(magnitudes)
+    if n == 0 or budget == 0:
+        return [0] * n
+    total = sum(magnitudes)
+    if total <= 0:
+        base = budget // n
+        rem = budget % n
+        out = [base] * n
+        for i in range(rem):
+            out[i] += 1
+        return out
+    raw = [budget * m / total for m in magnitudes]
+    floors = [int(math.floor(r)) for r in raw]
+    remainder = budget - sum(floors)
+    order = sorted(range(n), key=lambda i: raw[i] - floors[i], reverse=True)
+    for j in range(remainder):
+        floors[order[j]] += 1
+    return floors
+
+
+def _allocate_deltas_uniform(
+    chunk_rows: List[Tuple[str, str]],
+    signed_budget: int,
+) -> List[Tuple[str, str, int]]:
+    """Each row gets the full signed step (legacy: one unit per cited chunk)."""
+    step = UPVOTE_WEIGHT_INCREMENT if signed_budget > 0 else -DOWNVOTE_WEIGHT_DECREMENT
+    return [(cid, kb, step) for cid, kb in chunk_rows]
+
+
+def _allocate_deltas_relevance(
+    chunk_rows: List[Tuple[str, str, dict]],
+    signed_budget: int,
+) -> List[Tuple[str, str, int]]:
+    """
+    Split |signed_budget| integer units across chunks using retrieval_signal weights.
+    chunk_rows: (chunk_id, kb_id, original_chunk_dict)
+    """
+    if not chunk_rows:
+        return []
+
+    magnitudes = []
+    for _cid, _kb, ch in chunk_rows:
+        s = _retrieval_signal(ch)
+        magnitudes.append(s if s > 0 else 1.0)
+
+    total = sum(magnitudes)
+    if total <= 0:
+        magnitudes = [1.0] * len(chunk_rows)
+
+    sign = 1 if signed_budget > 0 else -1
+    budget_abs = abs(signed_budget)
+    parts = _split_integer_budget(magnitudes, budget_abs)
+    out: List[Tuple[str, str, int]] = []
+    for (cid, kb, _ch), p in zip(chunk_rows, parts, strict=True):
+        out.append((cid, kb, sign * p))
+    return out
+
+
+class ChunkFeedbackService:
+    """Service to update chunk weights based on user feedback."""
+
+    @staticmethod
+    def _feedback_rows_from_reference(reference: dict) -> List[Tuple[str, str, dict]]:
+        """(chunk_id, kb_id, raw_chunk) for chunks that can be updated (single pass).
+
+        raw_chunk is kept for retrieval-signal weighting and optional row_id.
+        """
+        if not reference:
+            return []
+        rows: List[Tuple[str, str, dict]] = []
+        for chunk in reference.get("chunks", []):
+            chunk_id = chunk.get("id") or chunk.get("chunk_id")
+            kb_id = chunk.get("dataset_id") or chunk.get("kb_id")
+            if chunk_id and kb_id:
+                rows.append((chunk_id, kb_id, chunk))
+        return rows
+
+    @staticmethod
+    def update_chunk_weight(
+        tenant_id: str,
+        chunk_id: str,
+        kb_id: str,
+        delta: int,
+        row_id: int | None = None,
+    ) -> bool:
+        """
+        Update the pagerank weight of a single chunk.
+
+        Elasticsearch, OpenSearch, OceanBase/SeekDB, and Infinity use an
+        atomic adjust on the doc store when supported. Infinity passes
+        row_id (from retrieval results) for targeted single-row updates.
+
+        Args:
+            tenant_id: The tenant ID for index naming
+            chunk_id: The chunk ID to update
+            kb_id: The knowledgebase ID
+            delta: Signed integer weight change (pagerank_fea is stored as int)
+
+        Returns:
+            True if update succeeded, False otherwise
+        """
+        try:
+            idx_name = index_name(tenant_id)
+            conn = settings.docStoreConn
+            adjust = getattr(conn, "adjust_chunk_pagerank_fea", None)
+            if callable(adjust):
+                kwargs: dict = {}
+                if row_id is not None:
+                    kwargs["row_id"] = row_id
+                success = adjust(
+                    chunk_id,
+                    idx_name,
+                    kb_id,
+                    float(delta),
+                    MIN_PAGERANK_WEIGHT,
+                    MAX_PAGERANK_WEIGHT,
+                    **kwargs,
+                )
+                if success:
+                    logging.info(
+                        "Adjusted chunk %s pagerank by %s (atomic)",
+                        chunk_id,
+                        delta,
+                    )
+                else:
+                    logging.warning("Failed atomic pagerank adjust for chunk %s", chunk_id)
+                return success
+
+            chunk = conn.get(chunk_id, idx_name, [kb_id])
+            if not chunk:
+                logging.warning("Chunk %s not found in index %s", chunk_id, idx_name)
+                return False
+
+            current_weight = float(chunk.get(PAGERANK_FLD, 0) or 0)
+            new_weight = current_weight + float(delta)
+            new_weight = max(float(MIN_PAGERANK_WEIGHT), min(float(MAX_PAGERANK_WEIGHT), new_weight))
+
+            condition = {"id": chunk_id}
+            doc_engine = settings.DOC_ENGINE.lower()
+            if new_weight <= 0.0 and doc_engine in ("elasticsearch", "opensearch"):
+                new_value = {"remove": PAGERANK_FLD}
+            else:
+                new_value = {PAGERANK_FLD: new_weight}
+
+            success = conn.update(condition, new_value, idx_name, kb_id)
+
+            if success:
+                logging.info(
+                    "Updated chunk %s pagerank: %s -> %s",
+                    chunk_id,
+                    current_weight,
+                    new_weight,
+                )
+            else:
+                logging.warning("Failed to update chunk %s pagerank", chunk_id)
+
+            return success
+
+        except Exception as e:
+            logging.exception("Error updating chunk %s weight: %s", chunk_id, e)
+            return False
+
+    @classmethod
+    def apply_feedback(
+        cls,
+        tenant_id: str,
+        reference: dict,
+        is_positive: bool
+    ) -> dict:
+        """
+        Apply user feedback to all chunks referenced in a response.
+
+        Args:
+            tenant_id: The tenant ID
+            reference: The reference dict from the conversation message
+            is_positive: True for upvote (thumbup), False for downvote
+
+        Returns:
+            Dict with 'success_count', 'fail_count', and 'chunk_ids' processed
+        """
+        # Check if feature is enabled
+        if not CHUNK_FEEDBACK_ENABLED:
+            logging.debug("Chunk feedback feature is disabled")
+            return {"success_count": 0, "fail_count": 0, "chunk_ids": [], "disabled": True}
+
+        rows = cls._feedback_rows_from_reference(reference)
+        chunk_ids = [r[0] for r in rows]
+
+        if not chunk_ids:
+            logging.debug("No chunk IDs found in reference for feedback")
+            return {"success_count": 0, "fail_count": 0, "chunk_ids": []}
+
+        signed_budget = (
+            UPVOTE_WEIGHT_INCREMENT if is_positive else -DOWNVOTE_WEIGHT_DECREMENT
+        )
+        weighting = CHUNK_FEEDBACK_WEIGHTING if CHUNK_FEEDBACK_WEIGHTING in (
+            "uniform",
+            "relevance",
+        ) else "relevance"
+
+        if weighting == "uniform":
+            deltas = _allocate_deltas_uniform([(r[0], r[1]) for r in rows], signed_budget)
+        else:
+            deltas = _allocate_deltas_relevance(rows, signed_budget)
+
+        success_count = 0
+        fail_count = 0
+
+        row_by_chunk = {r[0]: r[2].get("row_id") for r in rows}
+        for chunk_id, kb_id, delta in deltas:
+            if delta == 0:
+                continue
+            rid = row_by_chunk.get(chunk_id)
+            rid_int = None
+            if rid is not None:
+                try:
+                    rid_int = int(rid)
+                except (TypeError, ValueError):
+                    pass
+            if cls.update_chunk_weight(tenant_id, chunk_id, kb_id, delta, row_id=rid_int):
+                success_count += 1
+            else:
+                fail_count += 1
+
+        logging.info(
+            "Applied %s feedback (%s) to %s/%s chunks",
+            "positive" if is_positive else "negative",
+            weighting,
+            success_count,
+            len(chunk_ids),
+        )
+
+        return {
+            "success_count": success_count,
+            "fail_count": fail_count,
+            "chunk_ids": chunk_ids
+        }