mirror of
https://github.com/infiniflow/ragflow.git
synced 2026-05-26 18:57:20 +08:00
### What problem does this PR solve? Implements automatic adjustment of knowledge base chunk recall weights based on user feedback (upvotes/downvotes). When users upvote or downvote a response, the system locates the corresponding knowledge snippets and adjusts their recall weight to improve future retrieval quality. **Closes #12670** **How it works:** 1. User upvotes/downvotes a response via `POST /thumbup` 2. System extracts chunk IDs from the conversation reference 3. For each referenced chunk: - Reads current `pagerank_fea` value from document store - Increments (+1) for upvote or decrements (-1) for downvote - Clamps weight to [0, 100] range - Updates chunk in ES/Infinity/OceanBase 4. Future retrievals score these chunks higher/lower based on accumulated feedback **Files changed:** - `api/db/services/chunk_feedback_service.py` - New service for updating chunk pagerank weights - `api/apps/conversation_app.py` - Integrated feedback service into thumbup endpoint - `test/testcases/test_web_api/test_chunk_feedback/` - Unit tests ### Type of change - [x] New Feature (non-breaking change which adds functionality) <!-- This is an auto-generated comment: release notes by coderabbit.ai --> ## Summary by CodeRabbit * **New Features** * Chat message feedback now updates per-chunk relevance weights (feature-flag gated), with configurable weighting and atomic updates across storage backends. * **Bug Fixes** * Stricter validation for message feedback inputs and more robust handling of feedback transitions. * **Tests** * Expanded test coverage for chunk-feedback behavior, weighting strategies, storage backends, and thumb-flip scenarios. * **Chores** * CI workflow extended to run the new chunk-feedback web API tests. <!-- end of auto-generated comment: release notes by coderabbit.ai --> --------- Co-authored-by: mkdev11 <YOUR_GITHUB_ID+MkDev11@users.noreply.github.com> Co-authored-by: mkdev11 <MkDev11@users.noreply.github.com>
322 lines
11 KiB
Python
322 lines
11 KiB
Python
#
|
||
# Copyright 2025 The InfiniFlow Authors. All Rights Reserved.
|
||
#
|
||
# Licensed under the Apache License, Version 2.0 (the "License");
|
||
# you may not use this file except in compliance with the License.
|
||
# You may obtain a copy of the License at
|
||
#
|
||
# http://www.apache.org/licenses/LICENSE-2.0
|
||
#
|
||
# Unless required by applicable law or agreed to in writing, software
|
||
# distributed under the License is distributed on an "AS IS" BASIS,
|
||
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||
# See the License for the specific language governing permissions and
|
||
# limitations under the License.
|
||
#
|
||
"""
|
||
Service for adjusting chunk recall weights based on user feedback.
|
||
|
||
When users upvote or downvote responses, this service updates the pagerank_fea
|
||
field of the referenced chunks to improve future retrieval quality.
|
||
|
||
This feature is disabled by default. Enable it by setting the environment
|
||
variable CHUNK_FEEDBACK_ENABLED=true.
|
||
|
||
Weighting modes (CHUNK_FEEDBACK_WEIGHTING):
|
||
- relevance (default): one small budget per feedback event is split across
|
||
cited chunks using retrieval scores (similarity / vector_similarity /
|
||
term_similarity) from the reference payload, so chunks that drove the answer
|
||
move more than weak tail context.
|
||
- uniform: legacy behavior — each cited chunk receives the full increment or
|
||
decrement (stronger total effect when many chunks are cited).
|
||
|
||
Budget per feedback event is a small integer (1) applied to pagerank_fea
|
||
(0–100, integer in Infinity/OB/ES mappings). Relevance mode splits that unit
|
||
across cited chunks; uniform mode applies one unit per chunk (legacy, stronger
|
||
when many chunks are cited).
|
||
|
||
Infinity uses row_id (returned by search results since PR #13901) for targeted
|
||
single-row updates. If a concurrent update changes the row_id, the Infinity
|
||
connector retries with a fresh row_id lookup.
|
||
"""
|
||
import logging
|
||
import math
|
||
import os
|
||
from typing import List, Tuple
|
||
|
||
from common.constants import PAGERANK_FLD
|
||
from common import settings
|
||
from rag.nlp.search import index_name
|
||
|
||
|
||
# Feature flag - disabled by default to prevent unintended side effects
|
||
CHUNK_FEEDBACK_ENABLED = os.getenv("CHUNK_FEEDBACK_ENABLED", "false").lower() == "true"
|
||
|
||
# relevance: fixed budget split by retrieval signals; uniform: delta per chunk
|
||
CHUNK_FEEDBACK_WEIGHTING = os.getenv("CHUNK_FEEDBACK_WEIGHTING", "relevance").strip().lower()
|
||
|
||
# Integer units — matches pagerank_fea integer columns in doc stores
|
||
UPVOTE_WEIGHT_INCREMENT = 1
|
||
DOWNVOTE_WEIGHT_DECREMENT = 1
|
||
MIN_PAGERANK_WEIGHT = 0
|
||
MAX_PAGERANK_WEIGHT = 100
|
||
|
||
_SCORE_KEYS = ("similarity", "vector_similarity", "term_similarity")
|
||
|
||
|
||
def _retrieval_signal(chunk: dict) -> float:
|
||
"""Best available retrieval score for feedback allocation; 0 if none."""
|
||
best = 0.0
|
||
for key in _SCORE_KEYS:
|
||
raw = chunk.get(key)
|
||
if raw is None:
|
||
continue
|
||
try:
|
||
val = float(raw)
|
||
except (TypeError, ValueError):
|
||
continue
|
||
if math.isfinite(val) and val > best:
|
||
best = val
|
||
return best
|
||
|
||
|
||
def _split_integer_budget(magnitudes: List[float], budget: int) -> List[int]:
|
||
"""Split nonnegative integer budget across positive magnitudes (largest remainder)."""
|
||
n = len(magnitudes)
|
||
if n == 0 or budget == 0:
|
||
return [0] * n
|
||
total = sum(magnitudes)
|
||
if total <= 0:
|
||
base = budget // n
|
||
rem = budget % n
|
||
out = [base] * n
|
||
for i in range(rem):
|
||
out[i] += 1
|
||
return out
|
||
raw = [budget * m / total for m in magnitudes]
|
||
floors = [int(math.floor(r)) for r in raw]
|
||
remainder = budget - sum(floors)
|
||
order = sorted(range(n), key=lambda i: raw[i] - floors[i], reverse=True)
|
||
for j in range(remainder):
|
||
floors[order[j]] += 1
|
||
return floors
|
||
|
||
|
||
def _allocate_deltas_uniform(
|
||
chunk_rows: List[Tuple[str, str]],
|
||
signed_budget: int,
|
||
) -> List[Tuple[str, str, int]]:
|
||
"""Each row gets the full signed step (legacy: one unit per cited chunk)."""
|
||
step = UPVOTE_WEIGHT_INCREMENT if signed_budget > 0 else -DOWNVOTE_WEIGHT_DECREMENT
|
||
return [(cid, kb, step) for cid, kb in chunk_rows]
|
||
|
||
|
||
def _allocate_deltas_relevance(
|
||
chunk_rows: List[Tuple[str, str, dict]],
|
||
signed_budget: int,
|
||
) -> List[Tuple[str, str, int]]:
|
||
"""
|
||
Split |signed_budget| integer units across chunks using retrieval_signal weights.
|
||
chunk_rows: (chunk_id, kb_id, original_chunk_dict)
|
||
"""
|
||
if not chunk_rows:
|
||
return []
|
||
|
||
magnitudes = []
|
||
for _cid, _kb, ch in chunk_rows:
|
||
s = _retrieval_signal(ch)
|
||
magnitudes.append(s if s > 0 else 1.0)
|
||
|
||
total = sum(magnitudes)
|
||
if total <= 0:
|
||
magnitudes = [1.0] * len(chunk_rows)
|
||
|
||
sign = 1 if signed_budget > 0 else -1
|
||
budget_abs = abs(signed_budget)
|
||
parts = _split_integer_budget(magnitudes, budget_abs)
|
||
out: List[Tuple[str, str, int]] = []
|
||
for (cid, kb, _ch), p in zip(chunk_rows, parts, strict=True):
|
||
out.append((cid, kb, sign * p))
|
||
return out
|
||
|
||
|
||
class ChunkFeedbackService:
|
||
"""Service to update chunk weights based on user feedback."""
|
||
|
||
@staticmethod
|
||
def _feedback_rows_from_reference(reference: dict) -> List[Tuple[str, str, dict]]:
|
||
"""(chunk_id, kb_id, raw_chunk) for chunks that can be updated (single pass).
|
||
|
||
raw_chunk is kept for retrieval-signal weighting and optional row_id.
|
||
"""
|
||
if not reference:
|
||
return []
|
||
rows: List[Tuple[str, str, dict]] = []
|
||
for chunk in reference.get("chunks", []):
|
||
chunk_id = chunk.get("id") or chunk.get("chunk_id")
|
||
kb_id = chunk.get("dataset_id") or chunk.get("kb_id")
|
||
if chunk_id and kb_id:
|
||
rows.append((chunk_id, kb_id, chunk))
|
||
return rows
|
||
|
||
@staticmethod
|
||
def update_chunk_weight(
|
||
tenant_id: str,
|
||
chunk_id: str,
|
||
kb_id: str,
|
||
delta: int,
|
||
row_id: int | None = None,
|
||
) -> bool:
|
||
"""
|
||
Update the pagerank weight of a single chunk.
|
||
|
||
Elasticsearch, OpenSearch, OceanBase/SeekDB, and Infinity use an
|
||
atomic adjust on the doc store when supported. Infinity passes
|
||
row_id (from retrieval results) for targeted single-row updates.
|
||
|
||
Args:
|
||
tenant_id: The tenant ID for index naming
|
||
chunk_id: The chunk ID to update
|
||
kb_id: The knowledgebase ID
|
||
delta: Signed integer weight change (pagerank_fea is stored as int)
|
||
|
||
Returns:
|
||
True if update succeeded, False otherwise
|
||
"""
|
||
try:
|
||
idx_name = index_name(tenant_id)
|
||
conn = settings.docStoreConn
|
||
adjust = getattr(conn, "adjust_chunk_pagerank_fea", None)
|
||
if callable(adjust):
|
||
kwargs: dict = {}
|
||
if row_id is not None:
|
||
kwargs["row_id"] = row_id
|
||
success = adjust(
|
||
chunk_id,
|
||
idx_name,
|
||
kb_id,
|
||
float(delta),
|
||
MIN_PAGERANK_WEIGHT,
|
||
MAX_PAGERANK_WEIGHT,
|
||
**kwargs,
|
||
)
|
||
if success:
|
||
logging.info(
|
||
"Adjusted chunk %s pagerank by %s (atomic)",
|
||
chunk_id,
|
||
delta,
|
||
)
|
||
else:
|
||
logging.warning("Failed atomic pagerank adjust for chunk %s", chunk_id)
|
||
return success
|
||
|
||
chunk = conn.get(chunk_id, idx_name, [kb_id])
|
||
if not chunk:
|
||
logging.warning("Chunk %s not found in index %s", chunk_id, idx_name)
|
||
return False
|
||
|
||
current_weight = float(chunk.get(PAGERANK_FLD, 0) or 0)
|
||
new_weight = current_weight + float(delta)
|
||
new_weight = max(float(MIN_PAGERANK_WEIGHT), min(float(MAX_PAGERANK_WEIGHT), new_weight))
|
||
|
||
condition = {"id": chunk_id}
|
||
doc_engine = settings.DOC_ENGINE.lower()
|
||
if new_weight <= 0.0 and doc_engine in ("elasticsearch", "opensearch"):
|
||
new_value = {"remove": PAGERANK_FLD}
|
||
else:
|
||
new_value = {PAGERANK_FLD: new_weight}
|
||
|
||
success = conn.update(condition, new_value, idx_name, kb_id)
|
||
|
||
if success:
|
||
logging.info(
|
||
"Updated chunk %s pagerank: %s -> %s",
|
||
chunk_id,
|
||
current_weight,
|
||
new_weight,
|
||
)
|
||
else:
|
||
logging.warning("Failed to update chunk %s pagerank", chunk_id)
|
||
|
||
return success
|
||
|
||
except Exception as e:
|
||
logging.exception("Error updating chunk %s weight: %s", chunk_id, e)
|
||
return False
|
||
|
||
@classmethod
|
||
def apply_feedback(
|
||
cls,
|
||
tenant_id: str,
|
||
reference: dict,
|
||
is_positive: bool
|
||
) -> dict:
|
||
"""
|
||
Apply user feedback to all chunks referenced in a response.
|
||
|
||
Args:
|
||
tenant_id: The tenant ID
|
||
reference: The reference dict from the conversation message
|
||
is_positive: True for upvote (thumbup), False for downvote
|
||
|
||
Returns:
|
||
Dict with 'success_count', 'fail_count', and 'chunk_ids' processed
|
||
"""
|
||
# Check if feature is enabled
|
||
if not CHUNK_FEEDBACK_ENABLED:
|
||
logging.debug("Chunk feedback feature is disabled")
|
||
return {"success_count": 0, "fail_count": 0, "chunk_ids": [], "disabled": True}
|
||
|
||
rows = cls._feedback_rows_from_reference(reference)
|
||
chunk_ids = [r[0] for r in rows]
|
||
|
||
if not chunk_ids:
|
||
logging.debug("No chunk IDs found in reference for feedback")
|
||
return {"success_count": 0, "fail_count": 0, "chunk_ids": []}
|
||
|
||
signed_budget = (
|
||
UPVOTE_WEIGHT_INCREMENT if is_positive else -DOWNVOTE_WEIGHT_DECREMENT
|
||
)
|
||
weighting = CHUNK_FEEDBACK_WEIGHTING if CHUNK_FEEDBACK_WEIGHTING in (
|
||
"uniform",
|
||
"relevance",
|
||
) else "relevance"
|
||
|
||
if weighting == "uniform":
|
||
deltas = _allocate_deltas_uniform([(r[0], r[1]) for r in rows], signed_budget)
|
||
else:
|
||
deltas = _allocate_deltas_relevance(rows, signed_budget)
|
||
|
||
success_count = 0
|
||
fail_count = 0
|
||
|
||
row_by_chunk = {r[0]: r[2].get("row_id") for r in rows}
|
||
for chunk_id, kb_id, delta in deltas:
|
||
if delta == 0:
|
||
continue
|
||
rid = row_by_chunk.get(chunk_id)
|
||
rid_int = None
|
||
if rid is not None:
|
||
try:
|
||
rid_int = int(rid)
|
||
except (TypeError, ValueError):
|
||
pass
|
||
if cls.update_chunk_weight(tenant_id, chunk_id, kb_id, delta, row_id=rid_int):
|
||
success_count += 1
|
||
else:
|
||
fail_count += 1
|
||
|
||
logging.info(
|
||
"Applied %s feedback (%s) to %s/%s chunks",
|
||
"positive" if is_positive else "negative",
|
||
weighting,
|
||
success_count,
|
||
len(chunk_ids),
|
||
)
|
||
|
||
return {
|
||
"success_count": success_count,
|
||
"fail_count": fail_count,
|
||
"chunk_ids": chunk_ids
|
||
}
|