From 603262e42aec8350da3f5c57ab5e345017041ee8 Mon Sep 17 00:00:00 2001 From: wuqinchuan Date: Tue, 17 Feb 2026 18:11:25 +0800 Subject: [PATCH] fix: pass recursive parameter to embedding and include in cache key - Pass recursive parameter from request to _build_embeddings_one_folder - Include recursive in cache_params to avoid cache collision between recursive and non-recursive clustering results - Add debug logging for recursive parameter tracking Co-Authored-By: Claude --- scripts/iib/topic_cluster.py | 5 +++++ 1 file changed, 5 insertions(+) diff --git a/scripts/iib/topic_cluster.py b/scripts/iib/topic_cluster.py index 503d532..4f5eb75 100644 --- a/scripts/iib/topic_cluster.py +++ b/scripts/iib/topic_cluster.py @@ -841,13 +841,17 @@ def mount_topic_cluster_routes( batch_size = max(1, min(int(req.batch_size or 64), 256)) max_chars = max(256, min(int(req.max_chars or 4000), 8000)) force = bool(req.force_embed) + recursive = bool(req.recursive) if req.recursive is not None else True + logger.info(f"[_run_cluster_job] recursive={recursive}, req.recursive={req.recursive}") for f in folders: + logger.info(f"[_run_cluster_job] Building embeddings for folder: {f}, recursive={recursive}") await _build_embeddings_one_folder( folder=f, model=model, force=force, batch_size=batch_size, max_chars=max_chars, + recursive=recursive, progress_cb=_embed_cb, ) @@ -876,6 +880,7 @@ def mount_topic_cluster_routes( "lang": str(req.lang or ""), "nv": _PROMPT_NORMALIZE_VERSION, "nm": _PROMPT_NORMALIZE_MODE, + "recursive": recursive, } h = hashlib.sha1() h.update(json.dumps({"folders": folders, "params": cache_params}, ensure_ascii=False, sort_keys=True).encode("utf-8"))