diff --git a/fastapi_app/config/settings.py b/fastapi_app/config/settings.py
index 1bdeead..9be9bd9 100644
--- a/fastapi_app/config/settings.py
+++ b/fastapi_app/config/settings.py
@@ -75,6 +75,48 @@ class AppSettings(BaseSettings):
     LOCAL_EMBEDDING_CUDA_VISIBLE_DEVICES: Optional[str] = None
     LOCAL_EMBEDDING_GPU_MEMORY_UTILIZATION: float = 0.3
 
+    # ── GraphRAG ──────────────────────────────────────────────────────────────
+    # 查询侧默认用较快聊天模型；索引抽取亦走同一 default_chat_model（见 settings.yaml）
+    GRAPHRAG_LLM_MODEL: str = "deepseek-v3.2"
+    GRAPHRAG_EMBEDDING_MODEL: str = "text-embedding-3-small"
+    # True 且 USE_LOCAL_EMBEDDING=1 时，查询/索引写入的 embedding 指向本地 vLLM（须与向量维度一致；从 OpenAI 维度过来的库需重建索引）
+    GRAPHRAG_USE_LOCAL_EMBEDDING_RUNTIME: bool = True
+    GRAPHRAG_OUTPUT_DIR: str = "outputs/graphrag_kb"  # workspace root, layout: {dir}/{email}/{nb_id}/
+    GRAPHRAG_CMD: str = ""                          # graphrag CLI path; auto-detected from PATH if empty
+    GRAPHRAG_CHUNK_SIZE: int = 384                  # chars per chunk; also written to settings.yaml chunks.size
+    GRAPHRAG_CHUNK_OVERLAP: int = 48
+    # 写入 prompt，偏短输出可缩短 local_search 生成时间
+    GRAPHRAG_RESPONSE_TYPE: str = "At most 4 bullet points; be concise."
+    GRAPHRAG_COMMUNITY_LEVEL: int = 1               # 低于 2 通常更快，社区上下文更少
+    GRAPHRAG_LOCAL_SEARCH_CONTEXT_MAX_TOKENS: int = 12000  # 低于 24000 可加快检索上下文组装与生成
+    GRAPHRAG_SUBGRAPH_PRUNE_ENABLED: bool = True    # run LLM subgraph pruning after each query
+    GRAPHRAG_SUBGRAPH_PRUNE_MODEL: str = "deepseek-v3.2"  # 仅单独裁剪路径使用
+    GRAPHRAG_SUBGRAPH_PRUNE_MAX_EDGES_INPUT: int = 28   # 裁剪+Judge 合并路径：输入边数上限（越小越快）
+    GRAPHRAG_SUBGRAPH_PRUNE_MAX_TOKENS: int = 512      # 单独裁剪 LLM 输出上限（若仍启用旧路径）
+    # 裁剪与 Judge 合并为一次 LLM（graphrag_chat / graphrag_kb query）
+    GRAPHRAG_PRUNE_JUDGE_MODEL: Optional[str] = None   # 为空则用 JUDGE_MODEL
+    GRAPHRAG_PRUNE_JUDGE_MAX_TOKENS: int = 768        # 合并调用输出上限（含 analysis + judge JSON）
+    GRAPHRAG_MAX_HIGHLIGHT_HINTS: int = 10          # max highlight_hints returned (0 = unlimited)
+    # 子图实体名 → Wikidata 搜索 → 在 GraphRAG query/chat 答案末尾附加简短参考（需出网）
+    GRAPHRAG_WIKIDATA_ENRICH_ENABLED: bool = True
+    GRAPHRAG_WIKIDATA_LANG: str = "zh"              # wbsearchentities + 标签/描述优先语言
+    GRAPHRAG_WIKIDATA_MAX_ENTITIES: int = 8         # 最多解析的不重复实体数
+    # HTTPS 读超时（秒）；弱网可再加大或通过 HTTP 代理访问 wikidata.org
+    GRAPHRAG_WIKIDATA_TIMEOUT_SEC: float = 45.0
+    GRAPHRAG_WIKIDATA_CONNECT_TIMEOUT_SEC: float = 10.0
+    # 对 Read timeout / 连接错误额外重试次数（每次递增短暂退避）
+    GRAPHRAG_WIKIDATA_HTTP_RETRIES: int = 2
+    GRAPHRAG_WIKIDATA_API_URL: str = "https://www.wikidata.org/w/api.php"
+
+    # ── KGGen (optional triple extraction, disabled by default) ───────────────
+    KGGEN_MODEL: str = "deepseek-v3.2"
+    KGGEN_PER_CHUNK: bool = True                    # True = per-chunk calls; False = full-text single call
+    KGGEN_LOG_CHUNK_INTERVAL: int = 10              # log every N chunks (0 = first/last only)
+
+    # ── Judge (answer confidence scoring) ─────────────────────────────────────
+    JUDGE_MODEL: str = "deepseek-v3.2"              # 单独 Judge；合并路径默认同此模型
+    JUDGE_MAX_TOKENS: int = 256                     # 弱化：更短 judge 输出
+
     class Config:
         env_file = ".env"
         env_file_encoding = "utf-8"
diff --git a/fastapi_app/main.py b/fastapi_app/main.py
index fdbd9b1..107b672 100644
--- a/fastapi_app/main.py
+++ b/fastapi_app/main.py
@@ -41,6 +41,7 @@
 from fastapi.responses import FileResponse
 
 from fastapi_app.routers import auth, data_extract, files, kb, kb_embedding, paper2drawio, paper2ppt
+from fastapi_app.routers import graphrag_kb
 from fastapi_app.middleware.api_key import APIKeyMiddleware
 from fastapi_app.middleware.logging import LoggingMiddleware
 from workflow_engine.utils import get_project_root
@@ -428,6 +429,17 @@ async def _lifespan(app: FastAPI):
         os.environ["LOCAL_MINERU_API_URL"] = mineru_base_url
         os.environ["LOCAL_MINERU_MODEL"] = resolved_mineru_model
 
+    def _warmup_graphrag_imports() -> None:
+        try:
+            import graphrag.config.load_config  # noqa: F401
+            from graphrag import api as _graphrag_api  # noqa: F401
+            from graphrag.cli.query import _resolve_output_files  # noqa: F401
+            log.info("GraphRAG 相关 Python 包已预导入，可降低首次查询的 import 冷启动")
+        except ImportError as exc:
+            log.debug("GraphRAG 预导入跳过: %s", exc)
+
+    _warmup_graphrag_imports()
+
     yield
     for proc in managed_procs:
         if proc.poll() is None:
@@ -476,6 +488,8 @@ def create_app() -> FastAPI:
     app.include_router(paper2drawio.router, prefix="/api/v1", tags=["Paper2Drawio"])
     app.include_router(paper2ppt.router, prefix="/api/v1", tags=["Paper2PPT"])
     app.include_router(auth.router, prefix="/api/v1", tags=["Auth"])
+    # GraphRAG 知识库：/api/v1/graphrag-kb/{index,query,merge,chunk-snippet} → wa_graphrag_kb → wf_graphrag_kb
+    app.include_router(graphrag_kb.router, prefix="/api/v1", tags=["GraphRAG KB"])
 
     # 静态文件：/outputs 下的文件（兼容 URL 中 %40 与 磁盘 @ 两种路径）
     project_root = get_project_root()
diff --git a/fastapi_app/routers/graphrag_kb.py b/fastapi_app/routers/graphrag_kb.py
new file mode 100644
index 0000000..39e93db
--- /dev/null
+++ b/fastapi_app/routers/graphrag_kb.py
@@ -0,0 +1,729 @@
+"""GraphRAG 知识库 HTTP 路由（前缀在 ``main`` 中与 ``/api/v1`` 拼接）。
+
+【端点与数据流】
+    POST ``/graphrag-kb/index``  → ``wa_graphrag_kb.run_index`` → 建索引 → ``IndexResponse``
+    POST ``/graphrag-kb/query``   → ``run_query`` → 检索 + Judge（+ 子图 CoT）→ ``QueryResponse``
+    POST ``/graphrag-kb/merge``  → ``run_merge`` → 合并两 workspace → ``MergeResponse``
+    POST ``/graphrag-kb/chunk-snippet`` → 按 ``chunk_id`` 从 ``input/*.txt`` 取块；可选 ``passage_for_llm`` 与 UI 文段对齐后做抽句高亮
+    POST ``/graphrag-kb/context-refine`` → 首条 text_unit 原文 + ``reasoning_subgraph`` → LLM 清洗噪声并返回 ``cleaned_text`` + ``supporting_snippets``
+
+【安全】
+    ``_safe_workspace_dir`` 将路径解析到项目根目录下，防止目录穿越。
+
+【说明】
+    请求体携带与其它路由一致的 LLM 凭证；前端不直连 ``workflow_engine``，仅调本路由。
+"""
+from __future__ import annotations
+
+import json
+import re
+import asyncio
+from pathlib import Path
+from typing import Any, Dict, List, Optional
+
+from fastapi import APIRouter, HTTPException
+from pydantic import BaseModel, Field
+
+from fastapi_app.config import settings
+from fastapi_app.workflow_adapters.wa_graphrag_kb import run_index, run_query, run_merge, run_chat
+from workflow_engine.logger import get_logger
+from workflow_engine.utils import get_project_root
+
+log = get_logger(__name__)
+
+
+# 匹配 GraphRAG input 文件中每个 chunk 段的起始行（后跟该段正文直至下一 chunk 或 EOF）
+_CHUNK_HEAD = re.compile(r"\[chunk:([a-f0-9]+)\]\s*\n", re.IGNORECASE)
+
+
+def _extract_chunk_block_from_input_text(text: str, chunk_id: str) -> str:
+    """在整份 ``input/<stem>.txt`` 文本中，定位 ``[chunk:目标id]`` 之后到下一 ``[chunk:`` 之前的正文。"""
+    want = chunk_id.strip().lower()
+    matches = list(_CHUNK_HEAD.finditer(text))
+    for i, m in enumerate(matches):
+        if m.group(1).lower() != want:
+            continue
+        start = m.end()
+        end = matches[i + 1].start() if i + 1 < len(matches) else len(text)
+        return text[start:end].strip()
+    return ""
+
+
+def _reanchor_graphrag_workspace_to_root(resolved_abs: Path, root: Path) -> Optional[Path]:
+    """If *resolved_abs* points at another clone (browser localStorage) but shares
+    ``outputs/graphrag_kb/<tail>`` with this repo, map to ``root / outputs/graphrag_kb/<tail>``.
+
+    Returns a path under *root* only if that directory exists; otherwise ``None``.
+    """
+    parts = resolved_abs.parts
+    for i in range(len(parts) - 1):
+        if parts[i] == "outputs" and parts[i + 1] == "graphrag_kb":
+            tail = Path(*parts[i:])
+            candidate = (root / tail).resolve()
+            if not candidate.is_dir():
+                return None
+            try:
+                candidate.relative_to(root)
+                return candidate
+            except ValueError:
+                return None
+    return None
+
+
+def _safe_workspace_dir(raw: str) -> Path:
+    """将 *raw* 解析为项目根目录下的绝对路径；越界则抛 ``HTTPException(400)``。"""
+    root = get_project_root().resolve()
+    p = Path(raw.strip())
+    if not p.is_absolute():
+        p = (root / p).resolve()
+    else:
+        p = p.resolve()
+    try:
+        p.relative_to(root)
+        return p
+    except ValueError as exc:
+        alt = _reanchor_graphrag_workspace_to_root(p, root)
+        if alt is not None:
+            return alt
+        raise HTTPException(status_code=400, detail="workspace_dir must be under project root") from exc
+
+router = APIRouter(prefix="/graphrag-kb", tags=["GraphRAG KB"])
+
+# ---------------------------------------------------------------------------
+# Pydantic request/response models
+# ---------------------------------------------------------------------------
+
+class _LLMBase(BaseModel):
+    api_url: str = Field(default_factory=lambda: settings.DEFAULT_LLM_API_URL)
+    api_key: str = ""
+    model: str = Field(default_factory=lambda: settings.GRAPHRAG_LLM_MODEL)
+
+
+class IndexRequest(_LLMBase):
+    notebook_id: str
+    notebook_title: str = ""
+    email: str = ""
+    source_stems: Optional[List[str]] = None
+    workspace_dir: str = ""
+    force_reindex: bool = False
+    # Run MinerU on un-parsed PDFs before chunk extraction.
+    # Set to False if MinerU was already triggered via /kb/upload.
+    parse_pdfs: bool = True
+    # Default True: do not run KGGen (user-facing path is GraphRAG-only).
+    skip_kggen: bool = True
+
+
+class IndexResponse(BaseModel):
+    workspace_dir: str
+    num_chunks: int
+    kg_entities: int
+    kg_relations: int
+
+
+class QueryRequest(_LLMBase):
+    notebook_id: str
+    notebook_title: str = ""
+    email: str = ""
+    question: str
+    search_method: str = Field(default="local", pattern="^(local|global)$")
+    workspace_dir: str = ""
+    # None: use server GRAPHRAG_WIKIDATA_ENRICH_ENABLED; False: skip Wikidata appendix
+    wikidata_enrich: Optional[bool] = None
+
+
+class QueryResponse(BaseModel):
+    answer: str
+    context_data: Dict[str, Any] = Field(default_factory=dict)
+    reasoning_subgraph: List[Dict[str, Any]] = Field(default_factory=list)
+    source_chunks: List[str] = Field(default_factory=list)
+    highlight_hints: List[Dict[str, Any]] = Field(default_factory=list)
+    judge_score: float = 0.0
+    judge_rationale: str = ""
+    reasoning_subgraph_cot: str = ""
+
+
+class MergeRequest(_LLMBase):
+    notebook_id: str = ""
+    notebook_title: str = ""
+    email: str = ""
+    workspace_dir_a: str
+    workspace_dir_b: str
+    dedupe: bool = False
+
+
+class MergeResponse(BaseModel):
+    merged_workspace_dir: str
+    num_chunks: int
+
+
+class ChatRequest(_LLMBase):
+    notebook_id: str
+    notebook_title: str = ""
+    email: str = ""
+    query: str
+    history: List[Dict[str, Any]] = Field(default_factory=list)
+    search_method: str = Field(default="auto", pattern="^(auto|local|global)$")
+    workspace_dir: str = ""
+    wikidata_enrich: Optional[bool] = None
+    defer_postprocess: bool = False
+
+
+class ChatResponse(BaseModel):
+    answer: str
+    intent: Dict[str, Any] = Field(default_factory=dict)
+    rewritten_query: str = ""
+    context_data: Dict[str, Any] = Field(default_factory=dict)
+    reasoning_subgraph: List[Dict[str, Any]] = Field(default_factory=list)
+    reasoning_subgraph_cot: str = ""
+    source_chunks: List[str] = Field(default_factory=list)
+    highlight_hints: List[Dict[str, Any]] = Field(default_factory=list)
+    judge_score: float = 0.0
+    judge_rationale: str = ""
+    postprocess_pending: bool = False
+    graphrag_raw_answer: str = ""
+
+
+class ChatPostprocessRequest(_LLMBase):
+    query: str
+    answer: str = ""
+    reasoning_subgraph: List[Dict[str, Any]] = Field(default_factory=list)
+    wikidata_enrich: Optional[bool] = None
+    mode: str = Field(default="subgraph", pattern="^(all|subgraph|wikidata)$")
+
+
+class ChatPostprocessResponse(BaseModel):
+    reasoning_subgraph: List[Dict[str, Any]] = Field(default_factory=list)
+    reasoning_subgraph_cot: str = ""
+    judge_score: float = 0.0
+    judge_rationale: str = ""
+    wikidata_appendix: str = ""
+    subgraph_done: bool = False
+    wikidata_done: bool = False
+    done: bool = True
+
+
+class ChunkSnippetRequest(BaseModel):
+    """Resolve *chunk_id* to raw text inside GraphRAG ``input/<stem>.txt`` markers."""
+
+    workspace_dir: str = Field(..., description="GraphRAG workspace root (contains chunk_meta.json + input/)")
+    chunk_id: str = Field(..., min_length=8, description="Hex chunk id from chunk_meta / query")
+    # LLM credentials forwarded from the frontend (same key/url used by query/index).
+    api_key: str = ""
+    api_url: str = ""
+    # Optional: pass reasoning_subgraph triples so the backend can ask an LLM to pick
+    # the exact sentence from the chunk that best expresses one of these relationships.
+    triples: Optional[List[Dict[str, Any]]] = None
+    # Optional: same passage as shown in UI (e.g. stripped text_units[0].text). When set,
+    # LLM extraction uses this instead of the raw ``input/*.txt`` block so highlights align with the box.
+    passage_for_llm: Optional[str] = Field(
+        default=None,
+        max_length=120_000,
+        description="Context passage for highlight LLM; must be substring-compatible with indexed chunk",
+    )
+
+
+class ChunkSnippetResponse(BaseModel):
+    text: str = ""
+    source_stem: str = ""
+    found: bool = False
+    # LLM-extracted verbatim sentence from the chunk that best matches the triples.
+    # Empty string if triples were not provided or LLM extraction failed.
+    highlighted_sentence: str = ""
+
+
+class ContextRefineRequest(BaseModel):
+    """First retrieval text unit + reasoning subgraph → LLM cleans noise + picks supporting quotes."""
+
+    unit_text: str = Field(..., max_length=150_000, description="Raw text from context_data first Sources row")
+    subgraph: List[Dict[str, Any]] = Field(
+        default_factory=list,
+        description="reasoning_subgraph edges: source/target/relation",
+    )
+    api_key: str = ""
+    api_url: str = ""
+    model: str = Field(default_factory=lambda: settings.GRAPHRAG_LLM_MODEL)
+
+
+class ContextRefineResponse(BaseModel):
+    cleaned_text: str = ""
+    supporting_snippets: List[str] = Field(default_factory=list)
+
+
+# ---------------------------------------------------------------------------
+# Endpoints
+# ---------------------------------------------------------------------------
+
+
+def _extract_sentence_for_triples(
+    chunk_text: str,
+    triples: List[Dict[str, Any]],
+    *,
+    api_key: str = "",
+    api_url: str = "",
+) -> str:
+    """Ask the configured LLM to pick the verbatim sentence from *chunk_text* that best
+    expresses one of the given triples. *chunk_text* may be the indexed ``input/*.txt``
+    block or the UI passage (e.g. stripped ``text_units`` row) for alignment with highlights.
+    """
+    if not chunk_text.strip() or not triples:
+        return ""
+    try:
+        from openai import OpenAI
+    except ImportError:
+        log.debug("[ChunkSnippet] openai not installed; skipping sentence extraction")
+        return ""
+
+    triple_lines = "\n".join(
+        f"  ({t.get('source', '?')}) --[{t.get('relation', '?')}]--> ({t.get('target', '?')})"
+        for t in triples[:20]
+    )
+    system_prompt = (
+        "You are a precise text extraction assistant. "
+        "Return ONLY the verbatim sentence or short phrase from the provided chunk "
+        "that best expresses one of the given relationships. "
+        "Do NOT paraphrase, add explanation, or include any other text."
+    )
+    user_msg = (
+        f"Knowledge graph relationships:\n{triple_lines}\n\n"
+        f"Chunk text:\n{chunk_text}\n\n"
+        "Extract the EXACT sentence or phrase from the chunk that best matches "
+        "one of the relationships above. Return only that text."
+    )
+    try:
+        import os
+        resolved_key = api_key.strip() or os.getenv("DF_API_KEY", "") or "none"
+        api_base = (api_url.strip() or settings.DEFAULT_LLM_API_URL).rstrip("/")
+        client = OpenAI(api_key=resolved_key, base_url=api_base)
+        resp = client.chat.completions.create(
+            model=settings.GRAPHRAG_LLM_MODEL,
+            max_tokens=256,
+            temperature=0,
+            messages=[
+                {"role": "system", "content": system_prompt},
+                {"role": "user", "content": user_msg},
+            ],
+        )
+        sentence = (resp.choices[0].message.content or "").strip()
+        # Sanity check: LLM must return something that actually appears in the chunk
+        if sentence and sentence in chunk_text:
+            return sentence
+        log.debug("[ChunkSnippet] LLM sentence not found verbatim in chunk; discarding")
+        return ""
+    except Exception as exc:
+        log.warning("[ChunkSnippet] LLM extraction failed: %s", exc)
+        return ""
+
+
+def _refine_context_unit_with_llm(
+    unit_text: str,
+    subgraph: List[Dict[str, Any]],
+    *,
+    api_key: str,
+    api_url: str,
+    model: str,
+) -> tuple[str, List[str]]:
+    """Return (cleaned_text, supporting_snippets) from raw first-unit text + subgraph edges."""
+    raw = (unit_text or "").strip()
+    if not raw:
+        return "", []
+    if not subgraph:
+        return raw, []
+
+    edge_lines: List[str] = []
+    for i, e in enumerate(subgraph[:80], start=1):
+        if not isinstance(e, dict):
+            continue
+        s = str(e.get("source") or "").strip()
+        t = str(e.get("target") or "").strip()
+        r = str(e.get("relation") or "").strip()
+        if not (s and t):
+            continue
+        edge_lines.append(f"{i}. ({s}) -[{r}]-> ({t})")
+    if not edge_lines:
+        return raw, []
+
+    system = (
+        "You clean noisy document excerpts and select supporting quotes for a knowledge-graph subgraph.\n"
+        "Return ONLY valid JSON with keys: cleaned_text (string), supporting_snippets (array of strings).\n"
+        "Rules:\n"
+        "- cleaned_text: remove footers, URLs, page numbers, repeated headers, [chunk:...] / [Data:...] lines, "
+        "and other boilerplate. Preserve the substantive prose in reading order. Do not invent content.\n"
+        "- supporting_snippets: 1–6 short verbatim quotes from cleaned_text (exact substrings) that best "
+        "support the given subgraph edges (entities/relations). Each snippet should be one sentence or clause; "
+        "prefer distinct non-overlapping snippets.\n"
+        "- If nothing in the passage supports the subgraph, use an empty supporting_snippets array.\n"
+        "- Output JSON only, no markdown fences."
+    )
+    user_msg = "raw_passage:\n" + raw[:120_000] + "\n\nsubgraph_edges:\n" + "\n".join(edge_lines)
+
+    try:
+        from openai import OpenAI
+        import os
+
+        resolved_key = api_key.strip() or os.getenv("DF_API_KEY", "") or "none"
+        api_base = (api_url.strip() or settings.DEFAULT_LLM_API_URL).rstrip("/")
+        client = OpenAI(api_key=resolved_key, base_url=api_base)
+        mdl = (model or "").strip() or settings.GRAPHRAG_LLM_MODEL
+        messages = [
+            {"role": "system", "content": system},
+            {"role": "user", "content": user_msg},
+        ]
+        try:
+            comp = client.chat.completions.create(
+                model=mdl,
+                messages=messages,
+                temperature=0.1,
+                max_tokens=8192,
+                response_format={"type": "json_object"},
+            )
+        except Exception:
+            comp = client.chat.completions.create(
+                model=mdl,
+                messages=messages,
+                temperature=0.1,
+                max_tokens=8192,
+            )
+        choice = (comp.choices[0].message.content or "").strip()
+        if choice.startswith("```"):
+            choice = re.sub(r"^```(?:json)?\s*", "", choice, flags=re.I)
+            choice = re.sub(r"\s*```\s*$", "", choice).strip()
+        try:
+            data = json.loads(choice)
+        except json.JSONDecodeError:
+            i, j = choice.find("{"), choice.rfind("}")
+            if i < 0 or j <= i:
+                return raw, []
+            try:
+                data = json.loads(choice[i : j + 1])
+            except json.JSONDecodeError:
+                return raw, []
+        if not isinstance(data, dict):
+            return raw, []
+        cleaned = str(data.get("cleaned_text") or "").strip()
+        snips_raw = data.get("supporting_snippets")
+        snips: List[str] = []
+        if isinstance(snips_raw, list):
+            for x in snips_raw[:12]:
+                if isinstance(x, str) and x.strip():
+                    snips.append(x.strip())
+        if not cleaned:
+            cleaned = raw
+        validated: List[str] = []
+        for s in snips:
+            if s in cleaned:
+                validated.append(s)
+                continue
+            s2 = " ".join(s.split())
+            if s2 in cleaned:
+                validated.append(s2)
+        return cleaned, validated[:6]
+    except Exception as exc:
+        log.warning("[ContextRefine] LLM refine failed: %s", exc)
+        return raw, []
+
+
+@router.post("/chat", response_model=ChatResponse, summary="GraphRAG conversational chat with intent detection")
+async def chat_endpoint(req: ChatRequest):
+    """Multi-turn GraphRAG chat with intent detection, query rewriting, and answer synthesis."""
+    try:
+        result = await run_chat(
+            notebook_id=req.notebook_id,
+            notebook_title=req.notebook_title,
+            email=req.email,
+            api_url=req.api_url,
+            api_key=req.api_key,
+            model=req.model,
+            query=req.query,
+            history=req.history,
+            search_method=req.search_method,
+            workspace_dir=req.workspace_dir,
+            wikidata_enrich=req.wikidata_enrich,
+            defer_postprocess=req.defer_postprocess,
+        )
+        return ChatResponse(
+            answer=result.get("answer", ""),
+            intent=result.get("intent", {}),
+            rewritten_query=result.get("rewritten_query", ""),
+            context_data=result.get("context_data", {}),
+            reasoning_subgraph=result.get("reasoning_subgraph", []),
+            reasoning_subgraph_cot=result.get("reasoning_subgraph_cot", ""),
+            source_chunks=result.get("source_chunks", []),
+            highlight_hints=result.get("highlight_hints", []),
+            judge_score=float(result.get("judge_score", 0.0)),
+            judge_rationale=result.get("judge_rationale", ""),
+            postprocess_pending=bool(result.get("postprocess_pending", False)),
+            graphrag_raw_answer=result.get("graphrag_raw_answer", ""),
+        )
+    except Exception as exc:
+        log.exception("[Router] /graphrag-kb/chat error: %s", exc)
+        raise HTTPException(status_code=500, detail=str(exc))
+
+
+@router.post("/chat-postprocess", response_model=ChatPostprocessResponse, summary="Postprocess chat metadata (prune/judge/wikidata)")
+async def chat_postprocess_endpoint(req: ChatPostprocessRequest) -> ChatPostprocessResponse:
+    """Run prune+judge and Wikidata appendix after main answer has been shown."""
+    from workflow_engine.toolkits.graphrag_ms_tool.judge import judge_confidence
+    from workflow_engine.toolkits.graphrag_ms_tool.prune_judge_combined import (
+        prune_and_judge_combined_llm,
+    )
+    from workflow_engine.toolkits.wikidata_subgraph_enrich import (
+        format_wikidata_supplement_for_subgraph,
+    )
+
+    cfg = settings
+    edges = [e for e in (req.reasoning_subgraph or []) if isinstance(e, dict)]
+    if not edges:
+        return ChatPostprocessResponse(done=True)
+
+    wd_flag = req.wikidata_enrich
+    wd_on = (
+        bool(getattr(cfg, "GRAPHRAG_WIKIDATA_ENRICH_ENABLED", True))
+        if wd_flag is None
+        else bool(wd_flag)
+    )
+
+    api_base = req.api_url.rstrip("/")
+    api_key = req.api_key
+    question = req.query
+    answer = req.answer
+
+    async def _wikidata_task() -> str:
+        if not wd_on or req.mode == "subgraph":
+            return ""
+        return await asyncio.to_thread(
+            format_wikidata_supplement_for_subgraph,
+            edges,
+            lang=str(getattr(cfg, "GRAPHRAG_WIKIDATA_LANG", "zh") or "zh"),
+            max_entities=int(getattr(cfg, "GRAPHRAG_WIKIDATA_MAX_ENTITIES", 8) or 8),
+            connect_timeout=float(
+                getattr(cfg, "GRAPHRAG_WIKIDATA_CONNECT_TIMEOUT_SEC", 10.0) or 10.0
+            ),
+            read_timeout=float(getattr(cfg, "GRAPHRAG_WIKIDATA_TIMEOUT_SEC", 45.0) or 45.0),
+            http_retries=int(getattr(cfg, "GRAPHRAG_WIKIDATA_HTTP_RETRIES", 2) or 2),
+            api_url=str(
+                getattr(
+                    cfg,
+                    "GRAPHRAG_WIKIDATA_API_URL",
+                    "https://www.wikidata.org/w/api.php",
+                )
+                or "https://www.wikidata.org/w/api.php"
+            ),
+            emit_failure_hint=True,
+        )
+
+    async def _judge_task() -> tuple[List[Dict[str, Any]], str, float, str]:
+        if req.mode == "wikidata":
+            return edges, "", 0.0, ""
+        if bool(getattr(cfg, "GRAPHRAG_SUBGRAPH_PRUNE_ENABLED", True)) and edges:
+            pj = await asyncio.to_thread(
+                prune_and_judge_combined_llm,
+                question,
+                answer,
+                edges,
+                api_base=api_base,
+                api_key=api_key,
+                max_edges_input=int(getattr(cfg, "GRAPHRAG_SUBGRAPH_PRUNE_MAX_EDGES_INPUT", 28) or 28),
+                max_tokens=int(getattr(cfg, "GRAPHRAG_PRUNE_JUDGE_MAX_TOKENS", 768) or 768),
+            )
+            return pj.edges, pj.cot, float(pj.judge.score), str(pj.judge.rationale or "")
+        j = await asyncio.to_thread(
+            judge_confidence,
+            question,
+            answer,
+            edges,
+            api_base=api_base,
+            api_key=api_key,
+        )
+        return edges, "", float(j.score), str(j.rationale or "")
+
+    try:
+        judge_pack, wd_extra = await asyncio.gather(_judge_task(), _wikidata_task())
+        out_edges, out_cot, out_score, out_rationale = judge_pack
+        subgraph_done = req.mode in ("all", "subgraph")
+        wikidata_done = req.mode in ("all", "wikidata")
+        return ChatPostprocessResponse(
+            reasoning_subgraph=out_edges,
+            reasoning_subgraph_cot=out_cot,
+            judge_score=out_score,
+            judge_rationale=out_rationale,
+            wikidata_appendix=wd_extra,
+            subgraph_done=subgraph_done,
+            wikidata_done=wikidata_done,
+            done=True,
+        )
+    except Exception as exc:
+        log.warning("[Router] /graphrag-kb/chat-postprocess failed: %s", exc)
+        return ChatPostprocessResponse(
+            reasoning_subgraph=edges,
+            reasoning_subgraph_cot="",
+            judge_score=0.0,
+            judge_rationale=f"后处理失败：{exc}",
+            wikidata_appendix="",
+            subgraph_done=req.mode in ("all", "subgraph"),
+            wikidata_done=req.mode in ("all", "wikidata"),
+            done=True,
+        )
+
+
+@router.post("/chunk-snippet", response_model=ChunkSnippetResponse, summary="Extract [chunk:…] text from GraphRAG input")
+async def chunk_snippet_endpoint(req: ChunkSnippetRequest) -> ChunkSnippetResponse:
+    """Used by the notebook reader to show the exact indexed chunk, not the full MinerU MD."""
+    ws = _safe_workspace_dir(req.workspace_dir)
+    meta_path = ws / "chunk_meta.json"
+    if not meta_path.is_file():
+        return ChunkSnippetResponse()
+    try:
+        meta = json.loads(meta_path.read_text(encoding="utf-8"))
+    except Exception:
+        return ChunkSnippetResponse()
+    cid = req.chunk_id.strip().lower()
+    entry = meta.get(req.chunk_id.strip()) or meta.get(cid)
+    if not isinstance(entry, dict):
+        return ChunkSnippetResponse()
+    stem = str(entry.get("source_stem") or "").strip()
+    if not stem:
+        return ChunkSnippetResponse()
+    txt_path = ws / "input" / f"{stem}.txt"
+    if not txt_path.is_file():
+        return ChunkSnippetResponse(source_stem=stem, found=False)
+    try:
+        raw = txt_path.read_text(encoding="utf-8", errors="replace")
+    except Exception:
+        return ChunkSnippetResponse(source_stem=stem, found=False)
+    block = _extract_chunk_block_from_input_text(raw, cid)
+    if not block:
+        return ChunkSnippetResponse(source_stem=stem, found=False)
+    passage = (req.passage_for_llm or "").strip()
+    llm_context = passage if passage else block
+    highlighted_sentence = ""
+    if req.triples:
+        highlighted_sentence = _extract_sentence_for_triples(
+            llm_context, req.triples, api_key=req.api_key, api_url=req.api_url
+        )
+        log.debug(
+            "[ChunkSnippet] chunk=%s  hl_len=%d  hl=%r",
+            req.chunk_id[:8],
+            len(highlighted_sentence),
+            highlighted_sentence[:80] if highlighted_sentence else "",
+        )
+    return ChunkSnippetResponse(text=block, source_stem=stem, found=True, highlighted_sentence=highlighted_sentence)
+
+
+@router.post("/context-refine", response_model=ContextRefineResponse, summary="Clean first unit + supporting snippets from subgraph")
+async def context_refine_endpoint(req: ContextRefineRequest) -> ContextRefineResponse:
+    """Side panel: raw first text_unit + reasoning_subgraph → cleaned body + verbatim supporting quotes."""
+    cleaned, snips = _refine_context_unit_with_llm(
+        req.unit_text,
+        req.subgraph,
+        api_key=req.api_key,
+        api_url=req.api_url,
+        model=req.model,
+    )
+    return ContextRefineResponse(cleaned_text=cleaned, supporting_snippets=snips)
+
+
+# ---------------------------------------------------------------------------
+# Index / query / merge
+# ---------------------------------------------------------------------------
+
+@router.post("/index", response_model=IndexResponse, summary="Build GraphRAG index from notebook sources")
+async def index_endpoint(req: IndexRequest):
+    """Chunk notebook sources and run GraphRAG index (KGGen off by default).
+
+    Requires that sources have already been imported into the notebook
+    (via the ``/kb`` upload endpoint) so that MinerU output exists.
+    """
+    try:
+        result = await run_index(
+            notebook_id=req.notebook_id,
+            notebook_title=req.notebook_title,
+            email=req.email,
+            api_url=req.api_url,
+            api_key=req.api_key,
+            model=req.model,
+            source_stems=req.source_stems,
+            workspace_dir=req.workspace_dir,
+            force_reindex=req.force_reindex,
+            parse_pdfs=req.parse_pdfs,
+            skip_kggen=req.skip_kggen,
+        )
+        return IndexResponse(
+            workspace_dir=result.get("workspace_dir", ""),
+            num_chunks=result.get("num_chunks", 0),
+            kg_entities=result.get("kg_entities", 0),
+            kg_relations=result.get("kg_relations", 0),
+        )
+    except Exception as exc:
+        log.exception("[Router] /graphrag-kb/index error: %s", exc)
+        raise HTTPException(status_code=500, detail=str(exc))
+
+
+@router.post("/query", response_model=QueryResponse, summary="Query GraphRAG index with Judge scoring")
+async def query_endpoint(req: QueryRequest):
+    """Run a local or global GraphRAG search and return a structured result.
+
+    Returns:
+    - ``answer``            — model answer text
+    - ``context_data``      — serialised evidence tables (entities, relations, sources…)
+    - ``reasoning_subgraph`` — edge list induced from context_data
+    - ``source_chunks``     — chunk_ids that contributed to the answer
+    - ``highlight_hints``   — page/bbox hints for PDF highlighting
+    - ``judge_score``       — confidence score in [0.0, 1.0]
+    - ``judge_rationale``   — one-sentence judge explanation
+    - ``reasoning_subgraph_cot`` — LLM chain-of-thought for minimal subgraph (hop analysis)
+    """
+    try:
+        result = await run_query(
+            notebook_id=req.notebook_id,
+            notebook_title=req.notebook_title,
+            email=req.email,
+            api_url=req.api_url,
+            api_key=req.api_key,
+            model=req.model,
+            question=req.question,
+            search_method=req.search_method,
+            workspace_dir=req.workspace_dir,
+            wikidata_enrich=req.wikidata_enrich,
+        )
+        return QueryResponse(
+            answer=result.get("answer", ""),
+            context_data=result.get("context_data", {}),
+            reasoning_subgraph=result.get("reasoning_subgraph", []),
+            source_chunks=result.get("source_chunks", []),
+            highlight_hints=result.get("highlight_hints", []),
+            judge_score=float(result.get("judge_score", 0.0)),
+            judge_rationale=result.get("judge_rationale", ""),
+            reasoning_subgraph_cot=result.get("reasoning_subgraph_cot", ""),
+        )
+    except Exception as exc:
+        log.exception("[Router] /graphrag-kb/query error: %s", exc)
+        raise HTTPException(status_code=500, detail=str(exc))
+
+
+@router.post("/merge", response_model=MergeResponse, summary="Merge two GraphRAG KG workspaces")
+async def merge_endpoint(req: MergeRequest):
+    """Merge two GraphRAG workspaces using KGGen aggregate and re-index.
+
+    Both ``workspace_dir_a`` and ``workspace_dir_b`` must be absolute paths to
+    valid, previously indexed workspaces.  The merged workspace is written to
+    ``{workspace_dir_a}_merged/``.
+    """
+    try:
+        result = await run_merge(
+            notebook_id=req.notebook_id,
+            notebook_title=req.notebook_title,
+            email=req.email,
+            api_url=req.api_url,
+            api_key=req.api_key,
+            model=req.model,
+            workspace_dir_a=req.workspace_dir_a,
+            workspace_dir_b=req.workspace_dir_b,
+            dedupe=req.dedupe,
+        )
+        return MergeResponse(
+            merged_workspace_dir=result.get("merged_workspace_dir", ""),
+            num_chunks=result.get("num_chunks", 0),
+        )
+    except Exception as exc:
+        log.exception("[Router] /graphrag-kb/merge error: %s", exc)
+        raise HTTPException(status_code=500, detail=str(exc))
diff --git a/fastapi_app/source_manager.py b/fastapi_app/source_manager.py
index 5778163..2645cbc 100644
--- a/fastapi_app/source_manager.py
+++ b/fastapi_app/source_manager.py
@@ -7,16 +7,19 @@
 - Generating unified markdown for every source type
 - Reading back markdown / MinerU data for feature cards
 - Fallback to legacy kb_data / kb_mineru paths
+- Structured chunk extraction with chunk_id / page_index / order / bbox (for GraphRAG)
 """
 from __future__ import annotations
 
 import asyncio
+import hashlib
+import json
 import re
 import shutil
 import time
 from dataclasses import dataclass, field
 from pathlib import Path
-from typing import List, Optional, Tuple
+from typing import Any, Dict, List, Optional, Tuple
 
 from workflow_engine.logger import get_logger
 from workflow_engine.utils import get_project_root
@@ -237,6 +240,85 @@ def ensure_sam3_dir(self, source_stem: str) -> Path:
         sam3_dir.mkdir(parents=True, exist_ok=True)
         return sam3_dir
 
+    def get_chunks_with_meta(
+        self,
+        source_stem: str,
+        chunk_size: int = 512,    # 默认值与 settings.GRAPHRAG_CHUNK_SIZE 一致
+        chunk_overlap: int = 64,  # 默认值与 settings.GRAPHRAG_CHUNK_OVERLAP 一致
+    ) -> List[Dict[str, Any]]:
+        """Return structured chunks for a single source, used by GraphRAG indexing.
+
+        Each dict has keys: chunk_id, text, page_index, order, bbox, source_stem.
+        chunk_id = SHA1("{stem}:{order}")[:16], embedded as [chunk:ID] in input/*.txt.
+        Priority: MinerU content_list.json (exact page+bbox) → MinerU MD (estimated page)
+        → unified MD (page_index=-1).
+        """
+        chunks: List[Dict[str, Any]] = []
+
+        # 1) MinerU content_list.json — exact page + bbox per block
+        mineru_root = self.get_mineru_root(source_stem)
+        if mineru_root:
+            content_list_path = None
+            # rglob to handle varying MinerU output directory layouts
+            for candidate in mineru_root.parent.rglob("*_content_list.json"):
+                content_list_path = candidate
+                break
+            if content_list_path and content_list_path.exists():
+                try:
+                    raw_blocks = json.loads(
+                        content_list_path.read_text(encoding="utf-8")
+                    )
+                    order = 0
+                    for block in raw_blocks:
+                        # MinerU uses "text" or "content" depending on version
+                        text = (block.get("text") or block.get("content") or "").strip()
+                        if not text:
+                            continue  # skip image / formula blocks
+                        # MinerU uses "page_idx" or "page_index" depending on version
+                        page_idx = int(block.get("page_idx", block.get("page_index", -1)))
+                        bbox = block.get("bbox")  # [x1,y1,x2,y2] normalized, may be None
+                        # chunk_id = SHA1("{stem}:{order}")[:16], embedded as [chunk:ID] in input/*.txt
+                        chunk_id = hashlib.sha1(
+                            f"{source_stem}:{order}".encode()
+                        ).hexdigest()[:16]
+                        chunks.append(
+                            {
+                                "chunk_id": chunk_id,
+                                "text": text,
+                                "page_index": page_idx,
+                                "order": order,
+                                "bbox": bbox,
+                                "source_stem": source_stem,
+                            }
+                        )
+                        order += 1
+                    if chunks:
+                        return chunks
+                except Exception as e:
+                    log.debug(
+                        "[SourceManager] content_list.json parse failed for %s: %s",
+                        source_stem,
+                        e,
+                    )
+
+        # 2) MinerU markdown fallback — sliding window, estimated page_index
+        mineru_md = self.get_mineru_md(source_stem)
+        if mineru_md.strip():
+            chunks = self._split_text_to_chunks(
+                mineru_md, source_stem, chunk_size, chunk_overlap, estimate_pages=True
+            )
+            if chunks:
+                return chunks
+
+        # 3) Unified markdown fallback — no page info (Word/PPT/TXT)
+        md = self.get_markdown(source_stem)
+        if md.strip():
+            return self._split_text_to_chunks(
+                md, source_stem, chunk_size, chunk_overlap, estimate_pages=False
+            )
+
+        return []
+
     def get_all_markdowns(self) -> List[Tuple[str, str]]:
         """Return [(stem, markdown_text), ...] for all sources."""
         results: List[Tuple[str, str]] = []
@@ -393,3 +475,49 @@ def _find_in_sources(self, source_stem: str, subdir: str, pattern: str) -> str:
             except Exception:
                 continue
         return ""
+
+    @staticmethod
+    def _split_text_to_chunks(
+        text: str,
+        source_stem: str,
+        chunk_size: int,
+        chunk_overlap: int,
+        estimate_pages: bool,
+    ) -> List[Dict[str, Any]]:
+        """Sliding-window character chunking fallback when content_list is unavailable.
+
+        estimate_pages=True roughly estimates page_index at ~2000 chars/page.
+        """
+        chunks: List[Dict[str, Any]] = []
+        text = text.strip()
+        if not text:
+            return chunks
+
+        total_chars = len(text)
+        step = max(1, chunk_size - chunk_overlap)
+        order = 0
+        pos = 0
+        chars_per_page = 2000  # rough estimate: ~2000 chars per page
+
+        while pos < total_chars:
+            end = min(pos + chunk_size, total_chars)
+            snippet = text[pos:end].strip()
+            if snippet:
+                page_idx = int(pos / chars_per_page) if estimate_pages else -1
+                chunk_id = hashlib.sha1(
+                    f"{source_stem}:{order}".encode()
+                ).hexdigest()[:16]
+                chunks.append(
+                    {
+                        "chunk_id": chunk_id,
+                        "text": snippet,
+                        "page_index": page_idx,
+                        "order": order,
+                        "bbox": None,
+                        "source_stem": source_stem,
+                    }
+                )
+                order += 1
+            pos += step
+
+        return chunks
diff --git a/fastapi_app/workflow_adapters/wa_graphrag_kb.py b/fastapi_app/workflow_adapters/wa_graphrag_kb.py
new file mode 100644
index 0000000..846b71f
--- /dev/null
+++ b/fastapi_app/workflow_adapters/wa_graphrag_kb.py
@@ -0,0 +1,195 @@
+"""GraphRAG KB 管线的工作流适配层。
+
+【职责】
+    在 FastAPI 路由（Pydantic 请求体）与 ``wf_graphrag_kb``（``GraphRAGKBState`` 数据类）之间做转换，
+    统一调用 ``run_workflow("graphrag_kb", state)``，再从 ``agent_results`` / ``temp_data.errors`` 取结果。
+
+【数据流】
+    ``run_index`` / ``run_query`` / ``run_merge`` → 组装 ``GraphRAGKBRequest.action`` →
+    ``GraphRAGKBState`` → LangGraph 执行 → 成功则返回对应 ``agent_results`` 字典；失败则 ``RuntimeError``（携带首条错误信息）。
+
+【约定】
+    与 ``wa_paper2ppt.py`` 类似：``_workflow_outcome`` 兼容 LangGraph 返回 dataclass 或 dict。
+"""
+from __future__ import annotations
+
+from typing import Any, Dict, List, Optional, Tuple
+
+from workflow_engine.logger import get_logger
+from workflow_engine.workflow import run_workflow
+from workflow_engine.workflow.wf_graphrag_kb import GraphRAGKBRequest, GraphRAGKBState
+from workflow_engine.workflow.wf_graphrag_chat import GraphRAGChatRequest, GraphRAGChatState
+
+log = get_logger(__name__)
+
+
+def _workflow_outcome(state: Any) -> Tuple[Dict[str, Any], Optional[list]]:
+    """统一解析工作流终态：得到 ``(agent_results, errors)``，兼容 dict 与 dataclass 两种返回形式。"""
+    if isinstance(state, dict):
+        td = state.get("temp_data")
+        td = td if isinstance(td, dict) else {}
+        errors = td.get("errors")
+        ar = state.get("agent_results")
+        ar = ar if isinstance(ar, dict) else {}
+        return ar, errors
+    td = getattr(state, "temp_data", None)
+    td = td if isinstance(td, dict) else {}
+    errors = td.get("errors")
+    ar = getattr(state, "agent_results", None)
+    ar = ar if isinstance(ar, dict) else {}
+    return ar, errors
+
+
+# ---------------------------------------------------------------------------
+# Public adapter functions (called by routers)
+# ---------------------------------------------------------------------------
+
+async def run_index(
+    *,
+    notebook_id: str,
+    notebook_title: str,
+    email: str,
+    api_url: str,
+    api_key: str,
+    model: str,
+    source_stems: Optional[List[str]] = None,
+    workspace_dir: str = "",
+    force_reindex: bool = False,
+    parse_pdfs: bool = True,
+    skip_kggen: bool = True,
+) -> Dict[str, Any]:
+    """Run indexing workflow; returns ``agent_results["index"]`` dict on success."""
+    req = GraphRAGKBRequest(
+        action="index",
+        notebook_id=notebook_id,
+        notebook_title=notebook_title,
+        email=email,
+        chat_api_url=api_url,
+        api_key=api_key,
+        model=model,
+        source_stems=source_stems or [],
+        workspace_dir=workspace_dir,
+        force_reindex=force_reindex,
+        parse_pdfs=parse_pdfs,
+        skip_kggen=skip_kggen,
+    )
+    state = GraphRAGKBState(request=req)
+    state = await run_workflow("graphrag_kb", state)
+
+    agent_results, errors = _workflow_outcome(state)
+    if errors:
+        raise RuntimeError(f"Indexing failed: {errors[0]}")
+
+    return agent_results.get("index", {})
+
+
+async def run_query(
+    *,
+    notebook_id: str,
+    notebook_title: str,
+    email: str,
+    api_url: str,
+    api_key: str,
+    model: str,
+    question: str,
+    search_method: str = "local",
+    workspace_dir: str = "",
+    wikidata_enrich: Optional[bool] = None,
+) -> Dict[str, Any]:
+    """Run query workflow; returns ``agent_results["query"]`` dict on success."""
+    req = GraphRAGKBRequest(
+        action="query",
+        notebook_id=notebook_id,
+        notebook_title=notebook_title,
+        email=email,
+        chat_api_url=api_url,
+        api_key=api_key,
+        model=model,
+        question=question,
+        search_method=search_method,
+        workspace_dir=workspace_dir,
+        wikidata_enrich=wikidata_enrich,
+    )
+    state = GraphRAGKBState(request=req)
+    state = await run_workflow("graphrag_kb", state)
+
+    agent_results, errors = _workflow_outcome(state)
+    if errors:
+        raise RuntimeError(f"Query failed: {errors[0]}")
+
+    return agent_results.get("query", {})
+
+
+async def run_merge(
+    *,
+    notebook_id: str,
+    notebook_title: str,
+    email: str,
+    api_url: str,
+    api_key: str,
+    model: str,
+    workspace_dir_a: str,
+    workspace_dir_b: str,
+    dedupe: bool = False,
+) -> Dict[str, Any]:
+    """Merge two GraphRAG workspaces and re-index; returns ``agent_results["merge"]``."""
+    req = GraphRAGKBRequest(
+        action="merge",
+        notebook_id=notebook_id,
+        notebook_title=notebook_title,
+        email=email,
+        chat_api_url=api_url,
+        api_key=api_key,
+        model=model,
+        workspace_dir=workspace_dir_a,
+        workspace_dir_b=workspace_dir_b,
+        dedupe=dedupe,
+    )
+    state = GraphRAGKBState(request=req)
+    state = await run_workflow("graphrag_kb", state)
+
+    agent_results, errors = _workflow_outcome(state)
+    if errors:
+        raise RuntimeError(f"Merge failed: {errors[0]}")
+
+    return agent_results.get("merge", {})
+
+
+async def run_chat(
+    *,
+    notebook_id: str,
+    notebook_title: str = "",
+    email: str = "",
+    api_url: str,
+    api_key: str,
+    model: str,
+    query: str,
+    history: List[Dict[str, str]],
+    search_method: str = "auto",
+    workspace_dir: str = "",
+    wikidata_enrich: Optional[bool] = None,
+    defer_postprocess: bool = False,
+) -> Dict[str, Any]:
+    """Run GraphRAG conversational chat; returns ``agent_results["chat"]`` dict."""
+    req = GraphRAGChatRequest(
+        notebook_id=notebook_id,
+        notebook_title=notebook_title,
+        email=email,
+        chat_api_url=api_url,
+        api_key=api_key,
+        model=model,
+        query=query,
+        history=history,
+        search_method=search_method,
+        workspace_dir=workspace_dir,
+        wikidata_enrich=wikidata_enrich,
+        defer_postprocess=defer_postprocess,
+    )
+    state = GraphRAGChatState(request=req)
+    state = await run_workflow("graphrag_chat", state)
+
+    agent_results, errors = _workflow_outcome(state)
+    if errors:
+        raise RuntimeError(f"GraphRAG chat failed: {errors[0]}")
+
+    return agent_results.get("chat", {})
diff --git a/frontend_en/package-lock.json b/frontend_en/package-lock.json
index 873bc08..df09701 100644
--- a/frontend_en/package-lock.json
+++ b/frontend_en/package-lock.json
@@ -19,6 +19,7 @@
         "react-dom": "^18.2.0",
         "react-markdown": "^9.1.0",
         "react-pdf": "^10.3.0",
+        "rehype-raw": "^7.0.0",
         "tailwind-merge": "^2.0.0",
         "zustand": "^4.4.7"
       },
@@ -2632,6 +2633,17 @@
       "integrity": "sha512-f/ZeWvW/BCXbhGEf1Ujp29EASo/lk1FDnETgNKwJrsVvGZhUWCZyg3xLJjAsxfOmt8KjswHmI5EwCQcPMpOYhQ==",
       "license": "EPL-2.0"
     },
+    "node_modules/entities": {
+      "version": "6.0.1",
+      "resolved": "https://registry.npmjs.org/entities/-/entities-6.0.1.tgz",
+      "integrity": "sha512-aN97NXWF6AWBTahfVOIrB/NShkzi5H7F9r1s9mD3cDj4Ko5f2qhhVoYMibXF7GlLveb/D2ioWay8lxI97Ven3g==",
+      "engines": {
+        "node": ">=0.12"
+      },
+      "funding": {
+        "url": "https://github.com/fb55/entities?sponsor=1"
+      }
+    },
     "node_modules/esbuild": {
       "version": "0.21.5",
       "resolved": "https://registry.npmjs.org/esbuild/-/esbuild-0.21.5.tgz",
@@ -2849,6 +2861,71 @@
         "node": ">= 0.4"
       }
     },
+    "node_modules/hast-util-from-parse5": {
+      "version": "8.0.3",
+      "resolved": "https://registry.npmjs.org/hast-util-from-parse5/-/hast-util-from-parse5-8.0.3.tgz",
+      "integrity": "sha512-3kxEVkEKt0zvcZ3hCRYI8rqrgwtlIOFMWkbclACvjlDw8Li9S2hk/d51OI0nr/gIpdMHNepwgOKqZ/sy0Clpyg==",
+      "dependencies": {
+        "@types/hast": "^3.0.0",
+        "@types/unist": "^3.0.0",
+        "devlop": "^1.0.0",
+        "hastscript": "^9.0.0",
+        "property-information": "^7.0.0",
+        "vfile": "^6.0.0",
+        "vfile-location": "^5.0.0",
+        "web-namespaces": "^2.0.0"
+      },
+      "funding": {
+        "type": "opencollective",
+        "url": "https://opencollective.com/unified"
+      }
+    },
+    "node_modules/hast-util-from-parse5/node_modules/@types/unist": {
+      "version": "3.0.3",
+      "resolved": "https://registry.npmjs.org/@types/unist/-/unist-3.0.3.tgz",
+      "integrity": "sha512-ko/gIFJRv177XgZsZcBwnqJN5x/Gien8qNOn0D5bQU/zAzVf9Zt3BlcUiLqhV9y4ARk0GbT3tnUiPNgnTXzc/Q=="
+    },
+    "node_modules/hast-util-parse-selector": {
+      "version": "4.0.0",
+      "resolved": "https://registry.npmjs.org/hast-util-parse-selector/-/hast-util-parse-selector-4.0.0.tgz",
+      "integrity": "sha512-wkQCkSYoOGCRKERFWcxMVMOcYE2K1AaNLU8DXS9arxnLOUEWbOXKXiJUNzEpqZ3JOKpnha3jkFrumEjVliDe7A==",
+      "dependencies": {
+        "@types/hast": "^3.0.0"
+      },
+      "funding": {
+        "type": "opencollective",
+        "url": "https://opencollective.com/unified"
+      }
+    },
+    "node_modules/hast-util-raw": {
+      "version": "9.1.0",
+      "resolved": "https://registry.npmjs.org/hast-util-raw/-/hast-util-raw-9.1.0.tgz",
+      "integrity": "sha512-Y8/SBAHkZGoNkpzqqfCldijcuUKh7/su31kEBp67cFY09Wy0mTRgtsLYsiIxMJxlu0f6AA5SUTbDR8K0rxnbUw==",
+      "dependencies": {
+        "@types/hast": "^3.0.0",
+        "@types/unist": "^3.0.0",
+        "@ungap/structured-clone": "^1.0.0",
+        "hast-util-from-parse5": "^8.0.0",
+        "hast-util-to-parse5": "^8.0.0",
+        "html-void-elements": "^3.0.0",
+        "mdast-util-to-hast": "^13.0.0",
+        "parse5": "^7.0.0",
+        "unist-util-position": "^5.0.0",
+        "unist-util-visit": "^5.0.0",
+        "vfile": "^6.0.0",
+        "web-namespaces": "^2.0.0",
+        "zwitch": "^2.0.0"
+      },
+      "funding": {
+        "type": "opencollective",
+        "url": "https://opencollective.com/unified"
+      }
+    },
+    "node_modules/hast-util-raw/node_modules/@types/unist": {
+      "version": "3.0.3",
+      "resolved": "https://registry.npmjs.org/@types/unist/-/unist-3.0.3.tgz",
+      "integrity": "sha512-ko/gIFJRv177XgZsZcBwnqJN5x/Gien8qNOn0D5bQU/zAzVf9Zt3BlcUiLqhV9y4ARk0GbT3tnUiPNgnTXzc/Q=="
+    },
     "node_modules/hast-util-to-jsx-runtime": {
       "version": "2.3.6",
       "resolved": "https://registry.npmjs.org/hast-util-to-jsx-runtime/-/hast-util-to-jsx-runtime-2.3.6.tgz",
@@ -2882,6 +2959,24 @@
       "integrity": "sha512-ko/gIFJRv177XgZsZcBwnqJN5x/Gien8qNOn0D5bQU/zAzVf9Zt3BlcUiLqhV9y4ARk0GbT3tnUiPNgnTXzc/Q==",
       "license": "MIT"
     },
+    "node_modules/hast-util-to-parse5": {
+      "version": "8.0.1",
+      "resolved": "https://registry.npmjs.org/hast-util-to-parse5/-/hast-util-to-parse5-8.0.1.tgz",
+      "integrity": "sha512-MlWT6Pjt4CG9lFCjiz4BH7l9wmrMkfkJYCxFwKQic8+RTZgWPuWxwAfjJElsXkex7DJjfSJsQIt931ilUgmwdA==",
+      "dependencies": {
+        "@types/hast": "^3.0.0",
+        "comma-separated-tokens": "^2.0.0",
+        "devlop": "^1.0.0",
+        "property-information": "^7.0.0",
+        "space-separated-tokens": "^2.0.0",
+        "web-namespaces": "^2.0.0",
+        "zwitch": "^2.0.0"
+      },
+      "funding": {
+        "type": "opencollective",
+        "url": "https://opencollective.com/unified"
+      }
+    },
     "node_modules/hast-util-whitespace": {
       "version": "3.0.0",
       "resolved": "https://registry.npmjs.org/hast-util-whitespace/-/hast-util-whitespace-3.0.0.tgz",
@@ -2895,6 +2990,22 @@
         "url": "https://opencollective.com/unified"
       }
     },
+    "node_modules/hastscript": {
+      "version": "9.0.1",
+      "resolved": "https://registry.npmjs.org/hastscript/-/hastscript-9.0.1.tgz",
+      "integrity": "sha512-g7df9rMFX/SPi34tyGCyUBREQoKkapwdY/T04Qn9TDWfHhAYt4/I0gMVirzK5wEzeUqIjEB+LXC/ypb7Aqno5w==",
+      "dependencies": {
+        "@types/hast": "^3.0.0",
+        "comma-separated-tokens": "^2.0.0",
+        "hast-util-parse-selector": "^4.0.0",
+        "property-information": "^7.0.0",
+        "space-separated-tokens": "^2.0.0"
+      },
+      "funding": {
+        "type": "opencollective",
+        "url": "https://opencollective.com/unified"
+      }
+    },
     "node_modules/html-url-attributes": {
       "version": "3.0.1",
       "resolved": "https://registry.npmjs.org/html-url-attributes/-/html-url-attributes-3.0.1.tgz",
@@ -2905,6 +3016,15 @@
         "url": "https://opencollective.com/unified"
       }
     },
+    "node_modules/html-void-elements": {
+      "version": "3.0.0",
+      "resolved": "https://registry.npmjs.org/html-void-elements/-/html-void-elements-3.0.0.tgz",
+      "integrity": "sha512-bEqo66MRXsUGxWHV5IP0PUiAWwoEjba4VCzg0LjFJBpchPaTfyfCKTG6bc5F8ucKec3q5y6qOdGyYTSBEvhCrg==",
+      "funding": {
+        "type": "github",
+        "url": "https://github.com/sponsors/wooorm"
+      }
+    },
     "node_modules/iceberg-js": {
       "version": "0.8.1",
       "resolved": "https://registry.npmjs.org/iceberg-js/-/iceberg-js-0.8.1.tgz",
@@ -5773,6 +5893,17 @@
         "url": "https://github.com/sponsors/wooorm"
       }
     },
+    "node_modules/parse5": {
+      "version": "7.3.0",
+      "resolved": "https://registry.npmjs.org/parse5/-/parse5-7.3.0.tgz",
+      "integrity": "sha512-IInvU7fabl34qmi9gY8XOVxhYyMyuH2xUNpb2q8/Y+7552KlejkRvqvD19nMoUW/uQGGbqNpA6Tufu5FL5BZgw==",
+      "dependencies": {
+        "entities": "^6.0.0"
+      },
+      "funding": {
+        "url": "https://github.com/inikulin/parse5?sponsor=1"
+      }
+    },
     "node_modules/path-parse": {
       "version": "1.0.7",
       "resolved": "https://registry.npmjs.org/path-parse/-/path-parse-1.0.7.tgz",
@@ -6149,6 +6280,20 @@
         "node": ">=8.10.0"
       }
     },
+    "node_modules/rehype-raw": {
+      "version": "7.0.0",
+      "resolved": "https://registry.npmjs.org/rehype-raw/-/rehype-raw-7.0.0.tgz",
+      "integrity": "sha512-/aE8hCfKlQeA8LmyeyQvQF3eBiLRGNlfBJEvWH7ivp9sBqs7TNqBL5X3v157rM4IFETqDnIOO+z5M/biZbo9Ww==",
+      "dependencies": {
+        "@types/hast": "^3.0.0",
+        "hast-util-raw": "^9.0.0",
+        "vfile": "^6.0.0"
+      },
+      "funding": {
+        "type": "opencollective",
+        "url": "https://opencollective.com/unified"
+      }
+    },
     "node_modules/remark-parse": {
       "version": "11.0.0",
       "resolved": "https://registry.npmjs.org/remark-parse/-/remark-parse-11.0.0.tgz",
@@ -7361,6 +7506,24 @@
         "url": "https://opencollective.com/unified"
       }
     },
+    "node_modules/vfile-location": {
+      "version": "5.0.3",
+      "resolved": "https://registry.npmjs.org/vfile-location/-/vfile-location-5.0.3.tgz",
+      "integrity": "sha512-5yXvWDEgqeiYiBe1lbxYF7UMAIm/IcopxMHrMQDq3nvKcjPKIhZklUKL+AE7J7uApI4kwe2snsK+eI6UTj9EHg==",
+      "dependencies": {
+        "@types/unist": "^3.0.0",
+        "vfile": "^6.0.0"
+      },
+      "funding": {
+        "type": "opencollective",
+        "url": "https://opencollective.com/unified"
+      }
+    },
+    "node_modules/vfile-location/node_modules/@types/unist": {
+      "version": "3.0.3",
+      "resolved": "https://registry.npmjs.org/@types/unist/-/unist-3.0.3.tgz",
+      "integrity": "sha512-ko/gIFJRv177XgZsZcBwnqJN5x/Gien8qNOn0D5bQU/zAzVf9Zt3BlcUiLqhV9y4ARk0GbT3tnUiPNgnTXzc/Q=="
+    },
     "node_modules/vfile-message": {
       "version": "4.0.3",
       "resolved": "https://registry.npmjs.org/vfile-message/-/vfile-message-4.0.3.tgz",
@@ -7469,6 +7632,15 @@
         "loose-envify": "^1.0.0"
       }
     },
+    "node_modules/web-namespaces": {
+      "version": "2.0.1",
+      "resolved": "https://registry.npmjs.org/web-namespaces/-/web-namespaces-2.0.1.tgz",
+      "integrity": "sha512-bKr1DkiNa2krS7qxNtdrtHAmzuYGFQLiQ13TsorsdT6ULTkPLKuu5+GsFpDlg6JFjUTwX2DyhMPG2be8uPrqsQ==",
+      "funding": {
+        "type": "github",
+        "url": "https://github.com/sponsors/wooorm"
+      }
+    },
     "node_modules/web-worker": {
       "version": "1.5.0",
       "resolved": "https://registry.npmjs.org/web-worker/-/web-worker-1.5.0.tgz",
diff --git a/frontend_en/package.json b/frontend_en/package.json
index b6d9db4..d2b2fac 100644
--- a/frontend_en/package.json
+++ b/frontend_en/package.json
@@ -20,6 +20,7 @@
     "react-dom": "^18.2.0",
     "react-markdown": "^9.1.0",
     "react-pdf": "^10.3.0",
+    "rehype-raw": "^7.0.0",
     "tailwind-merge": "^2.0.0",
     "zustand": "^4.4.7"
   },
diff --git a/frontend_en/src/components/graphrag-kb/GraphRAGKbPanel.tsx b/frontend_en/src/components/graphrag-kb/GraphRAGKbPanel.tsx
new file mode 100644
index 0000000..9de171a
--- /dev/null
+++ b/frontend_en/src/components/graphrag-kb/GraphRAGKbPanel.tsx
@@ -0,0 +1,2 @@
+export { GraphRAGKbPanel } from './GraphRAGKbPanelChatAligned';
+export type { GraphRAGKbPanelProps } from './GraphRAGKbPanelChatAligned';
diff --git a/frontend_en/src/components/graphrag-kb/GraphRAGKbPanelChatAligned.tsx b/frontend_en/src/components/graphrag-kb/GraphRAGKbPanelChatAligned.tsx
new file mode 100644
index 0000000..a0ef997
--- /dev/null
+++ b/frontend_en/src/components/graphrag-kb/GraphRAGKbPanelChatAligned.tsx
@@ -0,0 +1,820 @@
+/**
+ * English GraphRAG KB panel aligned with frontend_zh flow:
+ * - index
+ * - chat with deferred postprocess
+ * - split postprocess: subgraph/judge and Wikidata
+ * - merge
+ */
+import React, { useCallback, useEffect, useMemo, useRef, useState } from 'react';
+import ReactMarkdown from 'react-markdown';
+import { Loader2, Copy, ChevronDown, ChevronRight, Network, Send } from 'lucide-react';
+import { getApiSettings } from '../../services/apiSettingsService';
+import {
+  indexGraphragKb,
+  mergeGraphragKb,
+  chatGraphragKb,
+  chatGraphragKbPostprocess,
+  defaultGraphragModel,
+  refineGraphragContextRefine,
+} from '../../services/graphragKbService';
+import type { ChatMessage, ChatResponse, GraphragWorkspacePersist } from '../../types/graphragKb';
+import { MermaidPreview } from '../knowledge-base/tools/MermaidPreview';
+import { injectMultipleGraphragHighlightsInMarkdown } from '../../utils/graphragMarkdownHighlight';
+import {
+  extractChunkIdFromText,
+  stripGraphragContextNoise,
+} from '../../utils/stripGraphragContextNoise';
+
+function getWorkspaceStorageKey(userId: string, notebookId: string) {
+  return `graphrag_workspace_${userId}_${notebookId}`;
+}
+
+function sanitizeMermaidLabel(s: string, max = 48): string {
+  return s.replace(/["[\]#]/g, ' ').slice(0, max).trim() || '?';
+}
+
+export function reasoningSubgraphToMermaid(edges: Array<Record<string, unknown>>, maxEdges = 36): string | null {
+  if (!edges.length) return null;
+  const slice = edges.slice(0, maxEdges);
+  const idFor = (() => {
+    const m = new Map<string, string>();
+    let n = 0;
+    return (raw: string) => {
+      const k = raw || `_${n}`;
+      if (!m.has(k)) m.set(k, `N${n++}`);
+      return m.get(k)!;
+    };
+  })();
+  const lines: string[] = [
+    '%%{init: {"flowchart": {"htmlLabels": true, "wrappingWidth": 250}} }%%',
+    'graph TD',
+  ];
+  for (let i = 0; i < slice.length; i++) {
+    const e = slice[i];
+    const src = String(e.source ?? e.src ?? e.from ?? e.head ?? `s${i}`);
+    const tgt = String(e.target ?? e.tgt ?? e.to ?? e.tail ?? `t${i}`);
+    const rel = String(e.relation ?? e.relationship ?? e.label ?? e.predicate ?? '');
+    const sid = idFor(src);
+    const tid = idFor(tgt);
+    const sl = sanitizeMermaidLabel(src, 40);
+    const tl = sanitizeMermaidLabel(tgt, 40);
+    const rl = sanitizeMermaidLabel(rel, 60);
+    lines.push(`  ${sid}["${sl}"] -->|"${rl}"| ${tid}["${tl}"]`);
+  }
+  return lines.join('\n');
+}
+
+interface ContextChunk {
+  chunkId: string;
+  text: string;
+  nTokens?: number;
+  sourceStem?: string;
+}
+
+function extractTopChunk(
+  contextData: Record<string, unknown>,
+  highlightHints: Array<Record<string, unknown>>,
+): ContextChunk | null {
+  const textUnits =
+    (contextData['sources'] as Array<Record<string, unknown>> | undefined) ??
+    (contextData['text_units'] as Array<Record<string, unknown>> | undefined);
+  if (!textUnits || !Array.isArray(textUnits) || textUnits.length === 0) return null;
+
+  const first = textUnits[0];
+  const rawText = String(first['text'] ?? first['content'] ?? '');
+  if (!rawText.trim()) return null;
+
+  const docIds = first['document_ids'];
+  const sourceStemFromUnit = Array.isArray(docIds) && docIds.length > 0 ? String(docIds[0]) : '';
+  const sourceStemFromHint = highlightHints.length > 0 ? String(highlightHints[0]['source_stem'] ?? '') : '';
+
+  const embedded = extractChunkIdFromText(rawText);
+  const idField = String(first['id'] ?? first['chunk_id'] ?? '').trim();
+  const chunkId = embedded || idField;
+
+  return {
+    chunkId,
+    text: rawText,
+    nTokens: first['n_tokens'] != null ? Number(first['n_tokens']) : undefined,
+    sourceStem: sourceStemFromUnit || sourceStemFromHint || undefined,
+  };
+}
+
+const STR = {
+  zh: {
+    headerTitle: 'GraphRAG 知识库',
+    headerSub: '分块（MinerU）+ GraphRAG 建索引与检索',
+    apiWarn: '请先在设置中配置 API URL 与 API Key',
+    noNotebook: '缺少笔记本 ID',
+    indexBtn: '构建索引',
+    indexing: '索引构建中…',
+    indexOk: '索引构建完成',
+    forceReindex: '强制重建',
+    parsePdfs: '解析 PDF（MinerU）',
+    summary: '上次索引摘要',
+    chunks: '分块数',
+    workspace: '工作区目录',
+    copy: '复制',
+    copied: '已复制',
+    modelLabel: 'LLM 模型名',
+    copyFailed: '复制失败',
+    mergeTitle: '合并工作区',
+    mergeA: 'workspace_dir A',
+    mergeB: 'workspace_dir B',
+    dedupe: '去重合并',
+    mergeBtn: '合并并重建索引',
+    merging: '合并中…',
+    mergeOk: '合并完成',
+    chatPlaceholder: '向知识库提问…',
+    send: '发送',
+    searchMethodLabel: '检索策略',
+    wikidataEnrich: 'Wikidata 参考（附在答案后）',
+    clearChat: '清空对话',
+    emptyReady: '索引已就绪，开始提问吧',
+    emptyNoIndex: '请先完成索引构建',
+    contextRefTitle: '上下文参考',
+    subgraph: '推理子图',
+    subgraphRaw: '推理全图（未裁剪版）',
+    noSubgraph: '无子图数据',
+    subgraphCot: '最小子图推理（CoT / 跳数）',
+    mermaidTitle: '子图（Mermaid）',
+    judge: 'Judge 分数',
+    postprocessSubgraphPending: '正在裁剪子图…',
+    postprocessWikidataPending: '正在补充 Wikidata 参考…',
+  },
+  en: {
+    headerTitle: 'GraphRAG Knowledge Base',
+    headerSub: 'Chunking (MinerU) + GraphRAG index & query',
+    apiWarn: 'Configure API URL and API Key in Settings first',
+    noNotebook: 'Notebook ID is missing',
+    indexBtn: 'Build index',
+    indexing: 'Indexing…',
+    indexOk: 'Index completed',
+    forceReindex: 'Force reindex',
+    parsePdfs: 'Parse PDFs (MinerU)',
+    summary: 'Last index summary',
+    chunks: 'Chunks',
+    workspace: 'Workspace directory',
+    copy: 'Copy',
+    copied: 'Copied',
+    modelLabel: 'LLM model',
+    copyFailed: 'Copy failed',
+    mergeTitle: 'Merge workspaces',
+    mergeA: 'workspace_dir A',
+    mergeB: 'workspace_dir B',
+    dedupe: 'Deduplicate when merging',
+    mergeBtn: 'Merge and re-index',
+    merging: 'Merging…',
+    mergeOk: 'Merge completed',
+    chatPlaceholder: 'Ask the knowledge base…',
+    send: 'Send',
+    searchMethodLabel: 'Search method',
+    wikidataEnrich: 'Wikidata supplement (after answer)',
+    clearChat: 'Clear chat',
+    emptyReady: 'Index ready. Start asking questions.',
+    emptyNoIndex: 'Build the index first.',
+    contextRefTitle: 'Context Reference',
+    subgraph: 'Reasoning subgraph',
+    subgraphRaw: 'Full reasoning graph (unpruned)',
+    noSubgraph: 'No subgraph',
+    subgraphCot: 'Minimal subgraph reasoning (CoT / hops)',
+    mermaidTitle: 'Subgraph (Mermaid)',
+    judge: 'Judge score',
+    postprocessSubgraphPending: 'Pruning subgraph…',
+    postprocessWikidataPending: 'Enriching Wikidata supplement…',
+  },
+} as const;
+
+function ContextRefHtml({
+  topChunk,
+  subgraph,
+  userId,
+  colorIdx,
+  locale,
+}: {
+  topChunk: ContextChunk;
+  subgraph: Array<Record<string, unknown>>;
+  userId: string | null;
+  colorIdx: number;
+  locale: 'zh' | 'en';
+}) {
+  const basePlain = useMemo(() => stripGraphragContextNoise(topChunk.text), [topChunk.text]);
+  const [html, setHtml] = useState<string>(basePlain);
+  const [loading, setLoading] = useState(false);
+
+  useEffect(() => {
+    setHtml(basePlain);
+    if (!subgraph?.length) {
+      setLoading(false);
+      return;
+    }
+    let cancelled = false;
+    setLoading(true);
+    (async () => {
+      try {
+        const st = getApiSettings(userId);
+        const out = await refineGraphragContextRefine(
+          topChunk.text,
+          subgraph,
+          st?.apiKey?.trim() || '',
+          st?.apiUrl?.trim() || '',
+          defaultGraphragModel(),
+        );
+        if (cancelled) return;
+        const body = (out.cleaned_text || '').trim() || basePlain;
+        const snips = (out.supporting_snippets || []).map((s) => s.trim()).filter(Boolean);
+        if (snips.length) {
+          setHtml(injectMultipleGraphragHighlightsInMarkdown(body, snips, { baseColorIndex: colorIdx }));
+        } else {
+          setHtml(body);
+        }
+      } catch {
+        if (!cancelled) setHtml(basePlain);
+      } finally {
+        if (!cancelled) setLoading(false);
+      }
+    })();
+    return () => {
+      cancelled = true;
+    };
+  }, [topChunk.chunkId, subgraph, basePlain, userId, colorIdx, topChunk.text]);
+
+  return (
+    <div className="space-y-1">
+      {loading ? (
+        <div className="text-[11px] text-amber-700/90">
+          {locale === 'zh' ? '正在清洗正文并选取支撑句…' : 'Cleaning passage and selecting evidence…'}
+        </div>
+      ) : null}
+      <div
+        className="text-xs text-ios-gray-800 leading-relaxed whitespace-pre-wrap break-words max-h-48 overflow-y-auto"
+        // eslint-disable-next-line react/no-danger
+        dangerouslySetInnerHTML={{ __html: html }}
+      />
+    </div>
+  );
+}
+
+interface AssistantMetaProps {
+  meta: NonNullable<ChatMessage['meta']>;
+  locale: 'zh' | 'en';
+  L: typeof STR['zh'];
+  userId: string | null;
+  subgraphPending: boolean;
+}
+
+function AssistantMeta({ meta, locale, L, userId, subgraphPending }: AssistantMetaProps) {
+  const topChunk = useMemo(() => {
+    if (!meta.context_data) return null;
+    return extractTopChunk(
+      meta.context_data as Record<string, unknown>,
+      (meta.highlight_hints ?? []) as Array<Record<string, unknown>>,
+    );
+  }, [meta.context_data, meta.highlight_hints]);
+
+  const mermaidCode = useMemo(() => {
+    if (!meta.reasoning_subgraph?.length) return null;
+    return reasoningSubgraphToMermaid(meta.reasoning_subgraph as Array<Record<string, unknown>>);
+  }, [meta.reasoning_subgraph]);
+
+  const subgraphRows = (meta.reasoning_subgraph ?? []) as Array<Record<string, unknown>>;
+  const judgePct = Math.round(Math.max(0, Math.min(1, meta.judge_score ?? 0)) * 100);
+  const [subgraphOpen, setSubgraphOpen] = useState(false);
+
+  return (
+    <div className="mt-3 space-y-3">
+      {meta.intent?.use_graphrag === false && (
+        <div className="inline-flex items-center gap-1 text-[11px] text-ios-gray-400 bg-ios-gray-50 rounded px-2 py-0.5">
+          {locale === 'zh' ? '直接回答（无检索）' : 'Direct answer (no retrieval)'}
+        </div>
+      )}
+      {meta.intent?.use_graphrag === true && meta.rewritten_query && (
+        <div className="text-[11px] text-ios-gray-400">
+          <span className="font-medium">{locale === 'zh' ? '检索问题：' : 'Retrieval query: '}</span>
+          {meta.rewritten_query}
+        </div>
+      )}
+
+      {topChunk && (
+        <div className="rounded-xl bg-amber-50 border border-amber-100 p-3 space-y-1.5">
+          <div className="text-xs font-semibold text-amber-800">{L.contextRefTitle}</div>
+          {topChunk.sourceStem && (
+            <div className="flex items-center gap-2 text-xs text-amber-700">
+              <code className="bg-amber-100/60 px-1.5 py-0.5 rounded text-[11px]">{topChunk.sourceStem}</code>
+              {topChunk.nTokens != null && (
+                <span className="text-amber-500">{topChunk.nTokens} tokens</span>
+              )}
+            </div>
+          )}
+          <ContextRefHtml
+            topChunk={topChunk}
+            subgraph={subgraphRows}
+            userId={userId}
+            colorIdx={0}
+            locale={locale}
+          />
+        </div>
+      )}
+
+      {mermaidCode && (
+        <div className="space-y-2">
+          <button
+            type="button"
+            onClick={() => setSubgraphOpen(!subgraphOpen)}
+            className="flex items-center gap-1 text-xs font-semibold text-ios-gray-700"
+          >
+            {subgraphOpen ? <ChevronDown size={14} /> : <ChevronRight size={14} />}
+            {subgraphPending ? L.subgraphRaw : L.subgraph}
+          </button>
+          {subgraphOpen && (
+            <>
+              <div className="bg-slate-900 rounded-xl p-2">
+                <MermaidPreview mermaidCode={mermaidCode} title={L.mermaidTitle} />
+              </div>
+              {meta.reasoning_subgraph_cot ? (
+                <details className="text-xs rounded-lg border border-ios-gray-100 bg-ios-gray-50/60 p-3">
+                  <summary className="cursor-pointer font-medium text-ios-gray-700 select-none">{L.subgraphCot}</summary>
+                  <div className="mt-2 text-ios-gray-800 whitespace-pre-wrap break-words">
+                    <ReactMarkdown>{meta.reasoning_subgraph_cot}</ReactMarkdown>
+                  </div>
+                </details>
+              ) : null}
+            </>
+          )}
+        </div>
+      )}
+
+      {judgePct > 0 && (
+        <div className="rounded-xl bg-sky-50 border border-sky-100 px-3 py-2 text-xs">
+          <div className="font-medium text-sky-900">{L.judge}: {judgePct}%</div>
+          {meta.judge_rationale ? (
+            <div className="text-sky-800 mt-0.5 opacity-90">{meta.judge_rationale}</div>
+          ) : null}
+        </div>
+      )}
+    </div>
+  );
+}
+
+export type GraphragOpenSourcePayload = {
+  sourceStem: string;
+  pageIndex: number;
+  chunkId?: string;
+  workspaceDir?: string;
+};
+
+export interface GraphRAGKbPanelProps {
+  notebook: { id?: string; title?: string; name?: string };
+  userId: string | null;
+  email: string;
+  locale?: 'zh' | 'en';
+  showToast: (message: string, type?: 'success' | 'error' | 'warning') => void;
+  onOpenGraphragSource?: (payload: GraphragOpenSourcePayload) => void | Promise<void>;
+}
+
+export function GraphRAGKbPanel({
+  notebook,
+  userId,
+  email,
+  locale = 'en',
+  showToast,
+}: GraphRAGKbPanelProps) {
+  const L = STR[locale];
+  const notebookId = notebook?.id || '';
+  const notebookTitle = notebook?.title || notebook?.name || '';
+
+  const [persist, setPersist] = useState<GraphragWorkspacePersist | null>(null);
+  const [forceReindex, setForceReindex] = useState(false);
+  const [parsePdfs, setParsePdfs] = useState(true);
+  const [indexLoading, setIndexLoading] = useState(false);
+  const [modelName, setModelName] = useState(defaultGraphragModel());
+
+  const [messages, setMessages] = useState<ChatMessage[]>([]);
+  const [inputValue, setInputValue] = useState('');
+  const [chatLoading, setChatLoading] = useState(false);
+  const [searchMethod, setSearchMethod] = useState<'auto' | 'local' | 'global'>('auto');
+  const [wikidataEnrich, setWikidataEnrich] = useState(true);
+  const messagesEndRef = useRef<HTMLDivElement>(null);
+
+  useEffect(() => {
+    try {
+      const v = localStorage.getItem('graphrag_wikidata_enrich');
+      if (v !== null) setWikidataEnrich(v === '1' || v === 'true');
+    } catch {
+      // keep default
+    }
+  }, []);
+
+  const [mergeA, setMergeA] = useState('');
+  const [mergeB, setMergeB] = useState('');
+  const [mergeDedupe, setMergeDedupe] = useState(false);
+  const [mergeLoading, setMergeLoading] = useState(false);
+
+  const storageKey = useMemo(() => {
+    const uid = userId || 'global';
+    if (!notebookId) return null;
+    return getWorkspaceStorageKey(uid, notebookId);
+  }, [userId, notebookId]);
+
+  const loadPersist = useCallback(() => {
+    if (!storageKey) { setPersist(null); return; }
+    try {
+      const raw = localStorage.getItem(storageKey);
+      if (!raw) { setPersist(null); return; }
+      const p = JSON.parse(raw) as GraphragWorkspacePersist;
+      if (p?.workspace_dir) setPersist(p); else setPersist(null);
+    } catch { setPersist(null); }
+  }, [storageKey]);
+
+  useEffect(() => { loadPersist(); }, [loadPersist]);
+  useEffect(() => { if (persist?.workspace_dir) setMergeA((a) => (a ? a : persist.workspace_dir)); }, [persist?.workspace_dir]);
+
+  const llmBody = useCallback(() => {
+    const settings = getApiSettings(userId);
+    const api_url = settings?.apiUrl?.trim() || '';
+    const api_key = settings?.apiKey?.trim() || '';
+    const model = modelName.trim() || defaultGraphragModel();
+    return { api_url, api_key, model };
+  }, [userId, modelName]);
+
+  const copyText = async (text: string, okMsg?: string) => {
+    try { await navigator.clipboard.writeText(text); showToast(okMsg || L.copied, 'success'); }
+    catch { showToast(L.copyFailed, 'error'); }
+  };
+
+  useEffect(() => {
+    messagesEndRef.current?.scrollIntoView({ behavior: 'smooth' });
+  }, [messages, chatLoading]);
+
+  const handleIndex = async () => {
+    if (!notebookId) { showToast(L.noNotebook, 'warning'); return; }
+    const { api_url, api_key, model } = llmBody();
+    if (!api_url || !api_key) { showToast(L.apiWarn, 'warning'); return; }
+    setIndexLoading(true);
+    try {
+      const res = await indexGraphragKb({
+        notebook_id: notebookId, notebook_title: notebookTitle, email: email || '',
+        api_url, api_key, model,
+        source_stems: null, workspace_dir: persist?.workspace_dir || '',
+        force_reindex: forceReindex, parse_pdfs: parsePdfs, skip_kggen: true,
+      });
+      const next: GraphragWorkspacePersist = { workspace_dir: res.workspace_dir, updatedAt: Date.now(), num_chunks: res.num_chunks };
+      if (storageKey) localStorage.setItem(storageKey, JSON.stringify(next));
+      setPersist(next);
+      showToast(L.indexOk, 'success');
+    } catch (e: unknown) {
+      showToast(e instanceof Error ? e.message : String(e), 'error');
+    } finally { setIndexLoading(false); }
+  };
+
+  const handleChat = async () => {
+    const userInput = inputValue.trim();
+    if (!userInput || chatLoading) return;
+    if (!persist?.workspace_dir) {
+      showToast(locale === 'zh' ? '请先完成索引构建' : 'Build the index first', 'warning');
+      return;
+    }
+    const { api_url, api_key, model } = llmBody();
+    if (!api_url || !api_key) { showToast(L.apiWarn, 'warning'); return; }
+
+    const history = messages.map((m) => ({
+      role: m.role,
+      content: m.content,
+      ...(m.meta ? { meta: { ...m.meta } } : {}),
+    }));
+    const userMsg: ChatMessage = { id: `u_${Date.now()}`, role: 'user', content: userInput };
+    setMessages((prev) => [...prev, userMsg]);
+    setInputValue('');
+    setChatLoading(true);
+
+    try {
+      const resp: ChatResponse = await chatGraphragKb({
+        notebook_id: notebookId, notebook_title: notebookTitle, email: email || '',
+        query: userInput, history, search_method: searchMethod,
+        workspace_dir: persist.workspace_dir, api_url, api_key, model,
+        wikidata_enrich: wikidataEnrich,
+        defer_postprocess: true,
+      });
+      const assistantId = `a_${Date.now()}`;
+      const assistantMsg: ChatMessage = {
+        id: assistantId, role: 'assistant', content: resp.answer,
+        meta: {
+          intent: resp.intent,
+          rewritten_query: resp.rewritten_query,
+          graphrag_raw_answer: resp.graphrag_raw_answer || '',
+          context_data: resp.context_data,
+          reasoning_subgraph: resp.reasoning_subgraph,
+          reasoning_subgraph_cot: resp.reasoning_subgraph_cot,
+          judge_score: resp.judge_score,
+          judge_rationale: resp.judge_rationale,
+          source_chunks: resp.source_chunks,
+          highlight_hints: resp.highlight_hints,
+        },
+        postprocessPending: !!resp.postprocess_pending,
+        postprocessSubgraphPending: !!resp.postprocess_pending,
+        postprocessWikidataPending: !!resp.postprocess_pending && wikidataEnrich,
+      };
+      setMessages((prev) => [...prev, assistantMsg]);
+
+      if (resp.postprocess_pending) {
+        chatGraphragKbPostprocess({
+          query: resp.rewritten_query || userInput,
+          answer: resp.graphrag_raw_answer || '',
+          reasoning_subgraph: (resp.reasoning_subgraph || []) as Array<Record<string, unknown>>,
+          api_url,
+          api_key,
+          model,
+          wikidata_enrich: wikidataEnrich,
+          mode: 'subgraph',
+        })
+          .then((pp) => {
+            setMessages((prev) => prev.map((m) => {
+              if (m.id !== assistantId || m.role !== 'assistant') return m;
+              return {
+                ...m,
+                postprocessSubgraphPending: false,
+                postprocessPending: !!m.postprocessWikidataPending,
+                meta: {
+                  ...(m.meta || {}),
+                  reasoning_subgraph: pp.reasoning_subgraph,
+                  reasoning_subgraph_cot: pp.reasoning_subgraph_cot,
+                  judge_score: pp.judge_score,
+                  judge_rationale: pp.judge_rationale,
+                },
+              };
+            }));
+          })
+          .catch((e) => {
+            setMessages((prev) => prev.map((m) => {
+              if (m.id !== assistantId || m.role !== 'assistant') return m;
+              return {
+                ...m,
+                postprocessSubgraphPending: false,
+                postprocessPending: !!m.postprocessWikidataPending,
+                meta: {
+                  ...(m.meta || {}),
+                  judge_rationale: String(e),
+                },
+              };
+            }));
+          });
+
+        if (wikidataEnrich) {
+          chatGraphragKbPostprocess({
+            query: resp.rewritten_query || userInput,
+            answer: resp.graphrag_raw_answer || '',
+            reasoning_subgraph: (resp.reasoning_subgraph || []) as Array<Record<string, unknown>>,
+            api_url,
+            api_key,
+            model,
+            wikidata_enrich: true,
+            mode: 'wikidata',
+          })
+            .then((pp) => {
+              setMessages((prev) => prev.map((m) => {
+                if (m.id !== assistantId || m.role !== 'assistant') return m;
+                const appendix = (pp.wikidata_appendix || '').trim();
+                const base = m.content || '';
+                const nextContent = appendix ? `${base}\n\n${appendix}` : base;
+                return {
+                  ...m,
+                  content: nextContent,
+                  postprocessWikidataPending: false,
+                  postprocessPending: !!m.postprocessSubgraphPending,
+                };
+              }));
+            })
+            .catch(() => {
+              setMessages((prev) => prev.map((m) => {
+                if (m.id !== assistantId || m.role !== 'assistant') return m;
+                return {
+                  ...m,
+                  postprocessWikidataPending: false,
+                  postprocessPending: !!m.postprocessSubgraphPending,
+                };
+              }));
+            });
+        }
+      }
+    } catch (err) {
+      showToast(String(err), 'error');
+      setMessages((prev) => prev.slice(0, -1));
+      setInputValue(userInput);
+    } finally { setChatLoading(false); }
+  };
+
+  const handleMerge = async () => {
+    if (!notebookId) { showToast(L.noNotebook, 'warning'); return; }
+    const a = mergeA.trim(); const b = mergeB.trim();
+    if (!a || !b) { showToast(locale === 'zh' ? '请填写两个 workspace 路径' : 'Enter both workspace paths', 'warning'); return; }
+    const { api_url, api_key, model } = llmBody();
+    if (!api_url || !api_key) { showToast(L.apiWarn, 'warning'); return; }
+    setMergeLoading(true);
+    try {
+      const res = await mergeGraphragKb({
+        notebook_id: notebookId, notebook_title: notebookTitle, email: email || '',
+        api_url, api_key, model, workspace_dir_a: a, workspace_dir_b: b, dedupe: mergeDedupe,
+      });
+      const next: GraphragWorkspacePersist = { workspace_dir: res.merged_workspace_dir, updatedAt: Date.now(), num_chunks: res.num_chunks };
+      if (storageKey) localStorage.setItem(storageKey, JSON.stringify(next));
+      setPersist(next);
+      setMergeA(res.merged_workspace_dir);
+      showToast(L.mergeOk, 'success');
+    } catch (e: unknown) {
+      showToast(e instanceof Error ? e.message : String(e), 'error');
+    } finally { setMergeLoading(false); }
+  };
+
+  return (
+    <main className="flex-1 flex flex-col relative bg-white min-w-[300px] overflow-hidden">
+      <div className="flex items-center gap-2 px-6 py-3 border-b border-ios-gray-100 shrink-0">
+        <Network className="text-cyan-600" size={20} />
+        <div>
+          <div className="text-sm font-medium text-ios-gray-900">{L.headerTitle}</div>
+          <div className="text-xs text-ios-gray-400">{L.headerSub}</div>
+        </div>
+      </div>
+
+      <div className="flex-1 overflow-y-auto p-6 space-y-6 max-w-[960px] w-full mx-auto">
+        <section className="rounded-2xl border border-ios-gray-100 bg-ios-gray-50/40 p-4 space-y-3">
+          <h3 className="text-sm font-semibold text-ios-gray-800">{L.indexBtn}</h3>
+          <div className="flex flex-wrap gap-4 items-center text-sm">
+            <label className="flex items-center gap-2 cursor-pointer">
+              <input type="checkbox" checked={forceReindex} onChange={(e) => setForceReindex(e.target.checked)} />
+              {L.forceReindex}
+            </label>
+            <label className="flex items-center gap-2 cursor-pointer">
+              <input type="checkbox" checked={parsePdfs} onChange={(e) => setParsePdfs(e.target.checked)} />
+              {L.parsePdfs}
+            </label>
+          </div>
+          <div>
+            <label className="block text-xs font-medium text-ios-gray-500 mb-1">{L.modelLabel}</label>
+            <input
+              value={modelName} onChange={(e) => setModelName(e.target.value)}
+              className="w-full max-w-md px-3 py-2 border border-ios-gray-200 rounded-lg text-sm"
+              placeholder={defaultGraphragModel()}
+            />
+          </div>
+          <button
+            type="button" disabled={indexLoading || !notebookId} onClick={handleIndex}
+            className="inline-flex items-center gap-2 px-4 py-2 rounded-ios bg-slate-900 text-white text-sm font-medium disabled:opacity-50"
+          >
+            {indexLoading ? <Loader2 size={16} className="animate-spin" /> : null}
+            {indexLoading ? L.indexing : L.indexBtn}
+          </button>
+
+          {persist && (
+            <div className="mt-4 rounded-xl border border-ios-gray-200 bg-white p-3 text-xs space-y-2">
+              <div className="font-medium text-ios-gray-700">{L.summary}</div>
+              <div className="grid grid-cols-1 sm:grid-cols-2 gap-2 text-ios-gray-600">
+                <span>{L.chunks}: <b>{persist.num_chunks ?? '—'}</b></span>
+              </div>
+              <div className="flex items-start gap-2 break-all">
+                <span className="shrink-0 text-ios-gray-500">{L.workspace}:</span>
+                <code className="flex-1 text-[11px] bg-ios-gray-50 p-2 rounded">{persist.workspace_dir}</code>
+                <button type="button" onClick={() => copyText(persist.workspace_dir)} className="shrink-0 p-1.5 rounded border border-ios-gray-200 hover:bg-ios-gray-50" title={L.copy}>
+                  <Copy size={14} />
+                </button>
+              </div>
+            </div>
+          )}
+        </section>
+
+        <section className="rounded-2xl border border-ios-gray-100 overflow-hidden">
+          <div className="flex items-center gap-3 px-4 py-2 border-b border-ios-gray-100 bg-ios-gray-50/40 text-xs">
+            <span className="text-ios-gray-500">{L.searchMethodLabel}</span>
+            <select
+              value={searchMethod} onChange={(e) => setSearchMethod(e.target.value as typeof searchMethod)}
+              className="px-2 py-1 border border-ios-gray-200 rounded text-xs"
+            >
+              <option value="auto">Auto</option>
+              <option value="local">Local</option>
+              <option value="global">Global</option>
+            </select>
+            <label className="flex items-center gap-1.5 cursor-pointer shrink-0">
+              <input
+                type="checkbox"
+                checked={wikidataEnrich}
+                onChange={(e) => {
+                  const c = e.target.checked;
+                  setWikidataEnrich(c);
+                  try {
+                    localStorage.setItem('graphrag_wikidata_enrich', c ? '1' : '0');
+                  } catch {
+                    // ignore
+                  }
+                }}
+              />
+              <span className="text-ios-gray-600">{L.wikidataEnrich}</span>
+            </label>
+            <button
+              type="button" onClick={() => setMessages([])}
+              className="ml-auto text-ios-gray-400 hover:text-ios-gray-600 text-[11px]"
+            >
+              {L.clearChat}
+            </button>
+          </div>
+
+          <div className="min-h-[min(520px,55vh)] max-h-[min(960px,78vh)] overflow-y-auto px-4 py-4 space-y-4">
+            {messages.length === 0 && (
+              <div className="text-center text-xs text-ios-gray-400 py-12">
+                {persist?.workspace_dir ? L.emptyReady : L.emptyNoIndex}
+              </div>
+            )}
+            {messages.map((msg) => (
+              <div key={msg.id} className={`flex ${msg.role === 'user' ? 'justify-end' : 'justify-start'}`}>
+                <div className={`max-w-[85%] rounded-2xl px-4 py-3 text-sm ${
+                  msg.role === 'user'
+                    ? 'bg-primary text-white rounded-br-sm'
+                    : 'bg-ios-gray-50 text-ios-gray-900 rounded-bl-sm border border-ios-gray-100'
+                }`}>
+                  {msg.role === 'user' ? (
+                    <div className="whitespace-pre-wrap break-words">{msg.content}</div>
+                  ) : (
+                    <div>
+                      <div className="prose prose-sm max-w-none">
+                        <ReactMarkdown>{msg.content || '—'}</ReactMarkdown>
+                      </div>
+                      {msg.meta && (
+                        <AssistantMeta
+                          meta={msg.meta}
+                          locale={locale}
+                          L={L}
+                          userId={userId}
+                          subgraphPending={!!msg.postprocessSubgraphPending}
+                        />
+                      )}
+                      {msg.postprocessSubgraphPending ? (
+                        <div className="mt-2 text-[11px] text-amber-700/90 flex items-center gap-1">
+                          <Loader2 size={12} className="animate-spin" />
+                          {L.postprocessSubgraphPending}
+                        </div>
+                      ) : null}
+                      {msg.postprocessWikidataPending ? (
+                        <div className="mt-1 text-[11px] text-amber-700/90 flex items-center gap-1">
+                          <Loader2 size={12} className="animate-spin" />
+                          {L.postprocessWikidataPending}
+                        </div>
+                      ) : null}
+                    </div>
+                  )}
+                </div>
+              </div>
+            ))}
+            {chatLoading && (
+              <div className="flex justify-start">
+                <div className="bg-ios-gray-50 border border-ios-gray-100 rounded-2xl rounded-bl-sm px-4 py-3">
+                  <Loader2 size={16} className="animate-spin text-ios-gray-400" />
+                </div>
+              </div>
+            )}
+            <div ref={messagesEndRef} />
+          </div>
+
+          <div className="border-t border-ios-gray-100 px-4 py-3 flex gap-2 items-end">
+            <textarea
+              value={inputValue}
+              onChange={(e) => setInputValue(e.target.value)}
+              onKeyDown={(e) => { if (e.key === 'Enter' && !e.shiftKey) { e.preventDefault(); handleChat(); } }}
+              rows={3} placeholder={L.chatPlaceholder}
+              className="flex-1 px-3 py-2 border border-ios-gray-200 rounded-xl text-sm resize-none"
+            />
+            <button
+              type="button" disabled={chatLoading || !inputValue.trim()} onClick={handleChat}
+              className="px-4 py-2 rounded-xl bg-primary text-white text-sm font-medium disabled:opacity-50 shrink-0"
+            >
+              {chatLoading ? <Loader2 size={16} className="animate-spin" /> : <Send size={16} />}
+            </button>
+          </div>
+        </section>
+
+        <section className="rounded-2xl border border-dashed border-ios-gray-200 p-4 space-y-3">
+          <h3 className="text-sm font-semibold text-ios-gray-800">{L.mergeTitle}</h3>
+          <div>
+            <label className="block text-xs text-ios-gray-500 mb-1">{L.mergeA}</label>
+            <textarea value={mergeA} onChange={(e) => setMergeA(e.target.value)} rows={2}
+              className="w-full px-3 py-2 border border-ios-gray-200 rounded-lg text-xs font-mono" />
+          </div>
+          <div>
+            <label className="block text-xs text-ios-gray-500 mb-1">{L.mergeB}</label>
+            <textarea value={mergeB} onChange={(e) => setMergeB(e.target.value)} rows={2}
+              className="w-full px-3 py-2 border border-ios-gray-200 rounded-lg text-xs font-mono" />
+          </div>
+          <label className="flex items-center gap-2 text-sm cursor-pointer">
+            <input type="checkbox" checked={mergeDedupe} onChange={(e) => setMergeDedupe(e.target.checked)} />
+            {L.dedupe}
+          </label>
+          <button
+            type="button" disabled={mergeLoading} onClick={handleMerge}
+            className="inline-flex items-center gap-2 px-4 py-2 rounded-ios border border-ios-gray-300 text-sm font-medium disabled:opacity-50"
+          >
+            {mergeLoading ? <Loader2 size={16} className="animate-spin" /> : null}
+            {mergeLoading ? L.merging : L.mergeBtn}
+          </button>
+        </section>
+      </div>
+    </main>
+  );
+}
+
diff --git a/frontend_en/src/config/api.ts b/frontend_en/src/config/api.ts
index 2918579..5d0b98b 100644
--- a/frontend_en/src/config/api.ts
+++ b/frontend_en/src/config/api.ts
@@ -21,6 +21,8 @@ function getApiBaseUrl(): string {
 
 export const API_BASE_URL = getApiBaseUrl();
 
+export const GRAPHRAG_KB_BASE = '/api/v1/graphrag-kb';
+
 // API key for backend authentication
 export const API_KEY = import.meta.env.VITE_API_KEY || 'df-internal-2024-workflow-key';
 
diff --git a/frontend_en/src/pages/NotebookView.tsx b/frontend_en/src/pages/NotebookView.tsx
index 1961f3e..945f615 100644
--- a/frontend_en/src/pages/NotebookView.tsx
+++ b/frontend_en/src/pages/NotebookView.tsx
@@ -1,11 +1,11 @@
-import React, { useState, useEffect } from 'react';
+import React, { useState, useEffect, useMemo } from 'react';
 import { motion, AnimatePresence } from 'framer-motion';
 import {
   ChevronLeft, Plus, Share2, Settings, MessageSquare,
   BarChart2, Zap, AudioLines, Video, FileText,
   Filter, MoreVertical, Search, Image as ImageIcon, FileStack, Sparkles,
   Mic2, Video as VideoIcon, BrainCircuit, Send, Bot, User, Loader2, Upload, X,
-  Globe, Link2, Cloud, ChevronRight, LayoutGrid, Download, BookOpen, Brain
+  Globe, Link2, Cloud, ChevronRight, LayoutGrid, Download, BookOpen, Brain, Network
 } from 'lucide-react';
 import { useAuthStore } from '../stores/authStore';
 import { apiFetch } from '../config/api';
@@ -13,6 +13,8 @@ import { getApiSettings } from '../services/apiSettingsService';
 import { fetchWithCache, invalidateCacheByPrefix } from '../services/clientCache';
 import type { KnowledgeFile, ChatMessage, ToolType } from '../types';
 import ReactMarkdown from 'react-markdown';
+import rehypeRaw from 'rehype-raw';
+import { injectGraphragHighlightInMarkdown } from '../utils/graphragMarkdownHighlight';
 import { MermaidPreview } from '../components/knowledge-base/tools/MermaidPreview';
 import { SettingsModal } from '../components/SettingsModal';
 import DrawioInlineEditor from '../components/DrawioInlineEditor';
@@ -20,6 +22,8 @@ import { FlashcardViewer } from '../components/flashcards/FlashcardViewer';
 import { QuizContainer } from '../components/quiz/QuizContainer';
 import { NotionEditor } from '../components/notes/NotionEditor';
 import { useToast } from '../hooks/useToast';
+import { GraphRAGKbPanel } from '../components/graphrag-kb/GraphRAGKbPanel';
+import { fetchGraphragChunkSnippet } from '../services/graphragKbService';
 import katex from 'katex';
 import 'katex/dist/katex.min.css';
 
@@ -40,6 +44,7 @@ type CitationReference = {
   preview?: string;
   chunkIndex?: number | null;
   sourceNumber?: string;
+  graphragHighlightText?: string;
 };
 
 type CitationTooltipState = {
@@ -253,6 +258,7 @@ const NotebookView = ({ notebook, onBack }: { notebook: any, onBack: () => void
 
   // Studio tools
   const studioTools: Array<{icon: React.ReactNode, label: string, id: ToolType}> = [
+    { icon: <Network className="text-cyan-600" />, label: 'GraphRAG KB', id: 'graphrag_kb' },
     { icon: <ImageIcon className="text-orange-500" />, label: 'PPT生成', id: 'ppt' },
     { icon: <BrainCircuit className="text-purple-500" />, label: '思维导图', id: 'mindmap' },
     // DrawIO 图表功能暂时隐藏，后续修复
@@ -266,11 +272,12 @@ const NotebookView = ({ notebook, onBack }: { notebook: any, onBack: () => void
   ];
 
   // Studio：每个功能卡片各自配置，点卡片上的「…」翻转进该卡片的设置
-  type StudioToolId = 'ppt' | 'mindmap' | 'drawio' | 'flashcard' | 'quiz' | 'podcast' | 'video' | 'note';
+  type StudioToolId = 'graphrag_kb' | 'ppt' | 'mindmap' | 'drawio' | 'flashcard' | 'quiz' | 'podcast' | 'video' | 'note';
   const [studioPanelView, setStudioPanelView] = useState<'tools' | 'settings'>('tools');
   const [studioSettingsTool, setStudioSettingsTool] = useState<StudioToolId | null>(null);
   const STORAGE_STUDIO_CONFIG = `kb_studio_config_${effectiveUser?.id || 'default'}`;
   const defaultByTool: Record<StudioToolId, Record<string, string>> = {
+    graphrag_kb: {},
     ppt: { llmModel: 'deepseek-v3.2', genFigModel: 'gemini-2.5-flash-image', stylePreset: 'modern', stylePrompt: '', language: 'zh', page_count: '10' },
     mindmap: { llmModel: 'deepseek-v3.2', mindmapStyle: 'default' },
     drawio: { llmModel: 'deepseek-v3.2', diagramType: 'auto', diagramStyle: 'default', language: 'zh' },
@@ -1127,6 +1134,17 @@ const NotebookView = ({ notebook, onBack }: { notebook: any, onBack: () => void
     return () => window.clearTimeout(timer);
   }, [sourceDetailCitationFocus, sourceDetailLoading, sourceDetailContent]);
 
+  const sourceDetailMarkdownWithHighlight = useMemo(() => {
+    if (sourceDetailFormat !== 'markdown' || !sourceDetailContent) return sourceDetailContent;
+    const hl = sourceDetailCitationFocus?.graphragHighlightText?.trim();
+    if (!hl) return sourceDetailContent;
+    return injectGraphragHighlightInMarkdown(sourceDetailContent, hl);
+  }, [
+    sourceDetailFormat,
+    sourceDetailContent,
+    sourceDetailCitationFocus?.graphragHighlightText,
+  ]);
+
   const runFastResearch = async () => {
     if (!fastResearchQuery.trim()) return;
     const settings = getApiSettings(effectiveUser?.id || null);
@@ -2590,8 +2608,10 @@ const NotebookView = ({ notebook, onBack }: { notebook: any, onBack: () => void
                     <span className="ml-2 text-sm text-gray-500">解析中…</span>
                   </div>
                 ) : sourceDetailFormat === 'markdown' && sourceDetailContent ? (
-                  <div className="prose prose-sm max-w-none text-gray-700 prose-p:text-xs prose-headings:text-sm prose-pre:text-xs">
-                    <ReactMarkdown>{sourceDetailContent}</ReactMarkdown>
+                  <div className="prose prose-sm max-w-none text-gray-700 prose-p:text-xs prose-headings:text-sm prose-pre:text-xs prose-mark:bg-amber-200/90 prose-mark:rounded prose-mark:px-0.5">
+                    <ReactMarkdown rehypePlugins={[rehypeRaw]}>
+                      {sourceDetailMarkdownWithHighlight ?? ''}
+                    </ReactMarkdown>
                   </div>
                 ) : (
                   <pre className="whitespace-pre-wrap text-xs text-gray-700 font-sans leading-relaxed break-words">
@@ -2646,6 +2666,42 @@ const NotebookView = ({ notebook, onBack }: { notebook: any, onBack: () => void
               }}
             />
           </div>
+        ) : activeTool === 'graphrag_kb' ? (
+          <GraphRAGKbPanel
+            notebook={notebook}
+            userId={effectiveUser?.id || null}
+            email={effectiveUser?.email || effectiveUser?.id || ''}
+            locale="en"
+            showToast={showToast}
+            onOpenGraphragSource={async (p) => {
+              const stem = p.sourceStem.trim();
+              const match = files.find((f) => {
+                const n = f.name || '';
+                const base = n.replace(/\.[^.]+$/, '');
+                return base === stem || n === stem || n.startsWith(`${stem}.`);
+              });
+              if (!match) {
+                showToast(`No source file matching "${stem}"`, 'warning');
+                return;
+              }
+              let graphragHighlightText: string | undefined;
+              if (p.workspaceDir && p.chunkId) {
+                try {
+                  const sn = await fetchGraphragChunkSnippet(p.workspaceDir, p.chunkId);
+                  if (sn.found && sn.text?.trim()) graphragHighlightText = sn.text.trim();
+                } catch {
+                  /* still open full preview */
+                }
+              }
+              await openSourceDetail(match, {
+                fileName: match.name,
+                filePath: match.url,
+                preview: `GraphRAG · ${p.pageIndex >= 0 ? `Page ${p.pageIndex + 1}` : 'unknown page'}`,
+                sourceNumber: 'GR',
+                graphragHighlightText,
+              });
+            }}
+          />
         ) : (
         <main className="flex-1 flex flex-col relative bg-white min-w-[300px] overflow-hidden">
           <div className="flex items-center justify-between px-6 py-3 border-b border-ios-gray-100 shrink-0">
@@ -2822,6 +2878,7 @@ const NotebookView = ({ notebook, onBack }: { notebook: any, onBack: () => void
                 返回
               </button>
               <h3 className="text-sm font-semibold text-gray-800 mb-3">
+                {studioSettingsTool === 'graphrag_kb' && 'GraphRAG KB'}
                 {studioSettingsTool === 'ppt' && 'PPT 生成'}
                 {studioSettingsTool === 'mindmap' && '思维导图'}
                 {studioSettingsTool === 'drawio' && 'DrawIO 图表'}
@@ -2831,6 +2888,9 @@ const NotebookView = ({ notebook, onBack }: { notebook: any, onBack: () => void
                 {/* {studioSettingsTool === 'video' && '视频讲解'} */}
               </h3>
               <div className="space-y-4">
+                {studioSettingsTool === 'graphrag_kb' && (
+                  <p className="text-sm text-gray-600">Indexing, query, and merge options are in the center GraphRAG Knowledge Base panel.</p>
+                )}
                 {studioSettingsTool === 'ppt' && (() => {
                   const c = getStudioConfig('ppt');
                   return (
@@ -3201,7 +3261,7 @@ const NotebookView = ({ notebook, onBack }: { notebook: any, onBack: () => void
                 </motion.div>
               ))}
             </div>
-            {activeTool !== 'chat' && activeTool !== 'search' && (
+            {activeTool !== 'chat' && activeTool !== 'search' && activeTool !== 'graphrag_kb' && (
               <motion.button
                 whileTap={{ scale: 0.97 }}
                 type="button"
diff --git a/frontend_en/src/services/graphragKbService.ts b/frontend_en/src/services/graphragKbService.ts
new file mode 100644
index 0000000..2e8ed8a
--- /dev/null
+++ b/frontend_en/src/services/graphragKbService.ts
@@ -0,0 +1,153 @@
+/**
+ * GraphRAG 知识库前端 API 封装。
+ *
+ * 数据流：调用 ``/api/v1/graphrag-kb/*`` → FastAPI ``graphrag_kb`` 路由 → ``wa_graphrag_kb`` → ``wf_graphrag_kb``。
+ * ``fetchGraphragChunkSnippet`` 用于侧栏打开来源时，按 chunk_id 拉取 ``input/*.txt`` 内嵌段正文，供 NotebookView 在 Markdown 中高亮。
+ */
+import { apiFetch, GRAPHRAG_KB_BASE } from '../config/api';
+import type {
+  IndexRequest,
+  IndexResponse,
+  QueryRequest,
+  QueryResponse,
+  MergeRequest,
+  MergeResponse,
+  ChatRequest,
+  ChatResponse,
+  ChatPostprocessRequest,
+  ChatPostprocessResponse,
+  ContextRefineResponse,
+} from '../types/graphragKb';
+
+const DEFAULT_LLM_MODEL = 'deepseek-v3.2';
+
+async function parseErrorDetail(res: Response): Promise<string> {
+  try {
+    const body = await res.json();
+    const d = body?.detail;
+    if (typeof d === 'string') return d;
+    if (Array.isArray(d)) return d.map((x: { msg?: string }) => x?.msg || String(x)).join('; ');
+    return body?.message || `HTTP ${res.status}`;
+  } catch {
+    const t = await res.text();
+    return t || `HTTP ${res.status}`;
+  }
+}
+
+export function defaultGraphragModel(): string {
+  return DEFAULT_LLM_MODEL;
+}
+
+export async function indexGraphragKb(body: IndexRequest): Promise<IndexResponse> {
+  const res = await apiFetch(`${GRAPHRAG_KB_BASE}/index`, {
+    method: 'POST',
+    headers: { 'Content-Type': 'application/json' },
+    body: JSON.stringify(body),
+  });
+  if (!res.ok) throw new Error(await parseErrorDetail(res));
+  return res.json() as Promise<IndexResponse>;
+}
+
+export async function queryGraphragKb(body: QueryRequest): Promise<QueryResponse> {
+  const res = await apiFetch(`${GRAPHRAG_KB_BASE}/query`, {
+    method: 'POST',
+    headers: { 'Content-Type': 'application/json' },
+    body: JSON.stringify(body),
+  });
+  if (!res.ok) throw new Error(await parseErrorDetail(res));
+  return res.json() as Promise<QueryResponse>;
+}
+
+export async function mergeGraphragKb(body: MergeRequest): Promise<MergeResponse> {
+  const res = await apiFetch(`${GRAPHRAG_KB_BASE}/merge`, {
+    method: 'POST',
+    headers: { 'Content-Type': 'application/json' },
+    body: JSON.stringify(body),
+  });
+  if (!res.ok) throw new Error(await parseErrorDetail(res));
+  return res.json() as Promise<MergeResponse>;
+}
+
+export async function chatGraphragKb(body: ChatRequest): Promise<ChatResponse> {
+  const res = await apiFetch(`${GRAPHRAG_KB_BASE}/chat`, {
+    method: 'POST',
+    headers: { 'Content-Type': 'application/json' },
+    body: JSON.stringify(body),
+  });
+  if (!res.ok) throw new Error(await parseErrorDetail(res));
+  return res.json() as Promise<ChatResponse>;
+}
+
+export async function chatGraphragKbPostprocess(
+  body: ChatPostprocessRequest,
+): Promise<ChatPostprocessResponse> {
+  const res = await apiFetch(`${GRAPHRAG_KB_BASE}/chat-postprocess`, {
+    method: 'POST',
+    headers: { 'Content-Type': 'application/json' },
+    body: JSON.stringify(body),
+  });
+  if (!res.ok) throw new Error(await parseErrorDetail(res));
+  return res.json() as Promise<ChatPostprocessResponse>;
+}
+
+export interface ChunkSnippetResponse {
+  text: string;
+  source_stem: string;
+  found: boolean;
+  /** Verbatim sentence/phrase extracted by LLM that best matches the reasoning triples. */
+  highlighted_sentence?: string;
+}
+
+/** 从 GraphRAG workspace ``input/*.txt`` 中解析 ``[chunk:id]`` 对应正文（用于阅读器高亮，非整篇 MinerU MD）。
+ *  可选传入 triples（reasoning_subgraph）让后端调 LLM 精确定位最相关的原句；
+ *  apiKey / apiUrl 需与查询时使用的凭证一致，否则 LLM 调用会返回 401。
+ */
+export async function fetchGraphragChunkSnippet(
+  workspaceDir: string,
+  chunkId: string,
+  triples?: Array<Record<string, unknown>>,
+  apiKey?: string,
+  apiUrl?: string,
+  /** Same text as the context-reference box (stripped); LLM uses this instead of raw input block. */
+  passageForLlm?: string,
+): Promise<ChunkSnippetResponse> {
+  const res = await apiFetch(`${GRAPHRAG_KB_BASE}/chunk-snippet`, {
+    method: 'POST',
+    headers: { 'Content-Type': 'application/json' },
+    body: JSON.stringify({
+      workspace_dir: workspaceDir,
+      chunk_id: chunkId,
+      api_key: apiKey || '',
+      api_url: apiUrl || '',
+      ...(triples && triples.length > 0 ? { triples } : {}),
+      ...(passageForLlm != null && passageForLlm.trim() !== ''
+        ? { passage_for_llm: passageForLlm }
+        : {}),
+    }),
+  });
+  if (!res.ok) throw new Error(await parseErrorDetail(res));
+  return res.json() as Promise<ChunkSnippetResponse>;
+}
+
+/** 首条检索 unit 原文 + reasoning_subgraph → 清洗正文 + 支撑句（侧栏上下文参考高亮） */
+export async function refineGraphragContextRefine(
+  unitText: string,
+  subgraph: Array<Record<string, unknown>>,
+  apiKey: string,
+  apiUrl: string,
+  model?: string,
+): Promise<ContextRefineResponse> {
+  const res = await apiFetch(`${GRAPHRAG_KB_BASE}/context-refine`, {
+    method: 'POST',
+    headers: { 'Content-Type': 'application/json' },
+    body: JSON.stringify({
+      unit_text: unitText,
+      subgraph,
+      api_key: apiKey || '',
+      api_url: apiUrl || '',
+      model: (model || '').trim() || DEFAULT_LLM_MODEL,
+    }),
+  });
+  if (!res.ok) throw new Error(await parseErrorDetail(res));
+  return res.json() as Promise<ContextRefineResponse>;
+}
diff --git a/frontend_en/src/types/graphragKb.ts b/frontend_en/src/types/graphragKb.ts
new file mode 100644
index 0000000..2f20fe3
--- /dev/null
+++ b/frontend_en/src/types/graphragKb.ts
@@ -0,0 +1,155 @@
+/**
+ * GraphRAG KB 前后端 JSON 契约（与 ``fastapi_app/routers/graphrag_kb.py`` 一致，字段 snake_case）。
+ *
+ * - Index*：建索引请求/响应（workspace_dir、分块数、可选 KGGen 统计）。
+ * - Query*：查询响应含 answer、context_data、推理子图、source_chunks、highlight_hints、Judge、子图 CoT。
+ * - Merge*：两工作区合并后的路径与 chunk 数。
+ * - GraphragWorkspacePersist：前端 localStorage 持久化的上次索引摘要。
+ */
+
+export interface IndexRequest {
+  notebook_id: string;
+  notebook_title?: string;
+  email?: string;
+  api_url: string;
+  api_key: string;
+  model: string;
+  source_stems?: string[] | null;
+  workspace_dir?: string;
+  force_reindex?: boolean;
+  parse_pdfs?: boolean;
+  /** Default true: server skips KGGen; set false only for internal experiments. */
+  skip_kggen?: boolean;
+}
+
+export interface IndexResponse {
+  workspace_dir: string;
+  num_chunks: number;
+  kg_entities: number;
+  kg_relations: number;
+}
+
+export interface QueryRequest {
+  notebook_id: string;
+  notebook_title?: string;
+  email?: string;
+  api_url: string;
+  api_key: string;
+  model: string;
+  question: string;
+  search_method: 'local' | 'global';
+  workspace_dir: string;
+  wikidata_enrich?: boolean | null;
+}
+
+export interface QueryResponse {
+  answer: string;
+  context_data: Record<string, unknown>;
+  reasoning_subgraph: Array<Record<string, unknown>>;
+  source_chunks: string[];
+  highlight_hints: Array<Record<string, unknown>>;
+  judge_score: number;
+  judge_rationale: string;
+  /** LLM chain-of-thought for minimal subgraph selection (hop analysis) */
+  reasoning_subgraph_cot?: string;
+}
+
+export interface MergeRequest {
+  notebook_id?: string;
+  notebook_title?: string;
+  email?: string;
+  api_url: string;
+  api_key: string;
+  model: string;
+  workspace_dir_a: string;
+  workspace_dir_b: string;
+  dedupe?: boolean;
+}
+
+export interface MergeResponse {
+  merged_workspace_dir: string;
+  num_chunks: number;
+}
+
+export interface GraphragWorkspacePersist {
+  workspace_dir: string;
+  updatedAt: number;
+  num_chunks?: number;
+}
+
+// ── Chat types ───────────────────────────────────────────────────────────────
+
+export interface ChatRequest {
+  notebook_id: string;
+  notebook_title?: string;
+  email?: string;
+  query: string;
+  history: Array<{ role: 'user' | 'assistant'; content: string; meta?: Record<string, unknown> }>;
+  search_method?: 'auto' | 'local' | 'global';
+  workspace_dir?: string;
+  api_url?: string;
+  api_key?: string;
+  model?: string;
+  /** false = do not append Wikidata tail; omitted = follow server default */
+  wikidata_enrich?: boolean | null;
+  /** true = return main answer first and postprocess later */
+  defer_postprocess?: boolean;
+}
+
+export interface ChatResponse {
+  answer: string;
+  intent: { use_graphrag?: boolean; reason?: string };
+  rewritten_query: string;
+  context_data: Record<string, unknown>;
+  reasoning_subgraph: Array<Record<string, unknown>>;
+  reasoning_subgraph_cot: string;
+  source_chunks: string[];
+  highlight_hints: Array<Record<string, unknown>>;
+  judge_score: number;
+  judge_rationale: string;
+  postprocess_pending?: boolean;
+  graphrag_raw_answer?: string;
+}
+
+export interface ChatPostprocessRequest {
+  query: string;
+  answer: string;
+  reasoning_subgraph: Array<Record<string, unknown>>;
+  api_url?: string;
+  api_key?: string;
+  model?: string;
+  wikidata_enrich?: boolean | null;
+  mode?: 'all' | 'subgraph' | 'wikidata';
+}
+
+export interface ChatPostprocessResponse {
+  reasoning_subgraph: Array<Record<string, unknown>>;
+  reasoning_subgraph_cot: string;
+  judge_score: number;
+  judge_rationale: string;
+  wikidata_appendix: string;
+  subgraph_done: boolean;
+  wikidata_done: boolean;
+  done: boolean;
+}
+
+export interface ChatMessage {
+  id: string;
+  role: 'user' | 'assistant';
+  content: string;
+  meta?: Pick<
+    ChatResponse,
+    'intent' | 'rewritten_query' | 'context_data' | 'reasoning_subgraph' |
+    'reasoning_subgraph_cot' | 'judge_score' | 'judge_rationale' |
+    'graphrag_raw_answer' |
+    'source_chunks' | 'highlight_hints'
+  >;
+  postprocessPending?: boolean;
+  postprocessSubgraphPending?: boolean;
+  postprocessWikidataPending?: boolean;
+}
+
+export interface ContextRefineResponse {
+  cleaned_text: string;
+  supporting_snippets: string[];
+}
diff --git a/frontend_en/src/types/index.ts b/frontend_en/src/types/index.ts
index 517d293..d42ba31 100644
--- a/frontend_en/src/types/index.ts
+++ b/frontend_en/src/types/index.ts
@@ -1,3 +1,13 @@
+export type {
+  IndexRequest as GraphragIndexRequest,
+  IndexResponse as GraphragIndexResponse,
+  QueryRequest as GraphragQueryRequest,
+  QueryResponse as GraphragQueryResponse,
+  MergeRequest as GraphragMergeRequest,
+  MergeResponse as GraphragMergeResponse,
+  GraphragWorkspacePersist,
+} from './graphragKb';
+
 // Knowledge Base Types
 export type MaterialType = 'image' | 'doc' | 'video' | 'link' | 'audio';
 
@@ -34,4 +44,4 @@ export interface ChatMessage {
 }
 
 export type SectionType = 'library' | 'upload' | 'output' | 'settings';
-export type ToolType = 'chat' | 'ppt' | 'mindmap' | 'podcast' | 'video' | 'search' | 'drawio' | 'flashcard' | 'quiz' | 'note';
+export type ToolType = 'chat' | 'ppt' | 'mindmap' | 'podcast' | 'video' | 'search' | 'drawio' | 'flashcard' | 'quiz' | 'note' | 'graphrag_kb';
diff --git a/frontend_en/src/utils/graphragMarkdownHighlight.ts b/frontend_en/src/utils/graphragMarkdownHighlight.ts
new file mode 100644
index 0000000..ba96a9e
--- /dev/null
+++ b/frontend_en/src/utils/graphragMarkdownHighlight.ts
@@ -0,0 +1,160 @@
+const DEFAULT_MARK_CLASS =
+  'bg-amber-200/90 rounded px-0.5 ring-1 ring-amber-300/60';
+
+const ALT_MARK_CLASSES = [
+  'bg-amber-200/90 rounded px-0.5 ring-1 ring-amber-300/60',
+  'bg-sky-200/90 rounded px-0.5 ring-1 ring-sky-300/60',
+  'bg-emerald-200/85 rounded px-0.5 ring-1 ring-emerald-300/55',
+  'bg-violet-200/85 rounded px-0.5 ring-1 ring-violet-300/55',
+];
+
+function markOpenTag(className: string): string {
+  const cls = className || DEFAULT_MARK_CLASS;
+  return `<mark class="${cls}" data-graphrag-hl="1">`;
+}
+
+function htmlEsc(s: string): string {
+  return s.replace(/&/g, '&amp;').replace(/</g, '&lt;').replace(/>/g, '&gt;');
+}
+
+function wrapRange(full: string, start: number, end: number, markClass: string): string {
+  return (
+    full.slice(0, start) +
+    markOpenTag(markClass) +
+    htmlEsc(full.slice(start, end)) +
+    '</mark>' +
+    full.slice(end)
+  );
+}
+
+function stripMdChars(md: string): { text: string; map: number[] } {
+  const map: number[] = [];
+  let text = '';
+  let i = 0;
+  while (i < md.length) {
+    const c = md[i];
+    if (c === '*' || c === '_' || c === '`') { i++; continue; }
+    if (c === '~' && md[i + 1] === '~') { i += 2; continue; }
+    if (c === '<') {
+      const end = md.indexOf('>', i);
+      if (end >= 0) { i = end + 1; continue; }
+    }
+    map.push(i);
+    text += c;
+    i++;
+  }
+  return { text, map };
+}
+
+function normPosToOrig(s: string, normPos: number): number {
+  let norm = 0;
+  let orig = 0;
+  while (orig < s.length && norm < normPos) {
+    if (/\s/.test(s[orig])) {
+      while (orig < s.length && /\s/.test(s[orig])) orig++;
+      norm++;
+    } else {
+      orig++;
+      norm++;
+    }
+  }
+  return orig;
+}
+
+export type InjectHighlightOptions = {
+  markClass?: string;
+  colorIndex?: number;
+};
+
+export function findGraphragHighlightRange(
+  full: string,
+  snippet: string,
+): { start: number; end: number } | null {
+  const sn = snippet.trim();
+  if (!full || !sn) return null;
+
+  const i1 = full.indexOf(sn);
+  if (i1 >= 0) return { start: i1, end: i1 + sn.length };
+
+  const { text: stripped, map } = stripMdChars(full);
+  const i2 = stripped.indexOf(sn);
+  if (i2 >= 0 && i2 + sn.length - 1 < map.length) {
+    return { start: map[i2], end: map[i2 + sn.length - 1] + 1 };
+  }
+
+  const normSn = sn.replace(/\s+/g, ' ');
+  const normStripped = stripped.replace(/\s+/g, ' ');
+  const i3 = normStripped.indexOf(normSn);
+  if (i3 < 0) return null;
+
+  const stripStart = normPosToOrig(stripped, i3);
+  const stripEnd = normPosToOrig(stripped, i3 + normSn.length);
+
+  if (stripStart >= map.length) return null;
+  const origStart = map[stripStart];
+  const origEnd = stripEnd < map.length ? map[stripEnd] : map[map.length - 1] + 1;
+  return { start: origStart, end: origEnd };
+}
+
+function markClassForOptions(options?: InjectHighlightOptions, slot = 0): string {
+  let markClass = options?.markClass || '';
+  if (!markClass && options?.colorIndex != null) {
+    const i =
+      (Math.max(0, Math.floor(options.colorIndex)) + slot) % ALT_MARK_CLASSES.length;
+    markClass = ALT_MARK_CLASSES[i]!;
+  }
+  if (!markClass) markClass = DEFAULT_MARK_CLASS;
+  return markClass;
+}
+
+export function injectGraphragHighlightInMarkdown(
+  full: string,
+  snippet: string,
+  options?: InjectHighlightOptions,
+): string {
+  const sn = snippet.trim();
+  if (!full || !sn) return full;
+  const markClass = markClassForOptions(options, 0);
+  const r = findGraphragHighlightRange(full, snippet);
+  if (!r) return full;
+  return wrapRange(full, r.start, r.end, markClass);
+}
+
+export type InjectMultipleHighlightsOptions = InjectHighlightOptions & {
+  baseColorIndex?: number;
+};
+
+export function injectMultipleGraphragHighlightsInMarkdown(
+  full: string,
+  snippets: string[],
+  options?: InjectMultipleHighlightsOptions,
+): string {
+  if (!full || !snippets.length) return full;
+  const base = options?.baseColorIndex ?? options?.colorIndex ?? 0;
+  const ranges: { start: number; end: number; slot: number }[] = [];
+  let k = 0;
+  for (const raw of snippets) {
+    const r = findGraphragHighlightRange(full, raw);
+    if (!r) continue;
+    ranges.push({ ...r, slot: k++ });
+  }
+  ranges.sort((a, b) => a.start - b.start);
+  const merged: typeof ranges = [];
+  for (const r of ranges) {
+    const prev = merged[merged.length - 1];
+    if (prev && r.start < prev.end) continue;
+    merged.push(r);
+  }
+  merged.sort((a, b) => b.start - a.start);
+  let out = full;
+  for (const r of merged) {
+    const mc = markClassForOptions(
+      options?.markClass
+        ? { markClass: options.markClass }
+        : { colorIndex: base + r.slot },
+      0,
+    );
+    out = wrapRange(out, r.start, r.end, mc);
+  }
+  return out;
+}
diff --git a/frontend_en/src/utils/stripGraphragContextNoise.ts b/frontend_en/src/utils/stripGraphragContextNoise.ts
new file mode 100644
index 0000000..b556d2a
--- /dev/null
+++ b/frontend_en/src/utils/stripGraphragContextNoise.ts
@@ -0,0 +1,21 @@
+/**
+ * GraphRAG text_units / sources often embed lineage markers. Strip them for human-readable UI.
+ */
+const RE_CHUNK_LINE = /^\s*\[chunk:[a-f0-9]+\]\s*$/gim;
+const RE_CHUNK_INLINE = /\[chunk:[a-f0-9]+\]/gi;
+const RE_DATA = /\s*\[Data:[^\]]+\]/gi;
+
+export function stripGraphragContextNoise(raw: string): string {
+  if (!raw) return '';
+  let t = raw.replace(RE_DATA, '');
+  t = t.replace(RE_CHUNK_INLINE, '');
+  t = t.replace(RE_CHUNK_LINE, '');
+  return t.replace(/\n{3,}/g, '\n\n').trim();
+}
+
+/** First hex chunk id embedded in text, or empty. */
+export function extractChunkIdFromText(raw: string): string {
+  const m = /\[chunk:([a-f0-9]+)\]/i.exec(raw);
+  return m ? m[1].toLowerCase() : '';
+}
+
diff --git a/frontend_en/src/vite-env.d.ts b/frontend_en/src/vite-env.d.ts
index 4c5ff97..8d2ba4c 100644
--- a/frontend_en/src/vite-env.d.ts
+++ b/frontend_en/src/vite-env.d.ts
@@ -1,5 +1,7 @@
 /// <reference types="vite/client" />
 
+declare module 'rehype-raw';
+
 interface ImportMetaEnv {
   readonly VITE_SUPABASE_URL?: string
   readonly VITE_SUPABASE_ANON_KEY?: string
diff --git a/frontend_en/vite.config.ts b/frontend_en/vite.config.ts
index b322e8c..0330e8d 100644
--- a/frontend_en/vite.config.ts
+++ b/frontend_en/vite.config.ts
@@ -9,11 +9,11 @@ export default defineConfig({
     allowedHosts: true,
     proxy: {
       '/api': {
-        target: 'http://localhost:8213',
+        target: 'http://localhost:8212',
         changeOrigin: true,
       },
       '/outputs': {
-        target: 'http://localhost:8213',
+        target: 'http://localhost:8212',
         changeOrigin: true,
       },
     },
diff --git a/frontend_zh/package-lock.json b/frontend_zh/package-lock.json
index 873bc08..df09701 100644
--- a/frontend_zh/package-lock.json
+++ b/frontend_zh/package-lock.json
@@ -19,6 +19,7 @@
         "react-dom": "^18.2.0",
         "react-markdown": "^9.1.0",
         "react-pdf": "^10.3.0",
+        "rehype-raw": "^7.0.0",
         "tailwind-merge": "^2.0.0",
         "zustand": "^4.4.7"
       },
@@ -2632,6 +2633,17 @@
       "integrity": "sha512-f/ZeWvW/BCXbhGEf1Ujp29EASo/lk1FDnETgNKwJrsVvGZhUWCZyg3xLJjAsxfOmt8KjswHmI5EwCQcPMpOYhQ==",
       "license": "EPL-2.0"
     },
+    "node_modules/entities": {
+      "version": "6.0.1",
+      "resolved": "https://registry.npmjs.org/entities/-/entities-6.0.1.tgz",
+      "integrity": "sha512-aN97NXWF6AWBTahfVOIrB/NShkzi5H7F9r1s9mD3cDj4Ko5f2qhhVoYMibXF7GlLveb/D2ioWay8lxI97Ven3g==",
+      "engines": {
+        "node": ">=0.12"
+      },
+      "funding": {
+        "url": "https://github.com/fb55/entities?sponsor=1"
+      }
+    },
     "node_modules/esbuild": {
       "version": "0.21.5",
       "resolved": "https://registry.npmjs.org/esbuild/-/esbuild-0.21.5.tgz",
@@ -2849,6 +2861,71 @@
         "node": ">= 0.4"
       }
     },
+    "node_modules/hast-util-from-parse5": {
+      "version": "8.0.3",
+      "resolved": "https://registry.npmjs.org/hast-util-from-parse5/-/hast-util-from-parse5-8.0.3.tgz",
+      "integrity": "sha512-3kxEVkEKt0zvcZ3hCRYI8rqrgwtlIOFMWkbclACvjlDw8Li9S2hk/d51OI0nr/gIpdMHNepwgOKqZ/sy0Clpyg==",
+      "dependencies": {
+        "@types/hast": "^3.0.0",
+        "@types/unist": "^3.0.0",
+        "devlop": "^1.0.0",
+        "hastscript": "^9.0.0",
+        "property-information": "^7.0.0",
+        "vfile": "^6.0.0",
+        "vfile-location": "^5.0.0",
+        "web-namespaces": "^2.0.0"
+      },
+      "funding": {
+        "type": "opencollective",
+        "url": "https://opencollective.com/unified"
+      }
+    },
+    "node_modules/hast-util-from-parse5/node_modules/@types/unist": {
+      "version": "3.0.3",
+      "resolved": "https://registry.npmjs.org/@types/unist/-/unist-3.0.3.tgz",
+      "integrity": "sha512-ko/gIFJRv177XgZsZcBwnqJN5x/Gien8qNOn0D5bQU/zAzVf9Zt3BlcUiLqhV9y4ARk0GbT3tnUiPNgnTXzc/Q=="
+    },
+    "node_modules/hast-util-parse-selector": {
+      "version": "4.0.0",
+      "resolved": "https://registry.npmjs.org/hast-util-parse-selector/-/hast-util-parse-selector-4.0.0.tgz",
+      "integrity": "sha512-wkQCkSYoOGCRKERFWcxMVMOcYE2K1AaNLU8DXS9arxnLOUEWbOXKXiJUNzEpqZ3JOKpnha3jkFrumEjVliDe7A==",
+      "dependencies": {
+        "@types/hast": "^3.0.0"
+      },
+      "funding": {
+        "type": "opencollective",
+        "url": "https://opencollective.com/unified"
+      }
+    },
+    "node_modules/hast-util-raw": {
+      "version": "9.1.0",
+      "resolved": "https://registry.npmjs.org/hast-util-raw/-/hast-util-raw-9.1.0.tgz",
+      "integrity": "sha512-Y8/SBAHkZGoNkpzqqfCldijcuUKh7/su31kEBp67cFY09Wy0mTRgtsLYsiIxMJxlu0f6AA5SUTbDR8K0rxnbUw==",
+      "dependencies": {
+        "@types/hast": "^3.0.0",
+        "@types/unist": "^3.0.0",
+        "@ungap/structured-clone": "^1.0.0",
+        "hast-util-from-parse5": "^8.0.0",
+        "hast-util-to-parse5": "^8.0.0",
+        "html-void-elements": "^3.0.0",
+        "mdast-util-to-hast": "^13.0.0",
+        "parse5": "^7.0.0",
+        "unist-util-position": "^5.0.0",
+        "unist-util-visit": "^5.0.0",
+        "vfile": "^6.0.0",
+        "web-namespaces": "^2.0.0",
+        "zwitch": "^2.0.0"
+      },
+      "funding": {
+        "type": "opencollective",
+        "url": "https://opencollective.com/unified"
+      }
+    },
+    "node_modules/hast-util-raw/node_modules/@types/unist": {
+      "version": "3.0.3",
+      "resolved": "https://registry.npmjs.org/@types/unist/-/unist-3.0.3.tgz",
+      "integrity": "sha512-ko/gIFJRv177XgZsZcBwnqJN5x/Gien8qNOn0D5bQU/zAzVf9Zt3BlcUiLqhV9y4ARk0GbT3tnUiPNgnTXzc/Q=="
+    },
     "node_modules/hast-util-to-jsx-runtime": {
       "version": "2.3.6",
       "resolved": "https://registry.npmjs.org/hast-util-to-jsx-runtime/-/hast-util-to-jsx-runtime-2.3.6.tgz",
@@ -2882,6 +2959,24 @@
       "integrity": "sha512-ko/gIFJRv177XgZsZcBwnqJN5x/Gien8qNOn0D5bQU/zAzVf9Zt3BlcUiLqhV9y4ARk0GbT3tnUiPNgnTXzc/Q==",
       "license": "MIT"
     },
+    "node_modules/hast-util-to-parse5": {
+      "version": "8.0.1",
+      "resolved": "https://registry.npmjs.org/hast-util-to-parse5/-/hast-util-to-parse5-8.0.1.tgz",
+      "integrity": "sha512-MlWT6Pjt4CG9lFCjiz4BH7l9wmrMkfkJYCxFwKQic8+RTZgWPuWxwAfjJElsXkex7DJjfSJsQIt931ilUgmwdA==",
+      "dependencies": {
+        "@types/hast": "^3.0.0",
+        "comma-separated-tokens": "^2.0.0",
+        "devlop": "^1.0.0",
+        "property-information": "^7.0.0",
+        "space-separated-tokens": "^2.0.0",
+        "web-namespaces": "^2.0.0",
+        "zwitch": "^2.0.0"
+      },
+      "funding": {
+        "type": "opencollective",
+        "url": "https://opencollective.com/unified"
+      }
+    },
     "node_modules/hast-util-whitespace": {
       "version": "3.0.0",
       "resolved": "https://registry.npmjs.org/hast-util-whitespace/-/hast-util-whitespace-3.0.0.tgz",
@@ -2895,6 +2990,22 @@
         "url": "https://opencollective.com/unified"
       }
     },
+    "node_modules/hastscript": {
+      "version": "9.0.1",
+      "resolved": "https://registry.npmjs.org/hastscript/-/hastscript-9.0.1.tgz",
+      "integrity": "sha512-g7df9rMFX/SPi34tyGCyUBREQoKkapwdY/T04Qn9TDWfHhAYt4/I0gMVirzK5wEzeUqIjEB+LXC/ypb7Aqno5w==",
+      "dependencies": {
+        "@types/hast": "^3.0.0",
+        "comma-separated-tokens": "^2.0.0",
+        "hast-util-parse-selector": "^4.0.0",
+        "property-information": "^7.0.0",
+        "space-separated-tokens": "^2.0.0"
+      },
+      "funding": {
+        "type": "opencollective",
+        "url": "https://opencollective.com/unified"
+      }
+    },
     "node_modules/html-url-attributes": {
       "version": "3.0.1",
       "resolved": "https://registry.npmjs.org/html-url-attributes/-/html-url-attributes-3.0.1.tgz",
@@ -2905,6 +3016,15 @@
         "url": "https://opencollective.com/unified"
       }
     },
+    "node_modules/html-void-elements": {
+      "version": "3.0.0",
+      "resolved": "https://registry.npmjs.org/html-void-elements/-/html-void-elements-3.0.0.tgz",
+      "integrity": "sha512-bEqo66MRXsUGxWHV5IP0PUiAWwoEjba4VCzg0LjFJBpchPaTfyfCKTG6bc5F8ucKec3q5y6qOdGyYTSBEvhCrg==",
+      "funding": {
+        "type": "github",
+        "url": "https://github.com/sponsors/wooorm"
+      }
+    },
     "node_modules/iceberg-js": {
       "version": "0.8.1",
       "resolved": "https://registry.npmjs.org/iceberg-js/-/iceberg-js-0.8.1.tgz",
@@ -5773,6 +5893,17 @@
         "url": "https://github.com/sponsors/wooorm"
       }
     },
+    "node_modules/parse5": {
+      "version": "7.3.0",
+      "resolved": "https://registry.npmjs.org/parse5/-/parse5-7.3.0.tgz",
+      "integrity": "sha512-IInvU7fabl34qmi9gY8XOVxhYyMyuH2xUNpb2q8/Y+7552KlejkRvqvD19nMoUW/uQGGbqNpA6Tufu5FL5BZgw==",
+      "dependencies": {
+        "entities": "^6.0.0"
+      },
+      "funding": {
+        "url": "https://github.com/inikulin/parse5?sponsor=1"
+      }
+    },
     "node_modules/path-parse": {
       "version": "1.0.7",
       "resolved": "https://registry.npmjs.org/path-parse/-/path-parse-1.0.7.tgz",
@@ -6149,6 +6280,20 @@
         "node": ">=8.10.0"
       }
     },
+    "node_modules/rehype-raw": {
+      "version": "7.0.0",
+      "resolved": "https://registry.npmjs.org/rehype-raw/-/rehype-raw-7.0.0.tgz",
+      "integrity": "sha512-/aE8hCfKlQeA8LmyeyQvQF3eBiLRGNlfBJEvWH7ivp9sBqs7TNqBL5X3v157rM4IFETqDnIOO+z5M/biZbo9Ww==",
+      "dependencies": {
+        "@types/hast": "^3.0.0",
+        "hast-util-raw": "^9.0.0",
+        "vfile": "^6.0.0"
+      },
+      "funding": {
+        "type": "opencollective",
+        "url": "https://opencollective.com/unified"
+      }
+    },
     "node_modules/remark-parse": {
       "version": "11.0.0",
       "resolved": "https://registry.npmjs.org/remark-parse/-/remark-parse-11.0.0.tgz",
@@ -7361,6 +7506,24 @@
         "url": "https://opencollective.com/unified"
       }
     },
+    "node_modules/vfile-location": {
+      "version": "5.0.3",
+      "resolved": "https://registry.npmjs.org/vfile-location/-/vfile-location-5.0.3.tgz",
+      "integrity": "sha512-5yXvWDEgqeiYiBe1lbxYF7UMAIm/IcopxMHrMQDq3nvKcjPKIhZklUKL+AE7J7uApI4kwe2snsK+eI6UTj9EHg==",
+      "dependencies": {
+        "@types/unist": "^3.0.0",
+        "vfile": "^6.0.0"
+      },
+      "funding": {
+        "type": "opencollective",
+        "url": "https://opencollective.com/unified"
+      }
+    },
+    "node_modules/vfile-location/node_modules/@types/unist": {
+      "version": "3.0.3",
+      "resolved": "https://registry.npmjs.org/@types/unist/-/unist-3.0.3.tgz",
+      "integrity": "sha512-ko/gIFJRv177XgZsZcBwnqJN5x/Gien8qNOn0D5bQU/zAzVf9Zt3BlcUiLqhV9y4ARk0GbT3tnUiPNgnTXzc/Q=="
+    },
     "node_modules/vfile-message": {
       "version": "4.0.3",
       "resolved": "https://registry.npmjs.org/vfile-message/-/vfile-message-4.0.3.tgz",
@@ -7469,6 +7632,15 @@
         "loose-envify": "^1.0.0"
       }
     },
+    "node_modules/web-namespaces": {
+      "version": "2.0.1",
+      "resolved": "https://registry.npmjs.org/web-namespaces/-/web-namespaces-2.0.1.tgz",
+      "integrity": "sha512-bKr1DkiNa2krS7qxNtdrtHAmzuYGFQLiQ13TsorsdT6ULTkPLKuu5+GsFpDlg6JFjUTwX2DyhMPG2be8uPrqsQ==",
+      "funding": {
+        "type": "github",
+        "url": "https://github.com/sponsors/wooorm"
+      }
+    },
     "node_modules/web-worker": {
       "version": "1.5.0",
       "resolved": "https://registry.npmjs.org/web-worker/-/web-worker-1.5.0.tgz",
diff --git a/frontend_zh/package.json b/frontend_zh/package.json
index b6d9db4..d2b2fac 100644
--- a/frontend_zh/package.json
+++ b/frontend_zh/package.json
@@ -20,6 +20,7 @@
     "react-dom": "^18.2.0",
     "react-markdown": "^9.1.0",
     "react-pdf": "^10.3.0",
+    "rehype-raw": "^7.0.0",
     "tailwind-merge": "^2.0.0",
     "zustand": "^4.4.7"
   },
diff --git a/frontend_zh/src/components/graphrag-kb/GraphRAGKbPanel.tsx b/frontend_zh/src/components/graphrag-kb/GraphRAGKbPanel.tsx
new file mode 100644
index 0000000..5aba9cb
--- /dev/null
+++ b/frontend_zh/src/components/graphrag-kb/GraphRAGKbPanel.tsx
@@ -0,0 +1,845 @@
+/**
+ * GraphRAG 知识库侧栏 UI：索引构建、多轮聊天（含意图识别）、推理子图展示、上下文参考（框内句级高亮）、合并工作区。
+ *
+ * 数据流：用户消息 → ``chatGraphragKb`` → 后端 /chat → messages；「上下文参考」将首条 text_unit 原文与子图送 /context-refine，展示清洗后正文并对支撑句多段高亮。
+ */
+import React, { useCallback, useEffect, useMemo, useRef, useState } from 'react';
+import ReactMarkdown from 'react-markdown';
+import { Loader2, Copy, ChevronDown, ChevronRight, Network, Send } from 'lucide-react';
+import { getApiSettings } from '../../services/apiSettingsService';
+import {
+  indexGraphragKb,
+  mergeGraphragKb,
+  chatGraphragKb,
+  chatGraphragKbPostprocess,
+  defaultGraphragModel,
+  refineGraphragContextRefine,
+} from '../../services/graphragKbService';
+import type { ChatMessage, ChatResponse, GraphragWorkspacePersist } from '../../types/graphragKb';
+import { MermaidPreview } from '../knowledge-base/tools/MermaidPreview';
+import { injectMultipleGraphragHighlightsInMarkdown } from '../../utils/graphragMarkdownHighlight';
+import {
+  extractChunkIdFromText,
+  stripGraphragContextNoise,
+} from '../../utils/stripGraphragContextNoise';
+
+function getWorkspaceStorageKey(userId: string, notebookId: string) {
+  return `graphrag_workspace_${userId}_${notebookId}`;
+}
+
+function sanitizeMermaidLabel(s: string, max = 48): string {
+  return s.replace(/["[\]#]/g, ' ').slice(0, max).trim() || '?';
+}
+
+/** 将 reasoning_subgraph 转为 Mermaid graph TD（启用换行，关系标签不截断）。 */
+export function reasoningSubgraphToMermaid(edges: Array<Record<string, unknown>>, maxEdges = 36): string | null {
+  if (!edges.length) return null;
+  const slice = edges.slice(0, maxEdges);
+  const idFor = (() => {
+    const m = new Map<string, string>();
+    let n = 0;
+    return (raw: string) => {
+      const k = raw || `_${n}`;
+      if (!m.has(k)) m.set(k, `N${n++}`);
+      return m.get(k)!;
+    };
+  })();
+  const lines: string[] = [
+    '%%{init: {"flowchart": {"htmlLabels": true, "wrappingWidth": 250}} }%%',
+    'graph TD',
+  ];
+  for (let i = 0; i < slice.length; i++) {
+    const e = slice[i];
+    const src = String(e.source ?? e.src ?? e.from ?? e.head ?? `s${i}`);
+    const tgt = String(e.target ?? e.tgt ?? e.to ?? e.tail ?? `t${i}`);
+    const rel = String(e.relation ?? e.relationship ?? e.label ?? e.predicate ?? '');
+    const sid = idFor(src);
+    const tid = idFor(tgt);
+    const sl = sanitizeMermaidLabel(src, 40);
+    const tl = sanitizeMermaidLabel(tgt, 40);
+    const rl = sanitizeMermaidLabel(rel, 60);
+    lines.push(`  ${sid}["${sl}"] -->|"${rl}"| ${tid}["${tl}"]`);
+  }
+  return lines.join('\n');
+}
+
+// ── extractTopChunk: 从 context_data.sources/text_units 中取第一条 ─────────────
+// GraphRAG 把检索上下文序列化进表时，第一行通常是 local_search 排序下的首要 text_unit，
+// 不是全局「语义上最相关」的严格保证；若需更准需改后端选块策略。
+
+interface ContextChunk {
+  chunkId: string;
+  text: string;
+  nTokens?: number;
+  sourceStem?: string;
+}
+
+function extractTopChunk(
+  contextData: Record<string, unknown>,
+  highlightHints: Array<Record<string, unknown>>,
+): ContextChunk | null {
+  const textUnits =
+    (contextData['sources'] as Array<Record<string, unknown>> | undefined) ??
+    (contextData['text_units'] as Array<Record<string, unknown>> | undefined);
+  if (!textUnits || !Array.isArray(textUnits) || textUnits.length === 0) return null;
+
+  const first = textUnits[0];
+  const rawText = String(first['text'] ?? first['content'] ?? '');
+  if (!rawText.trim()) return null;
+
+  const docIds = first['document_ids'];
+  const sourceStemFromUnit = Array.isArray(docIds) && docIds.length > 0 ? String(docIds[0]) : '';
+  const sourceStemFromHint = highlightHints.length > 0 ? String(highlightHints[0]['source_stem'] ?? '') : '';
+
+  const embedded = extractChunkIdFromText(rawText);
+  const idField = String(first['id'] ?? first['chunk_id'] ?? '').trim();
+  const chunkId = embedded || idField;
+
+  return {
+    chunkId,
+    text: rawText,
+    nTokens: first['n_tokens'] != null ? Number(first['n_tokens']) : undefined,
+    sourceStem: sourceStemFromUnit || sourceStemFromHint || undefined,
+  };
+}
+
+// ── Locale strings ──────────────────────────────────────────────────────────
+
+const STR = {
+  zh: {
+    headerTitle: 'GraphRAG 知识库',
+    headerSub: '分块（MinerU）+ GraphRAG 建索引与检索',
+    apiWarn: '请先在设置中配置 API URL 与 API Key',
+    noNotebook: '缺少笔记本 ID',
+    indexBtn: '构建索引',
+    indexing: '索引构建中…',
+    indexOk: '索引构建完成',
+    forceReindex: '强制重建',
+    parsePdfs: '解析 PDF（MinerU）',
+    summary: '上次索引摘要',
+    chunks: '分块数',
+    workspace: '工作区目录',
+    copy: '复制',
+    copied: '已复制',
+    modelLabel: 'LLM 模型名',
+    copyFailed: '复制失败',
+    mergeTitle: '合并工作区',
+    mergeA: 'workspace_dir A',
+    mergeB: 'workspace_dir B',
+    dedupe: '去重合并',
+    mergeBtn: '合并并重建索引',
+    merging: '合并中…',
+    mergeOk: '合并完成',
+    // Chat
+    chatPlaceholder: '向知识库提问…',
+    send: '发送',
+    searchMethodLabel: '检索策略',
+    wikidataEnrich: 'Wikidata 参考（附在答案后）',
+    clearChat: '清空对话',
+    emptyReady: '索引已就绪，开始提问吧',
+    emptyNoIndex: '请先完成索引构建',
+    contextRefTitle: '上下文参考',
+    subgraph: '推理子图',
+    subgraphRaw: '推理全图（未裁剪版）',
+    noSubgraph: '无子图数据',
+    subgraphCot: '最小子图推理（CoT / 跳数）',
+    mermaidTitle: '子图（Mermaid）',
+    judge: 'Judge 分数',
+    postprocessSubgraphPending: '正在裁剪子图…',
+    postprocessWikidataPending: '正在补充 Wikidata 参考…',
+  },
+  en: {
+    headerTitle: 'GraphRAG Knowledge Base',
+    headerSub: 'Chunking (MinerU) + GraphRAG index & query',
+    apiWarn: 'Configure API URL and API Key in Settings first',
+    noNotebook: 'Notebook ID is missing',
+    indexBtn: 'Build index',
+    indexing: 'Indexing…',
+    indexOk: 'Index completed',
+    forceReindex: 'Force reindex',
+    parsePdfs: 'Parse PDFs (MinerU)',
+    summary: 'Last index summary',
+    chunks: 'Chunks',
+    workspace: 'Workspace directory',
+    copy: 'Copy',
+    copied: 'Copied',
+    modelLabel: 'LLM model',
+    copyFailed: 'Copy failed',
+    mergeTitle: 'Merge workspaces',
+    mergeA: 'workspace_dir A',
+    mergeB: 'workspace_dir B',
+    dedupe: 'Deduplicate when merging',
+    mergeBtn: 'Merge and re-index',
+    merging: 'Merging…',
+    mergeOk: 'Merge completed',
+    chatPlaceholder: 'Ask the knowledge base…',
+    send: 'Send',
+    searchMethodLabel: 'Search method',
+    wikidataEnrich: 'Wikidata supplement (after answer)',
+    clearChat: 'Clear chat',
+    emptyReady: 'Index ready. Start asking questions.',
+    emptyNoIndex: 'Build the index first.',
+    contextRefTitle: 'Context Reference',
+    subgraph: 'Reasoning subgraph',
+    subgraphRaw: 'Full reasoning graph (unpruned)',
+    noSubgraph: 'No subgraph',
+    subgraphCot: 'Minimal subgraph reasoning (CoT / hops)',
+    mermaidTitle: 'Subgraph (Mermaid)',
+    judge: 'Judge score',
+    postprocessSubgraphPending: 'Pruning subgraph…',
+    postprocessWikidataPending: 'Enriching Wikidata supplement…',
+  },
+} as const;
+
+// ── Context reference: 首条 unit 原文 + 子图 → /context-refine → 干净正文 + 多段支撑句高亮 ─
+
+function ContextRefHtml({
+  topChunk,
+  subgraph,
+  userId,
+  colorIdx,
+  locale,
+}: {
+  topChunk: ContextChunk;
+  subgraph: Array<Record<string, unknown>>;
+  userId: string | null;
+  colorIdx: number;
+  locale: 'zh' | 'en';
+}) {
+  const basePlain = useMemo(() => stripGraphragContextNoise(topChunk.text), [topChunk.text]);
+  const [html, setHtml] = useState<string>(basePlain);
+  const [loading, setLoading] = useState(false);
+
+  useEffect(() => {
+    setHtml(basePlain);
+    if (!subgraph?.length) {
+      setLoading(false);
+      return;
+    }
+    let cancelled = false;
+    setLoading(true);
+    (async () => {
+      try {
+        const st = getApiSettings(userId);
+        const out = await refineGraphragContextRefine(
+          topChunk.text,
+          subgraph,
+          st?.apiKey?.trim() || '',
+          st?.apiUrl?.trim() || '',
+          defaultGraphragModel(),
+        );
+        if (cancelled) return;
+        const body = (out.cleaned_text || '').trim() || basePlain;
+        const snips = (out.supporting_snippets || []).map((s) => s.trim()).filter(Boolean);
+        if (snips.length) {
+          setHtml(
+            injectMultipleGraphragHighlightsInMarkdown(body, snips, { baseColorIndex: colorIdx }),
+          );
+        } else {
+          setHtml(body);
+        }
+      } catch {
+        if (!cancelled) setHtml(basePlain);
+      } finally {
+        if (!cancelled) setLoading(false);
+      }
+    })();
+    return () => {
+      cancelled = true;
+    };
+  }, [topChunk.chunkId, subgraph, basePlain, userId, colorIdx, topChunk.text]);
+
+  return (
+    <div className="space-y-1">
+      {loading ? (
+        <div className="text-[11px] text-amber-700/90">
+          {locale === 'zh' ? '正在清洗正文并选取支撑句…' : 'Cleaning passage and selecting evidence…'}
+        </div>
+      ) : null}
+      <div
+        className="text-xs text-ios-gray-800 leading-relaxed whitespace-pre-wrap break-words max-h-48 overflow-y-auto"
+        // eslint-disable-next-line react/no-danger -- 本地知识库 chunk 正文；mark 由 injectMultipleGraphragHighlightsInMarkdown 注入
+        dangerouslySetInnerHTML={{ __html: html }}
+      />
+    </div>
+  );
+}
+
+// ── AssistantMeta: renders metadata below each assistant message ─────────────
+
+interface AssistantMetaProps {
+  meta: NonNullable<ChatMessage['meta']>;
+  locale: 'zh' | 'en';
+  L: typeof STR['zh'];
+  userId: string | null;
+  subgraphPending: boolean;
+}
+
+function AssistantMeta({ meta, locale, L, userId, subgraphPending }: AssistantMetaProps) {
+  const topChunk = useMemo(() => {
+    if (!meta.context_data) return null;
+    return extractTopChunk(
+      meta.context_data as Record<string, unknown>,
+      (meta.highlight_hints ?? []) as Array<Record<string, unknown>>,
+    );
+  }, [meta.context_data, meta.highlight_hints]);
+
+  const mermaidCode = useMemo(() => {
+    if (!meta.reasoning_subgraph?.length) return null;
+    return reasoningSubgraphToMermaid(meta.reasoning_subgraph as Array<Record<string, unknown>>);
+  }, [meta.reasoning_subgraph]);
+
+  const subgraphRows = (meta.reasoning_subgraph ?? []) as Array<Record<string, unknown>>;
+
+  const judgePct = Math.round(Math.max(0, Math.min(1, meta.judge_score ?? 0)) * 100);
+  const [subgraphOpen, setSubgraphOpen] = useState(false);
+
+  return (
+    <div className="mt-3 space-y-3">
+      {meta.intent?.use_graphrag === false && (
+        <div className="inline-flex items-center gap-1 text-[11px] text-ios-gray-400 bg-ios-gray-50 rounded px-2 py-0.5">
+          {locale === 'zh' ? '直接回答（无检索）' : 'Direct answer (no retrieval)'}
+        </div>
+      )}
+      {meta.intent?.use_graphrag === true && meta.rewritten_query && (
+        <div className="text-[11px] text-ios-gray-400">
+          <span className="font-medium">{locale === 'zh' ? '检索问题：' : 'Retrieval query: '}</span>
+          {meta.rewritten_query}
+        </div>
+      )}
+
+      {topChunk && (
+        <div className="rounded-xl bg-amber-50 border border-amber-100 p-3 space-y-1.5">
+          <div className="text-xs font-semibold text-amber-800">{L.contextRefTitle}</div>
+          {topChunk.sourceStem && (
+            <div className="flex items-center gap-2 text-xs text-amber-700">
+              <code className="bg-amber-100/60 px-1.5 py-0.5 rounded text-[11px]">{topChunk.sourceStem}</code>
+              {topChunk.nTokens != null && (
+                <span className="text-amber-500">{topChunk.nTokens} tokens</span>
+              )}
+            </div>
+          )}
+          <ContextRefHtml
+            topChunk={topChunk}
+            subgraph={subgraphRows}
+            userId={userId}
+            colorIdx={0}
+            locale={locale}
+          />
+        </div>
+      )}
+
+      {mermaidCode && (
+        <div className="space-y-2">
+          <button
+            type="button"
+            onClick={() => setSubgraphOpen(!subgraphOpen)}
+            className="flex items-center gap-1 text-xs font-semibold text-ios-gray-700"
+          >
+            {subgraphOpen ? <ChevronDown size={14} /> : <ChevronRight size={14} />}
+            {subgraphPending ? L.subgraphRaw : L.subgraph}
+          </button>
+          {subgraphOpen && (
+            <>
+              <div className="bg-slate-900 rounded-xl p-2">
+                <MermaidPreview mermaidCode={mermaidCode} title={L.mermaidTitle} />
+              </div>
+              {meta.reasoning_subgraph_cot ? (
+                <details className="text-xs rounded-lg border border-ios-gray-100 bg-ios-gray-50/60 p-3">
+                  <summary className="cursor-pointer font-medium text-ios-gray-700 select-none">{L.subgraphCot}</summary>
+                  <div className="mt-2 text-ios-gray-800 whitespace-pre-wrap break-words">
+                    <ReactMarkdown>{meta.reasoning_subgraph_cot}</ReactMarkdown>
+                  </div>
+                </details>
+              ) : null}
+            </>
+          )}
+        </div>
+      )}
+
+      {judgePct > 0 && (
+        <div className="rounded-xl bg-sky-50 border border-sky-100 px-3 py-2 text-xs">
+          <div className="font-medium text-sky-900">{L.judge}: {judgePct}%</div>
+          {meta.judge_rationale ? (
+            <div className="text-sky-800 mt-0.5 opacity-90">{meta.judge_rationale}</div>
+          ) : null}
+        </div>
+      )}
+    </div>
+  );
+}
+
+// ── Main component ──────────────────────────────────────────────────────────
+
+export interface GraphRAGKbPanelProps {
+  notebook: { id?: string; title?: string; name?: string };
+  userId: string | null;
+  email: string;
+  locale?: 'zh' | 'en';
+  showToast: (message: string, type?: 'success' | 'error' | 'warning') => void;
+}
+
+export function GraphRAGKbPanel({
+  notebook,
+  userId,
+  email,
+  locale = 'zh',
+  showToast,
+}: GraphRAGKbPanelProps) {
+  const L = STR[locale];
+  const notebookId = notebook?.id || '';
+  const notebookTitle = notebook?.title || notebook?.name || '';
+
+  // ── Index state ───────────────────────────────────────────────────────────
+  const [persist, setPersist] = useState<GraphragWorkspacePersist | null>(null);
+  const [forceReindex, setForceReindex] = useState(false);
+  const [parsePdfs, setParsePdfs] = useState(true);
+  const [indexLoading, setIndexLoading] = useState(false);
+  const [modelName, setModelName] = useState(defaultGraphragModel());
+
+  // ── Chat state ────────────────────────────────────────────────────────────
+  const [messages, setMessages] = useState<ChatMessage[]>([]);
+  const [inputValue, setInputValue] = useState('');
+  const [chatLoading, setChatLoading] = useState(false);
+  const [searchMethod, setSearchMethod] = useState<'auto' | 'local' | 'global'>('auto');
+  const [wikidataEnrich, setWikidataEnrich] = useState(true);
+  const messagesEndRef = useRef<HTMLDivElement>(null);
+
+  useEffect(() => {
+    try {
+      const v = localStorage.getItem('graphrag_wikidata_enrich');
+      if (v !== null) setWikidataEnrich(v === '1' || v === 'true');
+    } catch {
+      /* keep default */
+    }
+  }, []);
+
+  // ── Merge state ───────────────────────────────────────────────────────────
+  const [mergeA, setMergeA] = useState('');
+  const [mergeB, setMergeB] = useState('');
+  const [mergeDedupe, setMergeDedupe] = useState(false);
+  const [mergeLoading, setMergeLoading] = useState(false);
+
+  // ── Persistence ───────────────────────────────────────────────────────────
+  const storageKey = useMemo(() => {
+    const uid = userId || 'global';
+    if (!notebookId) return null;
+    return getWorkspaceStorageKey(uid, notebookId);
+  }, [userId, notebookId]);
+
+  const loadPersist = useCallback(() => {
+    if (!storageKey) { setPersist(null); return; }
+    try {
+      const raw = localStorage.getItem(storageKey);
+      if (!raw) { setPersist(null); return; }
+      const p = JSON.parse(raw) as GraphragWorkspacePersist;
+      if (p?.workspace_dir) setPersist(p); else setPersist(null);
+    } catch { setPersist(null); }
+  }, [storageKey]);
+
+  useEffect(() => { loadPersist(); }, [loadPersist]);
+  useEffect(() => { if (persist?.workspace_dir) setMergeA((a) => (a ? a : persist.workspace_dir)); }, [persist?.workspace_dir]);
+
+  const llmBody = useCallback(() => {
+    const settings = getApiSettings(userId);
+    const api_url = settings?.apiUrl?.trim() || '';
+    const api_key = settings?.apiKey?.trim() || '';
+    const model = modelName.trim() || defaultGraphragModel();
+    return { api_url, api_key, model };
+  }, [userId, modelName]);
+
+  const copyText = async (text: string, okMsg?: string) => {
+    try { await navigator.clipboard.writeText(text); showToast(okMsg || L.copied, 'success'); }
+    catch { showToast(L.copyFailed, 'error'); }
+  };
+
+  // Auto-scroll on new messages
+  useEffect(() => {
+    messagesEndRef.current?.scrollIntoView({ behavior: 'smooth' });
+  }, [messages, chatLoading]);
+
+  // ── Index handler ─────────────────────────────────────────────────────────
+  const handleIndex = async () => {
+    if (!notebookId) { showToast(L.noNotebook, 'warning'); return; }
+    const { api_url, api_key, model } = llmBody();
+    if (!api_url || !api_key) { showToast(L.apiWarn, 'warning'); return; }
+    setIndexLoading(true);
+    try {
+      const res = await indexGraphragKb({
+        notebook_id: notebookId, notebook_title: notebookTitle, email: email || '',
+        api_url, api_key, model,
+        source_stems: null, workspace_dir: persist?.workspace_dir || '',
+        force_reindex: forceReindex, parse_pdfs: parsePdfs, skip_kggen: true,
+      });
+      const next: GraphragWorkspacePersist = { workspace_dir: res.workspace_dir, updatedAt: Date.now(), num_chunks: res.num_chunks };
+      if (storageKey) localStorage.setItem(storageKey, JSON.stringify(next));
+      setPersist(next);
+      showToast(L.indexOk, 'success');
+    } catch (e: unknown) {
+      showToast(e instanceof Error ? e.message : String(e), 'error');
+    } finally { setIndexLoading(false); }
+  };
+
+  // ── Chat handler ──────────────────────────────────────────────────────────
+  const handleChat = async () => {
+    const userInput = inputValue.trim();
+    if (!userInput || chatLoading) return;
+    if (!persist?.workspace_dir) {
+      showToast(locale === 'zh' ? '请先完成索引构建' : 'Build the index first', 'warning');
+      return;
+    }
+    const { api_url, api_key, model } = llmBody();
+    if (!api_url || !api_key) { showToast(L.apiWarn, 'warning'); return; }
+
+    const history = messages.map((m) => ({
+      role: m.role,
+      content: m.content,
+      ...(m.meta ? { meta: { ...m.meta } } : {}),
+    }));
+    const userMsg: ChatMessage = { id: `u_${Date.now()}`, role: 'user', content: userInput };
+    setMessages((prev) => [...prev, userMsg]);
+    setInputValue('');
+    setChatLoading(true);
+
+    try {
+      const resp: ChatResponse = await chatGraphragKb({
+        notebook_id: notebookId, notebook_title: notebookTitle, email: email || '',
+        query: userInput, history, search_method: searchMethod,
+        workspace_dir: persist.workspace_dir, api_url, api_key, model,
+        wikidata_enrich: wikidataEnrich,
+        defer_postprocess: true,
+      });
+      const assistantId = `a_${Date.now()}`;
+      const assistantMsg: ChatMessage = {
+        id: assistantId, role: 'assistant', content: resp.answer,
+        meta: {
+          intent: resp.intent,
+          rewritten_query: resp.rewritten_query,
+          graphrag_raw_answer: resp.graphrag_raw_answer || '',
+          context_data: resp.context_data,
+          reasoning_subgraph: resp.reasoning_subgraph,
+          reasoning_subgraph_cot: resp.reasoning_subgraph_cot,
+          judge_score: resp.judge_score,
+          judge_rationale: resp.judge_rationale,
+          source_chunks: resp.source_chunks,
+          highlight_hints: resp.highlight_hints,
+        },
+        postprocessPending: !!resp.postprocess_pending,
+        postprocessSubgraphPending: !!resp.postprocess_pending,
+        postprocessWikidataPending: !!resp.postprocess_pending && wikidataEnrich,
+      };
+      setMessages((prev) => [...prev, assistantMsg]);
+
+      if (resp.postprocess_pending) {
+        chatGraphragKbPostprocess({
+          query: resp.rewritten_query || userInput,
+          answer: resp.graphrag_raw_answer || '',
+          reasoning_subgraph: (resp.reasoning_subgraph || []) as Array<Record<string, unknown>>,
+          api_url,
+          api_key,
+          model,
+          wikidata_enrich: wikidataEnrich,
+          mode: 'subgraph',
+        })
+          .then((pp) => {
+            setMessages((prev) => prev.map((m) => {
+              if (m.id !== assistantId || m.role !== 'assistant') return m;
+              return {
+                ...m,
+                postprocessSubgraphPending: false,
+                postprocessPending: !!m.postprocessWikidataPending,
+                meta: {
+                  ...(m.meta || {}),
+                  reasoning_subgraph: pp.reasoning_subgraph,
+                  reasoning_subgraph_cot: pp.reasoning_subgraph_cot,
+                  judge_score: pp.judge_score,
+                  judge_rationale: pp.judge_rationale,
+                },
+              };
+            }));
+          })
+          .catch((e) => {
+            setMessages((prev) => prev.map((m) => {
+              if (m.id !== assistantId || m.role !== 'assistant') return m;
+              return {
+                ...m,
+                postprocessSubgraphPending: false,
+                postprocessPending: !!m.postprocessWikidataPending,
+                meta: {
+                  ...(m.meta || {}),
+                  judge_rationale: String(e),
+                },
+              };
+            }));
+          });
+
+        if (wikidataEnrich) {
+          chatGraphragKbPostprocess({
+            query: resp.rewritten_query || userInput,
+            answer: resp.graphrag_raw_answer || '',
+            reasoning_subgraph: (resp.reasoning_subgraph || []) as Array<Record<string, unknown>>,
+            api_url,
+            api_key,
+            model,
+            wikidata_enrich: true,
+            mode: 'wikidata',
+          })
+            .then((pp) => {
+              setMessages((prev) => prev.map((m) => {
+                if (m.id !== assistantId || m.role !== 'assistant') return m;
+                const appendix = (pp.wikidata_appendix || '').trim();
+                const base = m.content || '';
+                const nextContent = appendix ? `${base}\n\n${appendix}` : base;
+                return {
+                  ...m,
+                  content: nextContent,
+                  postprocessWikidataPending: false,
+                  postprocessPending: !!m.postprocessSubgraphPending,
+                };
+              }));
+            })
+            .catch(() => {
+              setMessages((prev) => prev.map((m) => {
+                if (m.id !== assistantId || m.role !== 'assistant') return m;
+                return {
+                  ...m,
+                  postprocessWikidataPending: false,
+                  postprocessPending: !!m.postprocessSubgraphPending,
+                };
+              }));
+            });
+        }
+      }
+    } catch (err) {
+      showToast(String(err), 'error');
+      setMessages((prev) => prev.slice(0, -1));
+      setInputValue(userInput);
+    } finally { setChatLoading(false); }
+  };
+
+  // ── Merge handler ─────────────────────────────────────────────────────────
+  const handleMerge = async () => {
+    if (!notebookId) { showToast(L.noNotebook, 'warning'); return; }
+    const a = mergeA.trim(); const b = mergeB.trim();
+    if (!a || !b) { showToast(locale === 'zh' ? '请填写两个 workspace 路径' : 'Enter both workspace paths', 'warning'); return; }
+    const { api_url, api_key, model } = llmBody();
+    if (!api_url || !api_key) { showToast(L.apiWarn, 'warning'); return; }
+    setMergeLoading(true);
+    try {
+      const res = await mergeGraphragKb({
+        notebook_id: notebookId, notebook_title: notebookTitle, email: email || '',
+        api_url, api_key, model, workspace_dir_a: a, workspace_dir_b: b, dedupe: mergeDedupe,
+      });
+      const next: GraphragWorkspacePersist = { workspace_dir: res.merged_workspace_dir, updatedAt: Date.now(), num_chunks: res.num_chunks };
+      if (storageKey) localStorage.setItem(storageKey, JSON.stringify(next));
+      setPersist(next);
+      setMergeA(res.merged_workspace_dir);
+      showToast(L.mergeOk, 'success');
+    } catch (e: unknown) {
+      showToast(e instanceof Error ? e.message : String(e), 'error');
+    } finally { setMergeLoading(false); }
+  };
+
+  // ── Render ────────────────────────────────────────────────────────────────
+
+  return (
+    <main className="flex-1 flex flex-col relative bg-white min-w-[300px] overflow-hidden">
+      {/* Header */}
+      <div className="flex items-center gap-2 px-6 py-3 border-b border-ios-gray-100 shrink-0">
+        <Network className="text-cyan-600" size={20} />
+        <div>
+          <div className="text-sm font-medium text-ios-gray-900">{L.headerTitle}</div>
+          <div className="text-xs text-ios-gray-400">{L.headerSub}</div>
+        </div>
+      </div>
+
+      <div className="flex-1 overflow-y-auto p-6 space-y-6 max-w-[960px] w-full mx-auto">
+
+        {/* ① Index section */}
+        <section className="rounded-2xl border border-ios-gray-100 bg-ios-gray-50/40 p-4 space-y-3">
+          <h3 className="text-sm font-semibold text-ios-gray-800">{L.indexBtn}</h3>
+          <div className="flex flex-wrap gap-4 items-center text-sm">
+            <label className="flex items-center gap-2 cursor-pointer">
+              <input type="checkbox" checked={forceReindex} onChange={(e) => setForceReindex(e.target.checked)} />
+              {L.forceReindex}
+            </label>
+            <label className="flex items-center gap-2 cursor-pointer">
+              <input type="checkbox" checked={parsePdfs} onChange={(e) => setParsePdfs(e.target.checked)} />
+              {L.parsePdfs}
+            </label>
+          </div>
+          <div>
+            <label className="block text-xs font-medium text-ios-gray-500 mb-1">{L.modelLabel}</label>
+            <input
+              value={modelName} onChange={(e) => setModelName(e.target.value)}
+              className="w-full max-w-md px-3 py-2 border border-ios-gray-200 rounded-lg text-sm"
+              placeholder={defaultGraphragModel()}
+            />
+          </div>
+          <button
+            type="button" disabled={indexLoading || !notebookId} onClick={handleIndex}
+            className="inline-flex items-center gap-2 px-4 py-2 rounded-ios bg-slate-900 text-white text-sm font-medium disabled:opacity-50"
+          >
+            {indexLoading ? <Loader2 size={16} className="animate-spin" /> : null}
+            {indexLoading ? L.indexing : L.indexBtn}
+          </button>
+
+          {persist && (
+            <div className="mt-4 rounded-xl border border-ios-gray-200 bg-white p-3 text-xs space-y-2">
+              <div className="font-medium text-ios-gray-700">{L.summary}</div>
+              <div className="grid grid-cols-1 sm:grid-cols-2 gap-2 text-ios-gray-600">
+                <span>{L.chunks}: <b>{persist.num_chunks ?? '—'}</b></span>
+              </div>
+              <div className="flex items-start gap-2 break-all">
+                <span className="shrink-0 text-ios-gray-500">{L.workspace}:</span>
+                <code className="flex-1 text-[11px] bg-ios-gray-50 p-2 rounded">{persist.workspace_dir}</code>
+                <button type="button" onClick={() => copyText(persist.workspace_dir)} className="shrink-0 p-1.5 rounded border border-ios-gray-200 hover:bg-ios-gray-50" title={L.copy}>
+                  <Copy size={14} />
+                </button>
+              </div>
+            </div>
+          )}
+        </section>
+
+        {/* ② Chat section */}
+        <section className="rounded-2xl border border-ios-gray-100 overflow-hidden">
+          {/* Toolbar */}
+          <div className="flex items-center gap-3 px-4 py-2 border-b border-ios-gray-100 bg-ios-gray-50/40 text-xs">
+            <span className="text-ios-gray-500">{L.searchMethodLabel}</span>
+            <select
+              value={searchMethod} onChange={(e) => setSearchMethod(e.target.value as typeof searchMethod)}
+              className="px-2 py-1 border border-ios-gray-200 rounded text-xs"
+            >
+              <option value="auto">Auto</option>
+              <option value="local">Local</option>
+              <option value="global">Global</option>
+            </select>
+            <label className="flex items-center gap-1.5 cursor-pointer shrink-0">
+              <input
+                type="checkbox"
+                checked={wikidataEnrich}
+                onChange={(e) => {
+                  const c = e.target.checked;
+                  setWikidataEnrich(c);
+                  try {
+                    localStorage.setItem('graphrag_wikidata_enrich', c ? '1' : '0');
+                  } catch {
+                    /* ignore */
+                  }
+                }}
+              />
+              <span className="text-ios-gray-600">{L.wikidataEnrich}</span>
+            </label>
+            <button
+              type="button" onClick={() => setMessages([])}
+              className="ml-auto text-ios-gray-400 hover:text-ios-gray-600 text-[11px]"
+            >
+              {L.clearChat}
+            </button>
+          </div>
+
+          {/* Messages */}
+          <div className="min-h-[min(520px,55vh)] max-h-[min(960px,78vh)] overflow-y-auto px-4 py-4 space-y-4">
+            {messages.length === 0 && (
+              <div className="text-center text-xs text-ios-gray-400 py-12">
+                {persist?.workspace_dir ? L.emptyReady : L.emptyNoIndex}
+              </div>
+            )}
+            {messages.map((msg) => (
+              <div key={msg.id} className={`flex ${msg.role === 'user' ? 'justify-end' : 'justify-start'}`}>
+                <div className={`max-w-[85%] rounded-2xl px-4 py-3 text-sm ${
+                  msg.role === 'user'
+                    ? 'bg-primary text-white rounded-br-sm'
+                    : 'bg-ios-gray-50 text-ios-gray-900 rounded-bl-sm border border-ios-gray-100'
+                }`}>
+                  {msg.role === 'user' ? (
+                    <div className="whitespace-pre-wrap break-words">{msg.content}</div>
+                  ) : (
+                    <div>
+                      <div className="prose prose-sm max-w-none">
+                        <ReactMarkdown>{msg.content || '—'}</ReactMarkdown>
+                      </div>
+                      {msg.meta && (
+                        <AssistantMeta
+                          meta={msg.meta}
+                          locale={locale}
+                          L={L}
+                          userId={userId}
+                          subgraphPending={!!msg.postprocessSubgraphPending}
+                        />
+                      )}
+                      {msg.postprocessSubgraphPending ? (
+                        <div className="mt-2 text-[11px] text-amber-700/90 flex items-center gap-1">
+                          <Loader2 size={12} className="animate-spin" />
+                          {L.postprocessSubgraphPending}
+                        </div>
+                      ) : null}
+                      {msg.postprocessWikidataPending ? (
+                        <div className="mt-1 text-[11px] text-amber-700/90 flex items-center gap-1">
+                          <Loader2 size={12} className="animate-spin" />
+                          {L.postprocessWikidataPending}
+                        </div>
+                      ) : null}
+                    </div>
+                  )}
+                </div>
+              </div>
+            ))}
+            {chatLoading && (
+              <div className="flex justify-start">
+                <div className="bg-ios-gray-50 border border-ios-gray-100 rounded-2xl rounded-bl-sm px-4 py-3">
+                  <Loader2 size={16} className="animate-spin text-ios-gray-400" />
+                </div>
+              </div>
+            )}
+            <div ref={messagesEndRef} />
+          </div>
+
+          {/* Input */}
+          <div className="border-t border-ios-gray-100 px-4 py-3 flex gap-2 items-end">
+            <textarea
+              value={inputValue}
+              onChange={(e) => setInputValue(e.target.value)}
+              onKeyDown={(e) => { if (e.key === 'Enter' && !e.shiftKey) { e.preventDefault(); handleChat(); } }}
+              rows={3} placeholder={L.chatPlaceholder}
+              className="flex-1 px-3 py-2 border border-ios-gray-200 rounded-xl text-sm resize-none"
+            />
+            <button
+              type="button" disabled={chatLoading || !inputValue.trim()} onClick={handleChat}
+              className="px-4 py-2 rounded-xl bg-primary text-white text-sm font-medium disabled:opacity-50 shrink-0"
+            >
+              {chatLoading ? <Loader2 size={16} className="animate-spin" /> : <Send size={16} />}
+            </button>
+          </div>
+        </section>
+
+        {/* ③ Merge section */}
+        <section className="rounded-2xl border border-dashed border-ios-gray-200 p-4 space-y-3">
+          <h3 className="text-sm font-semibold text-ios-gray-800">{L.mergeTitle}</h3>
+          <div>
+            <label className="block text-xs text-ios-gray-500 mb-1">{L.mergeA}</label>
+            <textarea value={mergeA} onChange={(e) => setMergeA(e.target.value)} rows={2}
+              className="w-full px-3 py-2 border border-ios-gray-200 rounded-lg text-xs font-mono" />
+          </div>
+          <div>
+            <label className="block text-xs text-ios-gray-500 mb-1">{L.mergeB}</label>
+            <textarea value={mergeB} onChange={(e) => setMergeB(e.target.value)} rows={2}
+              className="w-full px-3 py-2 border border-ios-gray-200 rounded-lg text-xs font-mono" />
+          </div>
+          <label className="flex items-center gap-2 text-sm cursor-pointer">
+            <input type="checkbox" checked={mergeDedupe} onChange={(e) => setMergeDedupe(e.target.checked)} />
+            {L.dedupe}
+          </label>
+          <button
+            type="button" disabled={mergeLoading} onClick={handleMerge}
+            className="inline-flex items-center gap-2 px-4 py-2 rounded-ios border border-ios-gray-300 text-sm font-medium disabled:opacity-50"
+          >
+            {mergeLoading ? <Loader2 size={16} className="animate-spin" /> : null}
+            {mergeLoading ? L.merging : L.mergeBtn}
+          </button>
+        </section>
+
+      </div>
+    </main>
+  );
+}
diff --git a/frontend_zh/src/config/api.ts b/frontend_zh/src/config/api.ts
index bbf9aea..422d232 100644
--- a/frontend_zh/src/config/api.ts
+++ b/frontend_zh/src/config/api.ts
@@ -23,6 +23,9 @@ function getApiBaseUrl(): string {
 
 export const API_BASE_URL = getApiBaseUrl();
 
+/** GraphRAG KB REST 前缀（相对 API_BASE_URL） */
+export const GRAPHRAG_KB_BASE = '/api/v1/graphrag-kb';
+
 // API key for backend authentication
 export const API_KEY = import.meta.env.VITE_API_KEY || 'df-internal-2024-workflow-key';
 
diff --git a/frontend_zh/src/pages/NotebookView.tsx b/frontend_zh/src/pages/NotebookView.tsx
index 64c76bd..9867227 100644
--- a/frontend_zh/src/pages/NotebookView.tsx
+++ b/frontend_zh/src/pages/NotebookView.tsx
@@ -1,11 +1,11 @@
-import React, { useState, useEffect } from 'react';
+import React, { useState, useEffect, useMemo } from 'react';
 import { motion, AnimatePresence } from 'framer-motion';
 import {
   ChevronLeft, Plus, Share2, Settings, MessageSquare,
   BarChart2, Zap, AudioLines, Video, FileText,
   Filter, MoreVertical, Search, Image as ImageIcon, FileStack, Sparkles,
   Mic2, Video as VideoIcon, BrainCircuit, Send, Bot, User, Loader2, Upload, X,
-  Globe, Link2, Cloud, ChevronRight, LayoutGrid, Download, BookOpen, Brain
+  Globe, Link2, Cloud, ChevronRight, LayoutGrid, Download, BookOpen, Brain, Network
 } from 'lucide-react';
 import { useAuthStore } from '../stores/authStore';
 import { apiFetch } from '../config/api';
@@ -13,6 +13,8 @@ import { getApiSettings } from '../services/apiSettingsService';
 import { fetchWithCache, invalidateCacheByPrefix } from '../services/clientCache';
 import type { KnowledgeFile, ChatMessage, ToolType } from '../types';
 import ReactMarkdown from 'react-markdown';
+import rehypeRaw from 'rehype-raw';
+import { injectGraphragHighlightInMarkdown } from '../utils/graphragMarkdownHighlight';
 import { MermaidPreview } from '../components/knowledge-base/tools/MermaidPreview';
 import { SettingsModal } from '../components/SettingsModal';
 import DrawioInlineEditor from '../components/DrawioInlineEditor';
@@ -20,6 +22,7 @@ import { FlashcardViewer } from '../components/flashcards/FlashcardViewer';
 import { QuizContainer } from '../components/quiz/QuizContainer';
 import { NotionEditor } from '../components/notes/NotionEditor';
 import { useToast } from '../hooks/useToast';
+import { GraphRAGKbPanel } from '../components/graphrag-kb/GraphRAGKbPanel';
 import katex from 'katex';
 import 'katex/dist/katex.min.css';
 
@@ -129,6 +132,8 @@ type CitationReference = {
   preview?: string;
   chunkIndex?: number | null;
   sourceNumber?: string;
+  /** GraphRAG 索引块原文（来自 workspace input 中 [chunk:…] 段，非整篇 MinerU 预览） */
+  graphragHighlightText?: string;
 };
 
 type CitationTooltipState = {
@@ -366,6 +371,7 @@ const NotebookView = ({ notebook, onBack }: { notebook: any, onBack: () => void
   const dataExtractTool = { icon: <BarChart2 className="text-emerald-500" />, label: '智能取数', id: 'data_extract' as ToolType };
   const studioTools: Array<{icon: React.ReactNode, label: string, id: ToolType}> = [
     dataExtractTool,
+    { icon: <Network className="text-cyan-600" />, label: 'GraphRAG KB', id: 'graphrag_kb' },
     { icon: <ImageIcon className="text-orange-500" />, label: 'PPT生成', id: 'ppt' },
     { icon: <BrainCircuit className="text-purple-500" />, label: '思维导图', id: 'mindmap' },
     // DrawIO 图表功能暂时隐藏，后续修复
@@ -379,12 +385,13 @@ const NotebookView = ({ notebook, onBack }: { notebook: any, onBack: () => void
   ];
 
   // Studio：每个功能卡片各自配置，点卡片上的「…」翻转进该卡片的设置
-  type StudioToolId = 'data_extract' | 'ppt' | 'mindmap' | 'drawio' | 'flashcard' | 'quiz' | 'podcast' | 'video' | 'note';
+  type StudioToolId = 'data_extract' | 'graphrag_kb' | 'ppt' | 'mindmap' | 'drawio' | 'flashcard' | 'quiz' | 'podcast' | 'video' | 'note';
   const [studioPanelView, setStudioPanelView] = useState<'tools' | 'settings'>('tools');
   const [studioSettingsTool, setStudioSettingsTool] = useState<StudioToolId | null>(null);
   const STORAGE_STUDIO_CONFIG = `kb_studio_config_${effectiveUser?.id || 'default'}`;
   const defaultByTool: Record<StudioToolId, Record<string, string>> = {
     data_extract: { resultFormat: 'json', executionStrategy: 'auto' },
+    graphrag_kb: {},
     ppt: { llmModel: 'deepseek-v3.2', genFigModel: 'gemini-2.5-flash-image', stylePreset: 'modern', stylePrompt: '', language: 'zh', page_count: '10' },
     mindmap: { llmModel: 'deepseek-v3.2', mindmapStyle: 'default' },
     drawio: { llmModel: 'deepseek-v3.2', diagramType: 'auto', diagramStyle: 'default', language: 'zh' },
@@ -1614,6 +1621,17 @@ const NotebookView = ({ notebook, onBack }: { notebook: any, onBack: () => void
     return () => window.clearTimeout(timer);
   }, [sourceDetailCitationFocus, sourceDetailLoading, sourceDetailContent]);
 
+  const sourceDetailMarkdownWithHighlight = useMemo(() => {
+    if (sourceDetailFormat !== 'markdown' || !sourceDetailContent) return sourceDetailContent;
+    const hl = sourceDetailCitationFocus?.graphragHighlightText?.trim();
+    if (!hl) return sourceDetailContent;
+    return injectGraphragHighlightInMarkdown(sourceDetailContent, hl);
+  }, [
+    sourceDetailFormat,
+    sourceDetailContent,
+    sourceDetailCitationFocus?.graphragHighlightText,
+  ]);
+
   const runFastResearch = async () => {
     if (!fastResearchQuery.trim()) return;
     const settings = getApiSettings(effectiveUser?.id || null);
@@ -3077,8 +3095,10 @@ const NotebookView = ({ notebook, onBack }: { notebook: any, onBack: () => void
                     <span className="ml-2 text-sm text-gray-500">解析中…</span>
                   </div>
                 ) : sourceDetailFormat === 'markdown' && sourceDetailContent ? (
-                  <div className="prose prose-sm max-w-none text-gray-700 prose-p:text-xs prose-headings:text-sm prose-pre:text-xs">
-                    <ReactMarkdown>{sourceDetailContent}</ReactMarkdown>
+                  <div className="prose prose-sm max-w-none text-gray-700 prose-p:text-xs prose-headings:text-sm prose-pre:text-xs prose-mark:bg-amber-200/90 prose-mark:rounded prose-mark:px-0.5">
+                    <ReactMarkdown rehypePlugins={[rehypeRaw]}>
+                      {sourceDetailMarkdownWithHighlight ?? ''}
+                    </ReactMarkdown>
                   </div>
                 ) : (
                   <pre className="whitespace-pre-wrap text-xs text-gray-700 font-sans leading-relaxed break-words">
@@ -3123,6 +3143,13 @@ const NotebookView = ({ notebook, onBack }: { notebook: any, onBack: () => void
               initialBlocks={editingNote?.blocks}
             />
           </div>
+        ) : activeTool === 'graphrag_kb' ? (
+          <GraphRAGKbPanel
+            notebook={notebook}
+            userId={effectiveUser?.id || null}
+            email={effectiveUser?.email || effectiveUser?.id || ''}
+            showToast={showToast}
+          />
         ) : activeTool === 'data_extract' ? (
           <main className="flex-1 flex flex-col relative bg-white min-w-[300px] overflow-hidden">
             <div className="flex items-center justify-between px-6 py-3 border-b border-ios-gray-100 shrink-0">
@@ -3644,6 +3671,7 @@ const NotebookView = ({ notebook, onBack }: { notebook: any, onBack: () => void
               </button>
               <h3 className="text-sm font-semibold text-gray-800 mb-3">
                 {studioSettingsTool === 'data_extract' && '智能取数'}
+                {studioSettingsTool === 'graphrag_kb' && 'GraphRAG KB'}
                 {studioSettingsTool === 'ppt' && 'PPT 生成'}
                 {studioSettingsTool === 'mindmap' && '思维导图'}
                 {studioSettingsTool === 'drawio' && 'DrawIO 图表'}
@@ -3676,6 +3704,9 @@ const NotebookView = ({ notebook, onBack }: { notebook: any, onBack: () => void
                     </>
                   );
                 })()}
+                {studioSettingsTool === 'graphrag_kb' && (
+                  <p className="text-sm text-gray-600">索引、查询与合并选项均在中间主面板的 GraphRAG 知识库中配置。</p>
+                )}
                 {studioSettingsTool === 'ppt' && (() => {
                   const c = getStudioConfig('ppt');
                   return (
@@ -4046,7 +4077,7 @@ const NotebookView = ({ notebook, onBack }: { notebook: any, onBack: () => void
                 </motion.div>
               ))}
             </div>
-            {activeTool !== 'chat' && activeTool !== 'search' && activeTool !== 'data_extract' && (
+            {activeTool !== 'chat' && activeTool !== 'search' && activeTool !== 'data_extract' && activeTool !== 'graphrag_kb' && (
               <motion.button
                 whileTap={{ scale: 0.97 }}
                 type="button"
diff --git a/frontend_zh/src/services/graphragKbService.ts b/frontend_zh/src/services/graphragKbService.ts
new file mode 100644
index 0000000..ea1104a
--- /dev/null
+++ b/frontend_zh/src/services/graphragKbService.ts
@@ -0,0 +1,154 @@
+/**
+ * GraphRAG 知识库前端 API 封装。
+ *
+ * 数据流：调用 ``/api/v1/graphrag-kb/*`` → FastAPI ``graphrag_kb`` 路由 → ``wa_graphrag_kb`` → ``wf_graphrag_kb``。
+ * ``refineGraphragContextRefine`` 用于侧栏「上下文参考」：首条 unit + 子图 → 清洗正文与支撑句高亮。
+ * ``fetchGraphragChunkSnippet`` 仍供阅读器等按 chunk_id 拉取 ``input/*.txt`` 段正文。
+ */
+import { apiFetch, GRAPHRAG_KB_BASE } from '../config/api';
+import type {
+  IndexRequest,
+  IndexResponse,
+  QueryRequest,
+  QueryResponse,
+  MergeRequest,
+  MergeResponse,
+  ChatRequest,
+  ChatResponse,
+  ChatPostprocessRequest,
+  ChatPostprocessResponse,
+  ContextRefineResponse,
+} from '../types/graphragKb';
+
+const DEFAULT_LLM_MODEL = 'deepseek-v3.2';
+
+async function parseErrorDetail(res: Response): Promise<string> {
+  try {
+    const body = await res.json();
+    const d = body?.detail;
+    if (typeof d === 'string') return d;
+    if (Array.isArray(d)) return d.map((x: { msg?: string }) => x?.msg || String(x)).join('; ');
+    return body?.message || `HTTP ${res.status}`;
+  } catch {
+    const t = await res.text();
+    return t || `HTTP ${res.status}`;
+  }
+}
+
+export function defaultGraphragModel(): string {
+  return DEFAULT_LLM_MODEL;
+}
+
+export async function indexGraphragKb(body: IndexRequest): Promise<IndexResponse> {
+  const res = await apiFetch(`${GRAPHRAG_KB_BASE}/index`, {
+    method: 'POST',
+    headers: { 'Content-Type': 'application/json' },
+    body: JSON.stringify(body),
+  });
+  if (!res.ok) throw new Error(await parseErrorDetail(res));
+  return res.json() as Promise<IndexResponse>;
+}
+
+export async function queryGraphragKb(body: QueryRequest): Promise<QueryResponse> {
+  const res = await apiFetch(`${GRAPHRAG_KB_BASE}/query`, {
+    method: 'POST',
+    headers: { 'Content-Type': 'application/json' },
+    body: JSON.stringify(body),
+  });
+  if (!res.ok) throw new Error(await parseErrorDetail(res));
+  return res.json() as Promise<QueryResponse>;
+}
+
+export async function mergeGraphragKb(body: MergeRequest): Promise<MergeResponse> {
+  const res = await apiFetch(`${GRAPHRAG_KB_BASE}/merge`, {
+    method: 'POST',
+    headers: { 'Content-Type': 'application/json' },
+    body: JSON.stringify(body),
+  });
+  if (!res.ok) throw new Error(await parseErrorDetail(res));
+  return res.json() as Promise<MergeResponse>;
+}
+
+export async function chatGraphragKb(body: ChatRequest): Promise<ChatResponse> {
+  const res = await apiFetch(`${GRAPHRAG_KB_BASE}/chat`, {
+    method: 'POST',
+    headers: { 'Content-Type': 'application/json' },
+    body: JSON.stringify(body),
+  });
+  if (!res.ok) throw new Error(await parseErrorDetail(res));
+  return res.json() as Promise<ChatResponse>;
+}
+
+export async function chatGraphragKbPostprocess(
+  body: ChatPostprocessRequest,
+): Promise<ChatPostprocessResponse> {
+  const res = await apiFetch(`${GRAPHRAG_KB_BASE}/chat-postprocess`, {
+    method: 'POST',
+    headers: { 'Content-Type': 'application/json' },
+    body: JSON.stringify(body),
+  });
+  if (!res.ok) throw new Error(await parseErrorDetail(res));
+  return res.json() as Promise<ChatPostprocessResponse>;
+}
+
+export interface ChunkSnippetResponse {
+  text: string;
+  source_stem: string;
+  found: boolean;
+  /** Verbatim sentence/phrase extracted by LLM that best matches the reasoning triples. */
+  highlighted_sentence?: string;
+}
+
+/** 从 GraphRAG workspace ``input/*.txt`` 中解析 ``[chunk:id]`` 对应正文（用于阅读器高亮，非整篇 MinerU MD）。
+ *  可选传入 triples（reasoning_subgraph）让后端调 LLM 精确定位最相关的原句；
+ *  apiKey / apiUrl 需与查询时使用的凭证一致，否则 LLM 调用会返回 401。
+ */
+export async function fetchGraphragChunkSnippet(
+  workspaceDir: string,
+  chunkId: string,
+  triples?: Array<Record<string, unknown>>,
+  apiKey?: string,
+  apiUrl?: string,
+  /** Same text as the context-reference box (stripped); LLM uses this instead of raw input block. */
+  passageForLlm?: string,
+): Promise<ChunkSnippetResponse> {
+  const res = await apiFetch(`${GRAPHRAG_KB_BASE}/chunk-snippet`, {
+    method: 'POST',
+    headers: { 'Content-Type': 'application/json' },
+    body: JSON.stringify({
+      workspace_dir: workspaceDir,
+      chunk_id: chunkId,
+      api_key: apiKey || '',
+      api_url: apiUrl || '',
+      ...(triples && triples.length > 0 ? { triples } : {}),
+      ...(passageForLlm != null && passageForLlm.trim() !== ''
+        ? { passage_for_llm: passageForLlm }
+        : {}),
+    }),
+  });
+  if (!res.ok) throw new Error(await parseErrorDetail(res));
+  return res.json() as Promise<ChunkSnippetResponse>;
+}
+
+/** 首条检索 unit 原文 + reasoning_subgraph → 清洗正文 + 支撑句（侧栏上下文参考高亮） */
+export async function refineGraphragContextRefine(
+  unitText: string,
+  subgraph: Array<Record<string, unknown>>,
+  apiKey: string,
+  apiUrl: string,
+  model?: string,
+): Promise<ContextRefineResponse> {
+  const res = await apiFetch(`${GRAPHRAG_KB_BASE}/context-refine`, {
+    method: 'POST',
+    headers: { 'Content-Type': 'application/json' },
+    body: JSON.stringify({
+      unit_text: unitText,
+      subgraph,
+      api_key: apiKey || '',
+      api_url: apiUrl || '',
+      model: (model || '').trim() || DEFAULT_LLM_MODEL,
+    }),
+  });
+  if (!res.ok) throw new Error(await parseErrorDetail(res));
+  return res.json() as Promise<ContextRefineResponse>;
+}
diff --git a/frontend_zh/src/types/graphragKb.ts b/frontend_zh/src/types/graphragKb.ts
new file mode 100644
index 0000000..43ed20d
--- /dev/null
+++ b/frontend_zh/src/types/graphragKb.ts
@@ -0,0 +1,156 @@
+/**
+ * GraphRAG KB 前后端 JSON 契约（与 ``fastapi_app/routers/graphrag_kb.py`` 一致，字段 snake_case）。
+ *
+ * - Index*：建索引请求/响应（workspace_dir、分块数、可选 KGGen 统计）。
+ * - Query*：查询响应含 answer、context_data、推理子图、source_chunks、highlight_hints、Judge、子图 CoT。
+ * - Merge*：两工作区合并后的路径与 chunk 数。
+ * - GraphragWorkspacePersist：前端 localStorage 持久化的上次索引摘要。
+ */
+
+export interface IndexRequest {
+  notebook_id: string;
+  notebook_title?: string;
+  email?: string;
+  api_url: string;
+  api_key: string;
+  model: string;
+  source_stems?: string[] | null;
+  workspace_dir?: string;
+  force_reindex?: boolean;
+  parse_pdfs?: boolean;
+  /** Default true: server skips KGGen; set false only for internal experiments. */
+  skip_kggen?: boolean;
+}
+
+export interface IndexResponse {
+  workspace_dir: string;
+  num_chunks: number;
+  kg_entities: number;
+  kg_relations: number;
+}
+
+export interface QueryRequest {
+  notebook_id: string;
+  notebook_title?: string;
+  email?: string;
+  api_url: string;
+  api_key: string;
+  model: string;
+  question: string;
+  search_method: 'local' | 'global';
+  workspace_dir: string;
+  wikidata_enrich?: boolean | null;
+}
+
+export interface QueryResponse {
+  answer: string;
+  context_data: Record<string, unknown>;
+  reasoning_subgraph: Array<Record<string, unknown>>;
+  source_chunks: string[];
+  highlight_hints: Array<Record<string, unknown>>;
+  judge_score: number;
+  judge_rationale: string;
+  /** LLM chain-of-thought for minimal subgraph selection (hop analysis) */
+  reasoning_subgraph_cot?: string;
+}
+
+export interface MergeRequest {
+  notebook_id?: string;
+  notebook_title?: string;
+  email?: string;
+  api_url: string;
+  api_key: string;
+  model: string;
+  workspace_dir_a: string;
+  workspace_dir_b: string;
+  dedupe?: boolean;
+}
+
+export interface MergeResponse {
+  merged_workspace_dir: string;
+  num_chunks: number;
+}
+
+export interface GraphragWorkspacePersist {
+  workspace_dir: string;
+  updatedAt: number;
+  num_chunks?: number;
+}
+
+// ── Chat types (Plan 3) ─────────────────────────────────────────────────────
+
+export interface ChatRequest {
+  notebook_id: string;
+  notebook_title?: string;
+  email?: string;
+  query: string;
+  history: Array<{ role: 'user' | 'assistant'; content: string; meta?: Record<string, unknown> }>;
+  search_method?: 'auto' | 'local' | 'global';
+  workspace_dir?: string;
+  api_url?: string;
+  api_key?: string;
+  model?: string;
+  /** false = 不在答案后附加 Wikidata；省略则跟服务端默认（默认可为 true） */
+  wikidata_enrich?: boolean | null;
+  /** true = 先返回主答案，再异步回填子图/Judge/Wikidata */
+  defer_postprocess?: boolean;
+}
+
+export interface ChatResponse {
+  answer: string;
+  intent: { use_graphrag?: boolean; reason?: string };
+  rewritten_query: string;
+  context_data: Record<string, unknown>;
+  reasoning_subgraph: Array<Record<string, unknown>>;
+  reasoning_subgraph_cot: string;
+  source_chunks: string[];
+  highlight_hints: Array<Record<string, unknown>>;
+  judge_score: number;
+  judge_rationale: string;
+  postprocess_pending?: boolean;
+  graphrag_raw_answer?: string;
+}
+
+export interface ChatPostprocessRequest {
+  query: string;
+  answer: string;
+  reasoning_subgraph: Array<Record<string, unknown>>;
+  api_url?: string;
+  api_key?: string;
+  model?: string;
+  wikidata_enrich?: boolean | null;
+  mode?: 'all' | 'subgraph' | 'wikidata';
+}
+
+export interface ChatPostprocessResponse {
+  reasoning_subgraph: Array<Record<string, unknown>>;
+  reasoning_subgraph_cot: string;
+  judge_score: number;
+  judge_rationale: string;
+  wikidata_appendix: string;
+  subgraph_done: boolean;
+  wikidata_done: boolean;
+  done: boolean;
+}
+
+export interface ChatMessage {
+  id: string;
+  role: 'user' | 'assistant';
+  content: string;
+  meta?: Pick<
+    ChatResponse,
+    'intent' | 'rewritten_query' | 'context_data' | 'reasoning_subgraph' |
+    'reasoning_subgraph_cot' | 'judge_score' | 'judge_rationale' |
+    'graphrag_raw_answer' |
+    'source_chunks' | 'highlight_hints'
+  >;
+  postprocessPending?: boolean;
+  postprocessSubgraphPending?: boolean;
+  postprocessWikidataPending?: boolean;
+}
+
+/** POST /graphrag-kb/context-refine — LLM 清洗首条 unit 并返回支撑子图的原文子串列表 */
+export interface ContextRefineResponse {
+  cleaned_text: string;
+  supporting_snippets: string[];
+}
diff --git a/frontend_zh/src/types/index.ts b/frontend_zh/src/types/index.ts
index 0b17279..1d4ff9c 100644
--- a/frontend_zh/src/types/index.ts
+++ b/frontend_zh/src/types/index.ts
@@ -1,3 +1,13 @@
+export type {
+  IndexRequest as GraphragIndexRequest,
+  IndexResponse as GraphragIndexResponse,
+  QueryRequest as GraphragQueryRequest,
+  QueryResponse as GraphragQueryResponse,
+  MergeRequest as GraphragMergeRequest,
+  MergeResponse as GraphragMergeResponse,
+  GraphragWorkspacePersist,
+} from './graphragKb';
+
 // Knowledge Base Types
 export type MaterialType = 'image' | 'doc' | 'video' | 'link' | 'audio' | 'dataset';
 
@@ -34,4 +44,4 @@ export interface ChatMessage {
 }
 
 export type SectionType = 'library' | 'upload' | 'output' | 'settings';
-export type ToolType = 'chat' | 'ppt' | 'mindmap' | 'podcast' | 'video' | 'search' | 'drawio' | 'flashcard' | 'quiz' | 'note' | 'data_extract';
+export type ToolType = 'chat' | 'ppt' | 'mindmap' | 'podcast' | 'video' | 'search' | 'drawio' | 'flashcard' | 'quiz' | 'note' | 'data_extract' | 'graphrag_kb';
diff --git a/frontend_zh/src/utils/graphragMarkdownHighlight.ts b/frontend_zh/src/utils/graphragMarkdownHighlight.ts
new file mode 100644
index 0000000..38e55d0
--- /dev/null
+++ b/frontend_zh/src/utils/graphragMarkdownHighlight.ts
@@ -0,0 +1,193 @@
+/**
+ * Inject a <mark> around the first occurrence of `snippet` in a Markdown string,
+ * then let react-markdown + rehype-raw render it as an inline highlight.
+ *
+ * Data flow: context-refine → cleaned_text + supporting_snippets（或 chunk-snippet 单句）
+ *   → NotebookView passes (fullMarkdown, snippet) here
+ *   → injected HTML → ReactMarkdown renders the highlight.
+ *
+ * Search strategy (in order, stops at first hit):
+ *   1. Exact verbatim indexOf
+ *   2. Strip inline markdown formatting chars (* _ ` ~) and retry
+ *   3. Whitespace-normalized: collapse all whitespace to single space, then retry
+ *
+ * This handles the common mismatch where chunk text comes from MinerU content_list
+ * (plain text) but the displayed content is MinerU Markdown (**bold**, _italic_, etc.).
+ */
+
+const DEFAULT_MARK_CLASS =
+  'bg-amber-200/90 rounded px-0.5 ring-1 ring-amber-300/60';
+
+/** Rotate styles so multiple refs are visually distinct in the sidebar. */
+const ALT_MARK_CLASSES = [
+  'bg-amber-200/90 rounded px-0.5 ring-1 ring-amber-300/60',
+  'bg-sky-200/90 rounded px-0.5 ring-1 ring-sky-300/60',
+  'bg-emerald-200/85 rounded px-0.5 ring-1 ring-emerald-300/55',
+  'bg-violet-200/85 rounded px-0.5 ring-1 ring-violet-300/55',
+];
+
+function markOpenTag(className: string): string {
+  const cls = className || DEFAULT_MARK_CLASS;
+  return `<mark class="${cls}" data-graphrag-hl="1">`;
+}
+
+function htmlEsc(s: string): string {
+  return s.replace(/&/g, '&amp;').replace(/</g, '&lt;').replace(/>/g, '&gt;');
+}
+
+function wrapRange(full: string, start: number, end: number, markClass: string): string {
+  return (
+    full.slice(0, start) +
+    markOpenTag(markClass) +
+    htmlEsc(full.slice(start, end)) +
+    '</mark>' +
+    full.slice(end)
+  );
+}
+
+/**
+ * Build a stripped version of `md` (inline format chars removed)
+ * plus a map from stripped-index → original-index.
+ */
+function stripMdChars(md: string): { text: string; map: number[] } {
+  const map: number[] = [];
+  let text = '';
+  let i = 0;
+  while (i < md.length) {
+    const c = md[i];
+    if (c === '*' || c === '_' || c === '`') { i++; continue; }
+    if (c === '~' && md[i + 1] === '~') { i += 2; continue; }
+    // skip HTML tags (e.g. pre-existing <mark>)
+    if (c === '<') {
+      const end = md.indexOf('>', i);
+      if (end >= 0) { i = end + 1; continue; }
+    }
+    map.push(i);
+    text += c;
+    i++;
+  }
+  return { text, map };
+}
+
+/**
+ * Map a position in the whitespace-normalised version of `s` back to the
+ * corresponding position in `s` itself (before normalisation).
+ */
+function normPosToOrig(s: string, normPos: number): number {
+  let norm = 0;
+  let orig = 0;
+  while (orig < s.length && norm < normPos) {
+    if (/\s/.test(s[orig])) {
+      // consume entire whitespace run (= one ' ' in normalised)
+      while (orig < s.length && /\s/.test(s[orig])) orig++;
+      norm++;
+    } else {
+      orig++;
+      norm++;
+    }
+  }
+  return orig;
+}
+
+export type InjectHighlightOptions = {
+  /** CSS classes for the &lt;mark&gt; (default amber). */
+  markClass?: string;
+  /** Pick a palette slot 0..3 for multi-source distinction. */
+  colorIndex?: number;
+};
+
+/** Locate [start, end) in *full* for *snippet* using the same 3-pass strategy as injection. */
+export function findGraphragHighlightRange(
+  full: string,
+  snippet: string,
+): { start: number; end: number } | null {
+  const sn = snippet.trim();
+  if (!full || !sn) return null;
+
+  const i1 = full.indexOf(sn);
+  if (i1 >= 0) return { start: i1, end: i1 + sn.length };
+
+  const { text: stripped, map } = stripMdChars(full);
+  const i2 = stripped.indexOf(sn);
+  if (i2 >= 0 && i2 + sn.length - 1 < map.length) {
+    return { start: map[i2], end: map[i2 + sn.length - 1] + 1 };
+  }
+
+  const normSn = sn.replace(/\s+/g, ' ');
+  const normStripped = stripped.replace(/\s+/g, ' ');
+  const i3 = normStripped.indexOf(normSn);
+  if (i3 < 0) return null;
+
+  const stripStart = normPosToOrig(stripped, i3);
+  const stripEnd = normPosToOrig(stripped, i3 + normSn.length);
+
+  if (stripStart >= map.length) return null;
+  const origStart = map[stripStart];
+  const origEnd = stripEnd < map.length ? map[stripEnd] : map[map.length - 1] + 1;
+  return { start: origStart, end: origEnd };
+}
+
+function markClassForOptions(options?: InjectHighlightOptions, slot = 0): string {
+  let markClass = options?.markClass || '';
+  if (!markClass && options?.colorIndex != null) {
+    const i =
+      (Math.max(0, Math.floor(options.colorIndex)) + slot) % ALT_MARK_CLASSES.length;
+    markClass = ALT_MARK_CLASSES[i]!;
+  }
+  if (!markClass) markClass = DEFAULT_MARK_CLASS;
+  return markClass;
+}
+
+export function injectGraphragHighlightInMarkdown(
+  full: string,
+  snippet: string,
+  options?: InjectHighlightOptions,
+): string {
+  const sn = snippet.trim();
+  if (!full || !sn) return full;
+  const markClass = markClassForOptions(options, 0);
+  const r = findGraphragHighlightRange(full, snippet);
+  if (!r) return full;
+  return wrapRange(full, r.start, r.end, markClass);
+}
+
+export type InjectMultipleHighlightsOptions = InjectHighlightOptions & {
+  /** First palette slot when using colorIndex rotation (default 0). */
+  baseColorIndex?: number;
+};
+
+/** Wrap multiple non-overlapping snippets (rightmost first) so indices stay valid on the original *full*. */
+export function injectMultipleGraphragHighlightsInMarkdown(
+  full: string,
+  snippets: string[],
+  options?: InjectMultipleHighlightsOptions,
+): string {
+  if (!full || !snippets.length) return full;
+  const base = options?.baseColorIndex ?? options?.colorIndex ?? 0;
+  const ranges: { start: number; end: number; slot: number }[] = [];
+  let k = 0;
+  for (const raw of snippets) {
+    const r = findGraphragHighlightRange(full, raw);
+    if (!r) continue;
+    ranges.push({ ...r, slot: k++ });
+  }
+  ranges.sort((a, b) => a.start - b.start);
+  const merged: typeof ranges = [];
+  for (const r of ranges) {
+    const prev = merged[merged.length - 1];
+    if (prev && r.start < prev.end) continue;
+    merged.push(r);
+  }
+  merged.sort((a, b) => b.start - a.start);
+  let out = full;
+  for (const r of merged) {
+    const mc = markClassForOptions(
+      options?.markClass
+        ? { markClass: options.markClass }
+        : { colorIndex: base + r.slot },
+      0,
+    );
+    out = wrapRange(out, r.start, r.end, mc);
+  }
+  return out;
+}
diff --git a/frontend_zh/src/utils/stripGraphragContextNoise.ts b/frontend_zh/src/utils/stripGraphragContextNoise.ts
new file mode 100644
index 0000000..2ce40c8
--- /dev/null
+++ b/frontend_zh/src/utils/stripGraphragContextNoise.ts
@@ -0,0 +1,20 @@
+/**
+ * GraphRAG text_units / sources often embed lineage markers. Strip them for human-readable UI.
+ */
+const RE_CHUNK_LINE = /^\s*\[chunk:[a-f0-9]+\]\s*$/gim;
+const RE_CHUNK_INLINE = /\[chunk:[a-f0-9]+\]/gi;
+const RE_DATA = /\s*\[Data:[^\]]+\]/gi;
+
+export function stripGraphragContextNoise(raw: string): string {
+  if (!raw) return '';
+  let t = raw.replace(RE_DATA, '');
+  t = t.replace(RE_CHUNK_INLINE, '');
+  t = t.replace(RE_CHUNK_LINE, '');
+  return t.replace(/\n{3,}/g, '\n\n').trim();
+}
+
+/** First hex chunk id embedded in text, or empty. */
+export function extractChunkIdFromText(raw: string): string {
+  const m = /\[chunk:([a-f0-9]+)\]/i.exec(raw);
+  return m ? m[1].toLowerCase() : '';
+}
diff --git a/frontend_zh/src/vite-env.d.ts b/frontend_zh/src/vite-env.d.ts
index 4c5ff97..8d2ba4c 100644
--- a/frontend_zh/src/vite-env.d.ts
+++ b/frontend_zh/src/vite-env.d.ts
@@ -1,5 +1,7 @@
 /// <reference types="vite/client" />
 
+declare module 'rehype-raw';
+
 interface ImportMetaEnv {
   readonly VITE_SUPABASE_URL?: string
   readonly VITE_SUPABASE_ANON_KEY?: string
diff --git a/frontend_zh/vite.config.ts b/frontend_zh/vite.config.ts
index b322e8c..0330e8d 100644
--- a/frontend_zh/vite.config.ts
+++ b/frontend_zh/vite.config.ts
@@ -9,11 +9,11 @@ export default defineConfig({
     allowedHosts: true,
     proxy: {
       '/api': {
-        target: 'http://localhost:8213',
+        target: 'http://localhost:8212',
         changeOrigin: true,
       },
       '/outputs': {
-        target: 'http://localhost:8213',
+        target: 'http://localhost:8212',
         changeOrigin: true,
       },
     },
diff --git a/requirements-base.txt b/requirements-base.txt
index 10b8650..bd7d8ec 100644
--- a/requirements-base.txt
+++ b/requirements-base.txt
@@ -17,19 +17,19 @@ charset-normalizer==3.4.4
 supabase==2.27.2
 
 # ------ LLM / LangChain ------
-openai==2.16.0
-aisuite>=0.1.14
-langchain==0.3.27
-langchain-chroma==0.2.6
-langchain-community==0.3.29
-langchain-core==0.3.76
-langchain-openai==0.3.33
-langchain-text-splitters==0.3.11
-langgraph==0.6.7
-langgraph-checkpoint==2.1.1
-langgraph-prebuilt==0.6.4
-langgraph-sdk==0.2.6
-sseclient-py>=1.8.0
+# openai==2.16.0
+# aisuite>=0.1.14
+# langchain==0.3.27
+# langchain-chroma==0.2.6
+# langchain-community==0.3.29
+# langchain-core==0.3.76
+# langchain-openai==0.3.33
+# langchain-text-splitters==0.3.11
+# langgraph==0.6.7
+# langgraph-checkpoint==2.1.1
+# langgraph-prebuilt==0.6.4
+# langgraph-sdk==0.2.6
+# sseclient-py>=1.8.0
 
 # ------ Vector Store / Embedding ------
 chromadb==1.5.5
@@ -130,7 +130,7 @@ google-api-python-client>=2.187.0
 librosa>=0.11.0
 soundfile>=0.13.0
 qwen-tts==0.1.1
-fireredtts2==0.1
+#fireredtts2==0.1
 
 # ------ OCR (PaddlePaddle / Local Serving) ------
 paddlepaddle==3.2.0
@@ -163,3 +163,5 @@ IPython==8.18.1
 
 # ------ Dev / Test ------
 pytest>=9.0.0
+
+graphrag==2.7.2
\ No newline at end of file
diff --git a/workflow_engine/toolkits/graphrag_ms_tool/__init__.py b/workflow_engine/toolkits/graphrag_ms_tool/__init__.py
new file mode 100644
index 0000000..9149a11
--- /dev/null
+++ b/workflow_engine/toolkits/graphrag_ms_tool/__init__.py
@@ -0,0 +1,21 @@
+"""微软 GraphRAG 工具包（索引 / 查询 / 置信度 Judge）。
+
+数据流（与 ``wf_graphrag_kb`` 配合）：
+    建索引：``build_index`` ← Step1 的 chunk 列表 → 写 ``input/*.txt`` + ``chunk_meta.json`` → ``graphrag index``
+    查询：``query_local`` / ``query_global`` → ``QueryResult``（answer、context_data、子图、chunk 回溯）
+    打分：``judge_confidence`` ← 问题 + 答案 + 推理子图边列表 → ``JudgeResult.score``
+
+本包不负责 HTTP；FastAPI 经 ``wa_graphrag_kb`` 调用工作流，工作流再调用上述函数。
+"""
+from workflow_engine.toolkits.graphrag_ms_tool.indexer import build_index, GraphRAGWorkspace
+from workflow_engine.toolkits.graphrag_ms_tool.querier import query_local, query_global, QueryResult
+from workflow_engine.toolkits.graphrag_ms_tool.judge import judge_confidence
+
+__all__ = [
+    "build_index",
+    "GraphRAGWorkspace",
+    "query_local",
+    "query_global",
+    "QueryResult",
+    "judge_confidence",
+]
diff --git a/workflow_engine/toolkits/graphrag_ms_tool/indexer.py b/workflow_engine/toolkits/graphrag_ms_tool/indexer.py
new file mode 100644
index 0000000..241ca6b
--- /dev/null
+++ b/workflow_engine/toolkits/graphrag_ms_tool/indexer.py
@@ -0,0 +1,310 @@
+"""GraphRAG 工作区构建与索引入口（Step 3）。
+
+【职责】
+    将 Step1 产出的「带元数据的文本块」写成微软 GraphRAG 2.7.x 所需目录结构，
+    并子进程执行 ``graphrag index``，生成 ``output/`` 下的实体、关系、社区等制品。
+
+【数据流】
+    输入 ``chunks``：每项含 ``chunk_id``、``text``、``page_index``、``order``、
+    ``bbox``、``source_stem``（通常来自 ``SourceManager.get_chunks_with_meta``）。
+    → 按 ``source_stem`` 分组写入 ``input/{stem}.txt``，每段前加 ``[chunk:<id>]`` 标记。
+    → 并行写入 ``chunk_meta.json``：``chunk_id → {page_index, order, bbox, source_stem}``，
+      供查询阶段 ``querier`` 将证据中的 chunk 映射回页码/bbox。
+    → 修补 ``settings.yaml``（LLM/Embedding/chunk 参数）后调用 CLI 建索引。
+
+【目录结构】（GraphRAG **2.7.x**）::
+
+    {workspace_dir}/
+    ├── prompts/             ← ``graphrag init`` 生成（2.7 必需）
+    ├── input/               ← GraphRAG 摄取的纯文本（内嵌 [chunk:…]）
+    ├── chunk_meta.json      ← 本项目扩展：chunk 与页码/来源的映射
+    ├── settings.yaml        ← 模型、输出、local_search 等
+    ├── .env                 ← 可选 GRAPHRAG_API_KEY
+    └── output/              ← ``graphrag index`` 产物
+
+依赖：**graphrag==2.7.x**，子进程调用；Python 版本需与该包要求一致。
+"""
+from __future__ import annotations
+
+import json
+import os
+import shutil
+import subprocess
+from dataclasses import dataclass, field
+from pathlib import Path
+from typing import Any, Dict, List, Optional, Tuple
+
+import yaml
+
+from workflow_engine.logger import get_logger
+
+log = get_logger(__name__)
+
+
+def _settings_is_graphrag_v27(settings_path: Path) -> bool:
+    """判断 ``settings.yaml`` 是否为 GraphRAG ≥2.5 风格（顶层含 ``models`` 块）。"""
+    if not settings_path.is_file():
+        return False
+    try:
+        data = yaml.safe_load(settings_path.read_text(encoding="utf-8"))
+        return isinstance(data, dict) and "models" in data
+    except Exception:
+        return False
+
+
+def _ensure_graphrag_v27_project(root: Path, *, force_init: bool) -> None:
+    """在 *root* 下调用官方 ``initialize_project_at``，生成 prompts 与默认 ``settings.yaml``。"""
+    settings_path = root / "settings.yaml"
+    if not force_init and _settings_is_graphrag_v27(settings_path):
+        return
+    try:
+        from graphrag.cli.initialize import initialize_project_at
+    except ImportError as exc:
+        raise RuntimeError(
+            "graphrag package is required. Install with: pip install graphrag==2.7.2"
+        ) from exc
+    log.info("[GraphRAGIndexer] Initializing GraphRAG 2.7 project layout at %s", root)
+    initialize_project_at(path=root, force=True)
+
+
+_EMBEDDING_VECTOR_SIZES: Dict[str, int] = {
+    "text-embedding-3-large": 3072,
+    "text-embedding-3-small": 1536,
+    "text-embedding-ada-002": 1536,
+    "octen/octen-embedding-0.6b": 768,
+    "octen-embedding-0.6b": 768,
+}
+_DEFAULT_VECTOR_SIZE = 1536
+
+
+def _embedding_vector_size(model: str) -> int:
+    """Return the output dimension for a known embedding model; default 1536."""
+    return _EMBEDDING_VECTOR_SIZES.get(model.lower().strip(), _DEFAULT_VECTOR_SIZE)
+
+
+def resolve_graphrag_embedding_for_patch(cfg: Any, embedding_model: str) -> Tuple[str, Optional[str]]:
+    """GraphRAG ``default_embedding_model`` 的模型名与可选独立 ``api_base``（本地 vLLM）。"""
+    if bool(getattr(cfg, "GRAPHRAG_USE_LOCAL_EMBEDDING_RUNTIME", False)) and int(
+        getattr(cfg, "USE_LOCAL_EMBEDDING", 0) or 0
+    ) == 1:
+        port = int(getattr(cfg, "LOCAL_EMBEDDING_PORT", 26210))
+        return (
+            str(getattr(cfg, "LOCAL_EMBEDDING_MODEL", "Octen/Octen-Embedding-0.6B")).strip(),
+            f"http://127.0.0.1:{port}/v1",
+        )
+    return (str(embedding_model).strip(), None)
+
+
+def _patch_settings_yaml(
+    settings_path: Path,
+    *,
+    api_key: str,
+    api_base: str,
+    llm_model: str,
+    embedding_model: str,
+    chunk_size: int,
+    chunk_overlap: int,
+    local_search_context_max_tokens: int = 12000,
+    embedding_api_base: Optional[str] = None,
+) -> None:
+    """Inject runtime LLM / embedding / chunk params into settings.yaml and write .env.
+
+    Modifies models.default_chat_model, models.default_embedding_model, chunks.size/overlap,
+    and vector_store.default_vector_store.vector_size to match the embedding model dimension.
+    Each user must have an independent workspace_dir to avoid concurrent overwrites.
+    """
+    text = settings_path.read_text(encoding="utf-8")
+    data = yaml.safe_load(text)
+    # graphrag 2.7 的 settings.yaml 必须有顶层 "models" 块，否则说明版本不对
+    if not isinstance(data, dict) or "models" not in data:
+        raise RuntimeError("Invalid GraphRAG settings.yaml — expected 'models' block (graphrag 2.7 layout).")
+
+    models = data["models"]
+    emb_base = (embedding_api_base or api_base).strip() if (embedding_api_base or api_base) else ""
+    for model_id, model_name, entry_base in (
+        ("default_chat_model", llm_model, api_base),
+        ("default_embedding_model", embedding_model, emb_base),
+    ):
+        if model_id not in models:
+            log.warning("[GraphRAGIndexer] settings missing model id %r; skipping patch for it", model_id)
+            continue
+        entry = models[model_id]
+        if isinstance(entry, dict):
+            entry["api_key"] = api_key
+            entry["model"] = model_name
+            if entry_base:
+                entry["api_base"] = entry_base.strip().rstrip("/")
+
+    if "chunks" not in data:
+        data["chunks"] = {}
+    if isinstance(data["chunks"], dict):
+        data["chunks"]["size"] = int(chunk_size)
+        data["chunks"]["overlap"] = int(chunk_overlap)
+
+    # Ensure vector_store.vector_size matches the actual embedding dimension so that
+    # GraphRAG can open the LanceDB collection during queries (default 3072 causes
+    # 'NoneType has no attribute search' when the stored vectors are 1536-dim).
+    vec_size = _embedding_vector_size(embedding_model)
+    vs = data.setdefault("vector_store", {})
+    if isinstance(vs, dict):
+        store = vs.setdefault("default_vector_store", {})
+        if isinstance(store, dict):
+            store["vector_size"] = vec_size
+
+    # 较低值可加快 local_search 上下文组装与生成；过低可能丢证据，可按需调大。
+    ls = data.setdefault("local_search", {})
+    if isinstance(ls, dict):
+        ls["context_window_max_tokens"] = max(2048, int(local_search_context_max_tokens))
+
+    settings_path.write_text(yaml.dump(data, default_flow_style=False, allow_unicode=True), encoding="utf-8")
+
+    dotenv = settings_path.parent / ".env"
+    dotenv.write_text(f"GRAPHRAG_API_KEY={api_key}\n", encoding="utf-8")
+
+
+@dataclass
+class GraphRAGWorkspace:
+    """已就绪的 GraphRAG 工作区根目录句柄。
+
+    属性：
+        ``input_dir`` / ``output_dir`` / ``settings_path``：标准子路径；
+        ``load_chunk_meta()``：读取索引阶段写入的 ``chunk_meta.json``，供查询侧解析页码与来源。
+    """
+
+    root: Path
+    chunk_meta_path: Path = field(init=False)
+
+    def __post_init__(self) -> None:
+        self.chunk_meta_path = self.root / "chunk_meta.json"
+
+    @property
+    def input_dir(self) -> Path:
+        return self.root / "input"
+
+    @property
+    def output_dir(self) -> Path:
+        return self.root / "output"
+
+    @property
+    def settings_path(self) -> Path:
+        return self.root / "settings.yaml"
+
+    def load_chunk_meta(self) -> Dict[str, Any]:
+        """从磁盘读取 ``chunk_id → 元数据`` 映射；文件不存在则返回空 dict。"""
+        if not self.chunk_meta_path.exists():
+            return {}
+        return json.loads(self.chunk_meta_path.read_text(encoding="utf-8"))
+
+
+def build_index(
+    chunks: List[Dict[str, Any]],
+    workspace_dir: str,
+    *,
+    llm_model: Optional[str] = None,
+    embedding_model: Optional[str] = None,
+    api_base: Optional[str] = None,
+    api_key: Optional[str] = None,
+    graphrag_cmd: Optional[str] = None,
+    chunk_size: Optional[int] = None,
+    chunk_overlap: Optional[int] = None,
+    force_reindex: bool = False,
+) -> GraphRAGWorkspace:
+    """Prepare workspace from chunks and run ``graphrag index`` to build the knowledge graph.
+
+    Writes input/{stem}.txt with embedded [chunk:ID] markers, chunk_meta.json for page/bbox
+    lookup, patches settings.yaml, then invokes the CLI. Skips indexing if output already
+    exists and force_reindex is False.
+    """
+    from fastapi_app.config.settings import settings as cfg
+
+    llm_model = llm_model or cfg.GRAPHRAG_LLM_MODEL
+    embedding_model = embedding_model or cfg.GRAPHRAG_EMBEDDING_MODEL
+    emb_for_yaml, emb_api = resolve_graphrag_embedding_for_patch(cfg, embedding_model)
+    api_base = api_base or cfg.DEFAULT_LLM_API_URL.rstrip("/")
+    api_key = api_key or os.getenv("DF_API_KEY", "")
+    chunk_size = chunk_size or cfg.GRAPHRAG_CHUNK_SIZE
+    chunk_overlap = chunk_overlap or cfg.GRAPHRAG_CHUNK_OVERLAP
+    graphrag_cmd = (
+        graphrag_cmd
+        or cfg.GRAPHRAG_CMD.strip()
+        or shutil.which("graphrag")
+    )
+    if not graphrag_cmd:
+        raise RuntimeError(
+            "graphrag CLI not found. Install with `pip install graphrag==2.7.2` or "
+            "set GRAPHRAG_CMD in .env to the executable path."
+        )
+
+    ws = GraphRAGWorkspace(root=Path(workspace_dir).resolve())
+    ws.root.mkdir(parents=True, exist_ok=True)
+    ws.input_dir.mkdir(parents=True, exist_ok=True)
+
+    # ── Step A：确保 GraphRAG 2.7 工程骨架存在（prompts/ + settings.yaml）───
+    # graphrag init 会生成 prompts 模板和默认 settings.yaml
+    # 已有合法的 2.7 格式 settings.yaml 且不强制重建时跳过，避免覆盖用户自定义配置
+    need_init = force_reindex or not _settings_is_graphrag_v27(ws.settings_path)
+    _ensure_graphrag_v27_project(ws.root, force_init=need_init)
+
+    # Step B: write input/*.txt with [chunk:ID] markers and chunk_meta.json
+    # [chunk:ID] tags are carried through text_units so querier can map them back to page/bbox
+    stem_to_chunks: Dict[str, List[Dict[str, Any]]] = {}
+    meta: Dict[str, Any] = {}
+    for chunk in chunks:
+        cid = chunk.get("chunk_id", "")
+        stem = chunk.get("source_stem", "unknown")
+        text = (chunk.get("text") or "").strip()
+        if not text or not cid:
+            continue
+        stem_to_chunks.setdefault(stem, []).append(chunk)
+        meta[cid] = {
+            "page_index": chunk.get("page_index", -1),
+            "order": chunk.get("order", -1),
+            "bbox": chunk.get("bbox"),
+            "source_stem": stem,
+        }
+
+    # 按来源分文件写入，同一来源的 chunk 按 order 排序保证顺序一致
+    for stem, cks in stem_to_chunks.items():
+        txt_path = ws.input_dir / f"{stem}.txt"
+        lines = []
+        for ck in sorted(cks, key=lambda c: c.get("order", 0)):
+            # ⚠️ 格式约定：[chunk:十六进制ID]\n文本内容
+            lines.append(f"[chunk:{ck['chunk_id']}]\n{ck['text']}")
+        txt_path.write_text("\n\n".join(lines), encoding="utf-8")
+
+    ws.chunk_meta_path.write_text(
+        json.dumps(meta, ensure_ascii=False, indent=2),
+        encoding="utf-8",
+    )
+
+    # Step C: inject API key / model params into settings.yaml
+    _patch_settings_yaml(
+        ws.settings_path,
+        api_key=api_key,
+        api_base=api_base,
+        llm_model=llm_model,
+        embedding_model=emb_for_yaml,
+        chunk_size=int(chunk_size),
+        chunk_overlap=int(chunk_overlap),
+        local_search_context_max_tokens=int(cfg.GRAPHRAG_LOCAL_SEARCH_CONTEXT_MAX_TOKENS),
+        embedding_api_base=emb_api,
+    )
+
+    # Step D: run graphrag index
+    output_dir = ws.output_dir
+    if force_reindex and output_dir.exists():
+        shutil.rmtree(str(output_dir))
+
+    already_indexed = (output_dir / "entities.parquet").exists()
+    if already_indexed and not force_reindex:
+        log.info("[GraphRAGIndexer] Skipping indexing — output already exists at %s", output_dir)
+        return ws
+
+    log.info("[GraphRAGIndexer] Running graphrag index at %s …", ws.root)
+    subprocess.run(
+        [graphrag_cmd, "index", "--root", str(ws.root)],
+        check=True,
+        text=True,
+    )
+    log.info("[GraphRAGIndexer] Indexing complete.")
+    return ws
diff --git a/workflow_engine/toolkits/graphrag_ms_tool/judge.py b/workflow_engine/toolkits/graphrag_ms_tool/judge.py
new file mode 100644
index 0000000..e9f897d
--- /dev/null
+++ b/workflow_engine/toolkits/graphrag_ms_tool/judge.py
@@ -0,0 +1,203 @@
+"""GraphRAG 答案置信度 Judge（独立 LLM 打分）。
+
+【输入】
+    用户问题（question）、GraphRAG 生成的答案（answer）、
+    推理子图边列表（reasoning_subgraph，由 ``querier._induce_subgraph`` 等得到，最多 50 条写入 prompt）。
+
+【输出】
+    ``JudgeResult``：``score`` ∈ [0,1]、``rationale`` 及可选三维 0–10 分（相关性 / 图支持 / 无过度推断）。
+
+【评分维度】（计划 §4.4，固定 rubric）
+    1. 相关性 — 是否答在问题上；
+    2. 图支持 — 子图证据是否支撑结论；
+    3. 无过度推断 — 是否超出证据范围。
+
+【数据流】
+    ``wf_graphrag_kb._action_query`` 在查询（及可选子图裁剪）之后调用；
+    配置来自 ``settings.JUDGE_MODEL`` 与 ``DEFAULT_LLM_API_URL``。
+    LLM 失败时返回 score=0.0 并记录 warning，不抛异常，便于接口仍返回部分结果。
+"""
+from __future__ import annotations
+
+import json
+import os
+import re
+from dataclasses import dataclass
+from typing import Any, Dict, List, Optional
+
+from workflow_engine.logger import get_logger
+
+log = get_logger(__name__)
+
+_JUDGE_SYSTEM_PROMPT = """\
+You are a rigorous evidence quality judge. Given a user question, a
+knowledge-graph reasoning subgraph (as a list of edges), and a candidate
+answer, score the answer on three criteria:
+
+1. Relevance (0-10): Does the answer address the question?
+2. Graph support (0-10): Is the answer supported by the provided subgraph?
+3. No over-reach (0-10): Does the answer avoid making claims beyond the evidence?
+
+Output ONLY valid JSON:
+{
+  "relevance": <int 0-10>,
+  "graph_support": <int 0-10>,
+  "no_over_reach": <int 0-10>,
+  "score": <float 0-1, average of the three divided by 10>,
+  "rationale": "<1-2 sentences>"
+}
+"""
+
+
+@dataclass
+class JudgeResult:
+    score: float           # 综合分 0.0–1.0
+    rationale: str = ""
+    relevance: int = 0
+    graph_support: int = 0
+    no_over_reach: int = 0
+
+
+def judge_confidence(
+    question: str,
+    answer: str,
+    reasoning_subgraph: List[Dict[str, Any]],
+    *,
+    model: Optional[str] = None,
+    api_base: Optional[str] = None,
+    api_key: Optional[str] = None,
+) -> JudgeResult:
+    """Score the answer against the question and subgraph via LLM; returns a low-score placeholder on error."""
+    from fastapi_app.config.settings import settings as cfg
+
+    model = model or cfg.JUDGE_MODEL
+    api_base = api_base or cfg.DEFAULT_LLM_API_URL.rstrip("/")
+    api_key = api_key or os.getenv("DF_API_KEY", "")
+    max_out = int(getattr(cfg, "JUDGE_MAX_TOKENS", 256) or 256)
+
+    # Compress the subgraph to a readable triple list (truncated to 50 edges)
+    edge_lines = [
+        f"  ({e.get('source', '?')}) --[{e.get('relation', '?')}]--> ({e.get('target', '?')})"
+        for e in reasoning_subgraph[:24]
+    ]
+    subgraph_text = "\n".join(edge_lines) if edge_lines else "  (no subgraph available)"
+
+    user_msg = (
+        f"## Question\n{question}\n\n"
+        f"## Reasoning Subgraph\n{subgraph_text}\n\n"
+        f"## Answer\n{answer}\n"
+    )
+
+    try:
+        raw = _call_llm(model, api_base, api_key, _JUDGE_SYSTEM_PROMPT, user_msg, max_tokens=max_out)
+        return _parse_judge_response(raw)
+    except Exception as exc:
+        log.warning("[Judge] LLM call failed: %s", exc)
+        return JudgeResult(score=0.0, rationale=f"Judge error: {exc}")
+
+
+# ---------------------------------------------------------------------------
+# Internal helpers
+# ---------------------------------------------------------------------------
+
+def _call_llm(
+    model: str,
+    api_base: str,
+    api_key: str,
+    system: str,
+    user: str,
+    *,
+    max_tokens: int = 256,
+) -> str:
+    """OpenAI-compatible chat call for the judge model."""
+    import time as _time
+    try:
+        from openai import OpenAI
+    except ImportError as exc:
+        raise ImportError("openai package required for Judge module") from exc
+
+    client = OpenAI(api_key=api_key or "none", base_url=api_base)
+    t0 = _time.perf_counter()
+    log.info("[TIMING][D] judge._call_llm START | model=%s | prompt_len=%d", model, len(user))
+    _kwargs = dict(
+        model=model,
+        max_tokens=max_tokens,
+        temperature=0,
+        messages=[
+            {"role": "system", "content": system},
+            {"role": "user", "content": user},
+        ],
+    )
+    try:
+        response = client.chat.completions.create(**_kwargs, response_format={"type": "json_object"})
+    except Exception as exc:
+        log.debug("[Judge] response_format json_object unsupported or rejected: %s", exc)
+        response = client.chat.completions.create(**_kwargs)
+    content = response.choices[0].message.content or ""
+    t1 = _time.perf_counter()
+    log.info("[TIMING][D] judge._call_llm DONE | model=%s | elapsed=%.3fs | response_len=%d", model, t1 - t0, len(content))
+    return content
+
+
+def _strip_after_thinking_block(text: str) -> str:
+    """Drop content before common ``</...thinking...>`` closers so JSON can be found."""
+    lower = text.lower()
+    for tag in (
+        "</redacted_thinking>",
+        "`</redacted_thinking>`",
+        "</think>",
+        "`</redacted_thinking>`",
+    ):
+        tl = tag.lower()
+        i = lower.rfind(tl)
+        if i != -1:
+            return text[i + len(tag) :].strip()
+    return text
+
+
+def _extract_first_json_object(text: str) -> Optional[Dict[str, Any]]:
+    """Parse the first balanced ``{...}`` substring as JSON (handles thinking / prose prefixes)."""
+    start = text.find("{")
+    while start != -1:
+        depth = 0
+        for i in range(start, len(text)):
+            if text[i] == "{":
+                depth += 1
+            elif text[i] == "}":
+                depth -= 1
+                if depth == 0:
+                    try:
+                        return json.loads(text[start : i + 1])
+                    except json.JSONDecodeError:
+                        start = text.find("{", start + 1)
+                        break
+        else:
+            break
+    return None
+
+
+def _parse_judge_response(raw: str) -> JudgeResult:
+    """Strip markdown fences, parse JSON, and normalise score to [0, 1]."""
+    raw = _strip_after_thinking_block(raw.strip())
+    raw = re.sub(r"^```(?:json)?\s*", "", raw.strip())
+    raw = re.sub(r"\s*```$", "", raw)
+    try:
+        parsed = json.loads(raw)
+    except json.JSONDecodeError:
+        parsed = _extract_first_json_object(raw)
+        if parsed is None:
+            raise
+
+    rel = int(parsed.get("relevance", 0))
+    gs = int(parsed.get("graph_support", 0))
+    nor = int(parsed.get("no_over_reach", 0))
+    score = float(parsed.get("score", (rel + gs + nor) / 30.0))
+    rationale = str(parsed.get("rationale", ""))
+
+    return JudgeResult(
+        score=min(1.0, max(0.0, score)),
+        rationale=rationale,
+        relevance=rel,
+        graph_support=gs,
+        no_over_reach=nor,
+    )
diff --git a/workflow_engine/toolkits/graphrag_ms_tool/prune_judge_combined.py b/workflow_engine/toolkits/graphrag_ms_tool/prune_judge_combined.py
new file mode 100644
index 0000000..e94254c
--- /dev/null
+++ b/workflow_engine/toolkits/graphrag_ms_tool/prune_judge_combined.py
@@ -0,0 +1,243 @@
+"""单次 LLM 同时完成推理子图裁剪与答案置信度 Judge（降低延迟）。
+
+当 ``GRAPHRAG_SUBGRAPH_PRUNE_ENABLED`` 且子图非空时使用本模块，替代
+``prune_reasoning_subgraph_llm`` + ``judge_confidence`` 两次调用。
+"""
+from __future__ import annotations
+
+import json
+import os
+import re
+from dataclasses import dataclass
+from typing import Any, Dict, List, Optional
+
+from workflow_engine.logger import get_logger
+
+from workflow_engine.toolkits.graphrag_ms_tool.judge import JudgeResult
+
+log = get_logger(__name__)
+
+_COMBINED_SYSTEM = """You are a knowledge-graph analyst and evidence judge in one step.
+
+Input: a user question (Q), a draft answer (A), and a numbered edge list (index 0..N-1).
+
+Tasks (be concise to save tokens):
+1) Pick keep_indices: 0-based indices of edges minimally needed to support A for Q (typically 3–12 edges).
+2) analysis: brief reasoning (≤120 words) on which edges matter and approximate hop counts between key entities.
+3) max_hops: integer estimate for the kept subgraph.
+4) Judge A against Q using ONLY the edges you would KEEP (describe mentally before scoring):
+   - relevance (0-10), graph_support (0-10), no_over_reach (0-10)
+   - score: float 0-1 = average of the three / 10
+   - rationale: one short sentence
+
+Output ONLY valid JSON (no markdown):
+{
+  "analysis": "<string>",
+  "keep_indices": [<int>, ...],
+  "max_hops": <int>,
+  "relevance": <int 0-10>,
+  "graph_support": <int 0-10>,
+  "no_over_reach": <int 0-10>,
+  "score": <float 0-1>,
+  "rationale": "<string>"
+}
+
+If the edge list is empty, return keep_indices [], max_hops 0, analysis "(no edges)", and low scores with rationale "no graph edges"."""
+
+
+def _parse_json_loose(raw: str) -> Dict[str, Any]:
+    raw = raw.strip()
+    raw = re.sub(r"^```(?:json)?\s*", "", raw)
+    raw = re.sub(r"\s*```$", "", raw)
+    try:
+        return json.loads(raw)
+    except json.JSONDecodeError:
+        start = raw.find("{")
+        while start != -1:
+            depth = 0
+            for i in range(start, len(raw)):
+                if raw[i] == "{":
+                    depth += 1
+                elif raw[i] == "}":
+                    depth -= 1
+                    if depth == 0:
+                        try:
+                            return json.loads(raw[start : i + 1])
+                        except json.JSONDecodeError:
+                            start = raw.find("{", start + 1)
+                            break
+            else:
+                break
+        raise
+
+
+def _fallback_edges(sl: List[Dict[str, Any]], err: str) -> tuple[List[Dict[str, Any]], str, int]:
+    n = min(12, len(sl))
+    return sl[:n], f"(fallback: {err})", 0
+
+
+@dataclass
+class PruneJudgeCombinedResult:
+    edges: List[Dict[str, Any]]
+    cot: str
+    max_hops: int
+    judge: JudgeResult
+
+
+def _call_llm(
+    model: str,
+    api_base: str,
+    api_key: str,
+    system: str,
+    user: str,
+    *,
+    max_tokens: int,
+) -> str:
+    import time as _time
+    from openai import OpenAI
+
+    client = OpenAI(api_key=api_key or "none", base_url=api_base)
+    t0 = _time.perf_counter()
+    log.info(
+        "[TIMING][CJ] prune_judge_combined START | model=%s | prompt_len=%d | max_tokens=%d",
+        model,
+        len(user),
+        max_tokens,
+    )
+    kwargs = dict(
+        model=model,
+        max_tokens=max_tokens,
+        temperature=0.1,
+        messages=[
+            {"role": "system", "content": system},
+            {"role": "user", "content": user},
+        ],
+    )
+    try:
+        response = client.chat.completions.create(**kwargs, response_format={"type": "json_object"})
+    except Exception as exc:
+        log.debug("[PruneJudge] response_format json_object rejected: %s", exc)
+        response = client.chat.completions.create(**kwargs)
+    content = response.choices[0].message.content or ""
+    t1 = _time.perf_counter()
+    log.info(
+        "[TIMING][CJ] prune_judge_combined DONE | model=%s | elapsed=%.3fs | response_len=%d",
+        model,
+        t1 - t0,
+        len(content),
+    )
+    return content
+
+
+def prune_and_judge_combined_llm(
+    question: str,
+    answer: str,
+    edges: List[Dict[str, Any]],
+    *,
+    model: Optional[str] = None,
+    api_base: Optional[str] = None,
+    api_key: Optional[str] = None,
+    max_edges_input: int = 28,
+    max_tokens: int = 768,
+) -> PruneJudgeCombinedResult:
+    """One LLM call: prune subgraph + judge; on failure returns truncated edges and a neutral judge."""
+    from fastapi_app.config.settings import settings as cfg
+
+    explicit = getattr(cfg, "GRAPHRAG_PRUNE_JUDGE_MODEL", None)
+    if explicit and str(explicit).strip():
+        model = str(explicit).strip()
+    elif model and str(model).strip():
+        model = str(model).strip()
+    else:
+        model = (cfg.JUDGE_MODEL or getattr(cfg, "GRAPHRAG_SUBGRAPH_PRUNE_MODEL", None) or cfg.GRAPHRAG_LLM_MODEL)
+    api_base = (api_base or cfg.DEFAULT_LLM_API_URL).rstrip("/")
+    api_key = api_key or os.getenv("DF_API_KEY", "")
+
+    if not edges:
+        return PruneJudgeCombinedResult(
+            edges=[],
+            cot="",
+            max_hops=0,
+            judge=JudgeResult(score=0.0, rationale="no subgraph edges"),
+        )
+
+    sl = edges[: max(1, int(max_edges_input))]
+    lines = [
+        f"{i}: ({e.get('source', '?')}) --[{e.get('relation', '?')}]--> ({e.get('target', '?')})"
+        for i, e in enumerate(sl)
+    ]
+    edge_block = "\n".join(lines)
+    user_msg = (
+        f"## Question\n{question}\n\n"
+        f"## Draft answer\n{answer}\n\n"
+        f"## Edges (index 0..{len(sl)-1})\n{edge_block}\n"
+    )
+
+    try:
+        raw = _call_llm(model, api_base, api_key, _COMBINED_SYSTEM, user_msg, max_tokens=max_tokens)
+        parsed = _parse_json_loose(raw)
+    except Exception as exc:
+        log.warning("[PruneJudge] combined LLM failed: %s", exc)
+        fe, cot, mh = _fallback_edges(sl, str(exc))
+        return PruneJudgeCombinedResult(
+            edges=fe,
+            cot=cot,
+            max_hops=mh,
+            judge=JudgeResult(score=0.5, rationale=f"combined call failed; neutral score: {exc}"),
+        )
+
+    analysis = str(parsed.get("analysis", "") or "")
+    max_hops = int(parsed.get("max_hops", 0) or 0)
+    cot_display = analysis
+    if max_hops > 0 and "max_hops" not in analysis.lower():
+        cot_display = f"{analysis}\n\n**max_hops (estimate):** {max_hops}"
+
+    rel = int(parsed.get("relevance", 0))
+    gs = int(parsed.get("graph_support", 0))
+    nor = int(parsed.get("no_over_reach", 0))
+    try:
+        score = float(parsed.get("score", (rel + gs + nor) / 30.0))
+    except (TypeError, ValueError):
+        score = 0.5
+    rationale = str(parsed.get("rationale", "") or "")
+
+    judge = JudgeResult(
+        score=min(1.0, max(0.0, score)),
+        rationale=rationale,
+        relevance=max(0, min(10, rel)),
+        graph_support=max(0, min(10, gs)),
+        no_over_reach=max(0, min(10, nor)),
+    )
+
+    idx_raw = parsed.get("keep_indices")
+    if not isinstance(idx_raw, list):
+        fe, cot_e, _ = _fallback_edges(sl, "invalid keep_indices")
+        return PruneJudgeCombinedResult(
+            edges=fe,
+            cot=cot_display or cot_e,
+            max_hops=max_hops,
+            judge=judge,
+        )
+
+    kept: List[Dict[str, Any]] = []
+    seen: set[int] = set()
+    for x in idx_raw:
+        try:
+            i = int(x)
+        except (TypeError, ValueError):
+            continue
+        if i < 0 or i >= len(sl) or i in seen:
+            continue
+        seen.add(i)
+        kept.append(sl[i])
+
+    if not kept:
+        fe, _, _ = _fallback_edges(sl, "empty keep_indices")
+        return PruneJudgeCombinedResult(
+            edges=fe,
+            cot=cot_display or "(empty keep_indices; truncated)",
+            max_hops=max_hops,
+            judge=judge,
+        )
+
+    return PruneJudgeCombinedResult(edges=kept, cot=cot_display, max_hops=max_hops, judge=judge)
diff --git a/workflow_engine/toolkits/graphrag_ms_tool/querier.py b/workflow_engine/toolkits/graphrag_ms_tool/querier.py
new file mode 100644
index 0000000..29a501e
--- /dev/null
+++ b/workflow_engine/toolkits/graphrag_ms_tool/querier.py
@@ -0,0 +1,494 @@
+"""GraphRAG 查询封装：本地/全局检索 + 证据打包（与计划 §3.3 / §4.3 契约一致）。
+
+【QueryResult 字段含义】
+    answer               模型生成的自然语言回答（已去掉末尾 ``[Data:…]`` 引用尾标）
+    context_data         GraphRAG ``SearchResult.context_data`` 序列化后的表（实体、关系、text_units 等）
+    reasoning_subgraph   从 ``relationships``（或兼容键）归纳出的边列表，供 Judge 与子图裁剪
+    source_chunks        从证据文本中正则提取的 ``[chunk:十六进制]`` → chunk_id 列表（去重保序）
+    highlight_hints      每个 chunk_id 经 ``chunk_meta.json`` 映射得到的 ``{chunk_id, source_stem, page_index, bbox?}``
+
+【执行路径】
+    优先 ``graphrag.api.local_search`` / ``global_search``（与 CLI 同源配置）；
+    失败则回退 ``graphrag query`` 子进程。**CLI 回退时只有 answer**，其余证据字段为空。
+
+【数据流】
+    索引阶段写入的 ``[chunk:ID]`` 会出现在检索上下文的 text_units 文本中 →
+    ``_extract_source_chunks`` 收集 ID → ``_build_highlight_hints`` 查 meta → 前端「文档定位」。
+"""
+from __future__ import annotations
+
+import inspect
+import json
+import os
+import re
+import shutil
+import subprocess
+from dataclasses import dataclass, field
+from pathlib import Path
+from typing import Any, Dict, List, Optional
+
+from workflow_engine.logger import get_logger
+from workflow_engine.toolkits.graphrag_ms_tool.indexer import (
+    GraphRAGWorkspace,
+    _patch_settings_yaml,
+    resolve_graphrag_embedding_for_patch,
+)
+
+log = get_logger(__name__)
+
+
+def _strip_graphrag_data_citation_suffix(answer: str) -> str:
+    """Remove all ``[Data: Entities (…); Relationships (…); …]`` inline citation markers.
+
+    GraphRAG injects these after every sentence, not just at the end, so we strip globally.
+    """
+    if not (answer and answer.strip()):
+        return answer
+    return re.sub(r"\s*\[Data:[^\]]+\]", "", answer.strip())
+
+
+def _coalesce_ctx(ctx: Dict[str, Any], *keys: str) -> Any:
+    """返回 ``ctx`` 中按 *keys* 顺序第一个非 ``None`` 的值。
+
+    注意：不能用 ``a or b`` 合并 DataFrame，pandas 在布尔上下文会抛错，故显式遍历键名。
+    """
+    for k in keys:
+        v = ctx.get(k)
+        if v is not None:
+            return v
+    return None
+
+
+@dataclass
+class QueryResult:
+    """Structured result of a single GraphRAG query.
+
+    answer: cleaned response text (GraphRAG [Data:...] citation suffix stripped).
+    context_data: serialised tables from SearchResult (entities, relationships, sources).
+    reasoning_subgraph: edge list [{source, target, relation, weight}] for visualisation.
+    source_chunks: chunk_ids extracted from context text_units, deduplicated in order.
+    highlight_hints: [{chunk_id, source_stem, page_index, bbox?}] from chunk_meta.json.
+    """
+
+    answer: str
+    context_data: Dict[str, Any] = field(default_factory=dict)
+    reasoning_subgraph: List[Dict[str, Any]] = field(default_factory=list)
+    source_chunks: List[str] = field(default_factory=list)
+    highlight_hints: List[Dict[str, Any]] = field(default_factory=list)
+
+
+# ---------------------------------------------------------------------------
+# 对外 API：local / global 查询入口
+# ---------------------------------------------------------------------------
+
+def query_local(
+    workspace: GraphRAGWorkspace,
+    question: str,
+    *,
+    llm_model: Optional[str] = None,
+    api_base: Optional[str] = None,
+    api_key: Optional[str] = None,
+    graphrag_cmd: Optional[str] = None,
+) -> QueryResult:
+    """Local search: answer around the most relevant entity/community subgraph.
+
+    Best for factual, entity-specific questions. Falls back to CLI if Python API fails
+    (CLI returns answer only; context_data and highlight_hints will be empty).
+    """
+    return _run_query(
+        workspace, question, method="local",
+        llm_model=llm_model, api_base=api_base, api_key=api_key,
+        graphrag_cmd=graphrag_cmd,
+    )
+
+
+def query_global(
+    workspace: GraphRAGWorkspace,
+    question: str,
+    *,
+    llm_model: Optional[str] = None,
+    api_base: Optional[str] = None,
+    api_key: Optional[str] = None,
+    graphrag_cmd: Optional[str] = None,
+) -> QueryResult:
+    """Global search: summarise across all community reports.
+
+    Best for thematic / overview questions. source_chunks and highlight_hints are
+    typically empty because global search does not return text_units.
+    """
+    return _run_query(
+        workspace, question, method="global",
+        llm_model=llm_model, api_base=api_base, api_key=api_key,
+        graphrag_cmd=graphrag_cmd,
+    )
+
+
+# ---------------------------------------------------------------------------
+# 内部实现：Python API / CLI、结果解析与子图/chunk 归纳
+# ---------------------------------------------------------------------------
+
+def _run_query(
+    workspace: GraphRAGWorkspace,
+    question: str,
+    method: str,
+    *,
+    llm_model: Optional[str],
+    api_base: Optional[str],
+    api_key: Optional[str],
+    graphrag_cmd: Optional[str],
+) -> QueryResult:
+    from fastapi_app.config.settings import settings as cfg
+
+    llm_model = llm_model or cfg.GRAPHRAG_LLM_MODEL
+    api_base = api_base or cfg.DEFAULT_LLM_API_URL.rstrip("/")
+    api_key = api_key or os.getenv("DF_API_KEY", "")
+
+    # Try Python API first
+    try:
+        return _query_via_python_api(
+            workspace, question, method, llm_model, api_base, api_key
+        )
+    except Exception as exc:
+        log.warning(
+            "[GraphRAGQuerier] Python API query failed (%s); falling back to CLI: %s",
+            method, exc,
+        )
+
+    # Fall back to CLI
+    return _query_via_cli(workspace, question, method, graphrag_cmd, cfg)
+
+
+def _query_via_python_api(
+    workspace: GraphRAGWorkspace,
+    question: str,
+    method: str,
+    llm_model: str,
+    api_base: str,
+    api_key: str,
+) -> QueryResult:
+    """经 GraphRAG **2.7.x** 的 ``graphrag.api`` 异步检索（与 ``graphrag query`` CLI 同源配置与输出）。
+
+    会先 ``_patch_settings_yaml`` 刷新密钥与模型，再 ``load_config`` + ``local_search``/``global_search``，
+    最后 ``_parse_search_result`` 打包证据。
+    """
+    import asyncio
+    import time as _time
+    from types import SimpleNamespace
+
+    try:
+        from graphrag.config.load_config import load_config
+        from graphrag import api as graphrag_api
+        from graphrag.cli.query import _resolve_output_files
+    except ImportError as exc:
+        raise ImportError(
+            "graphrag 2.7.x is required for the Python query path. "
+            "Install: pip install graphrag==2.7.2"
+        ) from exc
+
+    from fastapi_app.config.settings import settings as cfg
+
+    t0 = _time.perf_counter()
+    log.info("[TIMING][B] _query_via_python_api START | method=%s | question=%r", method, question[:60])
+
+    if not workspace.settings_path.is_file():
+        raise FileNotFoundError(f"Missing GraphRAG settings: {workspace.settings_path}")
+
+    emb_yaml_model, emb_api = resolve_graphrag_embedding_for_patch(
+        cfg, str(cfg.GRAPHRAG_EMBEDDING_MODEL).strip()
+    )
+    _patch_settings_yaml(
+        workspace.settings_path,
+        api_key=api_key,
+        api_base=api_base,
+        llm_model=llm_model,
+        embedding_model=emb_yaml_model,
+        chunk_size=int(cfg.GRAPHRAG_CHUNK_SIZE),
+        chunk_overlap=int(cfg.GRAPHRAG_CHUNK_OVERLAP),
+        local_search_context_max_tokens=int(cfg.GRAPHRAG_LOCAL_SEARCH_CONTEXT_MAX_TOKENS),
+        embedding_api_base=emb_api,
+    )
+    t1 = _time.perf_counter()
+    log.info("[TIMING][B1] _patch_settings_yaml | %.3fs", t1 - t0)
+
+    _lc_sig = inspect.signature(load_config)
+    _lc_kw: Dict[str, Any] = {"cli_overrides": {}}
+    if "config_filepath" in _lc_sig.parameters:
+        _lc_kw["config_filepath"] = None
+    config = load_config(workspace.root.resolve(), **_lc_kw)
+    t2 = _time.perf_counter()
+    log.info("[TIMING][B2] load_config | %.3fs", t2 - t1)
+
+    community_level = max(0, int(getattr(cfg, "GRAPHRAG_COMMUNITY_LEVEL", 2) or 0))
+    response_type = str(cfg.GRAPHRAG_RESPONSE_TYPE or "Single Paragraph").strip() or "Single Paragraph"
+
+    if method == "local":
+        df = _resolve_output_files(
+            config=config,
+            output_list=[
+                "communities",
+                "community_reports",
+                "text_units",
+                "relationships",
+                "entities",
+            ],
+            optional_list=["covariates"],
+        )
+        t3 = _time.perf_counter()
+        log.info("[TIMING][B3] _resolve_output_files(%s) | %.3fs", method, t3 - t2)
+        if df.get("multi-index"):
+            raise RuntimeError("Multi-index GraphRAG workspaces are not supported by this adapter.")
+        log.info("[TIMING][B4] graphrag_api.local_search START (embed + LLM gen)")
+        response, context_data = asyncio.run(
+            graphrag_api.local_search(
+                config=config,
+                entities=df["entities"],
+                communities=df["communities"],
+                community_reports=df["community_reports"],
+                text_units=df["text_units"],
+                relationships=df["relationships"],
+                covariates=df.get("covariates"),
+                community_level=community_level,
+                response_type=response_type,
+                query=question,
+                verbose=False,
+            )
+        )
+    elif method == "global":
+        df = _resolve_output_files(
+            config=config,
+            output_list=["entities", "communities", "community_reports"],
+            optional_list=[],
+        )
+        t3 = _time.perf_counter()
+        log.info("[TIMING][B3] _resolve_output_files(%s) | %.3fs", method, t3 - t2)
+        if df.get("multi-index"):
+            raise RuntimeError("Multi-index GraphRAG workspaces are not supported by this adapter.")
+        log.info("[TIMING][B4] graphrag_api.global_search START (embed + LLM gen)")
+        response, context_data = asyncio.run(
+            graphrag_api.global_search(
+                config=config,
+                entities=df["entities"],
+                communities=df["communities"],
+                community_reports=df["community_reports"],
+                community_level=community_level,
+                dynamic_community_selection=False,
+                response_type=response_type,
+                query=question,
+                verbose=False,
+            )
+        )
+    else:
+        raise ValueError(f"Unknown search method: {method}")
+
+    t4 = _time.perf_counter()
+    log.info("[TIMING][B4] graphrag_api.%s_search DONE | %.3fs | answer_len=%d", method, t4 - t3, len(response or ""))
+
+    if not isinstance(context_data, dict):
+        context_data = {}
+
+    wrapped = SimpleNamespace(response=response or "", context_data=context_data)
+    result = _parse_search_result(wrapped, workspace)
+    t5 = _time.perf_counter()
+    log.info("[TIMING][B5] _parse_search_result | %.3fs | subgraph_edges=%d | source_chunks=%d",
+             t5 - t4, len(result.reasoning_subgraph), len(result.source_chunks))
+
+    log.info(
+        "[TIMING][B] _query_via_python_api SUMMARY | patch=%.3fs | config=%.3fs | parquet=%.3fs | llm=%.3fs | parse=%.3fs | TOTAL=%.3fs",
+        t1 - t0, t2 - t1, t3 - t2, t4 - t3, t5 - t4, t5 - t0,
+    )
+    return result
+
+
+def _query_via_cli(
+    workspace: GraphRAGWorkspace,
+    question: str,
+    method: str,
+    graphrag_cmd: Optional[str],
+    cfg: Any,
+) -> QueryResult:
+    """CLI 回退：仅解析标准输出为 ``answer``，无 ``context_data``，故子图/chunk 均为空。"""
+    cmd = (
+        graphrag_cmd
+        or cfg.GRAPHRAG_CMD.strip()
+        or shutil.which("graphrag")
+    )
+    if not cmd:
+        raise RuntimeError(
+            "graphrag CLI not found. Install graphrag or set GRAPHRAG_CMD."
+        )
+
+    proc = subprocess.run(
+        [cmd, "query", "--root", str(workspace.root), "--method", method, "--query", question],
+        capture_output=True,
+        text=True,
+        check=False,
+    )
+    out = (proc.stdout or "").strip()
+    err = (proc.stderr or "").strip()
+    combined = out or err
+    if proc.returncode != 0:
+        raise RuntimeError(
+            f"graphrag CLI query failed (exit {proc.returncode}): {(err or out)[:800]}"
+        )
+    low = combined.lstrip().lower()
+    if low.startswith("usage:") or "try 'graphrag query --help'" in low or "╭─ error" in low:
+        raise RuntimeError(
+            f"graphrag CLI did not return an answer (usage or CLI error): {combined[:800]}"
+        )
+
+    answer = _strip_graphrag_data_citation_suffix(combined)
+    log.info("[GraphRAGQuerier] CLI answer (%s): %s …", method, answer[:120])
+    return QueryResult(answer=answer)
+
+
+def _parse_search_result(result: Any, workspace: GraphRAGWorkspace) -> QueryResult:
+    """将 GraphRAG API 返回的 ``response`` + ``context_data`` 转为本项目的 ``QueryResult``。
+
+    步骤：清洗 answer → DataFrame 转可 JSON 的 list → 归纳子图 → 提取 chunk → 查 meta 生成高亮提示。
+    """
+    answer = _strip_graphrag_data_citation_suffix(getattr(result, "response", "") or "")
+    ctx: Dict[str, Any] = getattr(result, "context_data", {}) or {}
+
+    # Serialise DataFrames → dicts for JSON transport
+    ctx_serialised: Dict[str, Any] = {}
+    for key, val in ctx.items():
+        try:
+            import pandas as pd
+            if isinstance(val, pd.DataFrame):
+                ctx_serialised[key] = json.loads(val.to_json(orient="records", force_ascii=False))
+            else:
+                ctx_serialised[key] = val
+        except Exception:
+            ctx_serialised[key] = str(val)
+
+    # Reasoning subgraph: induce from entities + relationships tables
+    reasoning_subgraph = _induce_subgraph(ctx)
+
+    # Source chunks: extract chunk_ids from text_units Sources table
+    source_chunks = _extract_source_chunks(ctx, workspace)
+
+    # Highlight hints: map chunk_ids back to page/bbox via chunk_meta
+    highlight_hints = _build_highlight_hints(source_chunks, workspace)
+
+    return QueryResult(
+        answer=answer,
+        context_data=ctx_serialised,
+        reasoning_subgraph=reasoning_subgraph,
+        source_chunks=source_chunks,
+        highlight_hints=highlight_hints,
+    )
+
+
+def _induce_subgraph(ctx: Dict[str, Any]) -> List[Dict[str, Any]]:
+    """从 ``context_data`` 的 ``relationships``（或 ``relations``）表中归纳有向边列表。
+
+    兼容 DataFrame 与已序列化的 ``list[dict]``；边字段统一为 source/target/relation/weight。
+    """
+    edges: List[Dict[str, Any]] = []
+    try:
+        import pandas as pd
+        rels = _coalesce_ctx(ctx, "relationships", "relations")
+        if rels is None:
+            return edges
+        # GraphRAG Python API typically returns DataFrames, but some adapters / JSON
+        # serialisation paths may already convert them to list[dict]. Support both.
+        if isinstance(rels, pd.DataFrame):
+            rows = rels.to_dict(orient="records")
+        elif isinstance(rels, list):
+            rows = [r for r in rels if isinstance(r, dict)]
+        else:
+            rows = []
+
+        for row in rows:
+            src = row.get("source") or row.get("source_id") or row.get("head") or row.get("from")
+            tgt = row.get("target") or row.get("target_id") or row.get("tail") or row.get("to")
+            rel = (
+                row.get("description")
+                or row.get("relationship")
+                or row.get("relation")
+                or row.get("predicate")
+                or row.get("label")
+                or ""
+            )
+            w = row.get("weight", 1.0)
+            try:
+                w_f = float(w)  # may be str in JSON payloads
+            except Exception:
+                w_f = 1.0
+            edges.append(
+                {
+                    "source": str(src or ""),
+                    "target": str(tgt or ""),
+                    "relation": str(rel or ""),
+                    "weight": w_f,
+                }
+            )
+    except Exception as exc:
+        log.debug("[GraphRAGQuerier] subgraph induction failed: %s", exc)
+    return edges
+
+
+def _extract_source_chunks(ctx: Dict[str, Any], workspace: GraphRAGWorkspace) -> List[str]:
+    """Extract [chunk:ID] markers from retrieved text_units, deduplicated in context order.
+
+    The markers were embedded by indexer.build_index and preserved through text_units.parquet.
+    Returns at most GRAPHRAG_MAX_HIGHLIGHT_HINTS ids (0 = unlimited).
+    """
+    from fastapi_app.config.settings import settings as cfg
+
+    chunk_ids: List[str] = []
+    try:
+        import pandas as pd
+        sources = _coalesce_ctx(ctx, "sources", "text_units")
+        if sources is None:
+            return chunk_ids
+        if isinstance(sources, pd.DataFrame):
+            rows = sources.to_dict(orient="records")
+        else:
+            rows = sources if isinstance(sources, list) else []
+        pattern = re.compile(r"\[chunk:([a-f0-9]+)\]")
+        for row in rows:
+            text = str(row.get("text") or row.get("content") or "")
+            chunk_ids.extend(pattern.findall(text))
+        seen: set[str] = set()
+        deduped = []
+        for cid in chunk_ids:
+            if cid not in seen:
+                seen.add(cid)
+                deduped.append(cid)
+        max_n = int(getattr(cfg, "GRAPHRAG_MAX_HIGHLIGHT_HINTS", 10) or 0)
+        if max_n > 0 and len(deduped) > max_n:
+            deduped = deduped[:max_n]
+        return deduped
+    except Exception as exc:
+        log.debug("[GraphRAGQuerier] source_chunks extraction failed: %s", exc)
+    return chunk_ids
+
+
+def _build_highlight_hints(
+    chunk_ids: List[str],
+    workspace: GraphRAGWorkspace,
+) -> List[Dict[str, Any]]:
+    """Map chunk_ids to document location hints by looking up chunk_meta.json.
+
+    Returns [{chunk_id, source_stem, page_index, bbox?}] for the frontend PDF viewer.
+    chunk_ids not found in chunk_meta are silently skipped.
+    """
+    if not chunk_ids:
+        return []
+    meta = workspace.load_chunk_meta()
+    hints = []
+    for cid in chunk_ids:
+        m = meta.get(cid)
+        if not m:
+            continue  # chunk_id 在 meta 中找不到时跳过（可能是旧索引遗留）
+        hint: Dict[str, Any] = {
+            "chunk_id": cid,
+            "source_stem": m.get("source_stem", ""),
+            "page_index": m.get("page_index", -1),
+        }
+        bbox = m.get("bbox")
+        if bbox:
+            hint["bbox"] = bbox
+        hints.append(hint)
+    return hints
diff --git a/workflow_engine/toolkits/graphrag_ms_tool/subgraph_pruner.py b/workflow_engine/toolkits/graphrag_ms_tool/subgraph_pruner.py
new file mode 100644
index 0000000..4754f0c
--- /dev/null
+++ b/workflow_engine/toolkits/graphrag_ms_tool/subgraph_pruner.py
@@ -0,0 +1,192 @@
+"""基于 LLM 的推理子图裁剪：从完整关系边列表中选出「支撑答案所需」的最小子集，并输出 CoT。
+
+【数据流】
+    输入：来自 ``querier._induce_subgraph`` 的边列表（可能很长）、用户问题、GraphRAG 草稿答案。
+    处理：将边编号为 0..N-1 写入 prompt，要求模型输出 ``keep_indices``、``analysis``（链式思考）、``max_hops``。
+    输出：``SubgraphPruneResult`` — 保留的边列表、展示用 CoT 文本、跳数估计。
+
+【调用关系】
+    ``wf_graphrag_kb._action_query`` 在 ``GRAPHRAG_SUBGRAPH_PRUNE_ENABLED`` 为真且子图非空时调用；
+    裁剪后的边写回 ``result.reasoning_subgraph``，CoT 写入 ``reasoning_subgraph_cot`` 供前端展示。
+
+【失败策略】
+    LLM 解析失败或索引非法时，回退为截断后的边列表并附带错误说明，避免查询整体失败。
+"""
+from __future__ import annotations
+
+import json
+import os
+import re
+from dataclasses import dataclass
+from typing import Any, Dict, List, Optional
+
+from workflow_engine.logger import get_logger
+
+log = get_logger(__name__)
+
+_SUBGRAPH_PRUNE_SYSTEM = """You are a knowledge-graph analyst.
+
+You will receive:
+1. A user question (Q)
+2. A draft answer (A) produced by GraphRAG retrieval + generation
+3. A numbered list of directed edges: (source) --[relation]--> (target)
+
+Your tasks:
+- In the JSON field "analysis", write a clear chain-of-thought: which edges are
+  strictly necessary to justify A for Q, and why. Discuss **hops**: when you
+  connect entities along these edges, what is the longest shortest-path length
+  (in edges) among pairs of entities that matter for the answer? Name approximate
+  hop counts (e.g. "entity X to Y is 2 hops via ...").
+- In "keep_indices", list the 0-based indices of edges to KEEP. Prefer a SMALL
+  minimal set (typically 3–15 edges) that still supports the answer. Indices
+  MUST refer only to edges in the provided numbered list (0 to N-1).
+- In "max_hops", give a single integer: your estimate of the maximum hop count
+  among important entity pairs in the kept subgraph (0 if a single edge or none).
+
+Output ONLY valid JSON (no markdown code fences):
+{
+  "analysis": "<chain-of-thought in English or Chinese>",
+  "keep_indices": [<int>, ...],
+  "max_hops": <int>
+}
+
+If the edge list is empty, return {"analysis":"(no edges)","keep_indices":[],"max_hops":0}.
+"""
+
+
+@dataclass
+class SubgraphPruneResult:
+    """Result of LLM-based subgraph pruning: kept edges, CoT text, and estimated max hops."""
+
+    edges: List[Dict[str, Any]]
+    cot: str
+    max_hops: int = 0
+
+
+def _call_llm(
+    model: str,
+    api_base: str,
+    api_key: str,
+    system: str,
+    user: str,
+    *,
+    max_tokens: int = 2048,
+) -> str:
+    """OpenAI-compatible chat call used by the pruner."""
+    import time as _time
+    try:
+        from openai import OpenAI
+    except ImportError as exc:
+        raise ImportError("openai package required for subgraph pruner") from exc
+
+    client = OpenAI(api_key=api_key or "none", base_url=api_base)
+    t0 = _time.perf_counter()
+    log.info("[TIMING][C] pruner._call_llm START | model=%s | prompt_len=%d", model, len(user))
+    response = client.chat.completions.create(
+        model=model,
+        max_tokens=max_tokens,
+        temperature=0.1,
+        messages=[
+            {"role": "system", "content": system},
+            {"role": "user", "content": user},
+        ],
+    )
+    content = response.choices[0].message.content or ""
+    t1 = _time.perf_counter()
+    log.info("[TIMING][C] pruner._call_llm DONE | model=%s | elapsed=%.3fs | response_len=%d", model, t1 - t0, len(content))
+    return content
+
+
+def _parse_json_object(raw: str) -> Dict[str, Any]:
+    """Strip optional markdown fences from LLM output and parse as JSON."""
+    raw = raw.strip()
+    raw = re.sub(r"^```(?:json)?\s*", "", raw)
+    raw = re.sub(r"\s*```$", "", raw)
+    return json.loads(raw)
+
+
+def prune_reasoning_subgraph_llm(
+    question: str,
+    answer: str,
+    edges: List[Dict[str, Any]],
+    *,
+    model: Optional[str] = None,
+    api_base: Optional[str] = None,
+    api_key: Optional[str] = None,
+    max_edges_input: int = 80,
+) -> SubgraphPruneResult:
+    """Return pruned edges and CoT; falls back to a truncated copy of the input edges on failure."""
+    from fastapi_app.config.settings import settings as cfg
+
+    model = model or getattr(cfg, "GRAPHRAG_SUBGRAPH_PRUNE_MODEL", None) or cfg.GRAPHRAG_LLM_MODEL
+    api_base = (api_base or cfg.DEFAULT_LLM_API_URL).rstrip("/")
+    api_key = api_key or os.getenv("DF_API_KEY", "")
+
+    if not edges:
+        return SubgraphPruneResult(edges=[], cot="")
+
+    sl = edges[: max(1, int(max_edges_input))]
+    lines = [
+        f"{i}: ({e.get('source', '?')}) --[{e.get('relation', '?')}]--> ({e.get('target', '?')})"
+        for i, e in enumerate(sl)
+    ]
+    edge_block = "\n".join(lines)
+
+    user_msg = (
+        f"## Question\n{question}\n\n"
+        f"## Draft answer\n{answer}\n\n"
+        f"## Edges (index 0..{len(sl)-1})\n{edge_block}\n"
+    )
+
+    try:
+        mt = int(getattr(cfg, "GRAPHRAG_SUBGRAPH_PRUNE_MAX_TOKENS", 512) or 512)
+        raw = _call_llm(
+            model,
+            api_base,
+            api_key,
+            _SUBGRAPH_PRUNE_SYSTEM,
+            user_msg,
+            max_tokens=mt,
+        )
+        parsed = _parse_json_object(raw)
+    except Exception as exc:
+        log.warning("[SubgraphPruner] LLM prune failed: %s", exc)
+        return SubgraphPruneResult(
+            edges=sl[: min(12, len(sl))],
+            cot=f"(automatic fallback: prune failed: {exc})",
+            max_hops=0,
+        )
+
+    analysis = str(parsed.get("analysis", "") or "")
+    max_hops = int(parsed.get("max_hops", 0) or 0)
+    cot_display = analysis
+    if max_hops > 0 and "**max_hops" not in analysis:
+        cot_display = f"{analysis}\n\n**max_hops (estimate):** {max_hops}"
+    idx_raw = parsed.get("keep_indices")
+    if not isinstance(idx_raw, list):
+        return SubgraphPruneResult(
+            edges=sl[: min(12, len(sl))],
+            cot=cot_display or "(invalid keep_indices; truncated)",
+            max_hops=max_hops,
+        )
+
+    kept: List[Dict[str, Any]] = []
+    seen: set[int] = set()
+    for x in idx_raw:
+        try:
+            i = int(x)
+        except (TypeError, ValueError):
+            continue
+        if i < 0 or i >= len(sl) or i in seen:
+            continue
+        seen.add(i)
+        kept.append(sl[i])
+
+    if not kept:
+        return SubgraphPruneResult(
+            edges=sl[: min(12, len(sl))],
+            cot=cot_display or "(empty keep_indices; truncated)",
+            max_hops=max_hops,
+        )
+
+    return SubgraphPruneResult(edges=kept, cot=cot_display, max_hops=max_hops)
diff --git a/workflow_engine/toolkits/kggen_tool/__init__.py b/workflow_engine/toolkits/kggen_tool/__init__.py
new file mode 100644
index 0000000..97c9348
--- /dev/null
+++ b/workflow_engine/toolkits/kggen_tool/__init__.py
@@ -0,0 +1,12 @@
+"""KGGen 工具包：从文本块抽取三元组，以及合并两个 ``kg_gen.Graph``。
+
+【数据流】
+    ``extract_kg`` / ``extract_kg_from_chunks``：输出带 ``source_chunk_ids`` 的关系列表，便于回溯；
+    ``merge_two_kgs``：对两个图做集合合并（可选 ``dedupe`` 占位）。
+
+默认用户路径为 ``skip_kggen=True``，GraphRAG 索引不依赖本包；仅 ``skip_kggen=False`` 时由 ``wf_graphrag_kb`` 调用。
+"""
+from workflow_engine.toolkits.kggen_tool.kg_extractor import extract_kg, extract_kg_from_chunks
+from workflow_engine.toolkits.kggen_tool.kg_merger import merge_two_kgs
+
+__all__ = ["extract_kg", "extract_kg_from_chunks", "merge_two_kgs"]
diff --git a/workflow_engine/toolkits/kggen_tool/kg_extractor.py b/workflow_engine/toolkits/kggen_tool/kg_extractor.py
new file mode 100644
index 0000000..3726d73
--- /dev/null
+++ b/workflow_engine/toolkits/kggen_tool/kg_extractor.py
@@ -0,0 +1,219 @@
+"""KGGen-based KG extraction — currently unused; kept for optional integration."""
+# from __future__ import annotations
+
+# import os
+# from typing import Any, Dict, List, Optional
+
+# from workflow_engine.logger import get_logger
+
+# log = get_logger(__name__)
+
+
+# def normalize_model_for_litellm(model: str) -> str:
+#     """dspy/kg-gen routes calls through LiteLLM, which requires ``provider/model``.
+
+#     Bare names like ``deepseek-v3.2`` raise *LLM Provider NOT provided*.  This project
+#     defaults to OpenAI-compatible gateways (``api_base`` + deployment id), so we
+#     prefix ``openai/`` when no provider is present.  If you use another LiteLLM
+#     provider, set the full id in config (e.g. ``deepseek/deepseek-chat``).
+#     """
+#     m = (model or "").strip()
+#     if not m or "/" in m:
+#         return m
+#     return f"openai/{m}"
+
+
+# def kggen_init_extras(litellm_model: str) -> Dict[str, Any]:
+#     """Extra ``KGGen(...)`` kwargs required by kg-gen's own validators.
+
+#     For GPT-5–family ids, ``kg_gen.KGGen`` enforces ``temperature == 1.0`` and
+#     ``max_tokens >= 16000`` (see ``validate_temperature`` / ``validate_max_tokens``).
+#     """
+#     m = (litellm_model or "").lower()
+#     if "gpt-5" in m:
+#         return {"temperature": 1.0, "max_tokens": 16000}
+#     return {}
+
+
+# def _get_kggen(model: str, api_base: str, api_key: str):
+#     """Import KGGen and return a configured instance.
+
+#     Raises ImportError if kg_gen is not installed.
+#     """
+#     try:
+#         from kg_gen import KGGen  # type: ignore[import]
+#     except ImportError as exc:
+#         raise ImportError(
+#             "kg-gen is not installed. Run: pip install kg-gen"
+#         ) from exc
+
+#     litellm_model = normalize_model_for_litellm(model)
+#     if litellm_model != model.strip():
+#         log.debug("[KGGen] LiteLLM model id: %r → %r", model, litellm_model)
+
+#     extras = kggen_init_extras(litellm_model)
+#     return KGGen(
+#         model=litellm_model,
+#         api_base=api_base,
+#         api_key=api_key,
+#         **extras,
+#     )
+
+
+# def _default_settings():
+#     from fastapi_app.config.settings import settings
+#     return settings
+
+
+# def extract_kg(
+#     text: str,
+#     source_chunk_ids: Optional[List[str]] = None,
+#     *,
+#     model: Optional[str] = None,
+#     api_base: Optional[str] = None,
+#     api_key: Optional[str] = None,
+# ) -> Dict[str, Any]:
+#     """Extract a knowledge graph from *text* and annotate with chunk IDs.
+
+#     Parameters
+#     ----------
+#     text:
+#         The raw text to extract triples from.
+#     source_chunk_ids:
+#         List of chunk_id values the text originated from.  Stored on every
+#         relation in the result under ``source_chunk_ids``.
+#     model / api_base / api_key:
+#         LLM settings; fall back to ``settings.KGGEN_MODEL`` / ``DEFAULT_LLM_API_URL``.
+
+#     Returns
+#     -------
+#     dict with keys:
+#         ``entities`` (list[str])
+#         ``relations`` (list[dict]) — each dict has keys:
+#             ``subject``, ``predicate``, ``object``, ``source_chunk_ids``
+#         ``raw_graph`` — the original ``kg_gen.Graph`` object
+#     """
+#     cfg = _default_settings()
+#     model = model or cfg.KGGEN_MODEL
+#     api_base = api_base or cfg.DEFAULT_LLM_API_URL.rstrip("/")
+#     api_key = api_key or os.getenv("DF_API_KEY", "")
+
+#     kggen = _get_kggen(model, api_base, api_key)
+#     # kg-gen 0.3.x / 0.4.x: first argument is *input_data* (str or message list), not input_text.
+#     graph = kggen.generate(text)
+
+#     chunk_ids = source_chunk_ids or []
+
+#     relations = []
+#     # Triples live on graph.relations (set of (s, p, o)). graph.edges is only predicate labels.
+#     for edge in (graph.relations or []):
+#         # KGGen edge can be a tuple (subj, pred, obj) or a dict
+#         if isinstance(edge, (list, tuple)) and len(edge) >= 3:
+#             subj, pred, obj = edge[0], edge[1], edge[2]
+#         elif isinstance(edge, dict):
+#             subj = edge.get("source") or edge.get("subject", "")
+#             pred = edge.get("relation") or edge.get("predicate", "")
+#             obj = edge.get("target") or edge.get("object", "")
+#         else:
+#             continue
+#         relations.append(
+#             {
+#                 "subject": str(subj),
+#                 "predicate": str(pred),
+#                 "object": str(obj),
+#                 "source_chunk_ids": chunk_ids,
+#             }
+#         )
+
+#     return {
+#         "entities": list(graph.entities or []),
+#         "relations": relations,
+#         "raw_graph": graph,
+#     }
+
+
+# def extract_kg_from_chunks(
+#     chunks: List[Dict[str, Any]],
+#     *,
+#     model: Optional[str] = None,
+#     api_base: Optional[str] = None,
+#     api_key: Optional[str] = None,
+# ) -> Dict[str, Any]:
+#     """Extract and merge KGs from a list of chunk dicts.
+
+#     Each item in *chunks* must have at least ``chunk_id`` and ``text`` keys
+#     (as produced by ``SourceManager.get_chunks_with_meta``).
+
+#     Returns the same shape as ``extract_kg`` but with relations carrying
+#     ``source_chunk_ids`` from their respective chunk.
+#     """
+#     cfg = _default_settings()
+#     per_chunk: bool = cfg.KGGEN_PER_CHUNK
+#     log_iv = int(getattr(cfg, "KGGEN_LOG_CHUNK_INTERVAL", 10) or 0)
+
+#     if per_chunk:
+#         all_entities: List[str] = []
+#         all_relations: List[Dict[str, Any]] = []
+#         raw_graphs = []
+
+#         to_process = [c for c in chunks if (c.get("text") or "").strip()]
+#         total = len(to_process)
+#         if log_iv == 0:
+#             log.info("[KGGen] per-chunk: starting %d chunks (progress logs off)", total)
+#         else:
+#             log.info(
+#                 "[KGGen] per-chunk: starting %d chunks (interval=%d, set KGGEN_LOG_CHUNK_INTERVAL=1 for each)",
+#                 total,
+#                 log_iv,
+#             )
+
+#         def _log_chunk_progress(i: int, cid: str) -> None:
+#             if log_iv == 0:
+#                 return
+#             if log_iv == 1:
+#                 log.info("[KGGen] chunk %d/%d id=%s", i, total, cid)
+#                 return
+#             if i == 1 or i == total or (i % log_iv) == 0:
+#                 log.info("[KGGen] chunk %d/%d id=%s", i, total, cid)
+
+#         for i, chunk in enumerate(to_process, start=1):
+#             cid = chunk.get("chunk_id", "")
+#             text = (chunk.get("text") or "").strip()
+#             _log_chunk_progress(i, cid or "?")
+#             try:
+#                 result = extract_kg(
+#                     text,
+#                     source_chunk_ids=[cid],
+#                     model=model,
+#                     api_base=api_base,
+#                     api_key=api_key,
+#                 )
+#                 all_entities.extend(result["entities"])
+#                 all_relations.extend(result["relations"])
+#                 raw_graphs.append(result["raw_graph"])
+#             except Exception as exc:
+#                 log.warning("[KGGen] chunk %s extraction failed: %s", cid, exc)
+
+#         if log_iv == 0:
+#             log.info("[KGGen] per-chunk: finished %d chunks", total)
+#         else:
+#             log.info("[KGGen] per-chunk: finished %d chunks", total)
+
+#         return {
+#             "entities": list(set(all_entities)),
+#             "relations": all_relations,
+#             "raw_graphs": raw_graphs,
+#         }
+
+#     # Whole-document mode: concatenate text, collect all chunk_ids
+#     n = len([c for c in chunks if (c.get("text") or "").strip()])
+#     log.info("[KGGen] whole-document mode: 1 LLM call over %d chunks (text merged)", n)
+#     full_text = "\n\n".join(c.get("text", "") for c in chunks if c.get("text"))
+#     all_ids = [c["chunk_id"] for c in chunks if c.get("chunk_id")]
+#     return extract_kg(
+#         full_text,
+#         source_chunk_ids=all_ids,
+#         model=model,
+#         api_base=api_base,
+#         api_key=api_key,
+#     )
diff --git a/workflow_engine/toolkits/kggen_tool/kg_merger.py b/workflow_engine/toolkits/kggen_tool/kg_merger.py
new file mode 100644
index 0000000..d4ca4c1
--- /dev/null
+++ b/workflow_engine/toolkits/kggen_tool/kg_merger.py
@@ -0,0 +1,87 @@
+"""KGGen-based KG merging — currently unused; kept for optional integration."""
+# from __future__ import annotations
+
+# from typing import Any, Optional
+
+# from workflow_engine.logger import get_logger
+# from workflow_engine.toolkits.kggen_tool.kg_extractor import (
+#     kggen_init_extras,
+#     normalize_model_for_litellm,
+# )
+
+# log = get_logger(__name__)
+
+
+# def _deduplicate_merged_graph(merged: Any, kggen: Any) -> Any:
+#     """Semantic deduplication after aggregate. Placeholder for next release.
+
+#     Parameters are reserved for a future implementation (e.g. ``kggen`` or custom LLM).
+#     """
+#     pass
+
+#     return merged
+
+
+# def merge_two_kgs(
+#     graph_a: Any,
+#     graph_b: Any,
+#     *,
+#     dedupe: bool = False,
+#     model: Optional[str] = None,
+#     api_base: Optional[str] = None,
+#     api_key: Optional[str] = None,
+# ) -> Any:
+#     """合并两个 ``kg_gen.Graph`` 为一张图（实体/关系/边集合并）。
+
+#     ``graph_a`` / ``graph_b`` 通常来自 ``extract_kg`` 的 ``raw_graph``；
+#     ``dedupe=True`` 时在聚合后调用占位去重（当前无实际逻辑）；
+#     若未安装 kg-gen 则 ``ImportError``。
+#     """
+#     try:
+#         from kg_gen import KGGen  # type: ignore[import]
+#     except ImportError as exc:
+#         raise ImportError("kg-gen is not installed. Run: pip install kg-gen") from exc
+
+#     import os
+
+#     from kg_gen.models import Graph as KGGraph  # type: ignore[import]
+
+#     # kg-gen exposes aggregate as an instance method; mirror its set-union logic so we
+#     # do not rely on KGGen.aggregate([...]) (invalid call) or a dummy KGGen instance.
+#     def _union_graphs(graphs: list[Any]) -> Any:
+#         all_entities: set = set()
+#         all_relations: set = set()
+#         all_edges: set = set()
+#         for g in graphs:
+#             all_entities.update(g.entities)
+#             all_relations.update(g.relations)
+#             all_edges.update(g.edges)
+#         return KGGraph(entities=all_entities, relations=all_relations, edges=all_edges)
+
+#     merged = _union_graphs([graph_a, graph_b])
+#     log.info(
+#         "[KGMerger] aggregate → %d entities, %d edges",
+#         len(merged.entities or []),
+#         len(merged.edges or []),
+#     )
+
+#     if dedupe:
+#         cfg_model = model
+#         cfg_base = api_base
+#         cfg_key = api_key
+#         if not cfg_model:
+#             from fastapi_app.config.settings import settings
+#             cfg_model = settings.KGGEN_MODEL
+#             cfg_base = cfg_base or settings.DEFAULT_LLM_API_URL.rstrip("/")
+#             cfg_key = cfg_key or os.getenv("DF_API_KEY", "")
+
+#         lm_model = normalize_model_for_litellm(cfg_model)
+#         kggen = KGGen(
+#             model=lm_model,
+#             api_base=cfg_base,
+#             api_key=cfg_key,
+#             **kggen_init_extras(lm_model),
+#         )
+#         merged = _deduplicate_merged_graph(merged, kggen)
+
+#     return merged
diff --git a/workflow_engine/toolkits/wikidata_subgraph_enrich.py b/workflow_engine/toolkits/wikidata_subgraph_enrich.py
new file mode 100644
index 0000000..102a6c9
--- /dev/null
+++ b/workflow_engine/toolkits/wikidata_subgraph_enrich.py
@@ -0,0 +1,383 @@
+"""Use Wikidata API to look up subgraph entity names and append short reference text.
+
+Search uses ``wbsearchentities`` (no prior entity alignment); labels/descriptions use
+``wbgetentities``. Intended to be called via ``asyncio.to_thread`` from GraphRAG workflows.
+
+See https://foundation.wikimedia.org/wiki/Policy:User-Agent_policy — a descriptive User-Agent is required.
+"""
+from __future__ import annotations
+
+import re
+import time
+from dataclasses import dataclass
+from dataclasses import dataclass
+from typing import Any, Dict, List, Optional, Set, Tuple
+
+import requests
+from requests.exceptions import ConnectionError as RequestsConnectionError
+from requests.exceptions import HTTPError, RequestException, Timeout
+
+from workflow_engine.logger import get_logger
+
+log = get_logger(__name__)
+
+_WIKIDATA_UA = "OpenNotebookLM/1.0 (GraphRAG subgraph Wikidata enrich; local research bot)"
+_QID_RE = re.compile(r"^Q[1-9]\d*$", re.IGNORECASE)
+
+
+@dataclass
+class _WikidataRuntimeStats:
+    network_failures: int = 0
+    timeout_failures: int = 0
+
+
+def _preferred_lang_chain(lang: str) -> Tuple[str, ...]:
+    lg = (lang or "").strip().lower()
+    if lg.startswith("zh"):
+        return ("zh-cn", "zh-hans", "zh", "zh-tw", "zh-hant", "en")
+    if lg.startswith("en"):
+        return ("en", "zh", "zh-cn", "zh-hans", "zh-tw", "zh-hant")
+    return (lg, "en", "zh", "zh-cn", "zh-hans", "zh-tw", "zh-hant")
+
+
+def _unique_entity_terms(edges: List[Dict[str, Any]], max_terms: int) -> List[str]:
+    seen: Set[str] = set()
+    out: List[str] = []
+    for e in edges:
+        if not isinstance(e, dict):
+            continue
+        for key in ("source", "target"):
+            raw = str(e.get(key) or "").strip()
+            if len(raw) < 2 or len(raw) > 200:
+                continue
+            low = raw.casefold()
+            if low in seen:
+                continue
+            seen.add(low)
+            out.append(raw)
+            if len(out) >= max_terms:
+                return out
+    return out
+
+
+def _wb_get(
+    session: requests.Session,
+    api_url: str,
+    params: Dict[str, Any],
+    *,
+    connect_timeout: float,
+    read_timeout: float,
+    http_retries: int = 2,
+    stats: Optional[_WikidataRuntimeStats] = None,
+) -> Optional[dict]:
+    """GET Wikimedia API; retries on read/connect timeout only."""
+    timeout_tpl = (float(connect_timeout), float(read_timeout))
+    attempts = max(1, int(http_retries) + 1)
+    action = params.get("action")
+    for attempt in range(attempts):
+        try:
+            r = session.get(api_url, params=params, timeout=timeout_tpl)
+            r.raise_for_status()
+            data = r.json()
+            return data if isinstance(data, dict) else None
+        except (Timeout, RequestsConnectionError) as exc:
+            if stats is not None:
+                stats.network_failures += 1
+                if isinstance(exc, Timeout):
+                    stats.timeout_failures += 1
+            if attempt + 1 < attempts:
+                wait = 0.6 * (attempt + 1)
+                log.info(
+                    "[Wikidata] retry %d/%d in %.1fs | action=%s | %s",
+                    attempt + 1,
+                    attempts,
+                    wait,
+                    action,
+                    exc,
+                )
+                time.sleep(wait)
+                continue
+            log.warning(
+                "[Wikidata] HTTP/API failed after %d tries | action=%s | %s",
+                attempts,
+                action,
+                exc,
+            )
+            return None
+        except HTTPError as exc:
+            if stats is not None:
+                stats.network_failures += 1
+            log.warning("[Wikidata] HTTP error | action=%s | %s", action, exc)
+            return None
+        except RequestException as exc:
+            if stats is not None:
+                stats.network_failures += 1
+            log.warning("[Wikidata] request error | action=%s | %s", action, exc)
+            return None
+        except (ValueError, TypeError) as exc:
+            log.warning("[Wikidata] invalid JSON | action=%s | %s", action, exc)
+            return None
+    return None
+
+
+def _search_qid(
+    session: requests.Session,
+    api_url: str,
+    term: str,
+    lang: str,
+    *,
+    connect_timeout: float,
+    read_timeout: float,
+    http_retries: int,
+    stats: Optional[_WikidataRuntimeStats] = None,
+) -> Optional[str]:
+    params = {
+        "action": "wbsearchentities",
+        "format": "json",
+        "language": lang,
+        "uselang": lang,
+        "search": term,
+        "limit": 1,
+        "type": "item",
+    }
+    data = _wb_get(
+        session,
+        api_url,
+        params,
+        connect_timeout=connect_timeout,
+        read_timeout=read_timeout,
+        http_retries=http_retries,
+        stats=stats,
+    )
+    if not data:
+        return None
+    arr = data.get("search")
+    if not isinstance(arr, list) or not arr:
+        return None
+    first = arr[0]
+    if not isinstance(first, dict):
+        return None
+    qid = str(first.get("id") or "").strip().upper()
+    return qid if _QID_RE.match(qid) else None
+
+
+def _pick_lang_value(obj: Any, lang_chain: Tuple[str, ...]) -> str:
+    if not isinstance(obj, dict):
+        return ""
+    for lg in lang_chain:
+        block = obj.get(lg)
+        if isinstance(block, dict):
+            v = str(block.get("value") or "").strip()
+            if v:
+                return v
+    for _k, block in obj.items():
+        if isinstance(block, dict):
+            v = str(block.get("value") or "").strip()
+            if v:
+                return v
+    return ""
+
+
+def _batch_get_entities(
+    session: requests.Session,
+    api_url: str,
+    qids: List[str],
+    langs: str,
+    *,
+    connect_timeout: float,
+    read_timeout: float,
+    http_retries: int,
+    stats: Optional[_WikidataRuntimeStats] = None,
+) -> Dict[str, Dict[str, Any]]:
+    """Return map qid_upper -> entity dict from wbgetentities."""
+    out: Dict[str, Dict[str, Any]] = {}
+    chunk = 20
+    for i in range(0, len(qids), chunk):
+        batch = qids[i : i + chunk]
+        params = {
+            "action": "wbgetentities",
+            "format": "json",
+            "ids": "|".join(batch),
+            "props": "labels|descriptions",
+            "languages": langs,
+            "languagefallback": 1,
+        }
+        data = _wb_get(
+            session,
+            api_url,
+            params,
+            connect_timeout=connect_timeout,
+            read_timeout=read_timeout,
+            http_retries=http_retries,
+            stats=stats,
+        )
+        if not data:
+            continue
+        entities = data.get("entities")
+        if not isinstance(entities, dict):
+            continue
+        for qid, ent in entities.items():
+            if isinstance(ent, dict) and qid.upper().startswith("Q"):
+                out[qid.upper()] = ent
+        time.sleep(0.05)
+    return out
+
+
+def _trunc(s: str, n: int = 120) -> str:
+    s = s.replace("\n", " ")
+    return s if len(s) <= n else s[: n - 3] + "..."
+
+
+def format_wikidata_supplement_for_subgraph(
+    edges: List[Dict[str, Any]],
+    *,
+    lang: str = "zh",
+    max_entities: int = 8,
+    connect_timeout: float = 10.0,
+    read_timeout: float = 45.0,
+    http_retries: int = 2,
+    api_url: str = "https://www.wikidata.org/w/api.php",
+    emit_failure_hint: bool = False,
+) -> str:
+    """Build a short Markdown block for user-facing answer tail, or empty string."""
+    t0 = time.perf_counter()
+    if not edges:
+        log.info("[Wikidata] skip: empty subgraph (0 edges)")
+        return ""
+
+    terms = _unique_entity_terms(edges, max_terms=max(1, max_entities * 2))
+    log.info(
+        "[Wikidata] start | edges=%d | max_entities=%d | lang=%s | terms=%d | "
+        "connect=%.1fs read=%.1fs retries=%d | sample=%s",
+        len(edges),
+        max_entities,
+        lang,
+        len(terms),
+        connect_timeout,
+        read_timeout,
+        http_retries,
+        [_trunc(t, 80) for t in terms[:8]],
+    )
+    if not terms:
+        log.info("[Wikidata] skip: no source/target strings in subgraph (after length/dedupe filter)")
+        return ""
+
+    session = requests.Session()
+    session.headers.update({"User-Agent": _WIKIDATA_UA})
+    stats = _WikidataRuntimeStats()
+
+    resolved: List[Tuple[str, str]] = []  # (original_term_or_qid, qid)
+    seen_q: Set[str] = set()
+    lang = (lang or "en").strip() or "en"
+    lang_chain = _preferred_lang_chain(lang)
+
+    for term in terms:
+        if len(resolved) >= max_entities:
+            log.info("[Wikidata] stop: reached max_entities=%d", max_entities)
+            break
+        if _QID_RE.match(term):
+            qid = term.upper()
+            log.info("[Wikidata] resolve | term=%r -> %s (literal QID)", _trunc(term, 100), qid)
+        else:
+            time.sleep(0.08)
+            qid = (
+                _search_qid(
+                    session,
+                    api_url,
+                    term,
+                    lang,
+                    connect_timeout=connect_timeout,
+                    read_timeout=read_timeout,
+                    http_retries=http_retries,
+                    stats=stats,
+                )
+                or ""
+            )
+            if qid:
+                log.info(
+                    "[Wikidata] resolve | term=%r -> %s (wbsearchentities first hit)",
+                    _trunc(term, 100),
+                    qid,
+                )
+            else:
+                log.info(
+                    "[Wikidata] resolve | term=%r -> NO_HIT (empty search or API error, see warnings above)",
+                    _trunc(term, 100),
+                )
+        if not qid or qid in seen_q:
+            if qid and qid in seen_q:
+                log.info("[Wikidata] skip duplicate QID %s for term=%r", qid, _trunc(term, 80))
+            continue
+        seen_q.add(qid)
+        resolved.append((term, qid))
+
+    if not resolved:
+        log.info(
+            "[Wikidata] skip: zero QIDs resolved | tried=%d terms | elapsed=%.2fs",
+            len(terms),
+            time.perf_counter() - t0,
+        )
+        if emit_failure_hint and stats.network_failures > 0:
+            if lang.casefold().startswith("en"):
+                return (
+                    "---\n"
+                    "**Wikidata reference unavailable**\n"
+                    "- Connection to Wikidata timed out or failed.\n"
+                    "- Please configure outbound proxy for this server "
+                    "(e.g. `HTTPS_PROXY`/`HTTP_PROXY`) or increase Wikidata timeout settings."
+                )
+            return (
+                "---\n"
+                "**Wikidata 参考暂不可用**\n"
+                "- 连接 Wikidata 超时或失败。\n"
+                "- 需要为服务端配置代理（如 `HTTPS_PROXY`/`HTTP_PROXY`），"
+                "或调大 Wikidata 超时参数。"
+            )
+        return ""
+
+    qids = [q for _, q in resolved]
+    langs_param = "|".join(dict.fromkeys(lang_chain).keys())
+    ent_map = _batch_get_entities(
+        session,
+        api_url,
+        qids,
+        langs_param,
+        connect_timeout=connect_timeout,
+        read_timeout=read_timeout,
+        http_retries=http_retries,
+        stats=stats,
+    )
+    missing = [q for q in qids if q not in ent_map]
+    if missing:
+        log.warning(
+            "[Wikidata] wbgetentities missing %d/%d ids (will use fallback labels): %s",
+            len(missing),
+            len(qids),
+            missing[:10],
+        )
+
+    if lang.casefold().startswith("en"):
+        header = "**Wikidata reference** (auto search from subgraph entity names; not entity-aligned)"
+    else:
+        header = "**Wikidata 参考**（由子图实体名自动检索，未做实体对齐，仅供参考）"
+    lines: List[str] = ["---", header]
+    for term, qid in resolved:
+        ent = ent_map.get(qid) or {}
+        label = _pick_lang_value(ent.get("labels"), lang_chain)
+        if not label:
+            label = term if not _QID_RE.match(term) else qid
+        desc = _pick_lang_value(ent.get("descriptions"), lang_chain)
+        url = f"https://www.wikidata.org/wiki/{qid}"
+        if desc:
+            lines.append(f"- [{label}]({url}) — {desc}")
+        else:
+            lines.append(f"- [{label}]({url})")
+
+    elapsed = time.perf_counter() - t0
+    log.info(
+        "[Wikidata] supplement built | qids=%s | markdown_lines=%d | elapsed=%.2fs",
+        qids,
+        len(lines),
+        elapsed,
+    )
+    return "\n".join(lines)
diff --git a/workflow_engine/workflow/wf_graphrag_chat.py b/workflow_engine/workflow/wf_graphrag_chat.py
new file mode 100644
index 0000000..ff39384
--- /dev/null
+++ b/workflow_engine/workflow/wf_graphrag_chat.py
@@ -0,0 +1,483 @@
+"""GraphRAG 对话工作流（注册名 ``"graphrag_chat"``）。
+
+【图结构】::
+
+    _start_ → _chat_ → END
+
+``_chat_`` 执行意图+改写（一次 LLM）→ GraphRAG 检索 → 可选子图裁剪与 Judge（一次 LLM）→ 综合回答，
+将完整结果写入 ``state.agent_results["chat"]``。
+
+【数据流边界】
+    本模块不处理 HTTP；FastAPI 经 ``wa_graphrag_kb.run_chat`` 构造 ``GraphRAGChatState``
+    后 ``run_workflow("graphrag_chat", state)``。
+"""
+from __future__ import annotations
+
+import json
+import re
+from dataclasses import dataclass, field
+from pathlib import Path
+from typing import Any, Dict, List, Optional
+
+from workflow_engine.graphbuilder.graph_builder import GenericGraphBuilder
+from workflow_engine.logger import get_logger
+from workflow_engine.state import MainRequest, MainState
+from workflow_engine.workflow.registry import register
+
+log = get_logger(__name__)
+
+MAX_HISTORY_TURNS = 8
+
+
+# ---------------------------------------------------------------------------
+# Request / State
+# ---------------------------------------------------------------------------
+
+@dataclass
+class GraphRAGChatRequest(MainRequest):
+    """Multi-turn chat request for GraphRAG conversational workflow."""
+    query: str = ""
+    history: List[Dict[str, Any]] = field(default_factory=list)
+    search_method: str = "auto"  # "auto" | "local" | "global"
+    notebook_id: str = ""
+    notebook_title: str = ""
+    email: str = ""
+    workspace_dir: str = ""
+    # None = follow settings.GRAPHRAG_WIKIDATA_ENRICH_ENABLED; False = skip Wikidata tail
+    wikidata_enrich: Optional[bool] = None
+    # True: return main answer first; prune/judge/wikidata will be done by a follow-up request.
+    defer_postprocess: bool = False
+
+
+@dataclass
+class GraphRAGChatState(MainState):
+    """Workflow state for GraphRAG chat."""
+    request: GraphRAGChatRequest = field(default_factory=GraphRAGChatRequest)
+    intent: Dict[str, Any] = field(default_factory=dict)
+    rewritten_query: str = ""
+    graphrag_raw_answer: str = ""
+    context_data: Dict[str, Any] = field(default_factory=dict)
+    reasoning_subgraph: List[Dict[str, Any]] = field(default_factory=list)
+    reasoning_subgraph_cot: str = ""
+    source_chunks: List[str] = field(default_factory=list)
+    highlight_hints: List[Dict[str, Any]] = field(default_factory=list)
+    judge_score: float = 0.0
+    judge_rationale: str = ""
+    answer: str = ""
+
+
+# ---------------------------------------------------------------------------
+# Prompt templates
+# ---------------------------------------------------------------------------
+
+_INTENT_REWRITE_SYSTEM = """You route chat for a GraphRAG knowledge base.
+Respond ONLY with valid JSON (no markdown) with exactly these keys:
+- "use_graphrag": boolean — true for factual questions about document content, entities, or KB knowledge; false for greetings, pure chitchat, or questions fully answerable from conversation history alone.
+- "reason": one short sentence explaining the choice.
+- "rewritten": string — if use_graphrag is true, rewrite the user's latest message into a standalone question (resolve pronouns and references using history). If use_graphrag is false, set "rewritten" to the latest user message or a minimal paraphrase."""
+
+_INTENT_REWRITE_USER = """Conversation history (most recent last):
+{history}
+
+Recent retrieval memory:
+{retrieval_memory}
+
+Latest user question: {query}"""
+
+_DIRECT_SYSTEM = """You are a helpful assistant for a document knowledge-base application.
+Answer the user's question based on the conversation history and your general knowledge.
+Be concise and helpful. Respond in the same language as the user's question."""
+
+_DIRECT_USER = """Conversation history:
+{history}
+
+User: {query}
+Assistant:"""
+
+_SYNTHESIS_SYSTEM = """You are a helpful assistant for a document knowledge-base application.
+You are given the GraphRAG retrieval result and conversation history.
+Write a clear, helpful answer. Respond in the same language as the user's question.
+Do NOT include: internal scoring, subgraph dumps, any literal substring "[chunk:" or "[Data:",
+hex chunk ids, or citation markers copied from the retrieval text."""
+
+_SYNTHESIS_USER = """Conversation history:
+{history}
+
+User question: {query}
+
+GraphRAG retrieval result:
+{graphrag_answer}
+
+Write the final answer, integrating the above evidence with any relevant context from history:"""
+
+
+# ---------------------------------------------------------------------------
+# LLM helpers
+# ---------------------------------------------------------------------------
+
+async def _llm_json(api_url: str, api_key: str, model: str, system: str, user: str) -> str:
+    from openai import AsyncOpenAI
+    client = AsyncOpenAI(api_key=api_key or "none", base_url=api_url.rstrip("/"))
+    resp = await client.chat.completions.create(
+        model=model,
+        temperature=0,
+        response_format={"type": "json_object"},
+        messages=[
+            {"role": "system", "content": system},
+            {"role": "user", "content": user},
+        ],
+    )
+    return (resp.choices[0].message.content or "{}").strip()
+
+
+async def _llm_text(api_url: str, api_key: str, model: str, system: str, user: str) -> str:
+    from openai import AsyncOpenAI
+    client = AsyncOpenAI(api_key=api_key or "none", base_url=api_url.rstrip("/"))
+    resp = await client.chat.completions.create(
+        model=model,
+        temperature=0.3,
+        messages=[
+            {"role": "system", "content": system},
+            {"role": "user", "content": user},
+        ],
+    )
+    return (resp.choices[0].message.content or "").strip()
+
+
+_RE_USER_LEAK_CHUNK = re.compile(r"\[chunk:[a-f0-9]+\]", re.IGNORECASE)
+_RE_USER_LEAK_DATA = re.compile(r"\s*\[Data:[^\]]+\]", re.IGNORECASE)
+
+
+def _strip_leakage_for_user_answer(text: str) -> str:
+    """Remove GraphRAG citation tails and chunk id markers from text shown to the user."""
+    if not (text and text.strip()):
+        return text
+    t = _RE_USER_LEAK_DATA.sub("", text)
+    t = _RE_USER_LEAK_CHUNK.sub("", t)
+    return re.sub(r"[ \t]+\n", "\n", t).strip()
+
+
+def _format_history(history: List[Dict[str, Any]]) -> str:
+    if not history:
+        return "(no prior conversation)"
+    recent = history[-MAX_HISTORY_TURNS * 2:]
+    lines = []
+    for msg in recent:
+        role = "User" if msg.get("role") == "user" else "Assistant"
+        lines.append(f"{role}: {msg.get('content', '')}")
+    return "\n".join(lines)
+
+
+def _norm_query(text: str) -> str:
+    return re.sub(r"\s+", " ", (text or "")).strip().casefold()
+
+
+def _format_retrieval_memory(history: List[Dict[str, Any]]) -> str:
+    rows: List[str] = []
+    for msg in reversed(history[-MAX_HISTORY_TURNS * 2 :]):
+        if msg.get("role") != "assistant":
+            continue
+        meta = msg.get("meta")
+        if not isinstance(meta, dict):
+            continue
+        intent = meta.get("intent")
+        use_gr = False
+        if isinstance(intent, dict):
+            use_gr = bool(intent.get("use_graphrag", False))
+        if not use_gr:
+            continue
+        rq = str(meta.get("rewritten_query") or "").strip()
+        score = meta.get("judge_score")
+        if rq:
+            rows.append(f"- rewritten_query={rq!r}, judge_score={score!r}")
+        if len(rows) >= 3:
+            break
+    return "\n".join(rows) if rows else "(none)"
+
+
+def _pick_cached_graphrag_result(
+    history: List[Dict[str, Any]], rewritten_query: str
+) -> Optional[Dict[str, Any]]:
+    target = _norm_query(rewritten_query)
+    if not target:
+        return None
+    for msg in reversed(history):
+        if msg.get("role") != "assistant":
+            continue
+        meta = msg.get("meta")
+        if not isinstance(meta, dict):
+            continue
+        rq = _norm_query(str(meta.get("rewritten_query") or ""))
+        raw_answer = str(meta.get("graphrag_raw_answer") or "").strip()
+        if rq != target or not raw_answer:
+            continue
+        return {
+            "answer": raw_answer,
+            "context_data": meta.get("context_data") if isinstance(meta.get("context_data"), dict) else {},
+            "reasoning_subgraph": meta.get("reasoning_subgraph") if isinstance(meta.get("reasoning_subgraph"), list) else [],
+            "source_chunks": meta.get("source_chunks") if isinstance(meta.get("source_chunks"), list) else [],
+            "highlight_hints": meta.get("highlight_hints") if isinstance(meta.get("highlight_hints"), list) else [],
+        }
+    return None
+
+
+# ---------------------------------------------------------------------------
+# Chat node
+# ---------------------------------------------------------------------------
+
+async def _chat_node(state: GraphRAGChatState) -> GraphRAGChatState:
+    import asyncio
+    import time as _time
+    from workflow_engine.toolkits.graphrag_ms_tool.indexer import GraphRAGWorkspace
+    from workflow_engine.toolkits.graphrag_ms_tool.querier import query_local, query_global
+    from workflow_engine.toolkits.graphrag_ms_tool.judge import JudgeResult, judge_confidence
+    from workflow_engine.toolkits.graphrag_ms_tool.prune_judge_combined import prune_and_judge_combined_llm
+    from fastapi_app.config.settings import settings as cfg
+
+    req = state.request
+    api_url = req.chat_api_url.rstrip("/")
+    api_key = req.api_key
+    model = req.model
+    history_str = _format_history(req.history)
+    retrieval_memory = _format_retrieval_memory(req.history)
+
+    t_total_start = _time.perf_counter()
+    # ── Step 1: Intent + query rewrite (single LLM call) ─────────────────────
+    t0 = _time.perf_counter()
+    rewritten = req.query
+    try:
+        intent_raw = await _llm_json(
+            api_url, api_key, model,
+            _INTENT_REWRITE_SYSTEM,
+            _INTENT_REWRITE_USER.format(
+                history=history_str,
+                retrieval_memory=retrieval_memory,
+                query=req.query,
+            ),
+        )
+        data = json.loads(intent_raw)
+        intent = {
+            "use_graphrag": bool(data.get("use_graphrag", True)),
+            "reason": str(data.get("reason", "") or ""),
+        }
+        rw = str(data.get("rewritten", "") or "").strip()
+        if rw:
+            rewritten = rw
+    except Exception as e:
+        log.warning("[GraphRAGChat] intent+rewrite failed: %s; defaulting to GraphRAG + raw query", e)
+        intent = {"use_graphrag": True, "reason": "fallback"}
+    state.intent = intent
+    use_graphrag = bool(intent.get("use_graphrag", True))
+    t1 = _time.perf_counter()
+    log.info("[TIMING][Chat] intent+rewrite | %.3fs | use_graphrag=%s", t1 - t0, use_graphrag)
+
+    if not use_graphrag:
+        # ── Step 2a: Direct answer (no GraphRAG) ────────────────────────────
+        answer = await _llm_text(
+            api_url, api_key, model,
+            _DIRECT_SYSTEM,
+            _DIRECT_USER.format(history=history_str, query=req.query),
+        )
+        t2 = _time.perf_counter()
+        log.info("[TIMING][Chat] direct answer | %.3fs | TOTAL=%.3fs", t2 - t1, t2 - t_total_start)
+        state.answer = answer
+        state.agent_results["chat"] = {
+            "answer": answer,
+            "intent": intent,
+            "rewritten_query": "",
+            "context_data": {},
+            "reasoning_subgraph": [],
+            "reasoning_subgraph_cot": "",
+            "source_chunks": [],
+            "highlight_hints": [],
+            "judge_score": 0.0,
+            "judge_rationale": "",
+            "postprocess_pending": False,
+            "graphrag_raw_answer": "",
+        }
+        return state
+
+    state.rewritten_query = rewritten
+    log.info("[TIMING][Chat] rewritten_query (from intent step) | %r", rewritten[:120])
+
+    # ── Step 2: GraphRAG search + optional prune+judge (single LLM when prune on) ─
+    workspace_dir = req.workspace_dir
+    ws = GraphRAGWorkspace(root=Path(workspace_dir).resolve())
+
+    if not (workspace_dir or "").strip():
+        state.temp_data["errors"] = ["GraphRAG workspace 未设置：请先在当前笔记本完成「构建索引」。"]
+        return state
+    if not ws.root.is_dir() or not ws.settings_path.is_file():
+        state.temp_data["errors"] = [
+            "GraphRAG 工作区无效：目录不存在或缺少 settings.yaml（常见于浏览器缓存了其他电脑或旧项目的路径）。"
+            f"当前路径：{ws.root}。请在当前环境重新执行「构建索引」或清空该笔记本的 GraphRAG 缓存后重建。"
+        ]
+        log.warning("[GraphRAGChat] invalid workspace root_is_dir=%s settings_exists=%s", ws.root.is_dir(), ws.settings_path.is_file())
+        return state
+
+    search_method = req.search_method if req.search_method in ("local", "global") else "local"
+    search_fn = query_global if search_method == "global" else query_local
+
+    cached = _pick_cached_graphrag_result(req.history, rewritten)
+    if cached is not None:
+        class _CachedResult:
+            def __init__(self, payload: Dict[str, Any]):
+                self.answer = str(payload.get("answer") or "")
+                self.context_data = payload.get("context_data") or {}
+                self.reasoning_subgraph = payload.get("reasoning_subgraph") or []
+                self.source_chunks = payload.get("source_chunks") or []
+                self.highlight_hints = payload.get("highlight_hints") or []
+
+        result = _CachedResult(cached)
+        log.info(
+            "[TIMING][Chat] graphrag search skipped (cache hit) | rewritten=%r | answer_len=%d | edges=%d",
+            rewritten[:80],
+            len(result.answer),
+            len(result.reasoning_subgraph),
+        )
+    else:
+        t4 = _time.perf_counter()
+        try:
+            result = await asyncio.to_thread(search_fn, ws, rewritten, api_base=api_url, api_key=api_key)
+        except Exception as exc:
+            log.warning("[GraphRAGChat] search failed: %s", exc)
+            state.temp_data["errors"] = [f"GraphRAG 检索失败：{exc}"]
+            return state
+        t5 = _time.perf_counter()
+        log.info("[TIMING][Chat] graphrag search | %.3fs | answer_len=%d", t5 - t4, len(result.answer or ""))
+
+    reasoning_subgraph_cot = ""
+    judge = None
+    if not req.defer_postprocess:
+        t_p0 = _time.perf_counter()
+        if cfg.GRAPHRAG_SUBGRAPH_PRUNE_ENABLED and result.reasoning_subgraph:
+            pj = await asyncio.to_thread(
+                prune_and_judge_combined_llm,
+                rewritten,
+                result.answer,
+                result.reasoning_subgraph,
+                api_base=api_url,
+                api_key=api_key,
+                max_edges_input=int(cfg.GRAPHRAG_SUBGRAPH_PRUNE_MAX_EDGES_INPUT),
+                max_tokens=int(getattr(cfg, "GRAPHRAG_PRUNE_JUDGE_MAX_TOKENS", 768) or 768),
+            )
+            result.reasoning_subgraph = pj.edges
+            reasoning_subgraph_cot = pj.cot
+            judge = pj.judge
+            t_p1 = _time.perf_counter()
+            log.info(
+                "[TIMING][Chat] prune+judge combined | %.3fs | score=%.3f",
+                t_p1 - t_p0,
+                judge.score,
+            )
+
+        t6 = _time.perf_counter()
+        if judge is None:
+            judge = await asyncio.to_thread(
+                judge_confidence, rewritten, result.answer, result.reasoning_subgraph,
+                api_base=api_url, api_key=api_key,
+            )
+        t7 = _time.perf_counter()
+        log.info("[TIMING][Chat] judge path | %.3fs | score=%.3f", t7 - t6, judge.score)
+    else:
+        judge = JudgeResult(
+            score=0.0,
+            rationale="后处理进行中：正在生成子图、置信度与 Wikidata 参考…",
+        )
+        log.info("[TIMING][Chat] defer_postprocess=True | skip prune/judge in main response")
+
+    state.graphrag_raw_answer = result.answer
+    state.context_data = result.context_data
+    state.reasoning_subgraph = result.reasoning_subgraph
+    state.reasoning_subgraph_cot = reasoning_subgraph_cot
+    state.source_chunks = result.source_chunks
+    state.highlight_hints = result.highlight_hints
+    state.judge_score = judge.score
+    state.judge_rationale = judge.rationale
+
+    # ── Step 4: Synthesis ────────────────────────────────────────────────────
+    t8 = _time.perf_counter()
+    answer = await _llm_text(
+        api_url, api_key, model,
+        _SYNTHESIS_SYSTEM,
+        _SYNTHESIS_USER.format(
+            history=history_str,
+            query=req.query,
+            graphrag_answer=result.answer,
+        ),
+    )
+    t9 = _time.perf_counter()
+    log.info("[TIMING][Chat] synthesis | %.3fs | TOTAL=%.3fs", t9 - t8, t9 - t_total_start)
+
+    answer = _strip_leakage_for_user_answer(answer)
+    if not req.defer_postprocess:
+        wd_flag = req.wikidata_enrich
+        wd_on = (
+            bool(getattr(cfg, "GRAPHRAG_WIKIDATA_ENRICH_ENABLED", True))
+            if wd_flag is None
+            else bool(wd_flag)
+        )
+        if wd_on and result.reasoning_subgraph:
+            try:
+                from workflow_engine.toolkits.wikidata_subgraph_enrich import (
+                    format_wikidata_supplement_for_subgraph,
+                )
+
+                extra = await asyncio.to_thread(
+                    format_wikidata_supplement_for_subgraph,
+                    result.reasoning_subgraph,
+                    lang=str(getattr(cfg, "GRAPHRAG_WIKIDATA_LANG", "zh") or "zh"),
+                    max_entities=int(getattr(cfg, "GRAPHRAG_WIKIDATA_MAX_ENTITIES", 8) or 8),
+                    connect_timeout=float(
+                        getattr(cfg, "GRAPHRAG_WIKIDATA_CONNECT_TIMEOUT_SEC", 10.0) or 10.0
+                    ),
+                    read_timeout=float(getattr(cfg, "GRAPHRAG_WIKIDATA_TIMEOUT_SEC", 45.0) or 45.0),
+                    http_retries=int(getattr(cfg, "GRAPHRAG_WIKIDATA_HTTP_RETRIES", 2) or 2),
+                    api_url=str(
+                        getattr(
+                            cfg,
+                            "GRAPHRAG_WIKIDATA_API_URL",
+                            "https://www.wikidata.org/w/api.php",
+                        )
+                        or "https://www.wikidata.org/w/api.php"
+                    ),
+                    emit_failure_hint=True,
+                )
+                if extra:
+                    answer = answer.rstrip() + "\n\n" + extra
+            except Exception as exc:
+                log.warning("[GraphRAGChat] Wikidata enrich failed: %s", exc)
+
+    state.answer = answer
+    state.agent_results["chat"] = {
+        "answer": answer,
+        "intent": intent,
+        "rewritten_query": rewritten,
+        "context_data": result.context_data,
+        "reasoning_subgraph": result.reasoning_subgraph,
+        "reasoning_subgraph_cot": reasoning_subgraph_cot,
+        "source_chunks": result.source_chunks,
+        "highlight_hints": result.highlight_hints,
+        "judge_score": judge.score,
+        "judge_rationale": judge.rationale,
+        "postprocess_pending": bool(req.defer_postprocess and bool(result.reasoning_subgraph)),
+        "graphrag_raw_answer": result.answer,
+    }
+    return state
+
+
+# ---------------------------------------------------------------------------
+# Graph factory
+# ---------------------------------------------------------------------------
+
+@register("graphrag_chat")
+def create_graphrag_chat_graph() -> GenericGraphBuilder:
+    """Register workflow nodes/edges and return a ``GenericGraphBuilder``."""
+
+    async def _start_(state: GraphRAGChatState) -> GraphRAGChatState:
+        return state
+
+    builder = GenericGraphBuilder(state_model=GraphRAGChatState, entry_point="_start_")
+    builder.add_nodes({"_start_": _start_, "_chat_": _chat_node})
+    builder.add_edges([("_start_", "_chat_")])
+    return builder
diff --git a/workflow_engine/workflow/wf_graphrag_kb.py b/workflow_engine/workflow/wf_graphrag_kb.py
new file mode 100644
index 0000000..2cb1efd
--- /dev/null
+++ b/workflow_engine/workflow/wf_graphrag_kb.py
@@ -0,0 +1,478 @@
+"""GraphRAG 知识库管线工作流（注册名 ``"graphrag_kb"``）。
+
+【图结构】（单节点派发，便于维护）::
+
+    _start_ → _dispatch_ → END
+
+``_dispatch_`` 读取 ``state.request.action``，分别路由到：
+    ``index``  → ``_action_index``   （MinerU 可选 → 分块 → 可选 KGGen → GraphRAG 建索引）
+    ``query``  → ``_action_query``   （本地/全局检索 → 可选子图剪枝+Judge 合并 LLM）
+    ``merge``  → ``_action_merge``   （两工作区 chunk 合并 → 强制重索引）
+
+【数据流边界】
+    本模块**不处理 HTTP**；FastAPI 经 ``wa_graphrag_kb`` 构造 ``GraphRAGKBState`` 后 ``run_workflow``。
+    成功结果写入 ``state.agent_results``；异常写入 ``state.temp_data["errors"]``。
+"""
+from __future__ import annotations
+
+import json
+import re
+from dataclasses import dataclass, field
+from pathlib import Path
+from typing import Any, Dict, List, Optional
+
+from workflow_engine.graphbuilder.graph_builder import GenericGraphBuilder
+from workflow_engine.logger import get_logger
+from workflow_engine.state import MainRequest, MainState
+from workflow_engine.workflow.registry import register
+
+log = get_logger(__name__)
+
+
+# ---------------------------------------------------------------------------
+# Request / State  (dataclasses matching project convention)
+# ---------------------------------------------------------------------------
+
+@dataclass
+class GraphRAGKBRequest(MainRequest):
+    """Single-action request for the GraphRAG KB pipeline (index / query / merge)."""
+
+    # ── 动作选择 ────────────────────────────────────────────────────────────────
+    # index   源文件分块 →（可选 KGGen）→ GraphRAG 建索引
+    # query   在已有 workspace 上做 local/global 检索
+    # merge   合并两个 workspace 并重新索引
+    action: str = "index"
+
+    # ── Index / Query shared ──────────────────────────────────────────────────
+    notebook_id: str = ""
+    notebook_title: str = ""
+    email: str = ""
+    workspace_dir: str = ""          # override default workspace path
+
+    # ── Index ─────────────────────────────────────────────────────────────────
+    source_stems: List[str] = field(default_factory=list)
+    force_reindex: bool = False
+    # When True, run MinerU on any PDF that has not been parsed yet before
+    # chunk extraction.  Skips PDFs that already have a mineru/ directory.
+    parse_pdfs: bool = True
+    # When False, run optional KGGen triple extraction (not used by GraphRAG index).
+    # Default True: user-facing index path is MinerU/chunks → GraphRAG only.
+    skip_kggen: bool = True
+
+    # ── Query ─────────────────────────────────────────────────────────────────
+    question: str = ""
+    search_method: str = "local"     # "local" | "global"
+
+    # ── Merge ─────────────────────────────────────────────────────────────────
+    workspace_dir_b: str = ""
+    dedupe: bool = False
+
+    # ── Query (optional) ──────────────────────────────────────────────────────
+    # None = follow settings.GRAPHRAG_WIKIDATA_ENRICH_ENABLED
+    wikidata_enrich: Optional[bool] = None
+
+
+@dataclass
+class GraphRAGKBState(MainState):
+    """Workflow state; ``agent_results`` accumulates action outputs."""
+
+    request: GraphRAGKBRequest = field(default_factory=GraphRAGKBRequest)
+
+
+# ---------------------------------------------------------------------------
+# Graph factory
+# ---------------------------------------------------------------------------
+
+@register("graphrag_kb")
+def create_graphrag_kb_graph() -> GenericGraphBuilder:
+    """Register workflow nodes/edges and return a ``GenericGraphBuilder``."""
+
+    builder = GenericGraphBuilder(state_model=GraphRAGKBState, entry_point="_start_")
+
+    async def _start_(state: GraphRAGKBState) -> GraphRAGKBState:
+        return state
+
+    async def _dispatch_(state: GraphRAGKBState) -> GraphRAGKBState:
+        action = (state.request.action or "").strip().lower()
+        try:
+            if action == "index":
+                await _action_index(state)
+            elif action == "query":
+                await _action_query(state)
+            elif action == "merge":
+                await _action_merge(state)
+            else:
+                state.temp_data["errors"] = [f"Unknown action: {action!r}"]
+        except Exception as exc:
+            log.exception("[GraphRAGKB] Workflow error (action=%s): %s", action, exc)
+            state.temp_data["errors"] = [str(exc)]
+        return state
+
+    nodes = {"_start_": _start_, "_dispatch_": _dispatch_}
+    edges = [("_start_", "_dispatch_")]
+
+    builder.add_nodes(nodes).add_edges(edges)
+    return builder
+
+
+# ---------------------------------------------------------------------------
+# Action implementations
+# ---------------------------------------------------------------------------
+
+async def _action_index(state: GraphRAGKBState) -> None:
+    """MinerU (opt) → chunk extraction → KGGen (opt) → ``build_index``; writes ``agent_results["index"]``."""
+    import asyncio
+    from fastapi_app.notebook_paths import get_notebook_paths
+    from fastapi_app.source_manager import SourceManager
+    from fastapi_app.config.settings import settings as cfg
+    from workflow_engine.toolkits.graphrag_ms_tool.indexer import build_index
+
+    req = state.request
+    nb_paths = get_notebook_paths(req.notebook_id, req.notebook_title, req.email)
+    manager = SourceManager(nb_paths)
+
+    # Step 0 — collect sources and (optionally) trigger MinerU for unparsed PDFs
+    sources = manager.list_sources()
+    if req.source_stems:
+        sources = [s for s in sources if s.stem in req.source_stems]
+
+    if req.parse_pdfs:
+        await _ensure_mineru_parsed(manager, nb_paths, sources, req.force_reindex)
+
+    # Step 1 — collect structured chunks from all (or selected) sources
+
+    all_chunks: List[Dict[str, Any]] = []
+    n_src = len(sources)
+    for si, src in enumerate(sources, start=1):
+        chunks = manager.get_chunks_with_meta(
+            src.stem,
+            chunk_size=cfg.GRAPHRAG_CHUNK_SIZE,
+            chunk_overlap=cfg.GRAPHRAG_CHUNK_OVERLAP,
+        )
+        all_chunks.extend(chunks)
+        log.info(
+            "[GraphRAGKB] Step1 source=%s → %d chunks (%d/%d sources)",
+            src.stem,
+            len(chunks),
+            si,
+            n_src,
+        )
+
+    if not all_chunks:
+        raise ValueError(
+            "No text chunks found. Ensure sources have been imported into the notebook first."
+        )
+    log.info("[GraphRAGKB] Step1 done: %d total chunks", len(all_chunks))
+
+    # Step 2 — optional KGGen (not fed into GraphRAG; default off for user-facing index)
+    kg_result: Optional[Dict[str, Any]] = None
+    if not req.skip_kggen:
+        from workflow_engine.toolkits.kggen_tool.kg_extractor import extract_kg_from_chunks
+
+        try:
+            kg_llm_model = req.model or cfg.GRAPHRAG_LLM_MODEL or cfg.KGGEN_MODEL
+            log.info(
+                "[GraphRAGKB] Step2 KGGen starting: %d chunks, per_chunk=%s, log_interval=%s",
+                len(all_chunks),
+                cfg.KGGEN_PER_CHUNK,
+                getattr(cfg, "KGGEN_LOG_CHUNK_INTERVAL", 10),
+            )
+            kg_result = await asyncio.to_thread(
+                extract_kg_from_chunks,
+                all_chunks,
+                model=kg_llm_model,
+                api_base=req.chat_api_url.rstrip("/"),
+                api_key=req.api_key,
+            )
+            log.info(
+                "[GraphRAGKB] KGGen → %d entities, %d relations",
+                len(kg_result.get("entities", [])),
+                len(kg_result.get("relations", [])),
+            )
+        except Exception as exc:
+            log.warning("[GraphRAGKB] KGGen extraction skipped: %s", exc)
+    else:
+        log.debug("[GraphRAGKB] KGGen skipped (skip_kggen=True)")
+
+    # Step 3 — GraphRAG workspace + indexing
+    workspace_dir = req.workspace_dir or _default_workspace_dir(req)
+    log.info("[GraphRAGKB] Step3 GraphRAG index → %s", workspace_dir)
+    ws = await asyncio.to_thread(
+        build_index,
+        all_chunks,
+        workspace_dir,
+        llm_model=req.model or cfg.GRAPHRAG_LLM_MODEL,
+        embedding_model=cfg.GRAPHRAG_EMBEDDING_MODEL,
+        api_base=req.chat_api_url.rstrip("/"),
+        api_key=req.api_key,
+        force_reindex=req.force_reindex,
+    )
+
+    state.agent_results["index"] = {
+        "workspace_dir": str(ws.root),
+        "num_chunks": len(all_chunks),
+        "kg_entities": len(kg_result.get("entities", [])) if kg_result else 0,
+        "kg_relations": len(kg_result.get("relations", [])) if kg_result else 0,
+    }
+
+
+async def _action_query(state: GraphRAGKBState) -> None:
+    """GraphRAG query → optional prune+Judge（单次 LLM）或单独 Judge；写入 ``agent_results["query"]``。"""
+    import asyncio
+    import time as _time
+    from fastapi_app.config.settings import settings as cfg
+    from workflow_engine.toolkits.graphrag_ms_tool.indexer import GraphRAGWorkspace
+    from workflow_engine.toolkits.graphrag_ms_tool.querier import query_local, query_global
+    from workflow_engine.toolkits.graphrag_ms_tool.judge import judge_confidence
+    from workflow_engine.toolkits.graphrag_ms_tool.prune_judge_combined import (
+        prune_and_judge_combined_llm,
+    )
+
+    req = state.request
+    workspace_dir = req.workspace_dir or _default_workspace_dir(req)
+    ws = GraphRAGWorkspace(root=Path(workspace_dir).resolve())
+
+    search_fn = query_local if req.search_method == "local" else query_global
+
+    t_a0 = _time.perf_counter()
+    log.info(
+        "[TIMING][A] _action_query START | method=%s | question=%r",
+        req.search_method, req.question[:80],
+    )
+
+    t_b0 = _time.perf_counter()
+    result = await asyncio.to_thread(
+        search_fn,
+        ws,
+        req.question,
+        api_base=req.chat_api_url.rstrip("/"),
+        api_key=req.api_key,
+    )
+    t_b1 = _time.perf_counter()
+    log.info(
+        "[TIMING][A→B] search(%s) done | elapsed=%.3fs | answer_len=%d | subgraph_edges=%d",
+        req.search_method, t_b1 - t_b0, len(result.answer or ""), len(result.reasoning_subgraph),
+    )
+
+    reasoning_subgraph_cot = ""
+    judge = None
+    did_prune_judge_combined = False
+    t_c0 = t_b1
+    if cfg.GRAPHRAG_SUBGRAPH_PRUNE_ENABLED and result.reasoning_subgraph:
+        did_prune_judge_combined = True
+        t_c0 = _time.perf_counter()
+        log.info(
+            "[TIMING][A→CJ] prune_judge_combined START | edges_in=%d",
+            len(result.reasoning_subgraph),
+        )
+        pj = await asyncio.to_thread(
+            prune_and_judge_combined_llm,
+            req.question,
+            result.answer,
+            result.reasoning_subgraph,
+            api_base=req.chat_api_url.rstrip("/"),
+            api_key=req.api_key,
+            max_edges_input=int(cfg.GRAPHRAG_SUBGRAPH_PRUNE_MAX_EDGES_INPUT),
+            max_tokens=int(getattr(cfg, "GRAPHRAG_PRUNE_JUDGE_MAX_TOKENS", 768) or 768),
+        )
+        result.reasoning_subgraph = pj.edges
+        reasoning_subgraph_cot = pj.cot
+        judge = pj.judge
+        t_c1 = _time.perf_counter()
+        log.info(
+            "[TIMING][A→CJ] prune_judge_combined done | elapsed=%.3fs | edges_out=%d | score=%.3f",
+            t_c1 - t_c0,
+            len(pj.edges),
+            judge.score,
+        )
+    else:
+        t_c1 = t_b1
+        log.info("[TIMING][A→CJ] prune_judge SKIPPED (disabled or no edges)")
+
+    t_d0 = _time.perf_counter()
+    if judge is None:
+        judge = await asyncio.to_thread(
+            judge_confidence,
+            req.question,
+            result.answer,
+            result.reasoning_subgraph,
+            api_base=req.chat_api_url.rstrip("/"),
+            api_key=req.api_key,
+        )
+    t_d1 = _time.perf_counter()
+    log.info("[TIMING][A→D] judge path done | elapsed=%.3fs | score=%.3f", t_d1 - t_d0, judge.score)
+
+    post_search_llm = (t_c1 - t_c0) if did_prune_judge_combined else (t_d1 - t_d0)
+    t_a1 = _time.perf_counter()
+    log.info(
+        "[TIMING][A] _action_query SUMMARY | search=%.3fs | post_search_llm=%.3fs | TOTAL=%.3fs",
+        t_b1 - t_b0,
+        post_search_llm,
+        t_a1 - t_a0,
+    )
+
+    query_answer = result.answer or ""
+    wd_flag = state.request.wikidata_enrich
+    wd_on = (
+        bool(getattr(cfg, "GRAPHRAG_WIKIDATA_ENRICH_ENABLED", True))
+        if wd_flag is None
+        else bool(wd_flag)
+    )
+    if wd_on and result.reasoning_subgraph:
+        try:
+            from workflow_engine.toolkits.wikidata_subgraph_enrich import (
+                format_wikidata_supplement_for_subgraph,
+            )
+
+            extra = await asyncio.to_thread(
+                format_wikidata_supplement_for_subgraph,
+                result.reasoning_subgraph,
+                lang=str(getattr(cfg, "GRAPHRAG_WIKIDATA_LANG", "zh") or "zh"),
+                max_entities=int(getattr(cfg, "GRAPHRAG_WIKIDATA_MAX_ENTITIES", 8) or 8),
+                connect_timeout=float(
+                    getattr(cfg, "GRAPHRAG_WIKIDATA_CONNECT_TIMEOUT_SEC", 10.0) or 10.0
+                ),
+                read_timeout=float(getattr(cfg, "GRAPHRAG_WIKIDATA_TIMEOUT_SEC", 45.0) or 45.0),
+                http_retries=int(getattr(cfg, "GRAPHRAG_WIKIDATA_HTTP_RETRIES", 2) or 2),
+                api_url=str(
+                    getattr(
+                        cfg,
+                        "GRAPHRAG_WIKIDATA_API_URL",
+                        "https://www.wikidata.org/w/api.php",
+                    )
+                    or "https://www.wikidata.org/w/api.php"
+                ),
+                emit_failure_hint=True,
+            )
+            if extra:
+                query_answer = query_answer.rstrip() + "\n\n" + extra
+        except Exception as exc:
+            log.warning("[GraphRAGKB] Wikidata enrich failed: %s", exc)
+
+    state.agent_results["query"] = {
+        "answer": query_answer,
+        "context_data": result.context_data,
+        "reasoning_subgraph": result.reasoning_subgraph,
+        "reasoning_subgraph_cot": reasoning_subgraph_cot,
+        "source_chunks": result.source_chunks,
+        "highlight_hints": result.highlight_hints,
+        "judge_score": judge.score,
+        "judge_rationale": judge.rationale,
+    }
+
+
+async def _action_merge(state: GraphRAGKBState) -> None:
+    """Reconstruct chunks from two workspaces, re-index into ``{ws_a}_merged``; writes ``agent_results["merge"]``."""
+    import asyncio
+    from fastapi_app.config.settings import settings as cfg
+    from workflow_engine.toolkits.graphrag_ms_tool.indexer import GraphRAGWorkspace, build_index
+
+    req = state.request
+    ws_a = GraphRAGWorkspace(root=Path(req.workspace_dir).resolve())
+    ws_b = GraphRAGWorkspace(root=Path(req.workspace_dir_b).resolve())
+
+    all_chunks: List[Dict[str, Any]] = []
+    _chunk_pattern = re.compile(r"\[chunk:([a-f0-9]+)\]\n")
+
+    for ws in (ws_a, ws_b):
+        meta = ws.load_chunk_meta()
+        for txt in ws.input_dir.glob("*.txt"):
+            stem = txt.stem
+            text = txt.read_text(encoding="utf-8")
+            # Reconstruct chunks from embedded [chunk:ID] markers
+            parts = _chunk_pattern.split(text)
+            # parts = ['', cid1, text1, cid2, text2, ...]
+            i = 1
+            while i + 1 < len(parts):
+                cid = parts[i].strip()
+                chunk_text = parts[i + 1].strip()
+                m = meta.get(cid, {})
+                all_chunks.append(
+                    {
+                        "chunk_id": cid,
+                        "text": chunk_text,
+                        "page_index": m.get("page_index", -1),
+                        "order": m.get("order", -1),
+                        "bbox": m.get("bbox"),
+                        "source_stem": m.get("source_stem", stem),
+                    }
+                )
+                i += 2
+
+    if not all_chunks:
+        raise ValueError("No chunks found in either workspace.")
+
+    merged_dir = str(ws_a.root) + "_merged"
+    ws_merged = await asyncio.to_thread(
+        build_index,
+        all_chunks,
+        merged_dir,
+        llm_model=req.model or cfg.GRAPHRAG_LLM_MODEL,
+        embedding_model=cfg.GRAPHRAG_EMBEDDING_MODEL,
+        api_base=req.chat_api_url.rstrip("/"),
+        api_key=req.api_key,
+        force_reindex=True,
+    )
+
+    state.agent_results["merge"] = {
+        "merged_workspace_dir": str(ws_merged.root),
+        "num_chunks": len(all_chunks),
+    }
+
+
+# ---------------------------------------------------------------------------
+# Helpers
+# ---------------------------------------------------------------------------
+
+async def _ensure_mineru_parsed(manager: Any, nb_paths: Any, sources: list, force: bool) -> None:
+    """Run MinerU on PDF sources that have not been parsed yet.
+
+    Skips sources that already have a ``mineru/`` directory (unless *force*
+    is True, which re-runs MinerU and regenerates the unified markdown).
+
+    Non-PDF sources are silently skipped.
+    """
+    import asyncio
+
+    for src in sources:
+        if src.file_type != "pdf":
+            continue
+
+        already_parsed = manager.get_mineru_root(src.stem) is not None
+        if already_parsed and not force:
+            log.info("[GraphRAGKB] MinerU already done for %s — skipping", src.stem)
+            continue
+
+        orig = manager.get_original_path(src.stem)
+        if not orig or not orig.exists():
+            log.warning("[GraphRAGKB] Original PDF not found for %s — skipping MinerU", src.stem)
+            continue
+
+        mineru_dir = nb_paths.source_mineru_dir(orig.name)
+        mineru_dir.mkdir(parents=True, exist_ok=True)
+        log.info("[GraphRAGKB] Running MinerU on %s …", orig.name)
+        try:
+            await manager._run_mineru(orig, mineru_dir)
+        except Exception as exc:
+            log.warning("[GraphRAGKB] MinerU failed for %s: %s", orig.name, exc)
+            continue
+
+        # Regenerate unified markdown now that MinerU output exists
+        md_text = manager._generate_markdown(orig, ".pdf", mineru_dir)
+        if md_text:
+            md_dir = nb_paths.source_markdown_dir(orig.name)
+            md_dir.mkdir(parents=True, exist_ok=True)
+            (md_dir / f"{src.stem}.md").write_text(md_text, encoding="utf-8")
+        log.info("[GraphRAGKB] MinerU + markdown done for %s", orig.name)
+
+
+def _default_workspace_dir(req: GraphRAGKBRequest) -> str:
+    """Build default workspace path from ``GRAPHRAG_OUTPUT_DIR`` / sanitized email / notebook id."""
+    from workflow_engine.utils import get_project_root
+    from fastapi_app.config.settings import settings as cfg
+    from fastapi_app.notebook_paths import _sanitize_user_id
+
+    root = get_project_root()
+    safe_email = _sanitize_user_id(req.email) if req.email else "local"
+    nb_id = (req.notebook_id or "default").replace("/", "_")[:64]
+    return str(root / cfg.GRAPHRAG_OUTPUT_DIR / safe_email / nb_id)