update for 1. 优化 2.中英切换

fix somethings
1. Add 登陆功能
2026-06-10 11:10:36 +08:00 · 2026-06-08 11:16:28 +08:00 · 2026-06-05 18:00:31 +08:00
105 changed files with 18044 additions and 801 deletions
--- a/.env
+++ b/.env
@@ -48,8 +48,16 @@ CHUNK_OVERLAP=50
 MAX_FILE_SIZE_MB=100
 PARSER_BACKEND=aliyun
 CHUNK_BACKEND=aliyun
-# 文档元数据存储后端：json（默认）或 postgres
-DOCUMENT_REPOSITORY_BACKEND=json
+# 文档元数据存储后端：启用 postgres 以激活合规分析历史记录（Direction B）及 Finding Chat 持久化（Direction C）
+DOCUMENT_REPOSITORY_BACKEND=postgres
+# Set to true only when a Celery worker is actually running (./dev.sh start worker).
+# Default false: processing runs in FastAPI's threadpool — no external worker needed.
+USE_CELERY_WORKER=false
+
+# ===== 法规感知爬取配置 =====
+PERCEPTION_CRAWL_TIMEOUT_SECONDS=120
+PERCEPTION_MAX_EVENTS_PER_SOURCE=100
+PERCEPTION_DIFF_SIMILARITY_THRESHOLD=0.85

 # ===== API配置 =====
 API_HOST=0.0.0.0
@@ -92,3 +100,23 @@ ALIYUN_LLM_ENHANCEMENT=true
 ALIYUN_ENHANCEMENT_MODE=VLM
 DOCUMENT_PARSE_ARTIFACT_PREFIX=artifacts
 PARSER_FAILURE_MODE=fail
+
+# ===== Reranker 配置 =====
+RERANKER_ENABLED=true
+RERANKER_BASE_URL=http://6.86.80.4:30080/v1
+RERANKER_MODEL=BAAI/bge-reranker-v2-m3
+RERANKER_API_KEY=
+RERANKER_TOP_K=5
+
+# ===== 会话持久化 =====
+SESSION_BACKEND=redis
+
+# ===== 认证配置 =====
+# 生产环境请修改为强随机密钥: python -c "import secrets; print(secrets.token_hex(32))"
+AUTH_SECRET_KEY=ai-compliance-hub-jwt-secret-2026-tsystems
+AUTH_ALGORITHM=HS256
+AUTH_TOKEN_EXPIRE_MINUTES=480
+AUTH_ENABLED=true
+
+# ===== CORS =====
+CORS_ALLOW_ORIGINS=http://localhost:5173
--- a/.env.development
+++ b/.env.development
@@ -31,5 +31,5 @@ POSTGRES_PASSWORD=postgresql123456
 POSTGRES_DB=compliance_db

 # ===== 文档元数据后端 =====
-# 改为 postgres 以启用 PG 持久化（structure_nodes + semantic_blocks 入库）
+# 改为 postgres 以启用合规分析历史记录（Direction B）和 Finding Chat（Direction C）
 DOCUMENT_REPOSITORY_BACKEND=json
--- a/.env.example
+++ b/.env.example
@@ -50,7 +50,19 @@ DOCUMENT_METADATA_PATH=backend/data/documents.json
 PARSER_BACKEND=aliyun
 CHUNK_BACKEND=aliyun
 # 文档元数据存储后端：json（默认，无需数据库）或 postgres（启用 PG 持久化）
+# ⚠  以下功能需要 postgres（设为 json 时功能静默降级或报 500）：
+#   - Direction B: 合规分析历史记录 (/compliance/history/*)
+#   - Direction B: DOCX 报告下载
+#   - Direction C: Finding Chat 消息持久化
 DOCUMENT_REPOSITORY_BACKEND=json
+# Set to true only when a Celery worker is running (./dev.sh start worker).
+# Default false: document processing runs in FastAPI's threadpool (no external worker needed).
+USE_CELERY_WORKER=false
+
+# ===== 法规感知爬取配置 =====
+PERCEPTION_CRAWL_TIMEOUT_SECONDS=120
+PERCEPTION_MAX_EVENTS_PER_SOURCE=100
+PERCEPTION_DIFF_SIMILARITY_THRESHOLD=0.85

 # ===== 阿里云文档解析 =====
 ALIBABA_ACCESS_KEY_ID=your_aliyun_access_key_id
@@ -96,11 +108,15 @@ RAG_TOP_K=10
 RAG_RETRIEVAL_TOP_K=20
 RAG_MAX_CONTEXT_TOKENS=4000
 RAG_SUMMARY_MAX_TOKENS=1024
+RAG_SKILLS_MAX_TOKENS=2048

-# ===== Reranker配置（Cross-Encoder精排，默认关闭）=====
-# 设置 RERANKER_ENABLED=true 并配置 RERANKER_BASE_URL 以启用精排
-RERANKER_ENABLED=false
-RERANKER_BASE_URL=
+# ── Reranker (Cross-Encoder) ──────────────────────────────────────────────────
+# Set RERANKER_ENABLED=true and point to a TEI or Cohere-compatible rerank API.
+# Recommended model: BAAI/bge-reranker-v2.5-gemma2-lightweight (lighter) or
+#                    BAAI/bge-reranker-v2-m3 (heavier, higher quality).
+# The endpoint must expose POST /rerank (TEI style) or POST /v1/rerank (Cohere style).
+RERANKER_ENABLED=true
+RERANKER_BASE_URL=http://6.86.80.4:30080/v1
 RERANKER_MODEL=BAAI/bge-reranker-v2-m3
 RERANKER_API_KEY=
 RERANKER_TOP_K=5
@@ -108,3 +124,20 @@ RERANKER_TOP_K=5
 # ===== 会话配置 =====
 SESSION_MAX_SESSIONS=100
 SESSION_TIMEOUT_MINUTES=30
+# SESSION_BACKEND=redis 启用 Redis 持久化会话（需要 Redis 可用，推荐生产环境）
+# SESSION_BACKEND=memory 使用内存会话（重启丢失，适合本地开发）
+SESSION_BACKEND=memory
+
+# ===== 认证配置 (Auth) =====
+# 生产环境必须替换为强随机密钥:
+#   python -c "import secrets; print(secrets.token_hex(32))"
+AUTH_SECRET_KEY=change-me-in-production-must-be-32-or-more-characters-long
+AUTH_ALGORITHM=HS256
+# Token 有效期（分钟），默认 8 小时
+AUTH_TOKEN_EXPIRE_MINUTES=480
+# 设为 false 可跳过认证（仅限本地开发调试，生产必须 true）
+AUTH_ENABLED=true
+
+# ===== CORS =====
+# 逗号分隔的允许跨域来源列表，生产环境绝不能使用 *
+CORS_ALLOW_ORIGINS=http://localhost:5173
--- a/.superpowers/brainstorm/1055-1780892298/content/directions.html
+++ b/.superpowers/brainstorm/1055-1780892298/content/directions.html
@@ -0,0 +1,56 @@
+<h2>Compliance Analysis — 哪个方向最值得优化？</h2>
+<p class="subtitle">基于代码深度分析，发现了 4 个有价值的改进方向。选择你最希望深入的那个。</p>
+
+<div class="options">
+
+  <div class="option" data-choice="A" onclick="toggleSelect(this)">
+    <div class="letter">A</div>
+    <div class="content">
+      <h3>⚡ 分析质量提升</h3>
+      <p>并行子句处理（速度 3–5×）、跨编码器重排序、置信度过滤、修复 highlight_terms 失效 Bug、减少 LLM 静默失败。</p>
+      <div class="pros-cons" style="margin-top:10px">
+        <div class="pros"><h4>收益</h4><ul><li>更快、更准确的分析</li><li>消除当前 Bug</li></ul></div>
+        <div class="cons"><h4>难度</h4><ul><li>需要改造 pipeline.py</li></ul></div>
+      </div>
+    </div>
+  </div>
+
+  <div class="option" data-choice="B" onclick="toggleSelect(this)">
+    <div class="letter">B</div>
+    <div class="content">
+      <h3>📋 分析历史 &amp; 专业报告</h3>
+      <p>持久化分析记录（PostgreSQL）、历史对比、PDF/DOCX 专业报告导出、分析版本追踪。</p>
+      <div class="pros-cons" style="margin-top:10px">
+        <div class="pros"><h4>收益</h4><ul><li>结果不再丢失</li><li>可交付给客户的报告</li></ul></div>
+        <div class="cons"><h4>难度</h4><ul><li>需要新增数据库表</li></ul></div>
+      </div>
+    </div>
+  </div>
+
+  <div class="option" data-choice="C" onclick="toggleSelect(this)">
+    <div class="letter">C</div>
+    <div class="content">
+      <h3>💬 深度 Chat 增强</h3>
+      <p>每个 Finding 独立对话线程（持久化）、Chat 上下文绑定真实检索到的法规原文、多轮追问记忆、快捷建议问句生成。</p>
+      <div class="pros-cons" style="margin-top:10px">
+        <div class="pros"><h4>收益</h4><ul><li>Finding 解读深度大幅提升</li><li>用户粘性强</li></ul></div>
+        <div class="cons"><h4>难度</h4><ul><li>需重构 chat 端点</li></ul></div>
+      </div>
+    </div>
+  </div>
+
+  <div class="option" data-choice="D" onclick="toggleSelect(this)">
+    <div class="letter">D</div>
+    <div class="content">
+      <h3>📑 自定义规则 &amp; 模板</h3>
+      <p>用户自定义合规规则库、按行业预设模板（汽车/金融/医疗）、Prompt 版本管理、A/B 测试不同提示策略。</p>
+      <div class="pros-cons" style="margin-top:10px">
+        <div class="pros"><h4>收益</h4><ul><li>适应不同行业场景</li><li>可配置，无需改代码</li></ul></div>
+        <div class="cons"><h4>难度</h4><ul><li>需要规则管理 UI</li></ul></div>
+      </div>
+    </div>
+  </div>
+
+</div>
+
+<p class="subtitle" style="margin-top:20px">💡 也可以多选，或者在终端告诉我你有其他想法。</p>
--- a/.superpowers/brainstorm/1055-1780892298/state/events
+++ b/.superpowers/brainstorm/1055-1780892298/state/events
@@ -0,0 +1,3 @@
+{"type":"click","text":"C\n    \n      💬 深度 Chat 增强\n      每个 Finding 独立对话线程（持久化）、Chat 上下文绑定真实检索到的法规原文、多轮追问记忆、快捷建议问句生成。\n      \n        收益Finding 解读深度大幅提升用户粘性强\n        难度需重构 chat 端点","choice":"C","id":null,"timestamp":1780897984866}
+{"type":"click","text":"B\n    \n      📋 分析历史 & 专业报告\n      持久化分析记录（PostgreSQL）、历史对比、PDF/DOCX 专业报告导出、分析版本追踪。\n      \n        收益结果不再丢失可交付给客户的报告\n        难度需要新增数据库表","choice":"B","id":null,"timestamp":1780897985879}
+{"type":"click","text":"A\n    \n      ⚡ 分析质量提升\n      并行子句处理（速度 3–5×）、跨编码器重排序、置信度过滤、修复 highlight_terms 失效 Bug、减少 LLM 静默失败。\n      \n        收益更快、更准确的分析消除当前 Bug\n        难度需要改造 pipeline.py","choice":"A","id":null,"timestamp":1780897986554}
--- a/.superpowers/brainstorm/1055-1780892298/state/server-stopped
+++ b/.superpowers/brainstorm/1055-1780892298/state/server-stopped
@@ -0,0 +1 @@
+{"reason":"idle timeout","timestamp":1780894411095}
--- a/.superpowers/brainstorm/1055-1780892298/state/server.pid
+++ b/.superpowers/brainstorm/1055-1780892298/state/server.pid
@@ -0,0 +1 @@
+1055
--- a/backend/app/api/dependencies/init.py
+++ b/backend/app/api/dependencies/init.py
@@ -0,0 +1,5 @@
+"""FastAPI dependency functions for authentication and authorisation.
+
+Import `get_current_user` or `require_role` into route modules to protect
+endpoints. Both use the shared JWTHandler wired through bootstrap.
+"""
--- a/backend/app/api/dependencies/auth.py
+++ b/backend/app/api/dependencies/auth.py
@@ -0,0 +1,72 @@
+"""FastAPI dependencies for JWT authentication.
+
+Usage in a route:
+    from app.api.dependencies.auth import get_current_user, require_role
+    from app.domain.auth.models import UserRole
+
+    @router.get("/protected")
+    async def protected(user: UserClaims = Depends(get_current_user)):
+        return {"user": user.username}
+
+    @router.delete("/admin-only")
+    async def admin_only(user: UserClaims = Depends(require_role(UserRole.ADMIN))):
+        ...
+"""
+
+from __future__ import annotations
+
+from fastapi import Depends, HTTPException, status
+from fastapi.security import HTTPAuthorizationCredentials, HTTPBearer
+
+from app.config.settings import settings
+from app.domain.auth.models import UserClaims, UserRole
+from app.shared.bootstrap import get_jwt_handler
+
+# Use Bearer token scheme — client sends `Authorization: Bearer <token>`.
+_bearer = HTTPBearer(auto_error=False)
+
+
+async def get_current_user(
+    credentials: HTTPAuthorizationCredentials | None = Depends(_bearer),
+) -> UserClaims:
+    """Extract and validate the JWT from the Authorization header.
+
+    Returns the decoded UserClaims on success.
+    Raises HTTP 401 when the token is missing, expired, or invalid.
+    When auth_enabled=False (development), returns a synthetic admin user.
+    """
+    if not settings.auth_enabled:
+        # Development bypass — never enable this in production.
+        return UserClaims(user_id="dev", username="dev-admin", role=UserRole.ADMIN)
+
+    if credentials is None:
+        raise HTTPException(
+            status_code=status.HTTP_401_UNAUTHORIZED,
+            detail="Missing authentication token",
+            headers={"WWW-Authenticate": "Bearer"},
+        )
+    try:
+        return get_jwt_handler().decode_token(credentials.credentials)
+    except ValueError as exc:
+        raise HTTPException(
+            status_code=status.HTTP_401_UNAUTHORIZED,
+            detail=str(exc),
+            headers={"WWW-Authenticate": "Bearer"},
+        ) from exc
+
+
+def require_role(*roles: UserRole):
+    """Return a dependency that enforces one of the given roles.
+
+    Example:
+        Depends(require_role(UserRole.ADMIN, UserRole.LEGAL))
+    """
+    async def _check(user: UserClaims = Depends(get_current_user)) -> UserClaims:
+        """Verify the user holds one of the required roles."""
+        if user.role not in roles:
+            raise HTTPException(
+                status_code=status.HTTP_403_FORBIDDEN,
+                detail=f"Role '{user.role}' is not permitted. Required: {[r.value for r in roles]}",
+            )
+        return user
+    return _check
--- a/backend/app/api/main.py
+++ b/backend/app/api/main.py
@@ -8,6 +8,7 @@ from fastapi.middleware.cors import CORSMiddleware
 from fastapi.responses import JSONResponse
 from loguru import logger

+from app.api.middleware.audit import AuditMiddleware
 from app.api.models import ErrorResponse
 from app.api.routes import api_router
 from app.config.logging import setup_logging
@@ -46,14 +47,23 @@ app = FastAPI(
    redoc_url="/redoc",
 )

+# Tighten CORS — only allow configured origins.
+# Set CORS_ALLOW_ORIGINS in .env to the real frontend URL in production.
+_ORIGINS = [o.strip() for o in settings.cors_allow_origins.split(",") if o.strip()]
+if not _ORIGINS:
+    _ORIGINS = ["http://localhost:5173"]
+
 app.add_middleware(
    CORSMiddleware,
-    allow_origins=["*"],
+    allow_origins=_ORIGINS,
    allow_credentials=True,
    allow_methods=["*"],
    allow_headers=["*"],
 )

+# Audit middleware logs every authenticated API call for compliance traceability.
+app.add_middleware(AuditMiddleware)
+
 app.include_router(api_router, prefix="/api/v1")


--- a/backend/app/api/middleware/init.py
+++ b/backend/app/api/middleware/init.py
@@ -0,0 +1 @@
+"""HTTP middleware for cross-cutting concerns: audit logging."""
--- a/backend/app/api/middleware/audit.py
+++ b/backend/app/api/middleware/audit.py
@@ -0,0 +1,56 @@
+"""Audit logging middleware.
+
+Logs every API request with method, path, status code, response time,
+and the authenticated user identity (extracted from the JWT when present).
+Log lines are structured so they can be ingested by ELK / Loki.
+"""
+
+from __future__ import annotations
+
+import time
+
+from fastapi import Request, Response
+from loguru import logger
+from starlette.middleware.base import BaseHTTPMiddleware
+
+
+class AuditMiddleware(BaseHTTPMiddleware):
+    """Log all API calls. Skips health/docs paths to reduce noise."""
+
+    # Paths that produce no audit log entry.
+    _SKIP_PREFIXES = ("/health", "/docs", "/redoc", "/openapi.json")
+
+    async def dispatch(self, request: Request, call_next) -> Response:
+        """Intercept the request, call the handler, and log the outcome."""
+        path = request.url.path
+        if path == "/" or any(path == p or path.startswith(p + "/") for p in self._SKIP_PREFIXES):
+            return await call_next(request)
+
+        start = time.perf_counter()
+        response = await call_next(request)
+        elapsed_ms = int((time.perf_counter() - start) * 1000)
+
+        # Extract user identity from JWT header for structured audit records.
+        # The token is not re-validated here — auth dependencies do that upstream.
+        user_id = "anonymous"
+        username = "anonymous"
+        auth_header = request.headers.get("authorization", "")
+        if auth_header.startswith("Bearer "):
+            try:
+                from app.shared.bootstrap import get_jwt_handler
+                claims = get_jwt_handler().decode_token(auth_header[7:])
+                user_id = claims.user_id
+                username = claims.username
+            except Exception:
+                pass
+
+        logger.info(
+            "AUDIT method={} path={} status={} elapsed_ms={} user_id={} username={}",
+            request.method,
+            path,
+            response.status_code,
+            elapsed_ms,
+            user_id,
+            username,
+        )
+        return response
--- a/backend/app/api/routes/init.py
+++ b/backend/app/api/routes/init.py
@@ -1,6 +1,7 @@
 """Initialize the app.api.routes package."""

 from fastapi import APIRouter
+from .auth import router as auth_router
 from .compliance import router as compliance_router
 from .documents import router as documents_router
 from .knowledge import router as knowledge_router
@@ -14,7 +15,8 @@ from .rag import router as rag_router
 # Keep package boundaries explicit so backend imports stay predictable.
 api_router = APIRouter()

-# Keep package boundaries explicit so backend imports stay predictable.
+# Auth routes first so /auth/token is easy to discover.
+api_router.include_router(auth_router)
 api_router.include_router(documents_router)
 api_router.include_router(knowledge_router)
 api_router.include_router(agent_router)
@@ -25,6 +27,7 @@ api_router.include_router(rag_router)

 __all__ = [
    "api_router",
+    "auth_router",
    "documents_router",
    "knowledge_router",
    "agent_router",
--- a/backend/app/api/routes/auth.py
+++ b/backend/app/api/routes/auth.py
@@ -0,0 +1,63 @@
+"""Authentication routes — token issuance only.
+
+POST /auth/token  — exchange username + password for a JWT.
+GET  /auth/me     — return the current user identity (requires token).
+"""
+
+from __future__ import annotations
+
+from fastapi import APIRouter, Depends, HTTPException, status
+from fastapi.security import OAuth2PasswordRequestForm
+from pydantic import BaseModel
+
+from app.api.dependencies.auth import get_current_user
+from app.config.settings import settings
+from app.domain.auth.models import UserClaims
+from app.shared.bootstrap import get_jwt_handler, get_user_store
+
+
+router = APIRouter(prefix="/auth", tags=["认证"])
+
+
+class TokenResponse(BaseModel):
+    """JWT token response body."""
+
+    access_token: str
+    token_type: str = "bearer"
+    expires_in: int
+
+
+@router.post("/token", response_model=TokenResponse)
+async def login(form: OAuth2PasswordRequestForm = Depends()):
+    """Issue a JWT for valid username + password credentials.
+
+    Uses standard OAuth2 password grant form fields — compatible with
+    Swagger UI Authorize button.
+    """
+    user = get_user_store().authenticate(form.username, form.password)
+    if user is None:
+        raise HTTPException(
+            status_code=status.HTTP_401_UNAUTHORIZED,
+            detail="Incorrect username or password",
+            headers={"WWW-Authenticate": "Bearer"},
+        )
+    token = get_jwt_handler().create_access_token(
+        user_id=user.id,
+        username=user.username,
+        role=user.role,
+    )
+    return TokenResponse(
+        access_token=token,
+        token_type="bearer",
+        expires_in=settings.auth_token_expire_minutes * 60,
+    )
+
+
+@router.get("/me")
+async def get_me(current_user: UserClaims = Depends(get_current_user)):
+    """Return the identity of the currently authenticated user."""
+    return {
+        "user_id": current_user.user_id,
+        "username": current_user.username,
+        "role": current_user.role.value,
+    }
--- a/backend/app/api/routes/compliance.py
+++ b/backend/app/api/routes/compliance.py
@@ -7,10 +7,12 @@ import json
 from pathlib import Path
 from typing import AsyncGenerator, Optional

-from fastapi import APIRouter, File, Form, UploadFile
+from fastapi import APIRouter, Depends, File, Form, UploadFile
 from fastapi.responses import StreamingResponse
 from loguru import logger

+from app.api.dependencies.auth import get_current_user
+from app.domain.auth.models import UserClaims
 from app.schemas.compliance import (
    AnalyzeResponse,
    ComplianceChatRequest,
@@ -75,6 +77,7 @@ async def analyze_stream(
    file: Optional[UploadFile] = File(None),
    domains: Optional[str] = Form(None),
    title: Optional[str] = Form(None),
+    current_user: UserClaims = Depends(get_current_user),
 ):
    """Stream compliance analysis as SSE events.

@@ -82,10 +85,9 @@ async def analyze_stream(
    Events: stage | source | finding | done | error
    """
    from app.application.compliance.pipeline import (
-        check_clause_compliance,
        extract_text_from_doc_id,
        extract_text_from_file,
-        retrieve_for_clause,
+        run_clauses_parallel,
        split_into_clauses,
        synthesize_conclusion,
    )
@@ -133,22 +135,28 @@ async def analyze_stream(
            await asyncio.sleep(0)
            clauses: list[str] = await asyncio.to_thread(split_into_clauses, para_text, client)

-            # ── Stage 3: retrieve + gap check per clause ──────────────────
+            # ── Stage 3: retrieve + gap check (parallel across all clauses) ────────────
            findings: list[dict] = []

-            for i, clause in enumerate(clauses):
-                yield _sse({
-                    "type": "stage",
-                    "stage": "analyzing",
-                    "label": f"Analyzing clause {i + 1}/{len(clauses)}…",
-                })
-                await asyncio.sleep(0)
+            yield _sse({
+                "type": "stage",
+                "stage": "analyzing",
+                "label": f"Analyzing {len(clauses)} clauses in parallel…",
+            })
+            await asyncio.sleep(0)

-                chunks = await asyncio.to_thread(
-                    retrieve_for_clause, clause, retrieval_service, 5, domains or None
-                )
+            clause_results = await run_clauses_parallel(
+                clauses, retrieval_service, client,
+                top_k=5,
+                domains=domains or None,
+            )

-                # Emit source events
+            for res in clause_results:
+                i = res["index"]
+                chunks = res["chunks"]
+                finding = res["finding"]
+
+                # Emit source events for this clause
                for chunk in chunks[:3]:
                    yield _sse({
                        "type": "source",
@@ -158,12 +166,11 @@ async def analyze_stream(
                        "status": "retrieved",
                        "full_content": (getattr(chunk, "text", "") or "")[:300],
                    })
-                await asyncio.sleep(0)

-                finding = await asyncio.to_thread(check_clause_compliance, clause, chunks, client)
                if finding:
                    findings.append(finding)
                    yield _sse({"type": "finding", **finding})
+
                await asyncio.sleep(0)

            # ── Stage 4: synthesize conclusion ────────────────────────────
@@ -175,6 +182,45 @@ async def analyze_stream(
            )
            yield _sse({"type": "done", **conclusion_data})

+            # Auto-save analysis to database
+            try:
+                from app.shared.bootstrap import get_compliance_repository
+                from app.domain.compliance.ports import AnalysisRecord, FindingRecord
+                from datetime import datetime
+
+                repo = get_compliance_repository()
+                finding_records = [
+                    FindingRecord(
+                        id="",
+                        analysis_id="",
+                        seq=i,
+                        title=f.get("title", ""),
+                        description=f.get("desc", ""),
+                        status=f.get("status", "ok"),
+                        clause_ref=f.get("clause_ref"),
+                    )
+                    for i, f in enumerate(findings)
+                ]
+                record = AnalysisRecord(
+                    id="",
+                    created_at=datetime.utcnow(),
+                    created_by=current_user.username if hasattr(current_user, "username") else None,
+                    doc_name=file_name or (title or "Pasted text"),
+                    standard_name=title or "",
+                    risk_score=conclusion_data.get("risk_score", 0),
+                    conclusion=conclusion_data.get("conclusion", ""),
+                    actions=conclusion_data.get("actions", []),
+                    para_text=conclusion_data.get("para_text", ""),
+                    highlight_terms=conclusion_data.get("highlight_terms", []),
+                    findings=finding_records,
+                )
+                analysis_id = await asyncio.to_thread(repo.save_analysis, record)
+                yield _sse({"type": "saved", "analysis_id": analysis_id})
+            except NotImplementedError:
+                pass  # No postgres backend configured — skip saving
+            except Exception as exc:
+                logger.warning("Failed to auto-save compliance analysis: {}", exc)
+
        except Exception as exc:
            logger.exception("analyze-stream pipeline error")
            yield _sse({"type": "error", "text": str(exc)})
@@ -222,3 +268,226 @@ async def compliance_chat(segment_id: int, request: ComplianceChatRequest):
        media_type="text/event-stream",
        headers={"Cache-Control": "no-cache", "Connection": "keep-alive", "X-Accel-Buffering": "no"},
    )
+
+
+@router.get("/history")
+async def list_history(
+    limit: int = 20,
+    offset: int = 0,
+    current_user: UserClaims = Depends(get_current_user),
+):
+    """Return paginated list of saved compliance analyses (newest first)."""
+    from app.shared.bootstrap import get_compliance_repository
+    try:
+        repo = get_compliance_repository()
+        records = await asyncio.to_thread(repo.list_analyses, limit, offset)
+        return [
+            {
+                "id": r.id,
+                "created_at": r.created_at.isoformat(),
+                "created_by": r.created_by,
+                "doc_name": r.doc_name,
+                "standard_name": r.standard_name,
+                "risk_score": r.risk_score,
+                "finding_count": len(r.findings),
+            }
+            for r in records
+        ]
+    except NotImplementedError:
+        return []
+
+
+@router.get("/history/{analysis_id}")
+async def get_history_item(
+    analysis_id: str,
+    current_user: UserClaims = Depends(get_current_user),
+):
+    """Return full analysis record including findings."""
+    from app.shared.bootstrap import get_compliance_repository
+    from fastapi import HTTPException
+    repo = get_compliance_repository()
+    record = await asyncio.to_thread(repo.get_analysis, analysis_id)
+    if not record:
+        raise HTTPException(status_code=404, detail="Analysis not found")
+    return {
+        "id": record.id,
+        "created_at": record.created_at.isoformat(),
+        "created_by": record.created_by,
+        "doc_name": record.doc_name,
+        "standard_name": record.standard_name,
+        "risk_score": record.risk_score,
+        "conclusion": record.conclusion,
+        "actions": record.actions,
+        "para_text": record.para_text,
+        "highlight_terms": record.highlight_terms,
+        "findings": [
+            {
+                "id": f.id,
+                "seq": f.seq,
+                "title": f.title,
+                "description": f.description,
+                "status": f.status,
+                "clause_ref": f.clause_ref,
+            }
+            for f in record.findings
+        ],
+    }
+
+
+@router.delete("/history/{analysis_id}", status_code=204)
+async def delete_history_item(
+    analysis_id: str,
+    current_user: UserClaims = Depends(get_current_user),
+):
+    """Delete a saved analysis (cascade removes findings and chat messages)."""
+    from app.shared.bootstrap import get_compliance_repository
+    repo = get_compliance_repository()
+    await asyncio.to_thread(repo.delete_analysis, analysis_id)
+
+
+@router.get("/history/{analysis_id}/download")
+async def download_history_docx(
+    analysis_id: str,
+    current_user: UserClaims = Depends(get_current_user),
+):
+    """Return a DOCX compliance report for the given analysis."""
+    from app.shared.bootstrap import get_compliance_repository
+    from app.infrastructure.compliance.docx_export import generate_docx
+    from fastapi import HTTPException
+    from fastapi.responses import Response
+
+    repo = get_compliance_repository()
+    record = await asyncio.to_thread(repo.get_analysis, analysis_id)
+    if not record:
+        raise HTTPException(status_code=404, detail="Analysis not found")
+
+    docx_bytes = await asyncio.to_thread(generate_docx, record)
+    safe_name = (record.doc_name or "report").replace(" ", "_")[:50]
+    filename = f"compliance_{safe_name}_{record.created_at.strftime('%Y%m%d')}.docx"
+    return Response(
+        content=docx_bytes,
+        media_type="application/vnd.openxmlformats-officedocument.wordprocessingml.document",
+        headers={"Content-Disposition": f'attachment; filename="{filename}"'},
+    )
+
+
+@router.get("/analyses/{analysis_id}/findings/{finding_id}/chat")
+async def get_finding_chat_history(
+    analysis_id: str,
+    finding_id: str,
+    current_user: UserClaims = Depends(get_current_user),
+):
+    """Return persisted chat messages for a finding thread, oldest first."""
+    from app.shared.bootstrap import get_compliance_repository
+    try:
+        repo = get_compliance_repository()
+        messages = await asyncio.to_thread(repo.get_messages, finding_id)
+        return messages
+    except NotImplementedError:
+        return []
+
+
+@router.post("/analyses/{analysis_id}/findings/{finding_id}/suggestions")
+async def get_finding_suggestions(
+    analysis_id: str,
+    finding_id: str,
+    current_user: UserClaims = Depends(get_current_user),
+):
+    """Generate 3 LLM-powered follow-up question suggestions for a finding."""
+    from app.application.compliance.pipeline import generate_suggestions
+    from app.shared.bootstrap import get_compliance_repository
+    from app.services.llm.llm_factory import get_llm_client
+    from fastapi import HTTPException
+
+    repo = get_compliance_repository()
+    analysis = await asyncio.to_thread(repo.get_analysis, analysis_id)
+    if not analysis:
+        raise HTTPException(status_code=404, detail="Analysis not found")
+
+    finding = next((f for f in analysis.findings if f.id == finding_id), None)
+    if not finding:
+        raise HTTPException(status_code=404, detail="Finding not found")
+
+    client = get_llm_client(provider=settings.llm_provider, model=settings.llm_model)
+    questions = await asyncio.to_thread(generate_suggestions, finding, analysis, client)
+    return {"questions": questions}
+
+
+@router.post("/analyses/{analysis_id}/findings/{finding_id}/chat")
+async def finding_chat(
+    analysis_id: str,
+    finding_id: str,
+    request: ComplianceChatRequest,
+    current_user: UserClaims = Depends(get_current_user),
+):
+    """Stream a grounded chat response for a specific finding.
+
+    Loads the finding and analysis from DB to build grounded context.
+    Persists both user message and assistant response to finding_chat_messages.
+    """
+    from app.application.compliance.pipeline import build_finding_context
+    from app.shared.bootstrap import get_compliance_repository
+    from fastapi import HTTPException
+
+    repo = get_compliance_repository()
+    analysis = await asyncio.to_thread(repo.get_analysis, analysis_id)
+    if not analysis:
+        raise HTTPException(status_code=404, detail="Analysis not found")
+    finding = next((f for f in analysis.findings if f.id == finding_id), None)
+    if not finding:
+        raise HTTPException(status_code=404, detail="Finding not found")
+
+    # Persist user message
+    await asyncio.to_thread(
+        repo.save_message, analysis_id, finding_id, "user", request.query
+    )
+
+    # Build message history (last 10 messages = 5 turns)
+    history = await asyncio.to_thread(repo.get_messages, finding_id)
+    history_messages = [
+        {"role": m["role"], "content": m["content"]}
+        for m in history[-10:]
+    ]
+
+    # Build grounded system context
+    system_context = build_finding_context(finding, analysis)
+    full_query = f"[Compliance Finding Context]\n{system_context}\n\nUser question: {request.query}"
+
+    assistant_buffer: list[str] = []
+
+    async def generate() -> AsyncGenerator[str, None]:
+        try:
+            _, event_stream = get_agent_conversation_service().stream_chat(
+                query=full_query,
+                top_k=5,
+                prompt_template="compliance_qa",
+            )
+            for event in event_stream:
+                event_type = event.get("event", "")
+                if event_type == "content":
+                    text = event.get("data", "")
+                    if text:
+                        assistant_buffer.append(text)
+                        yield _sse({"type": "chunk", "text": text})
+                elif event_type == "done":
+                    yield _sse({"type": "done"})
+                await asyncio.sleep(0)
+        except Exception as exc:
+            logger.exception("finding_chat stream error")
+            yield _sse({"type": "error", "text": str(exc)})
+        finally:
+            # Persist assistant response after stream completes
+            full_response = "".join(assistant_buffer)
+            if full_response:
+                try:
+                    await asyncio.to_thread(
+                        repo.save_message, analysis_id, finding_id, "assistant", full_response
+                    )
+                except Exception as exc:
+                    logger.warning("Failed to persist assistant message: {}", exc)
+
+    return StreamingResponse(
+        generate(),
+        media_type="text/event-stream",
+        headers={"Cache-Control": "no-cache", "Connection": "keep-alive", "X-Accel-Buffering": "no"},
+    )
--- a/backend/app/api/routes/documents.py
+++ b/backend/app/api/routes/documents.py
@@ -5,12 +5,15 @@ from __future__ import annotations
 from io import BytesIO
 from urllib.parse import quote

-from fastapi import APIRouter, File, Form, HTTPException, UploadFile
+from fastapi import APIRouter, BackgroundTasks, Depends, File, Form, HTTPException, UploadFile
 from fastapi.responses import StreamingResponse
 from loguru import logger

+from app.api.dependencies.auth import get_current_user
 from app.api.models import DocumentUploadResponse
 from app.application.documents import DocumentProcessResult
+from app.config.settings import settings
+from app.domain.auth.models import UserClaims
 from app.shared.bootstrap import get_document_command_service, get_document_query_service
 # Keep route handlers close to their transport-layer wiring for easier auditing.

@@ -31,16 +34,60 @@ def _document_response(result: DocumentProcessResult) -> DocumentUploadResponse:
    )


+def _run_process_in_background(
+    *,
+    doc_id: str,
+    file_name: str,
+    final_doc_name: str,
+    content: bytes,
+    regulation_type: str,
+    version: str,
+    generate_summary: bool,
+    run_id: str | None,
+) -> None:
+    """Run document processing synchronously inside a FastAPI BackgroundTask thread.
+
+    FastAPI executes BackgroundTasks in a threadpool executor, so blocking I/O
+    (parser API calls, embedding, Milvus upsert) is safe here.
+    """
+    try:
+        svc = get_document_command_service()
+        svc._process_document(
+            doc_id=doc_id,
+            file_name=file_name,
+            final_doc_name=final_doc_name,
+            content=content,
+            regulation_type=regulation_type,
+            version=version,
+            generate_summary=generate_summary,
+            run_id=run_id,
+        )
+    except Exception:
+        logger.exception("BackgroundTask document processing failed: doc_id={}", doc_id)
+
+
@router.post("/upload", response_model=DocumentUploadResponse)
 async def upload_document(
+    background_tasks: BackgroundTasks,
    file: UploadFile = File(..., description="上传的文档文件"),
    doc_id: str | None = Form(None, description="客户端预分配的文档ID，不传则自动生成"),
    doc_name: str | None = Form(None, description="文档名称"),
    regulation_type: str | None = Form(None, description="法规类型"),
    version: str | None = Form(None, description="文档版本"),
    generate_summary: bool = Form(False, description="是否生成摘要"),
+    sync: bool = Form(False, description="同步处理（演示/测试用，默认异步处理）"),
+    current_user: UserClaims = Depends(get_current_user),
 ):
-    """Handle upload document."""
+    """Upload a document and process it asynchronously.
+
+    Default path (sync=false):
+      1. Store binary to MinIO immediately — returns within seconds.
+      2. Schedule parse→embed→index as a FastAPI BackgroundTask (same process,
+         threadpool) OR enqueue to Celery workers when USE_CELERY_WORKER=true.
+      3. Poll GET /documents/status/{doc_id} for progress.
+
+    sync=true path: full inline processing, blocks until complete (demo / CI use).
+    """
    content = await file.read()
    if not file.filename:
        raise HTTPException(status_code=400, detail="文件名不能为空")
@@ -48,19 +95,73 @@ async def upload_document(
        raise HTTPException(status_code=400, detail="上传文件为空")

    try:
-        result = get_document_command_service().upload_and_process(
-            doc_id=doc_id,
-            file_name=file.filename,
-            content=content,
-            content_type=file.content_type or "application/octet-stream",
-            doc_name=doc_name,
-            regulation_type=regulation_type or "",
-            version=version or "",
-            generate_summary=generate_summary,
-        )
+        svc = get_document_command_service()
+
+        if sync:
+            # Synchronous fallback: full inline processing.
+            result = svc.upload_and_process(
+                doc_id=doc_id,
+                file_name=file.filename,
+                content=content,
+                content_type=file.content_type or "application/octet-stream",
+                doc_name=doc_name,
+                regulation_type=regulation_type or "",
+                version=version or "",
+                generate_summary=generate_summary,
+            )
+        else:
+            # Step 1: store binary and create the document record (fast, sync).
+            stored_doc_id, run_id = svc.store_document(
+                doc_id=doc_id,
+                file_name=file.filename,
+                content=content,
+                content_type=file.content_type or "application/octet-stream",
+                doc_name=doc_name,
+                regulation_type=regulation_type or "",
+                version=version or "",
+                generate_summary=generate_summary,
+            )
+            final_doc_name = doc_name or file.filename
+
+            # Step 2: schedule processing via Celery worker OR FastAPI BackgroundTask.
+            if settings.use_celery_worker:
+                from app.infrastructure.tasks.document_tasks import process_document_task
+                process_document_task.delay(
+                    doc_id=stored_doc_id,
+                    file_name=file.filename,
+                    doc_name=final_doc_name,
+                    regulation_type=regulation_type or "",
+                    version=version or "",
+                    generate_summary=generate_summary,
+                    run_id=run_id,
+                )
+                processing_note = "已入 Celery 队列，由 Worker 处理。"
+            else:
+                # Default: run in FastAPI's threadpool — no external worker needed.
+                background_tasks.add_task(
+                    _run_process_in_background,
+                    doc_id=stored_doc_id,
+                    file_name=file.filename,
+                    final_doc_name=final_doc_name,
+                    content=content,
+                    regulation_type=regulation_type or "",
+                    version=version or "",
+                    generate_summary=generate_summary,
+                    run_id=run_id,
+                )
+                processing_note = "正在后台处理。"
+
+            result = DocumentProcessResult(
+                doc_id=stored_doc_id,
+                doc_name=final_doc_name,
+                status="stored",
+                message=f"文件已存储，{processing_note}请轮询 GET /documents/status/{{doc_id}} 查看进度。",
+            )
+
        if result.status == "failed":
            raise HTTPException(status_code=500, detail=result.message)
        return _document_response(result)
+
    except HTTPException:
        raise
    except Exception as exc:
@@ -106,7 +207,7 @@ async def download_document(doc_id: str):


@router.get("/list")
-async def list_documents():
+async def list_documents(current_user: UserClaims = Depends(get_current_user)):
    """List documents."""
    documents = get_document_query_service().list_documents()
    return {
@@ -148,7 +249,7 @@ async def get_document_management_list():


@router.delete("/{doc_id}")
-async def delete_document(doc_id: str):
+async def delete_document(doc_id: str, current_user: UserClaims = Depends(get_current_user)):
    """Delete a document and its associated data."""
    deleted = get_document_command_service().delete(doc_id)
    if not deleted:
--- a/backend/app/api/routes/perception.py
+++ b/backend/app/api/routes/perception.py
@@ -4,10 +4,12 @@ from __future__ import annotations

 import json

-from fastapi import APIRouter, Query
+from fastapi import APIRouter, Depends, Query
 from fastapi.responses import StreamingResponse

-from app.shared.bootstrap import get_perception_service
+from app.shared.bootstrap import get_crawl_service, get_event_store, get_perception_service
+from app.api.dependencies.auth import get_current_user
+from app.domain.auth.models import UserClaims
 from app.shared.async_utils import iter_in_thread

 router = APIRouter(prefix="/perception", tags=["智能感知"])
@@ -65,3 +67,77 @@ async def analyze_event(event_id: str):
            "X-Accel-Buffering": "no",
        },
    )
+
+
+@router.post("/crawl")
+async def run_crawl(
+    body: dict = None,
+    current_user: UserClaims = Depends(get_current_user),
+):
+    """Trigger manual crawl of regulatory sources. Streams SSE progress.
+
+    Body (optional): {"sources": ["CATARC", "国标委·强制性", "EUR-Lex"]}
+    Omit sources to crawl all registered sources.
+    """
+    sources: list[str] | None = (body or {}).get("sources")
+    crawl_svc = get_crawl_service()
+
+    async def crawl_stream():
+        async for item in iter_in_thread(crawl_svc.run_crawl(sources=sources)):
+            event_name = item.get("event", "message")
+            data = item.get("data", "")
+            if isinstance(data, (dict, list)):
+                data = json.dumps(data, ensure_ascii=False)
+            yield f"event: {event_name}\ndata: {data}\n\n"
+
+    return StreamingResponse(
+        crawl_stream(),
+        media_type="text/event-stream",
+        headers={"Cache-Control": "no-cache", "X-Accel-Buffering": "no"},
+    )
+
+
+@router.post("/events/{event_id}/process")
+async def process_event(
+    event_id: str,
+    current_user: UserClaims = Depends(get_current_user),
+):
+    """Trigger LLM pipeline (extract + assess + diff) for a single event."""
+    from datetime import UTC, datetime
+    from app.infrastructure.perception.llm_pipeline import LlmPipeline
+    from app.shared.bootstrap import get_retrieval_service
+
+    event = get_perception_service().get_event(event_id)
+    if not event:
+        from fastapi import HTTPException
+        raise HTTPException(status_code=404, detail=f"Event {event_id} not found")
+
+    store = get_event_store()
+    pipeline = LlmPipeline()
+
+    structure = pipeline.extract_structure(event)
+    event.update(structure)
+    event["affected_docs"] = pipeline.assess_impact(event, get_retrieval_service())
+    event["processed_at"] = datetime.now(UTC).isoformat()
+    store.upsert(event)
+
+    return {"status": "ok", "event_id": event_id, "processed_at": event["processed_at"]}
+
+
+@router.get("/events/{event_id}/diff")
+async def get_event_diff(event_id: str):
+    """Return semantic diff detail for an event (only available if previously crawled twice)."""
+    event = get_perception_service().get_event(event_id)
+    if not event:
+        from fastapi import HTTPException
+        raise HTTPException(status_code=404, detail=f"Event {event_id} not found")
+    if not event.get("change_summary"):
+        from fastapi import HTTPException
+        raise HTTPException(status_code=404, detail="No diff available for this event")
+    return {
+        "event_id": event_id,
+        "change_summary": event.get("change_summary"),
+        "changed_sections": event.get("changed_sections") or [],
+        "previous_hash": event.get("previous_hash"),
+        "content_hash": event.get("content_hash"),
+    }
--- a/backend/app/api/routes/rag.py
+++ b/backend/app/api/routes/rag.py
@@ -5,10 +5,12 @@ from __future__ import annotations
 import json
 from typing import AsyncGenerator

-from fastapi import APIRouter
+from fastapi import APIRouter, Depends
 from fastapi.responses import StreamingResponse

+from app.api.dependencies.auth import get_current_user
 from app.config.settings import settings
+from app.domain.auth.models import UserClaims
 from app.schemas.rag import RagChatRequest, QuickQuestionsResponse, QuickQuestion
 from app.shared.async_utils import iter_in_thread
 from app.shared.bootstrap import get_agent_conversation_service
@@ -27,7 +29,10 @@ _DEFAULT_QUICK_QUESTIONS = [


@router.post("/chat")
-async def rag_chat(request: RagChatRequest):
+async def rag_chat(
+    request: RagChatRequest,
+    current_user: UserClaims = Depends(get_current_user),
+):
    """Stream RAG Q&A using the real agent service."""
    session_id, event_stream = get_agent_conversation_service().stream_chat(
        query=request.query,
--- a/backend/app/application/compliance/pipeline.py
+++ b/backend/app/application/compliance/pipeline.py
@@ -5,6 +5,7 @@ All functions are synchronous — call them via asyncio.to_thread() in async SSE

 from __future__ import annotations

+import asyncio
 import json
 import os
 import re
@@ -12,10 +13,20 @@ import tempfile
 from typing import TYPE_CHECKING

 from loguru import logger
+from tenacity import retry, retry_if_exception_type, stop_after_attempt, wait_exponential
+
+# Shared retry policy for LLM calls: 3 attempts, exponential back-off 1–4 s.
+_llm_retry = retry(
+    stop=stop_after_attempt(3),
+    wait=wait_exponential(multiplier=1, min=1, max=4),
+    retry=retry_if_exception_type((ValueError, TimeoutError, ConnectionError)),
+    reraise=True,
+)

 if TYPE_CHECKING:
    from app.application.knowledge import KnowledgeRetrievalService
    from app.domain.retrieval import RetrievedChunk
+    from app.domain.compliance.ports import AnalysisRecord, FindingRecord
    from app.services.llm.base_client import BaseLLMClient


@@ -109,17 +120,67 @@ def retrieve_for_clause(
    return retrieval_service.retrieve(query=clause, top_k=top_k, filters=domains)


+def process_single_clause(
+    clause: str,
+    index: int,
+    retrieval_service: "KnowledgeRetrievalService",
+    client: "BaseLLMClient",
+    top_k: int = 5,
+    domains: str | None = None,
+) -> dict:
+    """Process one clause: retrieve relevant regulations then check compliance.
+
+    Returns a dict with keys: index, chunks, finding (may be None on LLM failure).
+    Designed to run inside asyncio.to_thread() for parallel execution.
+    """
+    chunks = retrieve_for_clause(clause, retrieval_service, top_k, domains)
+    finding = check_clause_compliance(clause, chunks, client)
+    return {"index": index, "chunks": chunks, "finding": finding}
+
+
+async def run_clauses_parallel(
+    clauses: list[str],
+    retrieval_service: "KnowledgeRetrievalService",
+    client: "BaseLLMClient",
+    top_k: int = 5,
+    domains: str | None = None,
+) -> list[dict]:
+    """Run all clauses through retrieve+gap-check in parallel.
+
+    Results are returned in the original clause order even though processing
+    is concurrent. Exceptions in individual clauses are caught and returned as
+    dicts with finding=None so the stream continues for remaining clauses.
+
+    Both retrieval_service and client must be thread-safe — they are shared
+    across all asyncio.to_thread() calls without locking.
+    """
+    tasks = [
+        asyncio.to_thread(
+            process_single_clause,
+            clause, i, retrieval_service, client, top_k, domains,
+        )
+        for i, clause in enumerate(clauses)
+    ]
+    raw = await asyncio.gather(*tasks, return_exceptions=True)
+    results = []
+    for i, r in enumerate(raw):
+        if isinstance(r, Exception):
+            logger.warning("Clause {} processing failed: {}", i, r)
+            results.append({"index": i, "chunks": [], "finding": None})
+        else:
+            results.append(r)
+    return results
+
+
 def check_clause_compliance(
    clause: str,
    chunks: list["RetrievedChunk"],
    client: "BaseLLMClient",
 ) -> dict | None:
-    if not chunks:
-        return None
    reg_context = "\n".join(
        f"[{i+1}] {c.doc_title} {c.section_title or ''}: {c.text[:300]}"
        for i, c in enumerate(chunks[:5])
-    )
+    ) if chunks else "(no regulatory context retrieved)"
    prompt = (
        "You are a compliance expert. Judge whether the following business clause "
        "complies with the retrieved regulations.\n\n"
@@ -135,9 +196,19 @@ def check_clause_compliance(
        "status: ok=compliant, warn=gap exists, risk=critical/missing\n"
        "Return ONLY the JSON object."
    )
-    response = client.chat([{"role": "user", "content": prompt}], max_tokens=500)
-    if not response.is_success:
+
+    def _do_check():
+        resp = client.chat([{"role": "user", "content": prompt}], max_tokens=500)
+        if not resp.is_success:
+            raise ValueError("LLM returned non-success for gap check")
+        return resp
+
+    try:
+        response = _llm_retry(_do_check)()
+    except Exception as exc:
+        logger.warning("check_clause_compliance LLM call failed after retries: {}", exc)
        return None
+
    try:
        result = _extract_json(response.content)
        if isinstance(result, dict) and "status" in result:
@@ -182,12 +253,11 @@ def synthesize_conclusion(
        '    {"label": "Priority", "value": "High/Medium/Low", "risk": true}\n'
        '  ],\n'
        '  "risk_score": 0-100 (integer, higher=riskier),\n'
-        '  "highlight_terms": ["Key terms to highlight, max 10 terms"],\n'
+        '  "highlight_terms": ["term1", "term2"],  // up to 10 key technical/legal terms actually present in the text\n'
        '  "para_text": "Original text or summary (max 600 chars)"\n'
        "}\n"
        "Return ONLY the JSON object."
    )
-    response = client.chat([{"role": "user", "content": prompt}], max_tokens=1200)
    fallback = {
        "conclusion": "Compliance analysis complete. Review findings and create remediation plan.",
        "actions": [
@@ -198,8 +268,19 @@ def synthesize_conclusion(
        "highlight_terms": [],
        "para_text": para_text[:800],
    }
-    if not response.is_success:
+
+    def _do_synthesize():
+        resp = client.chat([{"role": "user", "content": prompt}], max_tokens=1200)
+        if not resp.is_success:
+            raise ValueError("LLM returned non-success for synthesis")
+        return resp
+
+    try:
+        response = _llm_retry(_do_synthesize)()
+    except Exception as exc:
+        logger.warning("synthesize_conclusion LLM call failed after retries: {}", exc)
        return fallback
+
    try:
        result = _extract_json(response.content)
        if isinstance(result, dict):
@@ -212,4 +293,78 @@ def synthesize_conclusion(
            }
    except (ValueError, TypeError) as exc:
        logger.warning("Conclusion synthesis JSON parse failed: {}", exc)
-    return fallback
+    return fallback
+
+
+_SUGGESTION_FOCUS = {
+    "risk": "Focus on remediation steps, required certifications, and timeline to resolve.",
+    "warn": "Focus on identifying the specific compliance gap and how to close it.",
+    "ok": "Focus on maintaining compliance evidence and monitoring future changes.",
+}
+
+_SUGGESTION_FALLBACK = {
+    "risk": [
+        "What specific certifications or documents are required to remediate this finding?",
+        "What is the typical remediation timeline for this type of non-compliance?",
+        "Which regulation clause defines the exact requirement?",
+    ],
+    "warn": [
+        "What is the exact gap between the current state and the requirement?",
+        "What evidence would demonstrate partial compliance?",
+        "Which regulation clause applies to this warning?",
+    ],
+    "ok": [
+        "What documentation should be maintained to evidence this compliance?",
+        "How should this area be monitored as regulations evolve?",
+        "Are there related clauses that may affect this compliant area?",
+    ],
+}
+
+
+def build_finding_context(finding: "FindingRecord", analysis: "AnalysisRecord") -> str:
+    """Build a grounded system context string for a finding chat thread.
+
+    Combines finding details with analysis metadata so the LLM has full
+    context without relying on the frontend to pass segment_context.
+    """
+    return (
+        f"Document: {analysis.doc_name}\n"
+        f"Standard: {analysis.standard_name}\n"
+        f"Finding [{finding.seq + 1}]: {finding.title}\n"
+        f"Status: {finding.status}\n"
+        f"Clause reference: {finding.clause_ref or 'N/A'}\n"
+        f"Description: {finding.description}\n"
+        f"Overall conclusion: {analysis.conclusion}\n"
+    )
+
+
+def generate_suggestions(
+    finding: "FindingRecord",
+    analysis: "AnalysisRecord",
+    client: "BaseLLMClient",
+) -> list[str]:
+    """Generate 3 context-aware follow-up questions for a finding chat thread.
+
+    Returns exactly 3 question strings. Falls back to static templates on error.
+    """
+    fallback = _SUGGESTION_FALLBACK.get(finding.status, _SUGGESTION_FALLBACK["warn"])
+    context = build_finding_context(finding, analysis)
+    focus = _SUGGESTION_FOCUS.get(finding.status, _SUGGESTION_FOCUS["warn"])
+    prompt = (
+        f"{context}\n\n"
+        f"Task: {focus}\n"
+        "Generate exactly 3 concise follow-up questions a compliance analyst would ask.\n"
+        'Return JSON: {"questions": ["question 1", "question 2", "question 3"]}\n'
+        "Return ONLY the JSON object."
+    )
+    response = client.chat([{"role": "user", "content": prompt}], max_tokens=300)
+    if not response.is_success:
+        return fallback
+    try:
+        result = _extract_json(response.content)
+        questions = result.get("questions", [])
+        if isinstance(questions, list) and len(questions) >= 3:
+            return [str(q) for q in questions[:3]]
+    except (ValueError, TypeError) as exc:
+        logger.warning("generate_suggestions JSON parse failed: {}", exc)
+    return fallback
--- a/backend/app/application/documents/services.py
+++ b/backend/app/application/documents/services.py
@@ -277,7 +277,6 @@ class DocumentCommandService:
            message="Document record created",
        )

-        temp_path = ""
        try:
            self.binary_store.save(
                object_name=object_name,
@@ -297,117 +296,20 @@ class DocumentCommandService:
                stage="store",
                message="Source file stored",
            )
-
-            suffix = os.path.splitext(file_name)[1]
-            with tempfile.NamedTemporaryFile(delete=False, suffix=suffix) as temp_file:
-                temp_file.write(content)
-                temp_path = temp_file.name
-
-            parsed_document = self.parser.parse(
-                file_path=temp_path,
+            # Delegate parse → embed → index to the shared processing method.
+            # This same method is invoked by the Celery worker for async processing.
+            return self._process_document(
                doc_id=doc_id,
-                doc_name=final_doc_name,
-            )
-            self._safe_mark_run_parsed(doc_id=doc_id, run_id=run_id, parsed_document=parsed_document)
-
-            artifact_keys: dict[str, str] = {}
-            try:
-                artifact_keys = self._save_parse_artifacts(doc_id=doc_id, parsed_document=parsed_document)
-            except Exception:
-                logger.warning("Parse artifact binary persistence failed for doc_id={}", doc_id)
-            self.document_repository.update_status(
-                doc_id,
-                DocumentStatus.PARSED,
-                parser_name=parsed_document.parser_name,
-                metadata={
-                    "parser_backend": parsed_document.parser_name,
-                    "parse_task_id": parsed_document.metadata.get("task_id", ""),
-                    "layout_count": parsed_document.metadata.get("layout_count", len(parsed_document.raw_layouts)),
-                    "structure_node_count": len(parsed_document.structure_nodes),
-                    "semantic_block_count": len(parsed_document.semantic_blocks),
-                    "vector_chunk_count": len(parsed_document.vector_chunks),
-                    "artifact_keys": artifact_keys,
-                    "processing_stage": "parsed",
-                },
-            )
-            current_status = DocumentStatus.PARSED
-            current_stage = "embed"
-            self._safe_replace_processing_artifacts(doc_id=doc_id, run_id=run_id, artifact_keys=artifact_keys)
-            self._safe_append_status_event(
-                doc_id=doc_id,
-                run_id=run_id,
-                from_status=DocumentStatus.STORED.value,
-                to_status=DocumentStatus.PARSED.value,
-                stage="parse",
-                message="Document parsed",
-                metadata={"artifact_count": len(artifact_keys)},
-            )
-            if self.parse_artifact_store:
-                try:
-                    self.parse_artifact_store.save(
-                        doc_id,
-                        parsed_document.structure_nodes,
-                        parsed_document.semantic_blocks,
-                    )
-                except Exception:
-                    logger.warning("ParseArtifactStore.save failed for doc_id={}", doc_id)
-
-            chunks = self.chunk_builder.build(
-                parsed_document=parsed_document,
+                file_name=file_name,
+                final_doc_name=final_doc_name,
+                content=content,
                regulation_type=regulation_type,
                version=version,
-            )
-            if not chunks:
-                raise ValueError("解析完成但没有生成可入库的 chunks")
-
-            vectors = self.embedding_provider.embed_texts([chunk.embedding_text for chunk in chunks])
-            current_stage = "index"
-            inserted = self.vector_index.upsert(chunks, vectors)
-            if inserted != len(chunks):
-                logger.warning("Milvus upsert count mismatched: inserted={}, chunks={}", inserted, len(chunks))
-
-            health = self.vector_index.health()
-            self.document_repository.update_status(
-                doc_id,
-                DocumentStatus.INDEXED,
-                chunk_count=len(chunks),
-                summary="",
-                summary_latency_ms=0,
-                index_name=health.get("collection_name", ""),
-                metadata={
-                    "index_collection": health.get("collection_name", ""),
-                    "processing_stage": "indexed",
-                },
-            )
-            current_status = DocumentStatus.INDEXED
-            index_name = health.get("collection_name", "")
-            self._safe_mark_run_indexed(
-                doc_id=doc_id,
+                generate_summary=generate_summary,
                run_id=run_id,
-                chunk_count=len(chunks),
-                index_name=index_name,
-            )
-            self._safe_append_status_event(
-                doc_id=doc_id,
-                run_id=run_id,
-                from_status=DocumentStatus.PARSED.value,
-                to_status=DocumentStatus.INDEXED.value,
-                stage="index",
-                message="Document indexed",
-                metadata={"chunk_count": len(chunks), "index_name": index_name},
-            )
-            stored = self.document_repository.get(doc_id)
-            return DocumentProcessResult(
-                doc_id=doc_id,
-                doc_name=final_doc_name,
-                status=(stored.status.value if stored else DocumentStatus.INDEXED.value),
-                message="处理成功",
-                num_chunks=len(chunks),
-                summary=stored.summary if stored else "",
-                summary_latency_ms=stored.summary_latency_ms if stored else 0,
            )
        except Exception as exc:
-            logger.exception("文档处理失败: doc_id={}", doc_id)
+            logger.exception("文档存储失败: doc_id={}", doc_id)
            failure_stage = current_stage
            self.document_repository.update_status(
                doc_id,
@@ -439,6 +341,183 @@ class DocumentCommandService:
                status=DocumentStatus.FAILED.value,
                message=f"文档处理失败: {exc}",
            )
+
+    def store_document(
+        self,
+        *,
+        doc_id: str | None = None,
+        file_name: str,
+        content: bytes,
+        content_type: str,
+        doc_name: str | None,
+        regulation_type: str,
+        version: str,
+        generate_summary: bool,
+    ) -> tuple[str, str | None]:
+        """Store the binary file and create the Document record.
+
+        Returns (doc_id, run_id). Does NOT parse, embed, or index.
+        This is the fast synchronous first step; processing is enqueued separately.
+        The caller is responsible for enqueuing the follow-up process_document_task.
+        """
+        doc_id = doc_id or str(uuid.uuid4())[:8]
+        final_doc_name = doc_name or file_name
+        object_name = f"{doc_id}/{file_name}"
+
+        document = Document(
+            doc_id=doc_id,
+            doc_name=final_doc_name,
+            file_name=file_name,
+            object_name=object_name,
+            content_type=content_type,
+            size_bytes=len(content),
+            regulation_type=regulation_type,
+            version=version,
+            metadata={"generate_summary": generate_summary},
+        )
+        self.document_repository.create(document)
+        run_id = self._safe_create_processing_run(
+            doc_id=doc_id, trigger_type="upload", generate_summary=generate_summary
+        )
+        self.binary_store.save(
+            object_name=object_name, data=content,
+            content_type=content_type, metadata={"doc_id": doc_id},
+        )
+        self.document_repository.update_status(doc_id, DocumentStatus.STORED)
+        self._safe_mark_run_stored(doc_id=doc_id, run_id=run_id)
+        self._safe_append_status_event(
+            doc_id=doc_id, run_id=run_id,
+            from_status=DocumentStatus.PENDING.value, to_status=DocumentStatus.STORED.value,
+            stage="store", message="Source file stored",
+        )
+        return doc_id, run_id
+
+    def _process_document(
+        self,
+        *,
+        doc_id: str,
+        file_name: str,
+        final_doc_name: str,
+        content: bytes,
+        regulation_type: str,
+        version: str,
+        generate_summary: bool,
+        run_id: str | None = None,
+    ) -> DocumentProcessResult:
+        """Run parse → chunk → embed → index for a document that is already stored.
+
+        Called both synchronously (from upload_and_process) and asynchronously
+        (from the Celery process_document_task worker). All side-effects write
+        through DocumentProcessingStore so callers can poll progress.
+        """
+        current_status = DocumentStatus.STORED
+        current_stage = "parse"
+        temp_path = ""
+        try:
+            suffix = os.path.splitext(file_name)[1]
+            with tempfile.NamedTemporaryFile(delete=False, suffix=suffix) as temp_file:
+                temp_file.write(content)
+                temp_path = temp_file.name
+
+            parsed_document = self.parser.parse(
+                file_path=temp_path,
+                doc_id=doc_id,
+                doc_name=final_doc_name,
+            )
+            self._safe_mark_run_parsed(doc_id=doc_id, run_id=run_id, parsed_document=parsed_document)
+
+            artifact_keys: dict[str, str] = {}
+            try:
+                artifact_keys = self._save_parse_artifacts(doc_id=doc_id, parsed_document=parsed_document)
+            except Exception:
+                logger.warning("Parse artifact binary persistence failed for doc_id={}", doc_id)
+
+            self.document_repository.update_status(
+                doc_id,
+                DocumentStatus.PARSED,
+                parser_name=parsed_document.parser_name,
+                metadata={
+                    "parser_backend": parsed_document.parser_name,
+                    "parse_task_id": parsed_document.metadata.get("task_id", ""),
+                    "layout_count": parsed_document.metadata.get("layout_count", len(parsed_document.raw_layouts)),
+                    "structure_node_count": len(parsed_document.structure_nodes),
+                    "semantic_block_count": len(parsed_document.semantic_blocks),
+                    "vector_chunk_count": len(parsed_document.vector_chunks),
+                    "artifact_keys": artifact_keys,
+                    "processing_stage": "parsed",
+                },
+            )
+            current_status = DocumentStatus.PARSED
+            current_stage = "embed"
+            self._safe_replace_processing_artifacts(doc_id=doc_id, run_id=run_id, artifact_keys=artifact_keys)
+            self._safe_append_status_event(
+                doc_id=doc_id, run_id=run_id,
+                from_status=DocumentStatus.STORED.value, to_status=DocumentStatus.PARSED.value,
+                stage="parse", message="Document parsed", metadata={"artifact_count": len(artifact_keys)},
+            )
+            if self.parse_artifact_store:
+                try:
+                    self.parse_artifact_store.save(
+                        doc_id, parsed_document.structure_nodes, parsed_document.semantic_blocks,
+                    )
+                except Exception:
+                    logger.warning("ParseArtifactStore.save failed for doc_id={}", doc_id)
+
+            chunks = self.chunk_builder.build(
+                parsed_document=parsed_document,
+                regulation_type=regulation_type,
+                version=version,
+            )
+            if not chunks:
+                raise ValueError("解析完成但没有生成可入库的 chunks")
+
+            vectors = self.embedding_provider.embed_texts([chunk.embedding_text for chunk in chunks])
+            current_stage = "index"
+            inserted = self.vector_index.upsert(chunks, vectors)
+            if inserted != len(chunks):
+                logger.warning("Milvus upsert count mismatched: inserted={}, chunks={}", inserted, len(chunks))
+
+            health = self.vector_index.health()
+            index_name = health.get("collection_name", "")
+            self.document_repository.update_status(
+                doc_id, DocumentStatus.INDEXED,
+                chunk_count=len(chunks), summary="", summary_latency_ms=0,
+                index_name=index_name,
+                metadata={"index_collection": index_name, "processing_stage": "indexed"},
+            )
+            self._safe_mark_run_indexed(doc_id=doc_id, run_id=run_id, chunk_count=len(chunks), index_name=index_name)
+            self._safe_append_status_event(
+                doc_id=doc_id, run_id=run_id,
+                from_status=DocumentStatus.PARSED.value, to_status=DocumentStatus.INDEXED.value,
+                stage="index", message="Document indexed",
+                metadata={"chunk_count": len(chunks), "index_name": index_name},
+            )
+            stored = self.document_repository.get(doc_id)
+            return DocumentProcessResult(
+                doc_id=doc_id, doc_name=final_doc_name,
+                status=(stored.status.value if stored else DocumentStatus.INDEXED.value),
+                message="处理成功", num_chunks=len(chunks),
+                summary=stored.summary if stored else "",
+                summary_latency_ms=stored.summary_latency_ms if stored else 0,
+            )
+        except Exception as exc:
+            logger.exception("文档处理失败: doc_id={}", doc_id)
+            self.document_repository.update_status(
+                doc_id, DocumentStatus.FAILED, error_message=str(exc),
+                metadata={"failure_reason": str(exc), "processing_stage": "failed", "failure_stage": current_stage},
+            )
+            self._safe_mark_run_failed(
+                doc_id=doc_id, run_id=run_id, failure_stage=current_stage, error_message=str(exc)
+            )
+            self._safe_append_status_event(
+                doc_id=doc_id, run_id=run_id,
+                from_status=current_status.value, to_status=DocumentStatus.FAILED.value,
+                stage=current_stage, message=str(exc),
+            )
+            return DocumentProcessResult(
+                doc_id=doc_id, doc_name=final_doc_name,
+                status=DocumentStatus.FAILED.value, message=f"文档处理失败: {exc}",
+            )
        finally:
            if temp_path and os.path.exists(temp_path):
                try:
@@ -446,7 +525,6 @@ class DocumentCommandService:
                except OSError:
                    logger.warning("临时文件清理失败: {}", temp_path)

-
    def delete(self, doc_id: str) -> bool:
        """Delete document record, binary file, and vector chunks."""
        document = self.document_repository.get(doc_id)
--- a/backend/app/application/perception/crawl_service.py
+++ b/backend/app/application/perception/crawl_service.py
@@ -0,0 +1,147 @@
+"""Orchestrates regulatory source crawlers and LLM enrichment pipeline."""
+
+from __future__ import annotations
+
+import hashlib
+from typing import Any, Generator
+
+from loguru import logger
+
+from app.infrastructure.perception.base_event_store import BaseEventStore
+from app.infrastructure.perception.crawlers.base import BaseCrawler, RawEvent
+from app.infrastructure.perception.llm_pipeline import LlmPipeline
+
+
+def _event_id(source: str, standard_code: str) -> str:
+    """Deterministic 12-char ID from source + standard_code."""
+    return hashlib.sha256(f"{source}-{standard_code}".encode()).hexdigest()[:12]
+
+
+def _content_hash(raw_text: str) -> str:
+    return hashlib.sha256(raw_text.encode()).hexdigest()
+
+
+def _raw_to_dict(raw: RawEvent, event_id: str, content_hash: str) -> dict:
+    return {
+        "id": event_id,
+        "source": raw.source,
+        "source_label": raw.source_label,
+        "standard_code": raw.standard_code,
+        "title": raw.title,
+        "summary": raw.summary,
+        "full_text_url": raw.full_text_url,
+        "status": raw.status,
+        "impact_level": "medium",
+        "published_at": raw.published_at,
+        "effective_at": raw.effective_at,
+        "category": raw.category,
+        "tags": raw.tags,
+        "content_hash": content_hash,
+        "previous_hash": None,
+    }
+
+
+class CrawlService:
+    """Orchestrate crawlers, hash-based change detection, and LLM enrichment."""
+
+    def __init__(
+        self,
+        crawlers: dict[str, BaseCrawler],
+        event_store: BaseEventStore,
+        llm_pipeline: LlmPipeline,
+        retrieval_service: Any,
+    ) -> None:
+        self._crawlers = crawlers
+        self._store = event_store
+        self._pipeline = llm_pipeline
+        self._retrieval = retrieval_service
+
+    def run_crawl(
+        self, sources: list[str] | None = None
+    ) -> Generator[dict, None, None]:
+        """Run crawl for selected sources. Yields SSE-ready progress dicts."""
+        targets = sources or list(self._crawlers.keys())
+        total_new = 0
+        total_updated = 0
+
+        for source_key in targets:
+            crawler = self._crawlers.get(source_key)
+            if not crawler:
+                yield {"event": "error", "data": f"Unknown source: {source_key}"}
+                continue
+
+            yield {"event": "progress", "data": {"source": source_key, "stage": "fetching"}}
+            try:
+                raw_events = crawler.fetch(limit=100)
+            except Exception as exc:
+                logger.exception("Crawler failed source={}", source_key)
+                yield {"event": "error", "data": {"source": source_key, "message": str(exc)}}
+                continue
+
+            yield {
+                "event": "progress",
+                "data": {"source": source_key, "stage": "processing", "fetched": len(raw_events)},
+            }
+
+            new_count = 0
+            updated_count = 0
+
+            for raw in raw_events:
+                eid = _event_id(raw.source, raw.standard_code)
+                new_hash = _content_hash(raw.raw_text or raw.title)
+                existing = self._store.get(eid)
+
+                if existing and existing.get("content_hash") == new_hash:
+                    continue
+
+                is_update = existing is not None
+                old_text = existing.get("summary", "") if is_update else ""
+                previous_hash = existing.get("content_hash") if is_update else None
+
+                event_dict = _raw_to_dict(raw, eid, new_hash)
+                event_dict["previous_hash"] = previous_hash
+
+                try:
+                    structure = self._pipeline.extract_structure(event_dict)
+                    event_dict.update(structure)
+                except Exception as exc:
+                    logger.warning("Structure extraction failed id={} err={}", eid, exc)
+
+                try:
+                    affected = self._pipeline.assess_impact(event_dict, self._retrieval)
+                    event_dict["affected_docs"] = affected
+                except Exception as exc:
+                    logger.warning("Impact assessment failed id={} err={}", eid, exc)
+
+                if is_update and old_text and raw.raw_text:
+                    try:
+                        diff = self._pipeline.compute_diff(old_text, raw.raw_text)
+                        event_dict["change_summary"] = diff.get("change_summary")
+                        event_dict["changed_sections"] = diff.get("changed_sections")
+                    except Exception as exc:
+                        logger.warning("Diff failed id={} err={}", eid, exc)
+
+                self._store.upsert(event_dict)
+
+                if is_update:
+                    updated_count += 1
+                else:
+                    new_count += 1
+
+            total_new += new_count
+            total_updated += updated_count
+
+            yield {
+                "event": "progress",
+                "data": {
+                    "source": source_key,
+                    "stage": "done",
+                    "new": new_count,
+                    "updated": updated_count,
+                },
+            }
+
+        yield {
+            "event": "done",
+            "data": {"total_new": total_new, "total_updated": total_updated},
+        }
--- a/backend/app/application/perception/services.py
+++ b/backend/app/application/perception/services.py
@@ -6,7 +6,7 @@ import json
 from typing import Generator

 from app.application.knowledge.services import KnowledgeRetrievalService
-from app.infrastructure.perception.mock_event_store import MockEventStore
+from app.infrastructure.perception.base_event_store import BaseEventStore
 from app.services.llm.llm_factory import get_llm_client
 from app.config.settings import settings

@@ -22,7 +22,7 @@ class PerceptionService:

    def __init__(
        self,
-        event_store: MockEventStore,
+        event_store: BaseEventStore,
        retrieval_service: KnowledgeRetrievalService,
    ) -> None:
        self._store = event_store
--- a/backend/app/config/settings.py
+++ b/backend/app/config/settings.py
@@ -82,6 +82,22 @@ class Settings(BaseSettings):
    parser_backend: str = Field(default="aliyun", description="解析后端(local/aliyun)")
    chunk_backend: str = Field(default="aliyun", description="分块后端(local/aliyun)")
    document_repository_backend: str = Field(default="json", description="文档元数据存储后端 (json/postgres)")
+    # When True, document processing is enqueued to Celery workers via Redis.
+    # When False (default), processing runs in a FastAPI BackgroundTask in the same process —
+    # no external worker needed. Switch to True only when a Celery worker is running.
+    use_celery_worker: bool = Field(default=False, description="使用 Celery Worker 异步处理文档 (需要 Worker 运行中)")
+
+    # ── Perception crawl ──────────────────────────────────────────────────────
+    perception_crawl_timeout_seconds: int = Field(
+        default=120, description="HTTP timeout for regulatory source crawlers."
+    )
+    perception_max_events_per_source: int = Field(
+        default=100, description="Maximum events fetched per source per crawl run."
+    )
+    perception_diff_similarity_threshold: float = Field(
+        default=0.85,
+        description="Cosine similarity below which a paragraph is flagged as changed.",
+    )

    # Keep configuration setup explicit so runtime behavior is easy to reason about.
    api_host: str = Field(default="0.0.0.0", description="API服务地址")
@@ -109,6 +125,7 @@ class Settings(BaseSettings):
    rag_retrieval_top_k: int = Field(default=20, description="精排前召回候选数量（reranker 启用时生效）")
    rag_max_context_tokens: int = Field(default=2000, description="RAG最大上下文token数")
    rag_summary_max_tokens: int = Field(default=10240, description="文档摘要最大token数")
+    rag_skills_max_tokens: int = Field(default=2048, description="技能类 RAG 最大 token 数")

    reranker_enabled: bool = Field(default=False, description="是否启用 Cross-Encoder 精排")
    reranker_base_url: str = Field(default="", description="Reranker API 地址")
@@ -124,6 +141,26 @@ class Settings(BaseSettings):
    # Keep configuration setup explicit so runtime behavior is easy to reason about.
    session_max_sessions: int = Field(default=100, description="最大会话数量")
    session_timeout_minutes: int = Field(default=30, description="会话超时时间(分钟)")
+    session_backend: str = Field(
+        default="memory",
+        description="会话存储后端 (memory | redis)。redis 需要 Redis 可用。",
+    )
+
+    # ── Auth ──────────────────────────────────────────────────────────────────
+    # Generate a strong secret: python -c "import secrets; print(secrets.token_hex(32))"
+    auth_secret_key: str = Field(
+        default="change-me-in-production-must-be-32-or-more-characters-long",
+        description="JWT signing secret. MUST be changed in production.",
+    )
+    auth_algorithm: str = Field(default="HS256", description="JWT signing algorithm.")
+    auth_token_expire_minutes: int = Field(default=480, description="JWT TTL in minutes (default 8 hours).")
+    auth_enabled: bool = Field(default=True, description="Set False to bypass auth (development only).")
+
+    # ── CORS ──────────────────────────────────────────────────────────────────
+    cors_allow_origins: str = Field(
+        default="http://localhost:5173",
+        description="Comma-separated allowed CORS origins. Never use * in production.",
+    )

@lru_cache
 def get_settings() -> Settings:
--- a/backend/app/domain/auth/init.py
+++ b/backend/app/domain/auth/init.py
@@ -0,0 +1,10 @@
+"""Auth domain: role definitions and token claim models.
+
+The domain layer defines what a user identity looks like (UserClaims) and
+what roles exist (UserRole). Infrastructure details (JWT, bcrypt, PostgreSQL)
+live under infrastructure/auth and never leak into this package.
+"""
+
+from .models import UserClaims, UserRole
+
+__all__ = ["UserClaims", "UserRole"]
--- a/backend/app/domain/auth/models.py
+++ b/backend/app/domain/auth/models.py
@@ -0,0 +1,42 @@
+"""Auth domain models: roles and token claims.
+
+UserRole defines the four roles from PPT Slide 12.
+UserClaims is what the JWT decodes to — it is the identity object passed
+through FastAPI dependency injection to route handlers.
+"""
+
+from __future__ import annotations
+
+import enum
+from dataclasses import dataclass
+
+
+class UserRole(str, enum.Enum):
+    """Access roles mirroring the four-role RBAC matrix from the product spec.
+
+    ADMIN      — full platform access including system management.
+    LEGAL      — knowledge query, document review, compliance checks.
+    EHS        — knowledge query, perception/regulatory signals.
+    READONLY   — knowledge query only.
+    """
+
+    ADMIN = "admin"
+    LEGAL = "legal"
+    EHS = "ehs"
+    READONLY = "readonly"
+
+
+@dataclass
+class UserClaims:
+    """Decoded JWT payload representing an authenticated user.
+
+    Instances are created by JWTHandler.decode_token() and injected into
+    route handlers via the get_current_user FastAPI dependency.
+    """
+
+    # Unique user identifier (UUID string stored in PostgreSQL users table).
+    user_id: str
+    # Display name used for audit log entries.
+    username: str
+    # Role determines which resources the user may access.
+    role: UserRole
--- a/backend/app/domain/compliance/init.py
+++ b/backend/app/domain/compliance/init.py
--- a/backend/app/domain/compliance/ports.py
+++ b/backend/app/domain/compliance/ports.py
@@ -0,0 +1,66 @@
+"""Domain ports for compliance history persistence."""
+from __future__ import annotations
+
+from abc import ABC, abstractmethod
+from dataclasses import dataclass, field
+from datetime import datetime
+from typing import Optional
+
+
+@dataclass
+class FindingRecord:
+    """Single finding row linked to an analysis."""
+    id: str
+    analysis_id: str
+    seq: int
+    title: str
+    description: str
+    status: str          # "ok" | "warn" | "risk"
+    clause_ref: Optional[str] = None
+
+
+@dataclass
+class AnalysisRecord:
+    """Full compliance analysis record with nested findings."""
+    id: str              # UUID string; empty string means not yet persisted
+    created_at: datetime
+    created_by: Optional[str]
+    doc_name: str
+    standard_name: str
+    risk_score: int
+    conclusion: str
+    actions: list        # list[dict] — serialised action items
+    para_text: str
+    highlight_terms: list  # list[str]
+    findings: list[FindingRecord] = field(default_factory=list)
+
+
+class ComplianceRepository(ABC):
+    """Port for persisting and retrieving compliance analysis records."""
+
+    @abstractmethod
+    def save_analysis(self, record: AnalysisRecord) -> str:
+        """Persist a new analysis record and return the assigned UUID string."""
+
+    @abstractmethod
+    def list_analyses(self, limit: int = 50, offset: int = 0) -> list[AnalysisRecord]:
+        """Return analyses ordered by created_at DESC, without nested findings."""
+
+    @abstractmethod
+    def get_analysis(self, analysis_id: str) -> Optional[AnalysisRecord]:
+        """Return a single analysis with all nested findings, or None."""
+
+    @abstractmethod
+    def delete_analysis(self, analysis_id: str) -> None:
+        """Delete an analysis and all related findings and chat messages (cascade)."""
+
+    @abstractmethod
+    def save_message(self, analysis_id: str, finding_id: str, role: str, content: str) -> str:
+        """Persist a chat message and return its UUID string."""
+
+    @abstractmethod
+    def get_messages(self, finding_id: str) -> list[dict]:
+        """Return chat messages for a finding ordered by created_at ASC.
+
+        Each dict has keys: id, role, content, created_at (ISO string).
+        """
--- a/backend/app/infrastructure/auth/init.py
+++ b/backend/app/infrastructure/auth/init.py
@@ -0,0 +1,5 @@
+"""JWT token creation and validation infrastructure.
+
+JWTHandler is the only component in this package. It is wired through
+shared/bootstrap.py and injected into FastAPI dependencies.
+"""
--- a/backend/app/infrastructure/auth/jwt_handler.py
+++ b/backend/app/infrastructure/auth/jwt_handler.py
@@ -0,0 +1,82 @@
+"""JWT access token creation and decoding.
+
+Uses python-jose for HS256 token signing. Token expiry is enforced at
+decode time so expired tokens are rejected even if the signature is valid.
+"""
+
+from __future__ import annotations
+
+from datetime import UTC, datetime, timedelta
+from typing import Any
+
+from jose import JWTError, jwt
+from loguru import logger
+
+from app.domain.auth.models import UserClaims, UserRole
+
+
+class JWTHandler:
+    """Create and validate HS256 JWT access tokens.
+
+    A single shared instance is wired by bootstrap.py. Use
+    get_jwt_handler() from shared.bootstrap for all token operations.
+    """
+
+    def __init__(
+        self,
+        *,
+        secret_key: str,
+        algorithm: str = "HS256",
+        expire_minutes: int = 480,
+    ) -> None:
+        """Initialise the handler with signing credentials and token lifetime."""
+        self._secret = secret_key
+        self._algorithm = algorithm
+        self._expire_minutes = expire_minutes
+
+    def create_access_token(
+        self,
+        *,
+        user_id: str,
+        username: str,
+        role: str,
+    ) -> str:
+        """Return a signed JWT containing user identity and role claims."""
+        now = datetime.now(UTC)
+        payload: dict[str, Any] = {
+            "sub": user_id,
+            "username": username,
+            "role": role,
+            "iat": now,
+            "exp": now + timedelta(minutes=self._expire_minutes),
+        }
+        return jwt.encode(payload, self._secret, algorithm=self._algorithm)
+
+    def decode_token(self, token: str) -> UserClaims:
+        """Decode and validate a JWT, returning UserClaims.
+
+        Raises ValueError with a descriptive message on expiry, tampering,
+        or any other validation failure so callers do not need to know jose.
+        """
+        try:
+            payload = jwt.decode(token, self._secret, algorithms=[self._algorithm])
+        except JWTError as exc:
+            msg = str(exc).lower()
+            if "expired" in msg:
+                raise ValueError("Token expired") from exc
+            raise ValueError(f"Invalid token: {exc}") from exc
+
+        user_id = payload.get("sub")
+        username = payload.get("username", "")
+        role_str = payload.get("role", UserRole.READONLY.value)
+
+        if not user_id:
+            raise ValueError("Token missing subject claim")
+
+        try:
+            role = UserRole(role_str)
+        except ValueError:
+            logger.warning("Unknown role in token: {}, defaulting to readonly", role_str)
+            role = UserRole.READONLY
+
+        return UserClaims(user_id=user_id, username=username, role=role)
--- a/backend/app/infrastructure/auth/user_store.py
+++ b/backend/app/infrastructure/auth/user_store.py
@@ -0,0 +1,113 @@
+"""PostgreSQL-backed user store for authentication.
+
+Manages a `users` table with hashed passwords and roles.
+Provides lookup by username for the login flow.
+Table DDL is auto-applied on first connection.
+"""
+
+from __future__ import annotations
+
+from dataclasses import dataclass
+from typing import Optional
+
+import psycopg2
+import psycopg2.extras
+from loguru import logger
+from passlib.context import CryptContext
+
+from app.config.settings import settings
+
+
+# bcrypt context — work factor 12 is a good production default.
+_PWD_CTX = CryptContext(schemes=["bcrypt"], deprecated="auto")
+
+# DDL executed once to ensure the table exists.
+_CREATE_TABLE_SQL = """
+CREATE TABLE IF NOT EXISTS users (
+    id          UUID        PRIMARY KEY DEFAULT gen_random_uuid(),
+    username    VARCHAR(100) UNIQUE NOT NULL,
+    hashed_pw   TEXT         NOT NULL,
+    role        VARCHAR(50)  NOT NULL DEFAULT 'readonly',
+    is_active   BOOLEAN      NOT NULL DEFAULT TRUE,
+    created_at  TIMESTAMPTZ  NOT NULL DEFAULT NOW()
+);
+"""
+
+
+@dataclass
+class UserRecord:
+    """A single row from the users table."""
+
+    id: str
+    username: str
+    hashed_pw: str
+    role: str
+    is_active: bool
+
+
+class PostgresUserStore:
+    """Read and verify users stored in the PostgreSQL users table.
+
+    The connection is opened on first use and shared for the lifetime
+    of the singleton instance wired by bootstrap.
+    """
+
+    def __init__(self) -> None:
+        """Initialise the store and ensure the users table exists."""
+        self._conn = psycopg2.connect(
+            host=settings.postgres_host,
+            port=settings.postgres_port,
+            user=settings.postgres_user,
+            password=settings.postgres_password,
+            dbname=settings.postgres_db,
+            cursor_factory=psycopg2.extras.RealDictCursor,
+        )
+        self._conn.autocommit = True
+        self._ensure_table()
+
+    def _ensure_table(self) -> None:
+        """Create the users table if it does not already exist."""
+        with self._conn.cursor() as cur:
+            # Enable pgcrypto so gen_random_uuid() is available for UUID primary keys.
+            try:
+                cur.execute("CREATE EXTENSION IF NOT EXISTS pgcrypto;")
+            except Exception:
+                self._conn.rollback()
+            cur.execute(_CREATE_TABLE_SQL)
+
+    def get_by_username(self, username: str) -> Optional[UserRecord]:
+        """Return a UserRecord for the given username, or None if not found."""
+        with self._conn.cursor() as cur:
+            cur.execute(
+                "SELECT id, username, hashed_pw, role, is_active "
+                "FROM users WHERE username = %s",
+                (username,),
+            )
+            row = cur.fetchone()
+        if row is None:
+            return None
+        return UserRecord(
+            id=str(row["id"]),
+            username=row["username"],
+            hashed_pw=row["hashed_pw"],
+            role=row["role"],
+            is_active=row["is_active"],
+        )
+
+    def verify_password(self, plain: str, hashed: str) -> bool:
+        """Return True if `plain` matches the stored bcrypt hash."""
+        return _PWD_CTX.verify(plain, hashed)
+
+    def authenticate(self, username: str, password: str) -> Optional[UserRecord]:
+        """Return the UserRecord if credentials are valid, else None."""
+        user = self.get_by_username(username)
+        if user is None or not user.is_active:
+            return None
+        if not self.verify_password(password, user.hashed_pw):
+            return None
+        return user
+
+    @staticmethod
+    def hash_password(plain: str) -> str:
+        """Hash a plain-text password with bcrypt."""
+        return _PWD_CTX.hash(plain)
--- a/backend/app/infrastructure/compliance/init.py
+++ b/backend/app/infrastructure/compliance/init.py
--- a/backend/app/infrastructure/compliance/docx_export.py
+++ b/backend/app/infrastructure/compliance/docx_export.py
@@ -0,0 +1,101 @@
+"""DOCX report generator for compliance analysis results.
+
+Uses python-docx (already in requirements.txt). Returns raw bytes so the
+caller can stream the response without writing to disk.
+"""
+from __future__ import annotations
+
+from datetime import datetime, timezone
+from io import BytesIO
+
+from docx import Document
+from docx.shared import Pt, RGBColor
+from docx.enum.text import WD_ALIGN_PARAGRAPH
+
+from app.domain.compliance.ports import AnalysisRecord
+
+_STATUS_LABEL = {"ok": "Compliant", "warn": "Warning", "risk": "Non-Compliant"}
+_STATUS_COLOR = {
+    "ok": RGBColor(0x22, 0x8B, 0x22),
+    "warn": RGBColor(0xFF, 0x8C, 0x00),
+    "risk": RGBColor(0xDC, 0x14, 0x3C),
+}
+
+
+def generate_docx(record: AnalysisRecord) -> bytes:
+    """Generate a compliance report DOCX and return its raw bytes.
+
+    Structure:
+    - Cover: document name, standard, date, risk score
+    - Executive summary (conclusion)
+    - Findings table
+    - Recommended actions
+    - Footer note
+    """
+    doc = Document()
+
+    # ── Cover ──────────────────────────────────────────────────────────────────
+    title_para = doc.add_heading("Compliance Analysis Report", level=0)
+    title_para.alignment = WD_ALIGN_PARAGRAPH.CENTER
+
+    doc.add_paragraph("")
+    meta_table = doc.add_table(rows=4, cols=2)
+    meta_table.style = "Table Grid"
+    labels = ["Document", "Standard", "Date", "Risk Score"]
+    values = [
+        record.doc_name,
+        record.standard_name,
+        record.created_at.strftime("%Y-%m-%d %H:%M UTC") if record.created_at else "",
+        f"{record.risk_score} / 100",
+    ]
+    for i, (label, value) in enumerate(zip(labels, values)):
+        meta_table.cell(i, 0).text = label
+        meta_table.cell(i, 1).text = value
+
+    # ── Executive Summary ──────────────────────────────────────────────────────
+    doc.add_heading("Executive Summary", level=1)
+    doc.add_paragraph(record.conclusion)
+
+    # ── Findings ───────────────────────────────────────────────────────────────
+    doc.add_heading("Findings", level=1)
+    if record.findings:
+        table = doc.add_table(rows=1, cols=4)
+        table.style = "Table Grid"
+        hdr = table.rows[0].cells
+        for i, h in enumerate(["#", "Status", "Title", "Description / Clause"]):
+            hdr[i].text = h
+            for run in hdr[i].paragraphs[0].runs:
+                run.bold = True
+
+        for f in record.findings:
+            row = table.add_row().cells
+            row[0].text = str(f.seq + 1)
+            row[1].text = _STATUS_LABEL.get(f.status, f.status)
+            row[2].text = f.title
+            desc = f.description
+            if f.clause_ref:
+                desc += f"\n[{f.clause_ref}]"
+            row[3].text = desc
+    else:
+        doc.add_paragraph("No findings recorded.")
+
+    # ── Recommended Actions ────────────────────────────────────────────────────
+    doc.add_heading("Recommended Actions", level=1)
+    for i, action in enumerate(record.actions, start=1):
+        label = action.get("label", "Action")
+        value = action.get("value", "")
+        doc.add_paragraph(f"{i}. {label}: {value}", style="List Number")
+
+    # ── Footer note ────────────────────────────────────────────────────────────
+    doc.add_paragraph("")
+    footer = doc.add_paragraph(
+        f"Generated by AI Regulation Analysis System — {datetime.now(timezone.utc).strftime('%Y-%m-%d')}"
+    )
+    footer.alignment = WD_ALIGN_PARAGRAPH.CENTER
+    for run in footer.runs:
+        run.font.size = Pt(8)
+        run.font.color.rgb = RGBColor(0x88, 0x88, 0x88)
+
+    buf = BytesIO()
+    doc.save(buf)
+    return buf.getvalue()
--- a/backend/app/infrastructure/compliance/repository.py
+++ b/backend/app/infrastructure/compliance/repository.py
@@ -0,0 +1,280 @@
+# backend/app/infrastructure/compliance/repository.py
+"""PostgreSQL-backed compliance analysis repository.
+
+Follows the same psycopg2 pattern as PostgresDocumentRepository:
+ThreadedConnectionPool + RealDictCursor for reads, _ensure_schema on init.
+"""
+from __future__ import annotations
+
+import json
+from contextlib import contextmanager
+from datetime import datetime
+from typing import Optional
+
+import psycopg2
+import psycopg2.extras
+import psycopg2.pool
+from loguru import logger
+
+from app.domain.compliance.ports import (
+    AnalysisRecord,
+    ComplianceRepository,
+    FindingRecord,
+)
+
+
+class PostgresComplianceRepository(ComplianceRepository):
+    """Stores compliance analyses, findings, and finding chat messages in PostgreSQL."""
+
+    def __init__(
+        self,
+        host: str,
+        port: int,
+        user: str,
+        password: str,
+        dbname: str,
+        minconn: int = 1,
+        maxconn: int = 5,
+    ) -> None:
+        self._pool = psycopg2.pool.ThreadedConnectionPool(
+            minconn=minconn,
+            maxconn=maxconn,
+            host=host,
+            port=port,
+            user=user,
+            password=password,
+            dbname=dbname,
+        )
+        self._ensure_schema()
+
+    @contextmanager
+    def _conn(self):
+        conn = self._pool.getconn()
+        try:
+            yield conn
+        finally:
+            self._pool.putconn(conn)
+
+    def _ensure_schema(self) -> None:
+        """Create tables if they do not exist."""
+        with self._conn() as conn:
+            with conn.cursor() as cur:
+                cur.execute("""
+                    CREATE TABLE IF NOT EXISTS compliance_analyses (
+                        id              UUID PRIMARY KEY DEFAULT gen_random_uuid(),
+                        created_at      TIMESTAMPTZ NOT NULL DEFAULT now(),
+                        created_by      VARCHAR(255),
+                        doc_name        VARCHAR(500),
+                        standard_name   VARCHAR(500),
+                        risk_score      INTEGER,
+                        conclusion      TEXT,
+                        actions         JSONB,
+                        para_text       TEXT,
+                        highlight_terms JSONB
+                    );
+                """)
+                cur.execute("""
+                    CREATE TABLE IF NOT EXISTS compliance_findings (
+                        id          UUID PRIMARY KEY DEFAULT gen_random_uuid(),
+                        analysis_id UUID NOT NULL REFERENCES compliance_analyses(id) ON DELETE CASCADE,
+                        seq         INTEGER NOT NULL,
+                        title       VARCHAR(500),
+                        description TEXT,
+                        status      VARCHAR(50),
+                        clause_ref  VARCHAR(200)
+                    );
+                """)
+                cur.execute("""
+                    CREATE TABLE IF NOT EXISTS finding_chat_messages (
+                        id          UUID PRIMARY KEY DEFAULT gen_random_uuid(),
+                        analysis_id UUID NOT NULL REFERENCES compliance_analyses(id) ON DELETE CASCADE,
+                        finding_id  UUID NOT NULL REFERENCES compliance_findings(id) ON DELETE CASCADE,
+                        role        VARCHAR(20) NOT NULL,
+                        content     TEXT NOT NULL,
+                        created_at  TIMESTAMPTZ NOT NULL DEFAULT now()
+                    );
+                """)
+            conn.commit()
+
+    def save_analysis(self, record: AnalysisRecord) -> str:
+        """Insert analysis + findings; return the new analysis UUID."""
+        with self._conn() as conn:
+            with conn.cursor(cursor_factory=psycopg2.extras.RealDictCursor) as cur:
+                cur.execute(
+                    """
+                    INSERT INTO compliance_analyses
+                        (created_by, doc_name, standard_name, risk_score,
+                         conclusion, actions, para_text, highlight_terms)
+                    VALUES
+                        (%(created_by)s, %(doc_name)s, %(standard_name)s, %(risk_score)s,
+                         %(conclusion)s, %(actions)s, %(para_text)s, %(highlight_terms)s)
+                    RETURNING id
+                    """,
+                    {
+                        "created_by": record.created_by,
+                        "doc_name": record.doc_name,
+                        "standard_name": record.standard_name,
+                        "risk_score": record.risk_score,
+                        "conclusion": record.conclusion,
+                        "actions": json.dumps(record.actions, ensure_ascii=False),
+                        "para_text": record.para_text,
+                        "highlight_terms": json.dumps(record.highlight_terms, ensure_ascii=False),
+                    },
+                )
+                row = cur.fetchone()
+                analysis_id = str(row["id"])
+
+            if record.findings:
+                with conn.cursor() as cur:
+                    for f in record.findings:
+                        cur.execute(
+                            """
+                            INSERT INTO compliance_findings
+                                (analysis_id, seq, title, description, status, clause_ref)
+                            VALUES
+                                (%(analysis_id)s, %(seq)s, %(title)s, %(desc)s, %(status)s, %(clause_ref)s)
+                            """,
+                            {
+                                "analysis_id": analysis_id,
+                                "seq": f.seq,
+                                "title": f.title,
+                                "desc": f.description,
+                                "status": f.status,
+                                "clause_ref": f.clause_ref,
+                            },
+                        )
+            conn.commit()
+        return analysis_id
+
+    def list_analyses(self, limit: int = 50, offset: int = 0) -> list[AnalysisRecord]:
+        """Return analyses without nested findings, ordered newest first."""
+        with self._conn() as conn:
+            with conn.cursor(cursor_factory=psycopg2.extras.RealDictCursor) as cur:
+                cur.execute(
+                    """
+                    SELECT id, created_at, created_by, doc_name, standard_name,
+                           risk_score, conclusion, actions, para_text, highlight_terms
+                    FROM compliance_analyses
+                    ORDER BY created_at DESC
+                    LIMIT %(limit)s OFFSET %(offset)s
+                    """,
+                    {"limit": limit, "offset": offset},
+                )
+                rows = cur.fetchall()
+        return [self._row_to_record(dict(r)) for r in rows]
+
+    def get_analysis(self, analysis_id: str) -> Optional[AnalysisRecord]:
+        """Return analysis with nested findings list."""
+        with self._conn() as conn:
+            with conn.cursor(cursor_factory=psycopg2.extras.RealDictCursor) as cur:
+                cur.execute(
+                    "SELECT * FROM compliance_analyses WHERE id = %(id)s",
+                    {"id": analysis_id},
+                )
+                row = cur.fetchone()
+                if not row:
+                    return None
+                record = self._row_to_record(dict(row))
+
+                cur.execute(
+                    """
+                    SELECT id, analysis_id, seq, title, description, status, clause_ref
+                    FROM compliance_findings
+                    WHERE analysis_id = %(id)s
+                    ORDER BY seq
+                    """,
+                    {"id": analysis_id},
+                )
+                findings = [
+                    FindingRecord(
+                        id=str(r["id"]),
+                        analysis_id=str(r["analysis_id"]),
+                        seq=r["seq"],
+                        title=r["title"] or "",
+                        description=r["description"] or "",
+                        status=r["status"] or "ok",
+                        clause_ref=r["clause_ref"],
+                    )
+                    for r in cur.fetchall()
+                ]
+                record.findings = findings
+        return record
+
+    def delete_analysis(self, analysis_id: str) -> None:
+        """Delete analysis; findings and chat messages cascade automatically."""
+        with self._conn() as conn:
+            with conn.cursor() as cur:
+                cur.execute(
+                    "DELETE FROM compliance_analyses WHERE id = %(id)s",
+                    {"id": analysis_id},
+                )
+            conn.commit()
+
+    def save_message(self, analysis_id: str, finding_id: str, role: str, content: str) -> str:
+        """Persist a chat message; return its UUID."""
+        with self._conn() as conn:
+            with conn.cursor(cursor_factory=psycopg2.extras.RealDictCursor) as cur:
+                cur.execute(
+                    """
+                    INSERT INTO finding_chat_messages
+                        (analysis_id, finding_id, role, content)
+                    VALUES
+                        (%(analysis_id)s, %(finding_id)s, %(role)s, %(content)s)
+                    RETURNING id
+                    """,
+                    {
+                        "analysis_id": analysis_id,
+                        "finding_id": finding_id,
+                        "role": role,
+                        "content": content,
+                    },
+                )
+                row = cur.fetchone()
+            conn.commit()
+        return str(row["id"])
+
+    def get_messages(self, finding_id: str) -> list[dict]:
+        """Return messages for a finding, oldest first."""
+        with self._conn() as conn:
+            with conn.cursor(cursor_factory=psycopg2.extras.RealDictCursor) as cur:
+                cur.execute(
+                    """
+                    SELECT id, role, content, created_at
+                    FROM finding_chat_messages
+                    WHERE finding_id = %(finding_id)s
+                    ORDER BY created_at ASC
+                    """,
+                    {"finding_id": finding_id},
+                )
+                rows = cur.fetchall()
+        return [
+            {
+                "id": str(r["id"]),
+                "role": r["role"],
+                "content": r["content"],
+                "created_at": r["created_at"].isoformat() if r["created_at"] else "",
+            }
+            for r in rows
+        ]
+
+    def _row_to_record(self, row: dict) -> AnalysisRecord:
+        """Convert a RealDictCursor row to an AnalysisRecord (no findings)."""
+        actions = row.get("actions") or []
+        if isinstance(actions, str):
+            actions = json.loads(actions)
+        highlight_terms = row.get("highlight_terms") or []
+        if isinstance(highlight_terms, str):
+            highlight_terms = json.loads(highlight_terms)
+        return AnalysisRecord(
+            id=str(row["id"]),
+            created_at=row["created_at"] if isinstance(row["created_at"], datetime) else datetime.utcnow(),
+            created_by=row.get("created_by"),
+            doc_name=row.get("doc_name") or "",
+            standard_name=row.get("standard_name") or "",
+            risk_score=int(row.get("risk_score") or 0),
+            conclusion=row.get("conclusion") or "",
+            actions=actions,
+            para_text=row.get("para_text") or "",
+            highlight_terms=highlight_terms,
+            findings=[],
+        )
--- a/backend/app/infrastructure/perception/base_event_store.py
+++ b/backend/app/infrastructure/perception/base_event_store.py
@@ -0,0 +1,39 @@
+"""Abstract base class for regulatory event stores."""
+
+from __future__ import annotations
+
+from abc import ABC, abstractmethod
+
+
+class BaseEventStore(ABC):
+    """Port interface for regulatory event persistence."""
+
+    @abstractmethod
+    def all(self) -> list[dict]:
+        """Return all events, most-recent first."""
+
+    @abstractmethod
+    def get(self, event_id: str) -> dict | None:
+        """Return a single event by ID, or None."""
+
+    @abstractmethod
+    def filter(
+        self,
+        *,
+        source: str | None = None,
+        impact_level: str | None = None,
+        limit: int = 50,
+    ) -> list[dict]:
+        """Return filtered events sorted by published_at descending."""
+
+    @abstractmethod
+    def stats(self) -> dict:
+        """Return {total, high_impact, medium_impact, low_impact, recent_90d}."""
+
+    @abstractmethod
+    def upsert(self, event: dict) -> None:
+        """Insert or update an event record."""
+
+    @abstractmethod
+    def get_by_standard_code(self, standard_code: str) -> dict | None:
+        """Return the most-recent event with matching standard_code, or None."""
--- a/backend/app/infrastructure/perception/crawlers/init.py
+++ b/backend/app/infrastructure/perception/crawlers/init.py
--- a/backend/app/infrastructure/perception/crawlers/_utils.py
+++ b/backend/app/infrastructure/perception/crawlers/_utils.py
@@ -0,0 +1,43 @@
+"""Shared utility functions for crawlers."""
+
+from __future__ import annotations
+
+import re
+from datetime import date
+
+
+def parse_date(text: str) -> str:
+    """Return YYYY-MM-DD from common Chinese date formats, or today's date."""
+    text = text.strip()
+    if not text:
+        return date.today().isoformat()
+    m = re.search(r"(\d{4})[/-](\d{1,2})[/-](\d{1,2})", text)
+    if m:
+        try:
+            return date(int(m.group(1)), int(m.group(2)), int(m.group(3))).isoformat()
+        except ValueError:
+            pass
+    m2 = re.search(r"(\d{4})年(\d{1,2})月(\d{1,2})日?", text)
+    if m2:
+        try:
+            return date(int(m2.group(1)), int(m2.group(2)), int(m2.group(3))).isoformat()
+        except ValueError:
+            pass
+    return date.today().isoformat()
+
+
+def extract_tags(standard_code: str, title: str) -> list[str]:
+    """Derive simple keyword tags from standard code and title."""
+    tags: list[str] = []
+    code_upper = standard_code.upper()
+    if "GB" in code_upper:
+        tags.append("国家标准")
+    if "/T" in code_upper:
+        tags.append("推荐性")
+    else:
+        tags.append("强制性")
+    keywords = ["电动", "安全", "自动驾驶", "充电", "智能网联", "碰撞", "排放", "网络安全"]
+    for kw in keywords:
+        if kw in title:
+            tags.append(kw)
+    return tags[:5]
--- a/backend/app/infrastructure/perception/crawlers/base.py
+++ b/backend/app/infrastructure/perception/crawlers/base.py
@@ -0,0 +1,32 @@
+"""Shared contracts for regulatory source crawlers."""
+
+from __future__ import annotations
+
+from abc import ABC, abstractmethod
+from dataclasses import dataclass, field
+
+
+@dataclass
+class RawEvent:
+    """Raw regulatory event returned by a crawler before enrichment."""
+
+    source: str
+    source_label: str
+    standard_code: str
+    title: str
+    summary: str
+    full_text_url: str
+    status: str           # 'enacted' | 'draft' | 'consultation'
+    published_at: str     # YYYY-MM-DD string
+    effective_at: str | None
+    category: str
+    tags: list[str] = field(default_factory=list)
+    raw_text: str = ""    # full crawled text for hashing + LLM
+
+
+class BaseCrawler(ABC):
+    """Abstract regulatory source crawler."""
+
+    @abstractmethod
+    def fetch(self, limit: int = 50) -> list[RawEvent]:
+        """Fetch up to `limit` recent events from the data source."""
--- a/backend/app/infrastructure/perception/crawlers/catarc_crawler.py
+++ b/backend/app/infrastructure/perception/crawlers/catarc_crawler.py
@@ -0,0 +1,83 @@
+"""Crawler for CATARC automotive standard catalogue."""
+
+from __future__ import annotations
+
+from urllib.parse import urljoin
+
+import httpx
+from bs4 import BeautifulSoup
+from loguru import logger
+
+from app.infrastructure.perception.crawlers.base import BaseCrawler, RawEvent
+from ._utils import extract_tags, parse_date
+
+_BASE_URL = "https://www.catarc.org.cn/bzzxd/qcbz/index.html"
+_HOST = "https://www.catarc.org.cn"
+
+_STATUS_MAP = {
+    "现行": "enacted",
+    "即将实施": "enacted",
+    "废止": "enacted",
+    "征求意见": "consultation",
+    "报批": "draft",
+}
+
+
+class CatarcCrawler(BaseCrawler):
+    """Scrape the CATARC automotive standard list page."""
+
+    def fetch(self, limit: int = 50) -> list[RawEvent]:
+        events: list[RawEvent] = []
+        page = 1
+        max_pages = max(10, limit)
+        while len(events) < limit and page <= max_pages:
+            url = f"{_BASE_URL}?page={page}"
+            try:
+                resp = httpx.get(url, timeout=30, follow_redirects=True)
+                resp.raise_for_status()
+            except Exception as exc:
+                logger.warning("CATARC fetch failed page={} err={}", page, exc)
+                break
+
+            soup = BeautifulSoup(resp.text, "lxml")
+            rows = soup.select("table tr")
+            if not rows:
+                break
+
+            batch: list[RawEvent] = []
+            for row in rows:
+                cells = row.find_all("td")
+                if len(cells) < 3:
+                    continue
+                link = cells[0].find("a")
+                standard_code = link.get_text(strip=True) if link else cells[0].get_text(strip=True)
+                title = cells[1].get_text(strip=True) if len(cells) > 1 else standard_code
+                date_text = cells[2].get_text(strip=True) if len(cells) > 2 else ""
+                published_at = parse_date(date_text)
+                status_text = cells[3].get_text(strip=True) if len(cells) > 3 else ""
+                status = _STATUS_MAP.get(status_text, "enacted")
+                detail_url = urljoin(_HOST, link["href"]) if link and link.get("href") else url
+                raw_text = f"{standard_code} {title}"
+                batch.append(RawEvent(
+                    source="CATARC",
+                    source_label="全国汽车标准化技术委员会",
+                    standard_code=standard_code,
+                    title=title,
+                    summary=title,
+                    full_text_url=detail_url,
+                    status=status,
+                    published_at=published_at,
+                    effective_at=None,
+                    category="汽车标准",
+                    tags=extract_tags(standard_code, title),
+                    raw_text=raw_text,
+                ))
+
+            if not batch:
+                break
+            events.extend(batch)
+            page += 1
+
+        return events[:limit]
+
+
--- a/backend/app/infrastructure/perception/crawlers/eurlex_crawler.py
+++ b/backend/app/infrastructure/perception/crawlers/eurlex_crawler.py
@@ -0,0 +1,117 @@
+"""Crawler for EUR-Lex RSS feeds covering EU AI Act and automotive regulations."""
+
+from __future__ import annotations
+
+import re
+from email.utils import parsedate_to_datetime
+
+import httpx
+from bs4 import BeautifulSoup
+from loguru import logger
+
+from app.infrastructure.perception.crawlers.base import BaseCrawler, RawEvent
+from ._utils import parse_date
+
+_EURLEX_RSS_URLS = [
+    "https://eur-lex.europa.eu/rss-feed/OJ-L.rss",
+]
+
+_AUTOMOTIVE_KEYWORDS = [
+    "vehicle", "automotive", "motor", "tyre", "emission", "ADAS", "autonomous",
+    "AI Act", "artificial intelligence", "cybersecurity", "software update",
+    "R155", "R156", "汽车", "车辆",
+]
+
+
+_AUTOMOTIVE_KEYWORDS_LOWER = [kw.lower() for kw in _AUTOMOTIVE_KEYWORDS]
+
+
+def _is_automotive_relevant(title: str, description: str) -> bool:
+    combined = (title + " " + description).lower()
+    return any(kw in combined for kw in _AUTOMOTIVE_KEYWORDS_LOWER)
+
+
+def _extract_celex(url: str) -> str:
+    m = re.search(r"CELEX[:/]([0-9A-Z]+)", url)
+    return m.group(1) if m else ""
+
+
+def _parse_rss_date(rfc2822: str) -> str:
+    try:
+        dt = parsedate_to_datetime(rfc2822)
+        return dt.date().isoformat()
+    except Exception:
+        return parse_date(rfc2822)
+
+
+class EurlexCrawler(BaseCrawler):
+    """Fetch automotive-relevant EU regulations from EUR-Lex RSS feeds."""
+
+    def fetch(self, limit: int = 50) -> list[RawEvent]:
+        events: list[RawEvent] = []
+        for rss_url in _EURLEX_RSS_URLS:
+            if len(events) >= limit:
+                break
+            try:
+                resp = httpx.get(rss_url, timeout=30, follow_redirects=True)
+                resp.raise_for_status()
+            except Exception as exc:
+                logger.warning("EUR-Lex RSS fetch failed url={} err={}", rss_url, exc)
+                continue
+
+            soup = BeautifulSoup(resp.content, "lxml-xml")
+            for item in soup.find_all("item"):
+                if len(events) >= limit:
+                    break
+                title_tag = item.find("title")
+                title = title_tag.get_text(strip=True) if title_tag else ""
+                desc_tag = item.find("description")
+                description = desc_tag.get_text(strip=True) if desc_tag else ""
+                link_tag = item.find("link")
+                link = link_tag.get_text(strip=True) if link_tag else ""
+                pub_date_tag = item.find("pubDate")
+                pub_date = pub_date_tag.get_text(strip=True) if pub_date_tag else ""
+
+                if not _is_automotive_relevant(title, description):
+                    continue
+
+                celex = _extract_celex(link)
+                standard_code = celex if celex else title[:60]
+                published_at = _parse_rss_date(pub_date) if pub_date else ""
+
+                events.append(RawEvent(
+                    source="EUR-Lex",
+                    source_label="欧盟官方公报",
+                    standard_code=standard_code,
+                    title=title,
+                    summary=description[:500],
+                    full_text_url=link,
+                    status="enacted",
+                    published_at=published_at,
+                    effective_at=None,
+                    category="EU法规",
+                    tags=_extract_eurlex_tags(title, description),
+                    raw_text=f"{title}\n{description}",
+                ))
+
+        return events[:limit]
+
+
+def _extract_eurlex_tags(title: str, description: str) -> list[str]:
+    combined = title + " " + description
+    tag_map = {
+        "AI Act": "EU AI Act",
+        "artificial intelligence": "EU AI Act",
+        "R155": "UN R155",
+        "R156": "UN R156",
+        "cybersecurity": "网络安全",
+        "emission": "排放",
+        "autonomous": "自动驾驶",
+        "ADAS": "ADAS",
+    }
+    combined_lower = combined.lower()
+    tags = []
+    for kw, tag in tag_map.items():
+        if kw.lower() in combined_lower:
+            tags.append(tag)
+    return tags[:5]
--- a/backend/app/infrastructure/perception/crawlers/guobiao_crawler.py
+++ b/backend/app/infrastructure/perception/crawlers/guobiao_crawler.py
@@ -0,0 +1,92 @@
+"""Crawlers for the 国标委 (SAMR) standard information platform."""
+
+from __future__ import annotations
+
+import httpx
+from loguru import logger
+
+from app.infrastructure.perception.crawlers.base import BaseCrawler, RawEvent
+from ._utils import extract_tags, parse_date
+
+_BASE_URL = "https://openstd.samr.gov.cn/bzgk/std/std_list_type"
+_HEADERS = {"User-Agent": "Mozilla/5.0 (compatible; RegulatoryBot/1.0)"}
+
+
+def _fetch_page(std_type: int, page: int, page_size: int) -> list[dict]:
+    params = {
+        "p.p1": std_type,
+        "p.p2": "车",
+        "p.p90": "circulation_date",
+        "p.p91": "desc",
+        "p.p6": page,
+        "p.p7": page_size,
+    }
+    try:
+        resp = httpx.get(_BASE_URL, params=params, headers=_HEADERS, timeout=30)
+        resp.raise_for_status()
+        data = resp.json()
+        return data.get("rows", []) or []
+    except Exception as exc:
+        logger.warning("国标委 fetch failed type={} page={} err={}", std_type, page, exc)
+        return []
+
+
+def _row_to_raw_event(row: dict, source_label: str) -> RawEvent:
+    standard_code = row.get("std_code", "")
+    title = row.get("std_name", standard_code)
+    published_at = parse_date(row.get("release_date", ""))
+    effective_at_raw = row.get("implement_date", "")
+    effective_at = parse_date(effective_at_raw) if effective_at_raw else None
+    status_text = row.get("std_status", "")
+    if "征求意见" in status_text:
+        status = "consultation"
+    elif "报批" in status_text or "草案" in status_text:
+        status = "draft"
+    else:
+        status = "enacted"
+    return RawEvent(
+        source="国标委",
+        source_label=source_label,
+        standard_code=standard_code,
+        title=title,
+        summary=title,
+        full_text_url=f"https://openstd.samr.gov.cn/bzgk/std/detail?id={row.get('id', '')}",
+        status=status,
+        published_at=published_at,
+        effective_at=effective_at,
+        category=row.get("std_type", "国家标准"),
+        tags=extract_tags(standard_code, title),
+        raw_text=f"{standard_code} {title}",
+    )
+
+
+class GuobiaoMandatoryCrawler(BaseCrawler):
+    """Fetch mandatory national standards (强制性) related to vehicles."""
+
+    def fetch(self, limit: int = 50) -> list[RawEvent]:
+        events: list[RawEvent] = []
+        page = 1
+        max_pages = max(10, limit)
+        while len(events) < limit and page <= max_pages:
+            rows = _fetch_page(std_type=1, page=page, page_size=20)
+            if not rows:
+                break
+            events.extend(_row_to_raw_event(r, "国标委·强制性") for r in rows)
+            page += 1
+        return events[:limit]
+
+
+class GuobiaoRecommendedCrawler(BaseCrawler):
+    """Fetch recommended national standards (推荐性) related to vehicles."""
+
+    def fetch(self, limit: int = 50) -> list[RawEvent]:
+        events: list[RawEvent] = []
+        page = 1
+        max_pages = max(10, limit)
+        while len(events) < limit and page <= max_pages:
+            rows = _fetch_page(std_type=2, page=page, page_size=20)
+            if not rows:
+                break
+            events.extend(_row_to_raw_event(r, "国标委·推荐性") for r in rows)
+            page += 1
+        return events[:limit]
--- a/backend/app/infrastructure/perception/llm_pipeline.py
+++ b/backend/app/infrastructure/perception/llm_pipeline.py
@@ -0,0 +1,241 @@
+"""LLM-driven pipeline for regulatory event enrichment."""
+
+from __future__ import annotations
+
+import json
+import math
+from typing import Any
+
+from loguru import logger
+
+from app.config.settings import settings
+from app.infrastructure.embedding.openai_compatible_embedding_provider import (
+    OpenAICompatibleEmbeddingProvider,
+)
+from app.services.llm.llm_factory import get_llm_client
+
+_EXTRACT_SYSTEM = (
+    "You are a regulatory compliance expert specialising in automotive standards "
+    "(GB, UN-ECE, ISO, EU). Extract structured information from regulation text. "
+    "Return valid JSON only — no markdown fences, no extra keys."
+)
+
+_ASSESS_SYSTEM = (
+    "You are an automotive compliance analyst. Given a regulation and related document excerpts, "
+    "identify which documents are affected and what actions are required. "
+    "Return a JSON array only."
+)
+
+_DIFF_SYSTEM = (
+    "You are a regulatory change analyst. Given an old and new version of a regulation paragraph, "
+    "classify the type of change and summarise it. "
+    "Return JSON only: {\"change_type\": \"tightened|relaxed|added|removed\", \"summary\": \"...\"}"
+)
+
+_SIMILARITY_THRESHOLD = 0.85
+
+
+def _cosine(a: list[float], b: list[float]) -> float:
+    dot = sum(x * y for x, y in zip(a, b))
+    norm_a = math.sqrt(sum(x * x for x in a))
+    norm_b = math.sqrt(sum(x * x for x in b))
+    if norm_a == 0 or norm_b == 0:
+        return 0.0
+    return dot / (norm_a * norm_b)
+
+
+def _llm_json(client: Any, messages: list[dict]) -> Any:
+    """Call LLM and parse JSON response; return None on failure."""
+    try:
+        resp = client.chat(messages)
+        text = (resp.content or "").strip()
+        if text.startswith("```"):
+            text = text.split("```")[1]
+            if text.startswith("json"):
+                text = text[4:]
+        return json.loads(text)
+    except Exception as exc:
+        logger.warning("LLM JSON parse failed: {}", exc)
+        return None
+
+
+class LlmPipeline:
+    """Three-step enrichment pipeline for crawled regulatory events."""
+
+    def __init__(self) -> None:
+        self._client = get_llm_client(
+            provider=settings.llm_provider,
+            model=settings.llm_model,
+        )
+        self._embedder = OpenAICompatibleEmbeddingProvider()
+
+    # ------------------------------------------------------------------
+    # Step 1: Structure extraction
+    # ------------------------------------------------------------------
+
+    def extract_structure(self, event: dict) -> dict:
+        """Extract obligations, deadlines, scope, penalties, impact_level from event text."""
+        prompt = f"""Extract structured compliance information from this regulation:
+
+Standard: {event.get('standard_code', '')}
+Title: {event.get('title', '')}
+Source: {event.get('source_label', '')}
+Summary: {event.get('summary', '')}
+Tags: {', '.join(event.get('tags') or [])}
+
+Return JSON with exactly these keys:
+{{
+  "obligations": [{{"text": "...", "deontic": "must|shall|may|prohibited", "subject": "...", "object": "...", "condition": ""}}],
+  "deadlines": [{{"date": "YYYY-MM-DD or null", "description": "..."}}],
+  "scope": "one sentence describing who/what this applies to",
+  "penalties": "one sentence on consequences of non-compliance, or null",
+  "impact_level": "high|medium|low"
+}}"""
+
+        messages = [
+            {"role": "system", "content": _EXTRACT_SYSTEM},
+            {"role": "user", "content": prompt},
+        ]
+        result = _llm_json(self._client, messages)
+        if not isinstance(result, dict):
+            return {
+                "obligations": [],
+                "deadlines": [],
+                "scope": "",
+                "penalties": "",
+                "impact_level": "medium",
+            }
+        return result
+
+    # ------------------------------------------------------------------
+    # Step 2: Impact assessment
+    # ------------------------------------------------------------------
+
+    def assess_impact(self, event: dict, retrieval_service: Any) -> list[dict]:
+        """Use RAG to find affected documents and generate recommendations."""
+        obligations = event.get("obligations") or []
+        obligation_texts = " ".join(o.get("text", "") for o in obligations[:3])
+        query = f"{event.get('standard_code', '')} {event.get('title', '')} {obligation_texts}"
+
+        try:
+            chunks = retrieval_service.retrieve(query=query, top_k=5)
+        except Exception as exc:
+            logger.warning("RAG retrieval failed: {}", exc)
+            return []
+
+        if not chunks:
+            return []
+
+        seen: set[str] = set()
+        doc_excerpts: list[dict] = []
+        for chunk in chunks:
+            if chunk.doc_id not in seen:
+                seen.add(chunk.doc_id)
+                doc_excerpts.append({
+                    "doc_id": chunk.doc_id,
+                    "doc_name": chunk.doc_title,
+                    "score": round(float(chunk.score if chunk.score is not None else 0), 4),
+                    "snippet": (chunk.text or "")[:300],
+                    "clause": getattr(chunk, "section_title", "") or "",
+                })
+
+        context = "\n".join(
+            f"[{d['doc_name']} {d['clause']}] score={d['score']}: {d['snippet']}"
+            for d in doc_excerpts
+        )
+        prompt = f"""Regulation: {event.get('standard_code')} — {event.get('title')}
+Obligations: {obligation_texts or event.get('summary', '')}
+
+Affected documents found in knowledge base:
+{context}
+
+For each document, assess impact and recommend action. Return JSON array:
+[{{"doc_id":"...","doc_name":"...","score":0.0,"key_clauses":"...","recommendation":"one sentence action"}}]"""
+
+        messages = [
+            {"role": "system", "content": _ASSESS_SYSTEM},
+            {"role": "user", "content": prompt},
+        ]
+        result = _llm_json(self._client, messages)
+        if isinstance(result, list):
+            score_map = {d["doc_id"]: d["score"] for d in doc_excerpts}
+            for item in result:
+                if isinstance(item, dict) and item.get("doc_id") in score_map:
+                    item["score"] = score_map[item["doc_id"]]
+            return result
+        return doc_excerpts
+
+    # ------------------------------------------------------------------
+    # Step 3: Semantic diff
+    # ------------------------------------------------------------------
+
+    def compute_diff(self, old_text: str, new_text: str) -> dict:
+        """Compare old and new regulation text; return changed sections and summary."""
+        old_paras = [p.strip() for p in old_text.split("\n") if p.strip()]
+        new_paras = [p.strip() for p in new_text.split("\n") if p.strip()]
+
+        if not old_paras or not new_paras:
+            return {"changed_sections": [], "change_summary": "No comparable text."}
+
+        all_paras = old_paras + new_paras
+        try:
+            all_embeddings = self._embedder.embed_texts(all_paras)
+        except Exception as exc:
+            logger.warning("Embedding for diff failed: {}", exc)
+            return {"changed_sections": [], "change_summary": "Diff unavailable (embedding error)."}
+
+        old_embeddings = all_embeddings[: len(old_paras)]
+        new_embeddings = all_embeddings[len(old_paras):]
+
+        changed_sections: list[dict] = []
+        max_len = max(len(old_paras), len(new_paras))
+
+        for i in range(max_len):
+            if i >= len(old_paras):
+                # New paragraph added
+                changed_sections.append({
+                    "old_text": "",
+                    "new_text": new_paras[i][:300],
+                    "similarity": 0.0,
+                    "change_type": "added",
+                    "summary": "New paragraph added.",
+                })
+                continue
+            if i >= len(new_paras):
+                # Old paragraph removed
+                changed_sections.append({
+                    "old_text": old_paras[i][:300],
+                    "new_text": "",
+                    "similarity": 0.0,
+                    "change_type": "removed",
+                    "summary": "Paragraph removed.",
+                })
+                continue
+            # Both exist — compare via embeddings
+            sim = _cosine(old_embeddings[i], new_embeddings[i])
+            if sim < _SIMILARITY_THRESHOLD:
+                messages = [
+                    {"role": "system", "content": _DIFF_SYSTEM},
+                    {"role": "user", "content": f"OLD: {old_paras[i][:500]}\nNEW: {new_paras[i][:500]}"},
+                ]
+                classification = _llm_json(self._client, messages) or {}
+                changed_sections.append({
+                    "old_text": old_paras[i][:300],
+                    "new_text": new_paras[i][:300],
+                    "similarity": round(sim, 3),
+                    "change_type": classification.get("change_type", "modified"),
+                    "summary": classification.get("summary", ""),
+                })
+
+        if not changed_sections:
+            change_summary = "No substantive changes detected between versions."
+        else:
+            types = [s["change_type"] for s in changed_sections]
+            change_summary = (
+                f"{len(changed_sections)} paragraph(s) changed: "
+                + ", ".join(f"{t}" for t in set(types))
+                + ". "
+                + (changed_sections[0].get("summary", "") if changed_sections else "")
+            )
+
+        return {"changed_sections": changed_sections, "change_summary": change_summary}
--- a/backend/app/infrastructure/perception/mock_event_store.py
+++ b/backend/app/infrastructure/perception/mock_event_store.py
@@ -4,6 +4,8 @@ from __future__ import annotations

 from typing import Any

+from app.infrastructure.perception.base_event_store import BaseEventStore
+
 MOCK_EVENTS: list[dict[str, Any]] = [
    # ------------------------------------------------------------------ HIGH
    {
@@ -379,18 +381,18 @@ MOCK_EVENTS: list[dict[str, Any]] = [
    },
 ]

-# Index for fast lookup
-_EVENT_INDEX: dict[str, dict] = {e["id"]: e for e in MOCK_EVENTS}
-
-
-class MockEventStore:
+class MockEventStore(BaseEventStore):
    """In-memory mock store for regulatory events."""

+    def __init__(self) -> None:
+        self._events: list[dict] = [dict(e) for e in MOCK_EVENTS]
+        self._index: dict[str, dict] = {e["id"]: e for e in self._events}
+
    def all(self) -> list[dict]:
-        return list(MOCK_EVENTS)
+        return list(self._events)

    def get(self, event_id: str) -> dict | None:
-        return _EVENT_INDEX.get(event_id)
+        return self._index.get(event_id)

    def filter(
        self,
@@ -399,23 +401,39 @@ class MockEventStore:
        impact_level: str | None = None,
        limit: int = 50,
    ) -> list[dict]:
-        events = list(MOCK_EVENTS)
+        events = list(self._events)
        if source:
            events = [e for e in events if e["source"] == source]
        if impact_level:
            events = [e for e in events if e["impact_level"] == impact_level]
-        events.sort(key=lambda e: e["published_at"], reverse=True)
+        events.sort(key=lambda e: e.get("published_at") or "", reverse=True)
        return events[:limit]

    def stats(self) -> dict:
        from datetime import date, timedelta

-        events = MOCK_EVENTS
+        events = self._events
        cutoff = (date.today() - timedelta(days=90)).isoformat()
        return {
            "total": len(events),
            "high_impact": sum(1 for e in events if e["impact_level"] == "high"),
            "medium_impact": sum(1 for e in events if e["impact_level"] == "medium"),
            "low_impact": sum(1 for e in events if e["impact_level"] == "low"),
-            "recent_90d": sum(1 for e in events if e["published_at"] >= cutoff),
+            "recent_90d": sum(1 for e in events if (e.get("published_at") or "") >= cutoff),
        }
+
+    def upsert(self, event: dict) -> None:
+        """Insert or update event in the in-memory list (used in tests)."""
+        existing = self._index.get(event["id"])
+        if existing:
+            existing.update(event)
+        else:
+            self._events.append(event)
+            self._index[event["id"]] = event
+
+    def get_by_standard_code(self, standard_code: str) -> dict | None:
+        """Return most-recent event with matching standard_code."""
+        matches = [e for e in self._events if e.get("standard_code") == standard_code]
+        if not matches:
+            return None
+        return max(matches, key=lambda e: e.get("published_at", ""))
--- a/backend/app/infrastructure/perception/postgres_event_store.py
+++ b/backend/app/infrastructure/perception/postgres_event_store.py
@@ -0,0 +1,225 @@
+"""PostgreSQL-backed regulatory event store."""
+
+from __future__ import annotations
+
+import json
+from contextlib import contextmanager
+from datetime import UTC, date, datetime, timedelta
+from typing import Any
+
+import psycopg2
+import psycopg2.extras
+from psycopg2.pool import ThreadedConnectionPool
+
+from app.config.settings import settings
+from app.infrastructure.perception.base_event_store import BaseEventStore
+
+_CREATE_TABLE = """
+CREATE TABLE IF NOT EXISTS regulation_events (
+    id               TEXT PRIMARY KEY,
+    source           TEXT NOT NULL,
+    source_label     TEXT,
+    standard_code    TEXT NOT NULL,
+    title            TEXT NOT NULL,
+    summary          TEXT,
+    full_text_url    TEXT,
+    status           TEXT,
+    impact_level     TEXT,
+    published_at     DATE,
+    effective_at     DATE,
+    category         TEXT,
+    tags             TEXT[],
+    obligations      JSONB,
+    deadlines        JSONB,
+    scope            TEXT,
+    penalties        TEXT,
+    content_hash     TEXT,
+    previous_hash    TEXT,
+    change_summary   TEXT,
+    changed_sections JSONB,
+    affected_docs    JSONB,
+    crawled_at       TIMESTAMPTZ DEFAULT now(),
+    processed_at     TIMESTAMPTZ,
+    raw_storage_key  TEXT
+);
+CREATE INDEX IF NOT EXISTS reg_events_source_date
+    ON regulation_events (source, published_at DESC);
+CREATE INDEX IF NOT EXISTS reg_events_impact_date
+    ON regulation_events (impact_level, published_at DESC);
+"""
+
+_ALL_COLUMNS = (
+    "id", "source", "source_label", "standard_code", "title", "summary",
+    "full_text_url", "status", "impact_level", "published_at", "effective_at",
+    "category", "tags", "obligations", "deadlines", "scope", "penalties",
+    "content_hash", "previous_hash", "change_summary", "changed_sections",
+    "affected_docs", "crawled_at", "processed_at", "raw_storage_key",
+)
+
+
+def _row_to_dict(row: dict[str, Any]) -> dict:
+    """Convert a psycopg2 RealDictRow to a plain dict with serialized JSON fields."""
+    d = dict(row)
+    for field in ("obligations", "deadlines", "changed_sections", "affected_docs"):
+        val = d.get(field)
+        if isinstance(val, str):
+            d[field] = json.loads(val)
+    for date_field in ("published_at", "effective_at"):
+        val = d.get(date_field)
+        if isinstance(val, datetime):
+            d[date_field] = val.date().isoformat()
+        elif isinstance(val, date):
+            d[date_field] = val.isoformat()
+    for ts_field in ("crawled_at", "processed_at"):
+        val = d.get(ts_field)
+        if isinstance(val, datetime):
+            d[ts_field] = val.isoformat()
+    return d
+
+
+class PostgresEventStore(BaseEventStore):
+    """Regulatory event store backed by PostgreSQL."""
+
+    def __init__(self) -> None:
+        self._pool = ThreadedConnectionPool(
+            minconn=1,
+            maxconn=5,
+            host=settings.postgres_host,
+            port=settings.postgres_port,
+            user=settings.postgres_user,
+            password=settings.postgres_password,
+            dbname=settings.postgres_db,
+        )
+        self._ensure_schema()
+
+    def _ensure_schema(self) -> None:
+        with self._conn() as conn:
+            try:
+                with conn.cursor() as cur:
+                    cur.execute(_CREATE_TABLE)
+                conn.commit()
+            except Exception:
+                conn.rollback()
+                raise
+
+    @contextmanager
+    def _conn(self):
+        conn = None
+        try:
+            conn = self._pool.getconn()
+            yield conn
+        finally:
+            if conn is not None:
+                self._pool.putconn(conn)
+
+    def all(self) -> list[dict]:
+        with self._conn() as conn:
+            with conn.cursor(cursor_factory=psycopg2.extras.RealDictCursor) as cur:
+                cur.execute(
+                    "SELECT * FROM regulation_events ORDER BY published_at DESC NULLS LAST"
+                )
+                return [_row_to_dict(r) for r in cur.fetchall()]
+
+    def get(self, event_id: str) -> dict | None:
+        with self._conn() as conn:
+            with conn.cursor(cursor_factory=psycopg2.extras.RealDictCursor) as cur:
+                cur.execute(
+                    "SELECT * FROM regulation_events WHERE id = %s", (event_id,)
+                )
+                row = cur.fetchone()
+                return _row_to_dict(row) if row else None
+
+    def filter(
+        self,
+        *,
+        source: str | None = None,
+        impact_level: str | None = None,
+        limit: int = 50,
+    ) -> list[dict]:
+        conditions: list[str] = []
+        params: list[Any] = []
+        if source:
+            conditions.append("source = %s")
+            params.append(source)
+        if impact_level:
+            conditions.append("impact_level = %s")
+            params.append(impact_level)
+        where = ("WHERE " + " AND ".join(conditions)) if conditions else ""
+        params.append(limit)
+        sql = f"""
+            SELECT * FROM regulation_events
+            {where}
+            ORDER BY published_at DESC NULLS LAST
+            LIMIT %s
+        """
+        with self._conn() as conn:
+            with conn.cursor(cursor_factory=psycopg2.extras.RealDictCursor) as cur:
+                cur.execute(sql, params)
+                return [_row_to_dict(r) for r in cur.fetchall()]
+
+    def stats(self) -> dict:
+        cutoff = (date.today() - timedelta(days=90)).isoformat()
+        with self._conn() as conn:
+            with conn.cursor(cursor_factory=psycopg2.extras.RealDictCursor) as cur:
+                cur.execute("SELECT COUNT(*) AS count FROM regulation_events")
+                total = (cur.fetchone() or {}).get("count", 0)
+                cur.execute(
+                    "SELECT COUNT(*) AS count FROM regulation_events WHERE impact_level = 'high'"
+                )
+                high = (cur.fetchone() or {}).get("count", 0)
+                cur.execute(
+                    "SELECT COUNT(*) AS count FROM regulation_events WHERE impact_level = 'medium'"
+                )
+                medium = (cur.fetchone() or {}).get("count", 0)
+                cur.execute(
+                    "SELECT COUNT(*) AS count FROM regulation_events WHERE published_at >= %s",
+                    (cutoff,),
+                )
+                recent = (cur.fetchone() or {}).get("count", 0)
+        return {
+            "total": int(total),
+            "high_impact": int(high),
+            "medium_impact": int(medium),
+            "recent_90d": int(recent),
+        }
+
+    def upsert(self, event: dict) -> None:
+        """Insert or update a regulation event."""
+        cols = [c for c in _ALL_COLUMNS if c in event]
+        placeholders = ", ".join(f"%({c})s" for c in cols)
+        updates = ", ".join(f"{c} = EXCLUDED.{c}" for c in cols if c != "id")
+        sql = f"""
+            INSERT INTO regulation_events ({', '.join(cols)})
+            VALUES ({placeholders})
+            ON CONFLICT (id) DO UPDATE SET {updates}
+        """
+        row: dict[str, Any] = {}
+        for c in cols:
+            val = event.get(c)
+            if c in ("obligations", "deadlines", "changed_sections", "affected_docs") and val is not None:
+                row[c] = json.dumps(val, ensure_ascii=False)
+            elif c == "tags" and isinstance(val, list):
+                row[c] = val
+            else:
+                row[c] = val
+        with self._conn() as conn:
+            try:
+                with conn.cursor() as cur:
+                    cur.execute(sql, row)
+                conn.commit()
+            except Exception:
+                conn.rollback()
+                raise
+
+    def get_by_standard_code(self, standard_code: str) -> dict | None:
+        with self._conn() as conn:
+            with conn.cursor(cursor_factory=psycopg2.extras.RealDictCursor) as cur:
+                cur.execute(
+                    """SELECT * FROM regulation_events
+                       WHERE standard_code = %s
+                       ORDER BY published_at DESC NULLS LAST
+                       LIMIT 1""",
+                    (standard_code,),
+                )
+                row = cur.fetchone()
+                return _row_to_dict(row) if row else None
--- a/backend/app/infrastructure/session/redis_conversation_store.py
+++ b/backend/app/infrastructure/session/redis_conversation_store.py
@@ -0,0 +1,169 @@
+"""Redis-backed conversation store for persistent chat sessions.
+
+Sessions are stored as JSON strings under the key `session:{session_id}`.
+The Redis TTL is refreshed on every write so active sessions stay alive.
+On expiry, `get_session` returns None — callers should create a new session.
+"""
+
+from __future__ import annotations
+
+import json
+import time
+import uuid
+from typing import Any
+
+from loguru import logger
+
+from app.domain.conversation import ConversationMessage, ConversationSession, ConversationStore
+
+
+class RedisConversationStore(ConversationStore):
+    """Store conversation sessions in Redis with automatic TTL expiry.
+
+    Each session is serialised as a JSON object at key ``session:{session_id}``.
+    The TTL is reset on every write so sessions stay alive as long as they are active.
+    """
+
+    # Prefix for all session keys to avoid collisions with other Redis consumers.
+    _PREFIX = "session:"
+
+    def __init__(self, *, redis_client: Any, timeout_seconds: int = 1800) -> None:
+        """Initialise the store with an existing Redis client and a TTL in seconds."""
+        self._redis = redis_client
+        self._ttl = timeout_seconds
+
+    # ------------------------------------------------------------------
+    # Internal helpers
+    # ------------------------------------------------------------------
+
+    def _key(self, session_id: str) -> str:
+        """Build the Redis key for a session."""
+        return f"{self._PREFIX}{session_id}"
+
+    def _serialise(self, session: ConversationSession) -> str:
+        """Serialise a ConversationSession to a JSON string."""
+        return json.dumps(
+            {
+                "session_id": session.session_id,
+                "created_at": session.created_at,
+                "updated_at": session.updated_at,
+                "metadata": session.metadata,
+                "messages": [
+                    {
+                        "role": msg.role,
+                        "content": msg.content,
+                        "timestamp": msg.timestamp,
+                        "sources": msg.sources,
+                    }
+                    for msg in session.messages
+                ],
+            },
+            ensure_ascii=False,
+        )
+
+    def _deserialise(self, raw: bytes | str) -> ConversationSession:
+        """Deserialise a JSON string back into a ConversationSession."""
+        data = json.loads(raw)
+        messages = [
+            ConversationMessage(
+                role=m["role"],
+                content=m["content"],
+                timestamp=m["timestamp"],
+                sources=m.get("sources", []),
+            )
+            for m in data.get("messages", [])
+        ]
+        session = ConversationSession(
+            session_id=data["session_id"],
+            created_at=data.get("created_at", 0),
+            updated_at=data.get("updated_at", 0),
+            metadata=data.get("metadata", {}),
+        )
+        session.messages = messages
+        return session
+
+    def _save(self, session: ConversationSession) -> None:
+        """Persist a session to Redis and refresh its TTL."""
+        self._redis.setex(self._key(session.session_id), self._ttl, self._serialise(session))
+
+    # ------------------------------------------------------------------
+    # ConversationStore protocol
+    # ------------------------------------------------------------------
+
+    def create_session(self, metadata: dict | None = None) -> ConversationSession:
+        """Create a new empty session and persist it immediately."""
+        now = int(time.time())
+        session = ConversationSession(
+            session_id=str(uuid.uuid4())[:8],
+            created_at=now,
+            updated_at=now,
+            metadata=metadata or {},
+        )
+        self._save(session)
+        return session
+
+    def get_session(self, session_id: str) -> ConversationSession | None:
+        """Return a session by ID, or None if it does not exist or has expired."""
+        raw = self._redis.get(self._key(session_id))
+        if raw is None:
+            return None
+        try:
+            return self._deserialise(raw)
+        except Exception:
+            logger.warning("Failed to deserialise session: {}", session_id)
+            return None
+
+    def save_message(
+        self,
+        session_id: str,
+        *,
+        role: str,
+        content: str,
+        sources: list[dict] | None = None,
+    ) -> ConversationSession | None:
+        """Append a message to a session and refresh its TTL."""
+        session = self.get_session(session_id)
+        if session is None:
+            return None
+        session.messages.append(
+            ConversationMessage(
+                role=role,
+                content=content,
+                timestamp=int(time.time()),
+                sources=sources or [],
+            )
+        )
+        session.updated_at = int(time.time())
+        self._save(session)
+        return session
+
+    def delete_session(self, session_id: str) -> bool:
+        """Delete a session. Returns True if it existed, False otherwise."""
+        deleted = self._redis.delete(self._key(session_id))
+        return bool(deleted)
+
+    def list_sessions(self) -> list[dict]:
+        """Return summary dicts for all live sessions visible in this Redis DB.
+
+        Note: KEYS is used for simplicity; replace with SCAN for large deployments.
+        """
+        pattern = f"{self._PREFIX}*"
+        keys = self._redis.keys(pattern)
+        result = []
+        for key in keys:
+            raw = self._redis.get(key)
+            if raw is None:
+                continue
+            try:
+                data = json.loads(raw)
+                result.append(
+                    {
+                        "session_id": data["session_id"],
+                        "message_count": len(data.get("messages", [])),
+                        "created_at": data.get("created_at", 0),
+                        "updated_at": data.get("updated_at", 0),
+                    }
+                )
+            except Exception:
+                continue
+        return result
--- a/backend/app/infrastructure/tasks/init.py
+++ b/backend/app/infrastructure/tasks/init.py
@@ -0,0 +1,5 @@
+"""Celery task definitions for background processing.
+
+This package exposes the shared Celery application instance and all
+registered task functions used by API routes to enqueue work.
+"""
--- a/backend/app/infrastructure/tasks/celery_app.py
+++ b/backend/app/infrastructure/tasks/celery_app.py
@@ -0,0 +1,45 @@
+"""Shared Celery application instance for background task processing.
+
+All workers and enqueueing call sites import `celery_app` from this module
+so the broker/backend configuration stays in one place.
+"""
+
+from __future__ import annotations
+
+from celery import Celery
+
+from app.config.settings import settings
+
+
+def _redis_url() -> str:
+    """Return a Redis connection URL from application settings."""
+    if settings.redis_password:
+        return (
+            f"redis://:{settings.redis_password}@"
+            f"{settings.redis_host}:{settings.redis_port}/{settings.redis_db}"
+        )
+    return f"redis://{settings.redis_host}:{settings.redis_port}/{settings.redis_db}"
+
+
+_BROKER = _redis_url()
+_BACKEND = _redis_url()
+
+celery_app = Celery(
+    "compliance_hub",
+    broker=_BROKER,
+    backend=_BACKEND,
+    include=["app.infrastructure.tasks.document_tasks"],
+)
+
+celery_app.conf.update(
+    task_serializer="json",
+    result_serializer="json",
+    accept_content=["json"],
+    timezone="UTC",
+    enable_utc=True,
+    # Acknowledge task only after successful execution to avoid data loss.
+    task_acks_late=True,
+    task_reject_on_worker_lost=True,
+    # Keep results for 1 hour for status polling.
+    result_expires=3600,
+)
--- a/backend/app/infrastructure/tasks/document_tasks.py
+++ b/backend/app/infrastructure/tasks/document_tasks.py
@@ -0,0 +1,73 @@
+"""Celery tasks for document processing.
+
+Each task is a thin wrapper that retrieves the already-stored document
+binary and delegates to DocumentCommandService._process_document.
+The task does not accept raw file bytes — it reads them from the binary
+store using the doc_id, so the Celery message payload stays small.
+"""
+
+from __future__ import annotations
+
+from loguru import logger
+
+from app.infrastructure.tasks.celery_app import celery_app
+
+
+@celery_app.task(
+    name="app.infrastructure.tasks.document_tasks.process_document_task",
+    bind=True,
+    max_retries=3,
+    default_retry_delay=30,
+    acks_late=True,
+)
+def process_document_task(
+    self,
+    doc_id: str,
+    file_name: str,
+    doc_name: str,
+    regulation_type: str,
+    version: str,
+    generate_summary: bool,
+    run_id: str | None = None,
+) -> dict:
+    """Parse, embed, and index a document that has already been stored.
+
+    The task reads the file binary from MinIO using doc_id so the Celery
+    message stays small. Retries up to 3 times with a 30-second delay on
+    transient infrastructure errors.
+    """
+    # Import inside the task function to avoid pickling issues and to ensure
+    # that each worker process initialises its own bootstrap singletons.
+    from app.shared.bootstrap import get_document_command_service, get_document_query_service
+
+    logger.info("process_document_task started: doc_id={}", doc_id)
+    try:
+        svc = get_document_command_service()
+        doc = get_document_query_service().get(doc_id)
+        if not doc:
+            raise ValueError(f"Document record not found: {doc_id}")
+
+        # Read the stored binary from MinIO — avoids passing raw bytes in the task message.
+        content = svc.binary_store.read(doc.object_name)
+
+        result = svc._process_document(
+            doc_id=doc_id,
+            file_name=file_name,
+            final_doc_name=doc_name,
+            content=content,
+            regulation_type=regulation_type,
+            version=version,
+            generate_summary=generate_summary,
+            run_id=run_id,
+        )
+        logger.info(
+            "process_document_task completed: doc_id={} status={} chunks={}",
+            doc_id, result.status, result.num_chunks,
+        )
+        return {"doc_id": result.doc_id, "status": result.status, "num_chunks": result.num_chunks}
+
+    except Exception as exc:
+        logger.exception("process_document_task failed: doc_id={}", doc_id)
+        # Retry on transient errors; permanent errors (bad file, parse failure)
+        # will exhaust retries and leave the document in FAILED state.
+        raise self.retry(exc=exc)
--- a/backend/app/infrastructure/vectorstore/pass_through_reranker.py
+++ b/backend/app/infrastructure/vectorstore/pass_through_reranker.py
@@ -0,0 +1,21 @@
+"""No-op reranker stub.
+
+Returns the original candidate list sliced to top_k.
+Replace with CrossEncoderReranker when a local cross-encoder model is available.
+"""
+from __future__ import annotations
+
+from app.domain.retrieval.models import RetrievedChunk
+from app.domain.retrieval.ports import Reranker
+
+
+class PassThroughReranker(Reranker):
+    """Pass-through reranker that preserves original retrieval order.
+
+    Acts as a placeholder for future cross-encoder reranking (e.g. ms-marco-MiniLM).
+    Wire via bootstrap.get_compliance_reranker() when ready to swap.
+    """
+
+    def rerank(self, query: str, chunks: list[RetrievedChunk], top_k: int) -> list[RetrievedChunk]:
+        """Return the first top_k chunks without reordering."""
+        return chunks[:top_k]
--- a/backend/app/shared/bootstrap.py
+++ b/backend/app/shared/bootstrap.py
@@ -19,6 +19,15 @@ from app.infrastructure.parser.local_chunk_builder import LocalRegulationChunkBu
 from app.infrastructure.parser.local_document_parser import LocalDocumentParser
 from app.infrastructure.parser.vector_chunk_builder import AliyunVectorChunkBuilder
 from app.infrastructure.perception.mock_event_store import MockEventStore
+from app.application.perception.crawl_service import CrawlService
+from app.infrastructure.perception.base_event_store import BaseEventStore
+from app.infrastructure.perception.crawlers.catarc_crawler import CatarcCrawler
+from app.infrastructure.perception.crawlers.guobiao_crawler import (
+    GuobiaoMandatoryCrawler,
+    GuobiaoRecommendedCrawler,
+)
+from app.infrastructure.perception.crawlers.eurlex_crawler import EurlexCrawler
+from app.infrastructure.perception.llm_pipeline import LlmPipeline
 from app.infrastructure.session.in_memory_conversation_store import InMemoryConversationStore
 from app.infrastructure.storage.json_document_processing_store import JsonDocumentProcessingStore
 from app.infrastructure.storage.json_document_repository import JsonDocumentRepository
@@ -31,6 +40,8 @@ from app.infrastructure.vectorstore.cross_encoder_reranker import OpenAICompatib
 from app.infrastructure.vectorstore.dense_retriever import DenseRetriever
 from app.infrastructure.vectorstore.milvus_vector_index import MilvusVectorIndex
 from app.services.llm.llm_factory import LLMFactory
+from app.domain.compliance.ports import ComplianceRepository
+from app.infrastructure.compliance.repository import PostgresComplianceRepository
 # Keep shared wiring centralized so dependency construction remains consistent.


@@ -252,7 +263,31 @@ def get_document_query_service() -> DocumentQueryService:

@lru_cache
 def get_conversation_store() -> InMemoryConversationStore:
-    """Return conversation store."""
+    """Return the active conversation store based on settings.
+
+    When session_backend='redis', sessions survive backend restarts and scale
+    across multiple API worker processes. When session_backend='memory' (default),
+    sessions are process-local and lost on restart.
+    """
+    if settings.session_backend == "redis":
+        import redis as redis_lib
+        from app.infrastructure.session.redis_conversation_store import RedisConversationStore
+
+        # Build the Redis client from the same connection settings used by Celery.
+        kwargs: dict = {
+            "host": settings.redis_host,
+            "port": settings.redis_port,
+            "db": settings.redis_db,
+            "decode_responses": False,
+        }
+        if settings.redis_password:
+            kwargs["password"] = settings.redis_password
+
+        redis_client = redis_lib.Redis(**kwargs)
+        return RedisConversationStore(  # type: ignore[return-value]
+            redis_client=redis_client,
+            timeout_seconds=settings.session_timeout_minutes * 60,
+        )
    return InMemoryConversationStore(
        max_sessions=settings.session_max_sessions,
        timeout_minutes=settings.session_timeout_minutes,
@@ -269,11 +304,57 @@ def get_agent_conversation_service() -> AgentConversationService:
    )


+@lru_cache
+def get_event_store() -> BaseEventStore:
+    """Return event store selected by DOCUMENT_REPOSITORY_BACKEND setting."""
+    if settings.document_repository_backend == "postgres":
+        from app.infrastructure.perception.postgres_event_store import PostgresEventStore
+        return PostgresEventStore()
+    return MockEventStore()
+
+
+@lru_cache
+def get_compliance_repository() -> ComplianceRepository:
+    """Return the compliance analysis repository.
+
+    Requires document_repository_backend=postgres and valid postgres_* settings.
+    Raises NotImplementedError for any other backend value.
+    """
+    if settings.document_repository_backend != "postgres":
+        raise NotImplementedError(
+            f"ComplianceRepository requires document_repository_backend=postgres, "
+            f"got '{settings.document_repository_backend}'. "
+            "Set DOCUMENT_REPOSITORY_BACKEND=postgres in your .env file."
+        )
+    return PostgresComplianceRepository(
+        host=settings.postgres_host,
+        port=settings.postgres_port,
+        user=settings.postgres_user,
+        password=settings.postgres_password,
+        dbname=settings.postgres_db,
+    )
+
+
@lru_cache
 def get_perception_service() -> PerceptionService:
-    """Return perception service for regulatory intelligence."""
    return PerceptionService(
-        event_store=MockEventStore(),
+        event_store=get_event_store(),
+        retrieval_service=get_retrieval_service(),
+    )
+
+
+@lru_cache
+def get_crawl_service() -> CrawlService:
+    crawlers = {
+        "CATARC": CatarcCrawler(),
+        "国标委·强制性": GuobiaoMandatoryCrawler(),
+        "国标委·推荐性": GuobiaoRecommendedCrawler(),
+        "EUR-Lex": EurlexCrawler(),
+    }
+    return CrawlService(
+        crawlers=crawlers,
+        event_store=get_event_store(),
+        llm_pipeline=LlmPipeline(),
        retrieval_service=get_retrieval_service(),
    )

@@ -284,6 +365,35 @@ def get_agent_session_service() -> AgentSessionService:
    return AgentSessionService(conversation_store=get_conversation_store())


+@lru_cache
+def get_celery_app():
+    """Return the shared Celery application instance.
+
+    Imported lazily so Celery is not required when running without workers
+    (e.g., tests that mock bootstrap or dev without Redis).
+    """
+    from app.infrastructure.tasks.celery_app import celery_app
+    return celery_app
+
+
+@lru_cache
+def get_jwt_handler():
+    """Return the shared JWTHandler instance for token creation and validation."""
+    from app.infrastructure.auth.jwt_handler import JWTHandler
+    return JWTHandler(
+        secret_key=settings.auth_secret_key,
+        algorithm=settings.auth_algorithm,
+        expire_minutes=settings.auth_token_expire_minutes,
+    )
+
+
+@lru_cache
+def get_user_store():
+    """Return the PostgreSQL user store (lazy-connects on first call)."""
+    from app.infrastructure.auth.user_store import PostgresUserStore
+    return PostgresUserStore()
+
+
 def preload_runtime_dependencies() -> None:
    """Warm dependencies that are safe and useful to preload during startup."""
    LLMFactory.preload_clients(["qwen", "deepseek"])
--- a/backend/requirements.txt
+++ b/backend/requirements.txt
@@ -1,30 +1,48 @@
+# ── Web framework ─────────────────────────────────────────────────────────────
 fastapi>=0.110.0
 uvicorn[standard]>=0.27.0
 python-multipart>=0.0.9

+# ── Config & utilities ────────────────────────────────────────────────────────
 pydantic>=2.0.0
 pydantic-settings>=2.0.0
 python-dotenv>=1.0.0
 loguru>=0.7.0
-
 httpx>=0.25.0
+beautifulsoup4>=4.12.0
+lxml>=5.0.0
 tiktoken>=0.5.0
 tenacity>=8.2.0

+# ── Auth ──────────────────────────────────────────────────────────────────────
+python-jose[cryptography]>=3.3.0
+# passlib is incompatible with bcrypt>=4.0 (removed __about__, strict 72-byte limit).
+# Pin bcrypt to 3.x until passlib ships a fix.
+passlib[bcrypt]>=1.7.4
+bcrypt>=3.2.0,<4.0.0
+
+# ── Async task queue ──────────────────────────────────────────────────────────
+celery>=5.3.0
+redis>=4.5.0
+
+# ── Storage & databases ───────────────────────────────────────────────────────
 pymilvus>=2.4.0
 minio>=7.1.0
 psycopg2-binary>=2.9.0

+# ── Document parsing ─────────────────────────────────────────────────────────
 pymupdf>=1.24.0
 python-docx>=1.1.0
-
-numpy>=1.24.0
 alibabacloud-docmind-api20220711>=1.0.6
 alibabacloud-tea-openapi>=0.3.11
 alibabacloud-tea-util>=0.3.13

+# ── RAG / LangChain ───────────────────────────────────────────────────────────
 langchain>=0.1.0
 langchain-milvus>=0.1.0
+numpy>=1.24.0

+# ── Testing ───────────────────────────────────────────────────────────────────
 pytest>=7.4.0
 pytest-asyncio>=0.21.0
+fakeredis>=2.0.0
--- a/backend/tests/compliance/init.py
+++ b/backend/tests/compliance/init.py
--- a/backend/tests/compliance/test_pipeline.py
+++ b/backend/tests/compliance/test_pipeline.py
@@ -0,0 +1,140 @@
+import asyncio
+
+import pytest
+from unittest.mock import MagicMock, patch
+from datetime import datetime
+
+from app.infrastructure.vectorstore.pass_through_reranker import PassThroughReranker
+from app.domain.retrieval.models import RetrievedChunk
+from app.domain.compliance.ports import AnalysisRecord, FindingRecord
+
+
+# ── helpers ──────────────────────────────────────────────────────────────────
+
+def _make_chunk(score: float) -> RetrievedChunk:
+    return RetrievedChunk(
+        chunk_id="c1",
+        doc_id="d1",
+        doc_title="Test Doc",
+        section_title="S1",
+        text="some text",
+        score=score,
+        page_start=1,
+    )
+
+
+def _make_mock_client(content: str = '{"status":"ok","title":"T","desc":"D","clause_ref":"A1"}'):
+    client = MagicMock()
+    response = MagicMock()
+    response.is_success = True
+    response.content = content
+    client.chat.return_value = response
+    return client
+
+
+def _make_mock_retrieval():
+    svc = MagicMock()
+    svc.retrieve.return_value = []
+    return svc
+
+
+# ── existing tests ────────────────────────────────────────────────────────────
+
+def test_pass_through_returns_top_k():
+    reranker = PassThroughReranker()
+    chunks = [_make_chunk(0.9), _make_chunk(0.8), _make_chunk(0.7)]
+    result = reranker.rerank(query="test", chunks=chunks, top_k=2)
+    assert len(result) == 2
+    assert result[0].score == 0.9
+
+
+def test_pass_through_returns_all_when_top_k_exceeds():
+    reranker = PassThroughReranker()
+    chunks = [_make_chunk(0.5)]
+    result = reranker.rerank(query="test", chunks=chunks, top_k=10)
+    assert len(result) == 1
+
+
+# ── new tests ─────────────────────────────────────────────────────────────────
+
+def test_process_single_clause_returns_finding():
+    from app.application.compliance.pipeline import process_single_clause
+    client = _make_mock_client()
+    svc = _make_mock_retrieval()
+    result = process_single_clause("test clause", 0, svc, client)
+    assert result["finding"] is not None
+    assert result["index"] == 0
+    assert result["chunks"] == []
+
+
+def test_run_clauses_parallel_runs_all():
+    from app.application.compliance.pipeline import run_clauses_parallel
+    client = _make_mock_client()
+    svc = _make_mock_retrieval()
+    clauses = ["clause one", "clause two", "clause three"]
+    results = asyncio.run(run_clauses_parallel(clauses, svc, client))
+    assert len(results) == 3
+    assert all(r["index"] == i for i, r in enumerate(results))
+
+
+def test_run_clauses_parallel_handles_clause_failure():
+    from app.application.compliance.pipeline import run_clauses_parallel
+    svc = _make_mock_retrieval()
+    bad_client = MagicMock()
+    bad_client.chat.side_effect = RuntimeError("LLM exploded")
+    results = asyncio.run(run_clauses_parallel(
+        ["clause one", "clause two"], svc, bad_client
+    ))
+    assert len(results) == 2
+    assert all(r["finding"] is None for r in results)
+    assert all(r["chunks"] == [] for r in results)
+
+
+# ── helpers for new tests ─────────────────────────────────────────────────────
+
+def _sample_analysis() -> AnalysisRecord:
+    return AnalysisRecord(
+        id="a1", created_at=datetime(2026, 6, 8), created_by="u",
+        doc_name="doc.pdf", standard_name="EU AI Act",
+        risk_score=72, conclusion="Gaps found.", actions=[], para_text="para",
+        highlight_terms=[], findings=[],
+    )
+
+
+def _sample_finding(status: str = "risk") -> FindingRecord:
+    return FindingRecord(
+        id="f1", analysis_id="a1", seq=0,
+        title="Missing CSMS", description="No CSMS certification.",
+        status=status, clause_ref="Art.9.1",
+    )
+
+
+# ── new tests ─────────────────────────────────────────────────────────────────
+
+def test_build_finding_context_contains_required_fields():
+    from app.application.compliance.pipeline import build_finding_context
+    ctx = build_finding_context(_sample_finding(), _sample_analysis())
+    assert "doc.pdf" in ctx
+    assert "EU AI Act" in ctx
+    assert "Missing CSMS" in ctx
+    assert "Art.9.1" in ctx
+
+
+def test_generate_suggestions_returns_three_questions():
+    from app.application.compliance.pipeline import generate_suggestions
+    client = _make_mock_client(
+        '{"questions": ["Q1?", "Q2?", "Q3?"]}'
+    )
+    questions = generate_suggestions(_sample_finding("risk"), _sample_analysis(), client)
+    assert len(questions) == 3
+    assert all(isinstance(q, str) for q in questions)
+
+
+def test_generate_suggestions_falls_back_on_error():
+    from app.application.compliance.pipeline import generate_suggestions
+    bad_client = MagicMock()
+    bad_resp = MagicMock()
+    bad_resp.is_success = False
+    bad_client.chat.return_value = bad_resp
+    questions = generate_suggestions(_sample_finding(), _sample_analysis(), bad_client)
+    assert len(questions) == 3  # fallback always returns 3
--- a/backend/tests/compliance/test_repository.py
+++ b/backend/tests/compliance/test_repository.py
@@ -0,0 +1,98 @@
+from unittest.mock import MagicMock, patch
+from datetime import datetime
+from app.domain.compliance.ports import (
+    AnalysisRecord,
+    FindingRecord,
+    ComplianceRepository,
+)
+
+
+def _mock_pool():
+    """Return a mock psycopg2 ThreadedConnectionPool."""
+    conn = MagicMock()
+    cursor = MagicMock()
+    cursor.__enter__ = MagicMock(return_value=cursor)
+    cursor.__exit__ = MagicMock(return_value=False)
+    conn.cursor.return_value = cursor
+    pool = MagicMock()
+    pool.getconn.return_value = conn
+    return pool, conn, cursor
+
+
+@patch("app.infrastructure.compliance.repository.psycopg2.pool.ThreadedConnectionPool")
+def test_save_analysis_returns_uuid(mock_pool_cls):
+    from app.infrastructure.compliance.repository import PostgresComplianceRepository
+    pool, conn, cursor = _mock_pool()
+    mock_pool_cls.return_value = pool
+    cursor.fetchone.return_value = {"id": "abc-123"}
+
+    repo = PostgresComplianceRepository(
+        host="localhost", port=5432, user="u", password="p", dbname="db"
+    )
+    record = AnalysisRecord(
+        id="", created_at=datetime.utcnow(), created_by="user1",
+        doc_name="doc.pdf", standard_name="EU AI Act",
+        risk_score=50, conclusion="OK", actions=[], para_text="p",
+        highlight_terms=[], findings=[],
+    )
+    result = repo.save_analysis(record)
+    assert result == "abc-123"
+
+
+def test_analysis_record_construction():
+    record = AnalysisRecord(
+        id="",
+        created_at=datetime.utcnow(),
+        created_by="user1",
+        doc_name="test.pdf",
+        standard_name="EU AI Act",
+        risk_score=72,
+        conclusion="Several gaps found.",
+        actions=[{"label": "Fix", "value": "Update docs"}],
+        para_text="The system shall...",
+        highlight_terms=["CSMS", "ISO 21434"],
+        findings=[
+            FindingRecord(
+                id="",
+                analysis_id="",
+                seq=0,
+                title="Missing CSMS",
+                description="No CSMS certification found.",
+                status="risk",
+                clause_ref="Art.9.1",
+            )
+        ],
+    )
+    assert record.doc_name == "test.pdf"
+    assert len(record.findings) == 1
+    assert record.findings[0].status == "risk"
+
+
+def test_compliance_repository_is_abstract():
+    import inspect
+    assert inspect.isabstract(ComplianceRepository)
+
+
+def test_generate_docx_returns_bytes():
+    from app.infrastructure.compliance.docx_export import generate_docx
+    record = AnalysisRecord(
+        id="test-id", created_at=datetime(2026, 6, 8), created_by="user1",
+        doc_name="test.pdf", standard_name="EU AI Act",
+        risk_score=72, conclusion="Several gaps found.",
+        actions=[{"label": "Fix", "value": "Update CSMS docs"}],
+        para_text="The system shall implement CSMS.",
+        highlight_terms=["CSMS"],
+        findings=[
+            FindingRecord(
+                id="f1", analysis_id="test-id", seq=0,
+                title="Missing CSMS", description="No CSMS cert.",
+                status="risk", clause_ref="Art.9.1",
+            )
+        ],
+    )
+    data = generate_docx(record)
+    assert isinstance(data, bytes)
+    assert len(data) > 1000  # DOCX is at minimum a ZIP with ~1 KB overhead
+    # Verify it's a valid ZIP (DOCX = ZIP container)
+    import zipfile, io
+    assert zipfile.is_zipfile(io.BytesIO(data))
--- a/backend/tests/perception/init.py
+++ b/backend/tests/perception/init.py
--- a/backend/tests/perception/test_base_event_store.py
+++ b/backend/tests/perception/test_base_event_store.py
@@ -0,0 +1,95 @@
+"""Contract tests: any BaseEventStore implementation must pass these."""
+from app.infrastructure.perception.base_event_store import BaseEventStore
+from app.infrastructure.perception.mock_event_store import MockEventStore
+
+
+def _store() -> BaseEventStore:
+    return MockEventStore()
+
+
+def test_is_base_event_store():
+    assert isinstance(_store(), BaseEventStore)
+
+
+def test_all_returns_list():
+    result = _store().all()
+    assert isinstance(result, list)
+    assert len(result) > 0
+
+
+def test_get_known_id():
+    store = _store()
+    first = store.all()[0]
+    result = store.get(first["id"])
+    assert result is not None
+    assert result["id"] == first["id"]
+
+
+def test_get_unknown_returns_none():
+    assert _store().get("does-not-exist") is None
+
+
+def test_filter_by_impact():
+    store = _store()
+    highs = store.filter(impact_level="high", limit=100)
+    assert all(e["impact_level"] == "high" for e in highs)
+
+
+def test_filter_limit():
+    store = _store()
+    result = store.filter(limit=3)
+    assert len(result) <= 3
+
+
+def test_stats_keys():
+    stats = _store().stats()
+    for key in ("total", "high_impact", "medium_impact", "recent_90d"):
+        assert key in stats, f"missing key: {key}"
+
+
+def test_upsert_and_get():
+    store = _store()
+    event = {
+        "id": "test-upsert-001",
+        "source": "TEST",
+        "source_label": "Test Source",
+        "standard_code": "TST-001",
+        "title": "Test Event",
+        "summary": "A test event",
+        "full_text_url": "https://example.com",
+        "status": "draft",
+        "impact_level": "low",
+        "published_at": "2026-01-01",
+        "effective_at": None,
+        "category": "test",
+        "tags": ["test"],
+        "content_hash": "abc123",
+        "previous_hash": None,
+    }
+    store.upsert(event)
+    result = store.get("test-upsert-001")
+    assert result is not None
+    assert result["title"] == "Test Event"
+
+
+def test_get_by_standard_code():
+    store = _store()
+    first = store.all()[0]
+    result = store.get_by_standard_code(first["standard_code"])
+    assert result is not None
+    assert result["standard_code"] == first["standard_code"]
+
+
+def test_upsert_updates_existing():
+    store = _store()
+    first = store.all()[0]
+    original_id = first["id"]
+    store.upsert({"id": original_id, "title": "Updated Title", "impact_level": first["impact_level"],
+                  "standard_code": first.get("standard_code", ""), "source": first["source"],
+                  "source_label": first.get("source_label", ""), "summary": "Updated",
+                  "full_text_url": "", "status": first["status"], "published_at": first.get("published_at", ""),
+                  "effective_at": None, "category": first.get("category", ""), "tags": [],
+                  "content_hash": "newhash", "previous_hash": None})
+    result = store.get(original_id)
+    assert result is not None
+    assert result["title"] == "Updated Title"
--- a/backend/tests/perception/test_crawl_service.py
+++ b/backend/tests/perception/test_crawl_service.py
@@ -0,0 +1,111 @@
+"""Integration tests for CrawlService."""
+from __future__ import annotations
+from unittest.mock import MagicMock
+import hashlib
+import pytest
+
+from app.infrastructure.perception.crawlers.base import RawEvent
+from app.infrastructure.perception.mock_event_store import MockEventStore
+
+
+def _make_raw_event(code="TST-001"):
+    return RawEvent(
+        source="TEST", source_label="Test", standard_code=code,
+        title=f"Test {code}", summary="Summary", full_text_url="https://example.com",
+        status="enacted", published_at="2026-01-01", effective_at=None,
+        category="test", tags=["test"], raw_text="full text",
+    )
+
+
+def _make_service(raw_events):
+    from app.application.perception.crawl_service import CrawlService
+
+    mock_crawler = MagicMock()
+    mock_crawler.fetch.return_value = raw_events
+
+    mock_pipeline = MagicMock()
+    mock_pipeline.extract_structure.return_value = {
+        "obligations": [], "deadlines": [], "scope": "test",
+        "penalties": None, "impact_level": "low",
+    }
+    mock_pipeline.assess_impact.return_value = []
+    mock_pipeline.compute_diff.return_value = {
+        "changed_sections": [], "change_summary": "No changes.",
+    }
+
+    mock_retrieval = MagicMock()
+    store = MockEventStore()
+
+    return CrawlService(
+        crawlers={"TEST": mock_crawler},
+        event_store=store,
+        llm_pipeline=mock_pipeline,
+        retrieval_service=mock_retrieval,
+    )
+
+
+def test_crawl_yields_progress_and_done():
+    svc = _make_service([_make_raw_event("TST-001")])
+    events = list(svc.run_crawl())
+    event_types = [e.get("event") for e in events]
+    assert "done" in event_types
+
+
+def test_crawl_upserts_to_store():
+    store = MockEventStore()
+    from app.application.perception.crawl_service import CrawlService
+    mock_crawler = MagicMock()
+    mock_crawler.fetch.return_value = [_make_raw_event("NEW-001")]
+    mock_pipeline = MagicMock()
+    mock_pipeline.extract_structure.return_value = {
+        "obligations": [], "deadlines": [], "scope": "",
+        "penalties": None, "impact_level": "medium",
+    }
+    mock_pipeline.assess_impact.return_value = []
+    mock_pipeline.compute_diff.return_value = {
+        "changed_sections": [], "change_summary": "",
+    }
+    svc = CrawlService(
+        crawlers={"TEST": mock_crawler},
+        event_store=store,
+        llm_pipeline=mock_pipeline,
+        retrieval_service=MagicMock(),
+    )
+    list(svc.run_crawl())
+    result = store.get_by_standard_code("NEW-001")
+    assert result is not None
+    assert result["title"] == "Test NEW-001"
+
+
+def test_crawl_skips_unchanged_events():
+    store = MockEventStore()
+    raw = _make_raw_event("SKIP-001")
+    content_hash = hashlib.sha256(raw.raw_text.encode()).hexdigest()
+    store.upsert({
+        "id": hashlib.sha256(f"TEST-SKIP-001".encode()).hexdigest()[:12],
+        "standard_code": "SKIP-001",
+        "source": "TEST",
+        "source_label": "Test",
+        "title": "Test SKIP-001",
+        "summary": "",
+        "full_text_url": "",
+        "status": "enacted",
+        "impact_level": "low",
+        "published_at": "2026-01-01",
+        "effective_at": None,
+        "category": "test",
+        "tags": [],
+        "content_hash": content_hash,
+    })
+    mock_pipeline = MagicMock()
+    from app.application.perception.crawl_service import CrawlService
+    mock_crawler = MagicMock()
+    mock_crawler.fetch.return_value = [raw]
+    svc = CrawlService(
+        crawlers={"TEST": mock_crawler},
+        event_store=store,
+        llm_pipeline=mock_pipeline,
+        retrieval_service=MagicMock(),
+    )
+    list(svc.run_crawl())
+    mock_pipeline.extract_structure.assert_not_called()
--- a/backend/tests/perception/test_crawlers.py
+++ b/backend/tests/perception/test_crawlers.py
@@ -0,0 +1,127 @@
+"""Unit tests for crawlers — mock httpx responses."""
+from __future__ import annotations
+from unittest.mock import MagicMock, patch
+import pytest
+
+from app.infrastructure.perception.crawlers.base import RawEvent, BaseCrawler
+
+
+def test_raw_event_fields():
+    ev = RawEvent(
+        source="TEST",
+        source_label="Test",
+        standard_code="TST-001",
+        title="Test",
+        summary="Summary",
+        full_text_url="https://example.com",
+        status="enacted",
+        published_at="2026-01-01",
+        effective_at=None,
+        category="test",
+        tags=["a"],
+        raw_text="full text here",
+    )
+    assert ev.source == "TEST"
+    assert ev.tags == ["a"]
+
+
+CATARC_HTML = """
+<html><body>
+<table>
+<tr>
+  <td><a href="/std/detail/123">GB 18384-2025</a></td>
+  <td>电动汽车安全要求</td>
+  <td>2025-11-15</td>
+  <td>现行</td>
+</tr>
+<tr>
+  <td><a href="/std/detail/456">GB/T 40429-2026</a></td>
+  <td>汽车驾驶自动化分级</td>
+  <td>2026-02-01</td>
+  <td>即将实施</td>
+</tr>
+</table>
+</body></html>
+"""
+
+
+def test_catarc_crawler_parses_html():
+    from app.infrastructure.perception.crawlers.catarc_crawler import CatarcCrawler
+
+    mock_resp = MagicMock()
+    mock_resp.status_code = 200
+    mock_resp.text = CATARC_HTML
+    mock_resp.raise_for_status = MagicMock()
+
+    with patch("httpx.get", return_value=mock_resp):
+        crawler = CatarcCrawler()
+        events = crawler.fetch(limit=10)
+
+    assert isinstance(events, list)
+    assert len(events) >= 1
+    assert all(isinstance(e, RawEvent) for e in events)
+    codes = [e.standard_code for e in events]
+    assert "GB 18384-2025" in codes
+
+
+GUOBIAO_JSON = {
+    "rows": [
+        {
+            "std_code": "GB 18384-2025",
+            "std_name": "电动汽车安全要求",
+            "release_date": "2025-11-15",
+            "implement_date": "2026-07-01",
+            "std_status": "现行",
+            "std_type": "强制性",
+        },
+    ]
+}
+
+
+def test_guobiao_crawler_parses_json():
+    from app.infrastructure.perception.crawlers.guobiao_crawler import GuobiaoMandatoryCrawler
+
+    mock_resp = MagicMock()
+    mock_resp.status_code = 200
+    mock_resp.json.return_value = GUOBIAO_JSON
+    mock_resp.raise_for_status = MagicMock()
+
+    with patch("httpx.get", return_value=mock_resp):
+        crawler = GuobiaoMandatoryCrawler()
+        events = crawler.fetch(limit=10)
+
+    assert len(events) >= 1
+    assert events[0].source == "国标委"
+    assert events[0].standard_code == "GB 18384-2025"
+
+
+EURLEX_RSS = """<?xml version="1.0" encoding="UTF-8"?>
+<rss version="2.0">
+  <channel>
+    <title>EUR-Lex</title>
+    <item>
+      <title>Regulation (EU) 2024/1689 — AI Act</title>
+      <link>https://eur-lex.europa.eu/legal-content/EN/TXT/?uri=CELEX:32024R1689</link>
+      <description>The EU Artificial Intelligence Act enters into force.</description>
+      <pubDate>Fri, 12 Jul 2024 00:00:00 GMT</pubDate>
+    </item>
+  </channel>
+</rss>"""
+
+
+def test_eurlex_crawler_parses_rss():
+    from app.infrastructure.perception.crawlers.eurlex_crawler import EurlexCrawler
+
+    mock_resp = MagicMock()
+    mock_resp.status_code = 200
+    mock_resp.text = EURLEX_RSS
+    mock_resp.content = EURLEX_RSS
+    mock_resp.raise_for_status = MagicMock()
+
+    with patch("httpx.get", return_value=mock_resp):
+        crawler = EurlexCrawler()
+        events = crawler.fetch(limit=5)
+
+    assert isinstance(events, list)
+    assert len(events) >= 1
+    assert events[0].source == "EUR-Lex"
--- a/backend/tests/perception/test_llm_pipeline.py
+++ b/backend/tests/perception/test_llm_pipeline.py
@@ -0,0 +1,77 @@
+"""Unit tests for LlmPipeline — mock LLM client and embedding provider."""
+from __future__ import annotations
+from unittest.mock import MagicMock, patch
+import json
+import pytest
+
+
+def _make_pipeline():
+    with patch("app.infrastructure.perception.llm_pipeline.get_llm_client") as mock_llm_fn, \
+         patch("app.infrastructure.perception.llm_pipeline.OpenAICompatibleEmbeddingProvider") as mock_emb_cls:
+
+        mock_client = MagicMock()
+        mock_client.chat.return_value = MagicMock(content='{"obligations":[{"text":"test obligation","deontic":"must","subject":"OEM","object":"system","condition":""}],"deadlines":[{"date":"2026-07-01","description":"实施截止"}],"scope":"适用于M1类车辆","penalties":"罚款","impact_level":"high"}')
+        mock_llm_fn.return_value = mock_client
+
+        mock_emb = MagicMock()
+        mock_emb.embed_texts.return_value = [[0.1] * 1024, [0.9] * 1024]
+        mock_emb_cls.return_value = mock_emb
+
+        from app.infrastructure.perception.llm_pipeline import LlmPipeline
+        return LlmPipeline(), mock_client, mock_emb
+
+
+def test_extract_structure_returns_dict():
+    pipeline, mock_client, _ = _make_pipeline()
+    event = {
+        "id": "evt-001",
+        "standard_code": "GB 18384-2025",
+        "title": "电动汽车安全要求",
+        "summary": "新增 IP67 级别防护",
+        "source_label": "CATARC",
+        "tags": ["电池安全"],
+    }
+    result = pipeline.extract_structure(event)
+    assert isinstance(result, dict)
+    assert "obligations" in result
+    assert "impact_level" in result
+
+
+def test_assess_impact_returns_list():
+    pipeline, mock_client, _ = _make_pipeline()
+    mock_client.chat.return_value = MagicMock(content='[{"doc_id":"d1","doc_name":"Safety Manual","score":0.85,"key_clauses":"§4.2","recommendation":"更新第4章"}]')
+    mock_retrieval = MagicMock()
+    chunk = MagicMock()
+    chunk.doc_id = "d1"
+    chunk.doc_title = "Safety Manual"
+    chunk.score = 0.85
+    chunk.text = "relevant text"
+    chunk.section_title = "§4.2"
+    mock_retrieval.retrieve.return_value = [chunk]
+    event = {
+        "standard_code": "GB 18384-2025",
+        "title": "电动汽车安全要求",
+        "obligations": [{"text": "OEM shall comply"}],
+    }
+    result = pipeline.assess_impact(event, mock_retrieval)
+    assert isinstance(result, list)
+
+
+def test_compute_diff_no_change():
+    pipeline, _, mock_emb = _make_pipeline()
+    mock_emb.embed_texts.return_value = [[0.5] * 1024, [0.5] * 1024]
+    result = pipeline.compute_diff("paragraph one", "paragraph one")
+    assert isinstance(result, dict)
+    assert "changed_sections" in result
+    assert "change_summary" in result
+
+
+def test_compute_diff_detects_change():
+    pipeline, mock_client, mock_emb = _make_pipeline()
+    mock_emb.embed_texts.return_value = [
+        [1.0] + [0.0] * 1023,
+        [0.0] + [1.0] + [0.0] * 1022,
+    ]
+    mock_client.chat.return_value = MagicMock(content='{"change_type":"tightened","summary":"Requirement tightened"}')
+    result = pipeline.compute_diff("old paragraph text", "new tighter requirement text")
+    assert isinstance(result["changed_sections"], list)
--- a/backend/tests/perception/test_postgres_event_store.py
+++ b/backend/tests/perception/test_postgres_event_store.py
@@ -0,0 +1,98 @@
+"""Unit tests for PostgresEventStore using a mocked psycopg2 pool."""
+from __future__ import annotations
+import json
+from unittest.mock import MagicMock, patch
+import pytest
+
+# Patch psycopg2 before importing the module under test
+import sys
+mock_psycopg2 = MagicMock()
+mock_psycopg2.extras = MagicMock()
+sys.modules.setdefault("psycopg2", mock_psycopg2)
+sys.modules.setdefault("psycopg2.extras", mock_psycopg2.extras)
+sys.modules.setdefault("psycopg2.pool", MagicMock())
+
+from app.infrastructure.perception.base_event_store import BaseEventStore
+
+
+SAMPLE_ROW = {
+    "id": "pg-001",
+    "source": "国标委",
+    "source_label": "国家标准化管理委员会",
+    "standard_code": "GB 18384-2025",
+    "title": "电动汽车安全要求",
+    "summary": "新增要求",
+    "full_text_url": "https://openstd.samr.gov.cn",
+    "status": "enacted",
+    "impact_level": "high",
+    "published_at": "2025-11-15",
+    "effective_at": "2026-07-01",
+    "category": "电动汽车安全",
+    "tags": ["电池安全"],
+    "obligations": None,
+    "deadlines": None,
+    "scope": None,
+    "penalties": None,
+    "content_hash": "abc123",
+    "previous_hash": None,
+    "change_summary": None,
+    "changed_sections": None,
+    "affected_docs": None,
+    "crawled_at": "2026-06-05T10:00:00+00:00",
+    "processed_at": None,
+    "raw_storage_key": None,
+}
+
+
+def _make_store_with_pool(mock_pool):
+    with patch("psycopg2.pool.ThreadedConnectionPool", return_value=mock_pool):
+        with patch(
+            "app.infrastructure.perception.postgres_event_store.PostgresEventStore._ensure_schema"
+        ):
+            from app.infrastructure.perception.postgres_event_store import PostgresEventStore
+            return PostgresEventStore()
+
+
+def _cursor_returning(rows):
+    cursor = MagicMock()
+    cursor.__enter__ = lambda s: s
+    cursor.__exit__ = MagicMock(return_value=False)
+    cursor.fetchall.return_value = rows
+    cursor.fetchone.return_value = rows[0] if rows else None
+    return cursor
+
+
+def test_is_base_event_store():
+    mock_pool = MagicMock()
+    store = _make_store_with_pool(mock_pool)
+    assert isinstance(store, BaseEventStore)
+
+
+def test_filter_returns_list():
+    mock_pool = MagicMock()
+    conn = MagicMock()
+    conn.__enter__ = lambda s: s
+    conn.__exit__ = MagicMock(return_value=False)
+    cursor = _cursor_returning([SAMPLE_ROW])
+    conn.cursor.return_value = cursor
+    mock_pool.getconn.return_value = conn
+    store = _make_store_with_pool(mock_pool)
+    result = store.filter(limit=10)
+    assert isinstance(result, list)
+
+
+def test_stats_returns_correct_keys():
+    mock_pool = MagicMock()
+    conn = MagicMock()
+    conn.__enter__ = lambda s: s
+    conn.__exit__ = MagicMock(return_value=False)
+    cursor = MagicMock()
+    cursor.__enter__ = lambda s: s
+    cursor.__exit__ = MagicMock(return_value=False)
+    cursor.fetchone.return_value = {"count": 5}
+    conn.cursor.return_value = cursor
+    mock_pool.getconn.return_value = conn
+    store = _make_store_with_pool(mock_pool)
+    stats = store.stats()
+    for key in ("total", "high_impact", "medium_impact", "recent_90d"):
+        assert key in stats
--- a/dev.sh
+++ b/dev.sh
@@ -549,7 +549,7 @@ AI+合规智能中枢统一脚本
 用法:
  ./dev.sh help
  ./dev.sh setup
-  ./dev.sh start [all|api|frontend] [--foreground] [--mode dev|static]
+  ./dev.sh start [all|api|frontend|worker|beat] [--foreground] [--mode dev|static]
  ./dev.sh stop [all|api|frontend]
  ./dev.sh restart [all|api|frontend] [--mode dev|static]
  ./dev.sh status
@@ -563,6 +563,9 @@ AI+合规智能中枢统一脚本
    进行一次性的本地初始化。
    包含 Python 版本检查、.venv 虚拟环境创建、后端依赖安装、前端 npm install、
    以及 6.86.80.8 基础服务端口连通性检查。
+    初始化完成后，首次运行前还需执行:
+      PYTHONPATH=backend .venv/bin/python scripts/seed_users.py
+    以创建 admin/legal/ehs/readonly 四个演示用户。

  start
    启动服务。默认行为等同于 ./dev.sh start all。
@@ -570,6 +573,8 @@ AI+合规智能中枢统一脚本
      all       同时启动 API 和前端。
      api       只启动后端 API。
      frontend  只启动前端。
+      worker    启动 Celery 文档处理 worker（前台运行，需要 Redis）。
+      beat      启动 Celery Beat 定时调度器（前台运行，需要 Redis）。
    可选参数:
      --foreground    仅对 start api 生效，前台运行并开启 --reload，便于调试。
      --mode dev      前端使用 Vite 开发服务器，默认端口 5173。
@@ -578,6 +583,7 @@ AI+合规智能中枢统一脚本
  stop
    停止服务。默认行为等同于 ./dev.sh stop all。
    会优先读取 logs/*.pid，PID 文件失效时会回退到端口探测。
+    注意: worker 和 beat 为前台进程，直接 Ctrl+C 停止。

  restart
    先停止再启动，支持 all/api/frontend。
@@ -601,8 +607,11 @@ AI+合规智能中枢统一脚本

 常用示例:
  ./dev.sh setup
+  PYTHONPATH=backend .venv/bin/python scripts/seed_users.py
  ./dev.sh start
  ./dev.sh start api --foreground
+  ./dev.sh start worker
+  ./dev.sh start beat
  ./dev.sh start frontend --mode static
  ./dev.sh restart frontend --mode dev
  ./dev.sh status
@@ -615,7 +624,7 @@ parse_target() {
    local default_target="$1"
    local candidate="${2:-}"
    case "$candidate" in
-        all|api|frontend)
+        all|api|frontend|worker|beat)
            echo "$candidate"
            ;;
        *)
@@ -646,41 +655,64 @@ main() {
                shift || true
            fi

-            while [ $# -gt 0 ]; do
-                case "$1" in
-                    --foreground)
-                        foreground=true
-                        ;;
-                    --mode)
-                        shift || die "--mode 需要指定 dev 或 static"
-                        mode="$1"
-                        validate_frontend_mode "$mode"
-                        ;;
-                    *)
-                        die "未知参数: $1"
-                        ;;
-                esac
-                shift || true
-            done
-
+            # worker and beat are pass-through — forward remaining args to celery directly.
            case "$target" in
-                all)
-                    [ "$foreground" = false ] || die "start all 不支持 --foreground，请使用 start api --foreground"
-                    print_header "AI+合规智能中枢 - 启动服务"
-                    start_api background
-                    start_frontend "${mode:-$FRONTEND_MODE}"
+                worker)
+                    print_header "AI+合规智能中枢 - 启动 Celery Worker"
+                    require_venv
+                    export PYTHONPATH="backend${PYTHONPATH:+:$PYTHONPATH}"
+                    "$VENV_PYTHON" -m celery -A app.infrastructure.tasks.celery_app worker \
+                        --loglevel=info \
+                        --concurrency=2 \
+                        --queues=celery \
+                        "$@"
                    ;;
-                api)
-                    if [ "$foreground" = true ]; then
-                        start_api foreground
-                    else
-                        print_header "AI+合规智能中枢 - 启动 API"
-                        start_api background
-                    fi
+                beat)
+                    print_header "AI+合规智能中枢 - 启动 Celery Beat"
+                    require_venv
+                    export PYTHONPATH="backend${PYTHONPATH:+:$PYTHONPATH}"
+                    "$VENV_PYTHON" -m celery -A app.infrastructure.tasks.celery_app beat \
+                        --loglevel=info \
+                        "$@"
                    ;;
-                frontend)
-                    print_header "AI+合规智能中枢 - 启动前端"
-                    start_frontend "${mode:-$FRONTEND_MODE}"
+                *)
+                    while [ $# -gt 0 ]; do
+                        case "$1" in
+                            --foreground)
+                                foreground=true
+                                ;;
+                            --mode)
+                                shift || die "--mode 需要指定 dev 或 static"
+                                mode="$1"
+                                validate_frontend_mode "$mode"
+                                ;;
+                            *)
+                                die "未知参数: $1"
+                                ;;
+                        esac
+                        shift || true
+                    done
+
+                    case "$target" in
+                        all)
+                            [ "$foreground" = false ] || die "start all 不支持 --foreground，请使用 start api --foreground"
+                            print_header "AI+合规智能中枢 - 启动服务"
+                            start_api background
+                            start_frontend "${mode:-$FRONTEND_MODE}"
+                            ;;
+                        api)
+                            if [ "$foreground" = true ]; then
+                                start_api foreground
+                            else
+                                print_header "AI+合规智能中枢 - 启动 API"
+                                start_api background
+                            fi
+                            ;;
+                        frontend)
+                            print_header "AI+合规智能中枢 - 启动前端"
+                            start_frontend "${mode:-$FRONTEND_MODE}"
+                            ;;
+                    esac
                    ;;
            esac
            ;;
--- a/docker/docker-compose.yml
+++ b/docker/docker-compose.yml
@@ -58,7 +58,8 @@ services:
      retries: 5
    restart: unless-stopped

-  # PostgreSQL数据库 (可选，启用 DOCUMENT_REPOSITORY_BACKEND=postgres 时使用)
+  # PostgreSQL数据库 (启用 DOCUMENT_REPOSITORY_BACKEND=postgres 时使用；
+  # 合规分析历史记录 Direction B、DOCX 报告下载及 Finding Chat 持久化 Direction C 均依赖此服务)
  postgres:
    image: postgres:15-alpine
    container_name: postgres
--- a/docs/superpowers/plans/2026-06-05-perception-intelligence.md
+++ b/docs/superpowers/plans/2026-06-05-perception-intelligence.md
--- a/docs/superpowers/plans/2026-06-05-phase1-production-foundation.md
+++ b/docs/superpowers/plans/2026-06-05-phase1-production-foundation.md
--- a/docs/superpowers/plans/2026-06-08-compliance-enhancement.md
+++ b/docs/superpowers/plans/2026-06-08-compliance-enhancement.md
--- a/docs/superpowers/plans/2026-06-08-i18n.md
+++ b/docs/superpowers/plans/2026-06-08-i18n.md
--- a/docs/superpowers/specs/2026-06-05-next-steps-roadmap-design.md
+++ b/docs/superpowers/specs/2026-06-05-next-steps-roadmap-design.md
@@ -0,0 +1,289 @@
+# AI+合规智能中枢 — 下一步开发与优化路线图（设计文档）
+
+- 日期：2026-06-05
+- 定位：试点 MVP 走向生产
+- 范围：全景清单 + 异步任务化（设计①）+ 法规感知闭环（设计②）深入方案 + 三阶段实施路线图
+- 作者：AI Regulations Team（brainstorming 产出）
+
+---
+
+## 0. 背景与目的
+
+本文档基于对当前仓库前后端真实代码的逐文件探查，结合四份愿景文档（`AI_Regulations_Report.pptx`、`AI_Regulations_Architecture.docx`、`01_Architecture.html`、`02_Architecture_Detail.html`）与最新开源 AI 技术调研，给出**下一步可继续开发与优化的方向清单**，并对两个最高价值方向给出可落地的深入设计。
+
+本文档是**方向性设计（spec）**，不是实施计划（plan）。阶段一、阶段二的具体落地由后续 writing-plans 环节拆分为分步计划。
+
+### 0.1 现状一句话
+
+后端是一套结构清晰的 DDD 风格 FastAPI RAG 系统（上传 → 解析 → 分块 → BGE-M3 嵌入 → Milvus → 混合检索 → 流式问答 + 合规分析），**真实可用**。但愿景文档中的多个旗舰能力（知识图谱、法规感知闭环、RBAC、EHS、异步化）目前为 **mock 或缺失**。
+
+---
+
+## 1. 现状盘点（基于真实代码）
+
+### 1.1 已实现且真实可用
+
+- **文档处理主链路**：`application/documents/services.py::DocumentCommandService.upload_and_process` — 存储 → 解析（阿里云 DocMind / 本地）→ 分块 → BGE-M3 嵌入 → Milvus 入库，含 `DocumentProcessingStore` 全程状态事件记录。
+- **混合检索**：`application/knowledge/services.py::KnowledgeRetrievalService` — Dense（`DenseRetriever`）+ BM25（jieba）+ Reciprocal Rank Fusion + 可选 Cross-Encoder 重排。
+- **流式 RAG 问答**：`application/agent/services.py::AgentConversationService.stream_chat` + `api/routes/rag.py` — 真实检索 + 引文 + 会话历史 + SSE。
+- **合规分析管线**：`application/compliance/pipeline.py` — clause_split → retrieve → gap_check → conclusion，真实 LLM + 真实检索，SSE 流式（`api/routes/compliance.py::analyze_stream`）。
+- **状态/健康面板**：`api/routes/status.py` + 前端 `StatusPage.tsx` — Milvus/MinIO/BM25/Reranker/会话实时状态。
+- **存储后端**：PostgreSQL / MinIO 适配器齐全；JSON 与 Postgres 双后端可切换。
+- **前端**：React 19 + Vite + Tailwind，6 个页面（Overview/Status/Perception/Docs/Compliance/RagChat）。
+
+### 1.2 愿景已规划但代码缺失或为 mock
+
+| 能力 | 愿景出处 | 代码现状 |
+|------|---------|---------|
+| 知识图谱 / Neo4j 多跳推理 | 架构图 L4/L5、Slide 5 | 全代码 0 处 neo4j/graph |
+| 法规感知自动更新闭环 | 01_Architecture.html L157-193、Slide 11 | `PerceptionService` 喂 `MockEventStore`（20 条死数据） |
+| 认证 / RBAC / 审计日志 | Slide 12 四角色权限矩阵 | 全代码 0 处 auth/jwt/rbac；`main.py` CORS=`*` |
+| 异步任务 / Worker 集群 | 架构图"Worker 集群"、Slide 9 | `app/workers/` 空目录；处理全同步 |
+| EHS 隐患识别（SIF/四维根因） | Slide 7 | 未实现 |
+| 多渠道推送（Email/Teams/飞书） | Slide 8 | 未实现 |
+| 闭环整改跟踪、可观测性 | 架构图右栏 | 缺失 |
+
+### 1.3 关键发现
+
+- **`requirements.txt:28` 已有 `celery>=5.3.0` + `redis>=4.5.0`**，`docker-compose.yml` 已配 Redis 7，`settings.py` 已有 redis 配置 —— **异步化是"接线"，不是"从零搭建"**。
+- **`DocumentProcessingStore` 已能记录 run 状态/状态事件** —— 是天然的任务进度表。
+- **`PerceptionService.analyze_event` 的 LLM 影响分析与 RAG 关联检索是真的** —— 感知闭环缺的只是前半段（采集 → Diff → 入库）。
+- 后端正处于 legacy 迁移期：`services/*`、`workflows/*` 为兼容层（见 `docs/architecture/backend-project-architecture.md`）。
+
+---
+
+## 2. 全景机会清单
+
+类型标记：`[新能力]`=愿景缺口补齐，`[加固]`=已实现能力优化。价值 ★（1-5），工作量 S/M/L。
+
+### P0 — 生产地基（阻断"走向生产"的硬伤）
+
+| # | 机会点 | 类型 | 现状证据 | 价值 | 工作量 |
+|---|--------|------|---------|------|--------|
+| 1 | 异步任务化（Celery + 已配 Redis）：解析/嵌入/感知/推送下沉 worker | 加固 | `workers/` 空；`documents.py:34` 上传同步阻塞 | ★★★★★ | L |
+| 2 | 认证 + RBAC + 审计日志，收紧 CORS | 新能力 | 0 处 auth；`main.py` CORS=`*`；Slide 12 | ★★★★★ | M |
+| 3 | 会话 & 任务持久化（内存 → Redis/PG） | 加固 | `bootstrap.py:254` 内存会话；`compliance.py:25` 内存字典 | ★★★★ | M |
+| 4 | 基础可观测性（Prometheus + 结构化日志 + 追踪） | 加固 | 仅 loguru；架构图右栏全缺 | ★★★ | M |
+
+### P1 — 高价值能力补齐 + RAG 质量
+
+| # | 机会点 | 类型 | 现状证据 | 价值 | 工作量 |
+|---|--------|------|---------|------|--------|
+| 5 | 启用并升级 Reranker（`bge-reranker-v2.5-gemma2-lightweight`） | 加固 | `settings.py:113` 默认关；管线已写好 | ★★★★ | S |
+| 6 | Agentic 检索（查询改写/意图理解/多路召回） | 加固 | `agent/services.py` 直接 retrieve，无 rewrite/HyDE | ★★★★ | M |
+| 7 | 知识图谱 / GraphRAG（Neo4j + LightRAG v1.5） | 新能力 | 0 处 neo4j；LightRAG v1.5 原生支持 | ★★★★★ | L |
+| 8 | 法规感知自动更新闭环（真实采集 + 版本 Diff + 增量重索引） | 新能力 | `perception/services.py` 用 MockEventStore | ★★★★★ | L |
+| 9 | 引文置信度评分（Slide 5 承诺"置信度评分+页码溯源"） | 加固 | `rag.py` sources 无 confidence | ★★★ | S |
+| 10 | 检索评估 harness（recall@k / faithfulness） | 加固 | `tests/` 需真实服务，无离线 RAG 评估 | ★★★ | M |
+
+### P2 — 视野扩展（独立子项目）
+
+| # | 机会点 | 类型 | 价值 | 工作量 |
+|---|--------|------|------|--------|
+| 11 | EHS 隐患识别（SIF 评分 + 四维根因 + ISO 45001 扫描，Slide 7） | 新能力 | ★★★★ | L |
+| 12 | 多渠道推送 + 订阅规则引擎（Email/Teams/飞书，Slide 8） | 新能力 | ★★★ | M |
+| 13 | 闭环整改跟踪（任务派发 → 进度 → 验收归档） | 新能力 | ★★★ | M |
+| 14 | 企业系统集成（PLM/ERP/OA/MES Webhook） | 新能力 | ★★ | L |
+| 15 | MinerU 3.1 升级（已转 Apache 协议，VLM 解析）作本地兜底 | 加固 | ★★ | S |
+| 16 | 前端加固（清 mock 数据、补 error/loading 态、KG 可视化、登录态） | 加固 | ★★★ | M |
+| 17 | 收口 legacy 迁移（`services/*`、`workflows/*` 按架构文档归位） | 加固 | ★★ | M |
+
+---
+
+## 3. 深入设计 ① — 异步任务化
+
+### 3.1 问题
+
+`upload_document`（`api/routes/documents.py:34`）在单个 HTTP 请求内同步跑完 存储 → 解析（阿里云云端可达 900 秒，`settings.py:49`）→ 嵌入 → Milvus 入库。大体量 GB 标准必然超时；`compliance.py` 的 `/analyze` 为假异步（立即返回 mock）；perception 爬取闭环无执行载体。PPT Slide 9 已将"大文件性能"列为关键挑战，对策正是"流式处理 + 异步队列 + 实时进度"。
+
+### 3.2 关键前提：基建已就位
+
+- `requirements.txt:28` 已含 `celery>=5.3.0` + `redis>=4.5.0`
+- `docker-compose.yml:46` Redis 7 已配置；`settings.py:64` 已有 redis 连接配置
+- `PostgresDocumentProcessingStore` 已记录 run 状态/状态事件 —— 天然任务进度表
+- `app/workers/` 为空目录（唯一缺口）
+
+### 3.3 架构（遵循 AGENTS.md 的 `api → application → domain ports → infrastructure`）
+
+```
+api/routes/documents.py  POST /upload
+        │ 1. 存二进制 + 建 Document 记录（快，同步）
+        │ 2. enqueue task → 立即返回 {doc_id, status:"queued", run_id}
+        ▼
+infrastructure/tasks/            ← 新增
+   celery_app.py                 broker=redis, backend=redis
+   document_tasks.py             @task process_document(doc_id) → DocumentCommandService
+        │ 复用现有 upload_and_process 的 parse→embed→index 段
+        ▼
+application/documents/services.py（拆分：store 与 process 解耦）
+        │ 每阶段写 DocumentProcessingStore（已存在）→ 进度可查
+        ▼
+api/routes/documents.py  GET /status/{doc_id}  ← 已存在，读 run 状态即可
+```
+
+### 3.4 落地步骤（增量、不破坏现有同步路径）
+
+1. 新增 `infrastructure/tasks/celery_app.py` — Celery 实例，broker/backend 指向已配 Redis。
+2. 拆分 `upload_and_process` → `store_document`（同步快）+ `process_document`（可异步），复用现有逻辑，零重写解析/嵌入代码。
+3. 新增 `document_tasks.py` — `@celery_app.task` 包裹 `process_document`，失败用 `tenacity`（已在 deps）重试 + 死信。
+4. 改 `documents.py` 上传 — 默认入队（保留 `?sync=true` 同步回退便于演示）；`GET /status/{doc_id}` 读 `DocumentProcessingStore` 返回阶段进度。
+5. 前端 `DocsPage.tsx` — 上传后轮询/SSE 进度条（架构图 Worker"心跳/状态上报"已是既定设计）。
+6. `dev.sh`/`dev.bat` 加 worker 启动：`celery -A app.infrastructure.tasks.celery_app worker`。
+
+### 3.5 工作量与风险
+
+- **M（中），3-5 天。**
+- 最大风险：Celery worker 进程内 `PYTHONPATH=backend` 与 bootstrap `lru_cache` 单例需重新初始化 —— 可控，因 bootstrap 已是懒加载。
+- YAGNI 边界：本期仅异步化"文档处理"一条链；compliance/perception 复用同一 Celery 基建后续接入。
+
+---
+
+## 4. 深入设计 ② — 法规感知自动更新闭环
+
+### 4.1 问题
+
+感知闭环是愿景旗舰能力（`01_Architecture.html` L157-193、Slide 11）。现状：`PerceptionService` 喂 `MockEventStore`（`mock_event_store.py:7`，20 条手写死数据），`list_events`/`stats` 全静态，`source_url` 真实但从不访问。**LLM 影响分析与 RAG 关联检索是真的** —— 闭环缺的是前半段：真实采集 → 变更感知（Diff）→ 入库。
+
+### 4.2 六步现状对照
+
+| 步骤 | 愿景设计 | 现状 | 本期目标 |
+|------|---------|------|---------|
+| ① 法规源监控 | 定时爬国标网/MIIT/UN-ECE/EUR-Lex | ❌ 无 | ✅ 适配器+定时 |
+| ② 智能变更感知 | NLP 比对新旧版本 Diff | ❌ 无 | ✅ 内容指纹+LLM Diff |
+| ③ 自动解析入库 | MinerU→分块→BGE-M3→Milvus | ✅ 已有（复用设计①管线） | ✅ 接线 |
+| ④ 知识图谱更新 | Neo4j 关系同步 | ❌ 无 | ⏭️ 本期不做（归 GraphRAG 专项） |
+| ⑤ 差距分析&推送 | AI 比对+按角色推送 | 🟡 analyze_event 已有分析，无推送 | 🟡 分析复用，推送下期 |
+| ⑥ 触发整改闭环 | 整改任务跟踪 | ❌ 无 | ⏭️ 下期 |
+
+本期聚焦 ①②③，复用设计①异步管线与已有解析/嵌入/检索/分析能力。
+
+### 4.3 架构（端口与适配器）
+
+```
+domain/perception/ports.py        ← 新增
+   RegulationSource (Protocol)    fetch_latest() → list[RawRegulation]
+   EventStore (Protocol)          抽象掉 MockEventStore（现有 mock 成为一个实现）
+   ChangeDetector (Protocol)      diff(old, new) → ChangeSet
+
+infrastructure/perception/
+   sources/                       ← 新增，每法规源一个适配器
+     gb_openstd_source.py         国标网 (openstd.samr.gov.cn)
+     miit_source.py               工信部
+     base_html_source.py          通用 HTML 抓取基类（httpx 已在 deps）
+   postgres_event_store.py        ← 替换 MockEventStore（真实持久化）
+   content_fingerprint_detector.py  哈希指纹 + LLM 语义 Diff
+
+application/perception/services.py（扩展现有）
+   ingest_cycle()                 ← 新增：①抓取 → ②Diff → ③入队解析（设计①的 task）
+   （list_events/analyze_event 保持不变，已是真实逻辑）
+
+infrastructure/tasks/perception_tasks.py  ← 复用设计①的 Celery
+   @task perception_crawl_cycle()  Celery Beat 定时触发
+```
+
+### 4.4 关键设计决策
+
+1. **接口契约零改动**：`PostgresEventStore` 输出与 `MockEventStore` 完全相同的 dict 结构（mock_event_store.py 的 20 字段），故 `perception.ts` 前端契约、`PerceptionPage.tsx`、`analyze_event` 全部不改。Mock 退化为种子数据/演示回退，通过 `perception_event_store=mock|postgres` 开关切换（对齐现有 `document_repository_backend` 模式）。
+2. **变更感知分两层**：廉价层（内容哈希指纹判断"是否变了"）+ 智能层（变了才调 LLM 做"新增/修订/废止条款"结构化 Diff，复用 `get_llm_client`，prompt 风格照搬 `compliance/pipeline.py::_extract_json`）。
+3. **合规防滥用**：尊重 `robots.txt` + 限速 + `tenacity` 重试 + 抓取失败不污染已有数据；适配器隔离，单源故障不影响其它。
+4. **入库复用设计①**：抓到新法规 PDF → 丢进 `process_document` task → 自动走完解析/嵌入/索引。
+
+### 4.5 落地步骤
+
+1. 抽 `domain/perception/ports.py`，让现有 `MockEventStore` 实现 `EventStore` 协议（纯重构，行为不变）。
+2. `PostgresEventStore` + 建表（参照 `aliyun_parser/schema.sql` 风格）+ 20 条 mock 作 seed。
+3. 先做 1 个真实源适配器（建议国标网，结构最稳）跑通 ①→②→③，验证端到端。
+4. `content_fingerprint_detector` + LLM Diff。
+5. `perception_crawl_cycle` Celery Beat 定时（每日）；新事件落 PostgresEventStore + 新法规入队解析。
+6. 前端 `PerceptionPage` 加"最近同步时间/本次新增 N 条"（stats 已有结构，加 2 字段）。
+
+### 4.6 工作量与风险
+
+- **L（大），5-8 天**，依赖设计①先落地（共用 Celery）。
+- 最大风险：外部源站不可控（改版/反爬）。缓解：适配器隔离 + mock 永久保留为回退 + 先攻 1 个源验证（对齐 Slide 13"选取 2-3 个场景 POC 验证"）。
+- YAGNI 边界：④Neo4j 图谱、⑥整改闭环、多渠道推送本期不做，各自独立子项目。
+
+---
+
+## 5. 三阶段实施路线图
+
+### 5.1 核心主线
+
+项目不缺"能力点"，缺的是**让能力点从同步脚本变成可运营的系统**。主线是**异步化基建**：既是文档处理性能解药（设计①），又是感知闭环执行载体（设计②），也是未来 EHS/推送的统一底座。路线图以它为"第 0 块地基"，其余能力挂载其上。
+
+### 5.2 与 PPT 三阶段映射（Slide 10）
+
+```
+PPT 规划                  代码现状          本路线图补齐
+─────────────────────────────────────────────────────
+一阶段 知识库+基础问答   ✅ 大体已实现     → 加固 (P0/P1)
+二阶段 文档审查+API集成  🟡 审查真/API半   → 异步化+感知闭环
+三阶段 EHS+个性化+图谱   ❌ 基本缺失       → 子项目 (P2)
+```
+
+### 5.3 阶段一 · 生产地基（2-3 周）— "让它扛得住生产"
+
+| 顺序 | 事项 | 依据 | 估时 |
+|------|------|------|------|
+| 1 | 设计① 异步任务化 | celery/redis 已在 deps，workers/ 空 | M, 3-5d |
+| 2 | 认证 + RBAC + 审计 + 收紧 CORS | 0 处 auth；Slide 12 矩阵 | M, 3-5d |
+| 3 | 会话/任务持久化（内存 → Redis/PG） | InMemoryConversationStore 重启即丢 | M, 2-3d |
+| 4 | 快赢：启用 Reranker | settings 默认关，管线已写好 | S, 0.5d |
+
+### 5.4 阶段二 · 招牌能力（2-3 周）— "让它有亮点"
+
+建议**感知闭环优先于图谱**（前者复用阶段一异步基建，ROI 更高）。
+
+| 顺序 | 事项 | 依据 | 估时 |
+|------|------|------|------|
+| 5 | 设计② 法规感知闭环 ①②③ | MockEventStore → 真实采集 | L, 5-8d |
+| 6 | Agentic 检索（查询改写/意图理解） | Slide 5"意图理解"，代码是直检索 | M, 3-4d |
+| 7 | 引文置信度评分 + 基础可观测性 | Slide 5 承诺；架构图右栏全缺 | S+M, 3-4d |
+
+### 5.5 阶段三 · 视野扩展（按需，各为独立子项目）— "让它成体系"
+
+每项单独 brainstorm → spec → 实施，本期不细化：
+
+- 知识图谱 / GraphRAG（Neo4j + LightRAG v1.5，接感知闭环第④步）
+- EHS 隐患识别（SIF + 四维根因，Slide 7）
+- 多渠道推送 + 订阅规则引擎（Slide 8）→ 闭环整改跟踪（第⑤⑥步）
+- 持续加固：MinerU 3.1 升级、前端清 mock、legacy 收口
+
+### 5.6 决策建议
+
+1. 强烈建议按阶段顺序：地基 → 招牌 → 扩展。跳过地基直接做招牌，会在生产暴露超时/无鉴权/数据丢失。
+2. 阶段一第 4 项（Reranker）可立即做 —— 半天见效，与其它解耦，适合先尝甜头。
+3. 阶段二二选一先行：要 demo 冲击力选"感知闭环"；要问答质量选"Agentic 检索"。
+
+---
+
+## 6. 最新 AI 技术调研（支撑选型）
+
+| 技术 | 版本/状态（2026） | 对应机会点 |
+|------|------------------|-----------|
+| LightRAG | v1.5.0（2026-06），EMNLP 2025；KG-RAG，原生支持 Neo4j + MinerU/Docling，含 Web UI 图谱可视化 | #7 知识图谱 |
+| MinerU | v3.1.0（2026-04），协议转为 Apache 2.0 基础的开源协议，VLM 解析（MinerU2.5-Pro），109 语言 OCR | #15 本地解析兜底 |
+| BGE Reranker | `bge-reranker-v2.5-gemma2-lightweight`（token 压缩 + 分层轻量化，生产推荐） | #5 Reranker 升级 |
+| BGE-M3 | 100+ 语言，8192 上下文，dense+sparse+colbert 统一（现已在用） | 现有嵌入 |
+| RAGFlow | 2026 支持 DeepSeek v4 / MCP / 跨语言查询；agentic RAG 参考实现 | #6 Agentic 检索参考 |
+
+---
+
+## 7. 验收与边界
+
+### 7.1 本文档明确不做（YAGNI）
+
+- 阶段三所有子项目（图谱、EHS、推送、整改闭环、企业集成）仅列方向，不在本期展开。
+- 移动端适配（AGENTS.md 明确 desktop-first）。
+- 感知闭环的第④⑤⑥步（图谱同步、推送、整改）。
+
+### 7.2 架构约束（必须遵守）
+
+- 后端遵循 `api → application → domain ports → infrastructure`（`docs/architecture/backend-project-architecture.md` 为权威）。
+- 新业务逻辑不得落入 `services/*`、`workflows/*`（legacy 迁移区）。
+- `shared/bootstrap.py` 为依赖装配 composition root，新依赖在此接线。
+- 后端注释/docstring 全英文（AGENTS.md 规范）。
+
+### 7.3 下一步
+
+经用户审阅本 spec 后，对**阶段一**（异步任务化优先）调用 writing-plans 拆分为分步实施计划。
--- a/docs/superpowers/specs/2026-06-05-perception-intelligence-design.md
+++ b/docs/superpowers/specs/2026-06-05-perception-intelligence-design.md
@@ -0,0 +1,328 @@
+# Regulatory Signals Intelligence Enhancement — Design Spec
+
+> **For agentic workers:** REQUIRED SUB-SKILL: Use superpowers:subagent-driven-development (recommended) or superpowers:executing-plans to implement this plan task-by-task. Steps use checkbox (`- [ ]`) syntax for tracking.
+
+**Goal:** Replace the 20-item hardcoded MockEventStore with real regulatory data from Chinese and international sources, add LLM-driven structured extraction, impact assessment, and semantic change diff — all accessible through a manual-trigger crawl in the frontend.
+
+**Architecture:** Crawler Service (httpx + BeautifulSoup) → PostgreSQL EventStore → LLM Pipeline (extract → assess → diff) → existing PerceptionService interface. New code follows `api → application → domain ports → infrastructure` layering; no new files in `services/*` or `workflows/*`; `shared/bootstrap.py` is the composition root.
+
+**Tech Stack:** httpx, BeautifulSoup4, sentence-transformers (for diff), existing LLM factory (deepseek/qwen), existing KnowledgeRetrievalService (RAG), PostgreSQL (already available), existing SSE infrastructure.
+
+---
+
+## 1. Data Sources
+
+| Source | URL | Method | Coverage |
+|--------|-----|--------|----------|
+| CATARC 汽车标准 | `https://www.catarc.org.cn/bzzxd/qcbz/index.html` | httpx + BeautifulSoup (static pages) | 国家/行业汽车标准列表 |
+| 国标委强制性标准 | `https://openstd.samr.gov.cn/bzgk/std/std_list_type?p.p1=1&p.p2=车&p.p90=circulation_date&p.p91=desc` | httpx + JSON API parse | 强制性国家标准，按"车"过滤 |
+| 国标委推荐性标准 | `https://openstd.samr.gov.cn/bzgk/std/std_list_type?p.p1=2&p.p2=车&p.p90=circulation_date&p.p91=desc` | httpx + JSON API parse | 推荐性国家标准，按"车"过滤 |
+| EUR-Lex | RSS + CELLAR REST API | pyeurlex / httpx | EU AI Act, automotive directives |
+| UN R155/R156 | CELLAR REST API (CELEX lookup) | httpx | UN-ECE cybersecurity/OTA regulations |
+
+Crawl is **manual-trigger only** — no cron/Celery Beat. Admin clicks "刷新数据源" in the frontend UI.
+
+---
+
+## 2. Database Schema
+
+### New table: `regulation_events`
+
+```sql
+CREATE TABLE IF NOT EXISTS regulation_events (
+    id              TEXT PRIMARY KEY,          -- sha256(source + standard_code)[:12]
+    source          TEXT NOT NULL,             -- 'CATARC' | '国标委' | 'EUR-Lex' | 'UN-ECE'
+    source_label    TEXT,                      -- Human-readable source label
+    standard_code   TEXT NOT NULL,             -- e.g. "GB 18384-2025", "EU/2024/1689"
+    title           TEXT NOT NULL,
+    summary         TEXT,                      -- Crawled abstract or first paragraph
+    full_text_url   TEXT,                      -- Original page URL
+    status          TEXT,                      -- 'enacted' | 'draft' | 'consultation'
+    impact_level    TEXT,                      -- 'high' | 'medium' | 'low' (LLM-assigned)
+    published_at    DATE,
+    effective_at    DATE,
+    category        TEXT,
+    tags            TEXT[],
+    -- LLM structured extraction
+    obligations     JSONB,       -- [{text, deontic, subject, object, condition}]
+    deadlines       JSONB,       -- [{date, description}]
+    scope           TEXT,        -- Applicability scope summary
+    penalties       TEXT,        -- Penalty / consequence summary
+    -- Change tracking
+    content_hash    TEXT,        -- SHA256 of crawled full text
+    previous_hash   TEXT,        -- Hash from prior crawl (NULL on first crawl)
+    change_summary  TEXT,        -- LLM-generated description of changes
+    changed_sections JSONB,      -- [{old_text, new_text, change_type}] where cosine<0.85
+    -- Impact assessment
+    affected_docs   JSONB,       -- [{doc_id, doc_name, score, key_clauses, recommendation}]
+    -- Metadata
+    crawled_at      TIMESTAMPTZ DEFAULT now(),
+    processed_at    TIMESTAMPTZ,
+    raw_storage_key TEXT         -- MinIO path for raw HTML/PDF (optional)
+);
+
+CREATE INDEX IF NOT EXISTS regulation_events_source_date
+    ON regulation_events (source, published_at DESC);
+CREATE INDEX IF NOT EXISTS regulation_events_impact_date
+    ON regulation_events (impact_level, published_at DESC);
+CREATE INDEX IF NOT EXISTS regulation_events_tags
+    ON regulation_events USING gin(tags);
+```
+
+---
+
+## 3. Backend Architecture
+
+### 3.1 File Map
+
+**New files (infrastructure layer):**
+- `backend/app/infrastructure/perception/crawlers/catarc_crawler.py` — CATARC scraper
+- `backend/app/infrastructure/perception/crawlers/guobiao_crawler.py` — 国标委 JSON API crawler
+- `backend/app/infrastructure/perception/crawlers/eurlex_crawler.py` — EUR-Lex RSS + CELLAR
+- `backend/app/infrastructure/perception/crawlers/base.py` — Abstract base class
+- `backend/app/infrastructure/perception/postgres_event_store.py` — PostgresEventStore (replaces MockEventStore)
+- `backend/app/infrastructure/perception/llm_pipeline.py` — Extract / assess / diff pipeline
+
+**New files (application layer):**
+- `backend/app/application/perception/crawl_service.py` — Orchestrates crawlers + LLM pipeline, exposes `run_crawl(sources)` + progress generator
+
+**Modified files:**
+- `backend/app/api/routes/perception.py` — Add `POST /crawl`, `GET /crawl/status` (SSE), `POST /events/{id}/process`, `GET /events/{id}/diff`
+- `backend/app/shared/bootstrap.py` — Wire `PostgresEventStore` + `CrawlService` + `LlmPipeline` when `DOCUMENT_REPOSITORY_BACKEND=postgres`; fallback to `MockEventStore` when `json`
+- `backend/app/config/settings.py` — Add `perception_crawl_timeout_seconds`, `perception_max_events_per_source`
+
+**Unchanged files:**
+- `backend/app/application/perception/services.py` — `PerceptionService` interface unchanged; only `_store` swap
+- `backend/app/infrastructure/perception/mock_event_store.py` — Kept for `json` backend mode
+
+### 3.2 Domain Port (Abstract Interface)
+
+```python
+# backend/app/infrastructure/perception/base_event_store.py
+from abc import ABC, abstractmethod
+
+class BaseEventStore(ABC):
+    @abstractmethod
+    def all(self) -> list[dict]: ...
+    @abstractmethod
+    def get(self, event_id: str) -> dict | None: ...
+    @abstractmethod
+    def filter(self, source=None, impact_level=None, limit=50) -> list[dict]: ...
+    @abstractmethod
+    def stats(self) -> dict: ...
+    @abstractmethod
+    def upsert(self, event: dict) -> None: ...      # new — needed for crawl writes
+    @abstractmethod
+    def get_by_standard_code(self, code: str) -> dict | None: ...  # for change detection
+```
+
+`MockEventStore` and `PostgresEventStore` both implement this interface.
+
+### 3.3 Crawler Base Contract
+
+```python
+# backend/app/infrastructure/perception/crawlers/base.py
+from abc import ABC, abstractmethod
+from dataclasses import dataclass
+
+@dataclass
+class RawEvent:
+    source: str
+    source_label: str
+    standard_code: str
+    title: str
+    summary: str
+    full_text_url: str
+    status: str           # 'enacted' | 'draft' | 'consultation'
+    published_at: str     # YYYY-MM-DD string
+    effective_at: str | None
+    category: str
+    tags: list[str]
+    raw_text: str         # full crawled text for hashing + LLM
+
+class BaseCrawler(ABC):
+    @abstractmethod
+    def fetch(self, limit: int = 50) -> list[RawEvent]: ...
+```
+
+### 3.4 LLM Pipeline
+
+```python
+# backend/app/infrastructure/perception/llm_pipeline.py
+
+class LlmPipeline:
+    """Runs three sequential LLM steps on a regulation event."""
+
+    def extract_structure(self, event: dict) -> dict:
+        """Step 1: Extract obligations, deadlines, scope, penalties, impact_level.
+        
+        Returns dict with keys: obligations, deadlines, scope, penalties, impact_level.
+        Uses JSON-mode or structured prompt; model retries once on parse failure.
+        """
+
+    def assess_impact(self, event: dict, retrieval_service) -> list[dict]:
+        """Step 2: RAG-based impact on existing knowledge base documents.
+        
+        Query = standard_code + title + first obligation texts.
+        Returns list of {doc_id, doc_name, score, key_clauses, recommendation}.
+        """
+
+    def compute_diff(self, old_text: str, new_text: str) -> dict:
+        """Step 3: Semantic diff between old and new regulation text.
+        
+        Splits both texts by paragraph. Calls existing EmbeddingService (text-embedding-v3
+        via EMBEDDING_BASE_URL) to embed each paragraph, then computes cosine similarity.
+        Changed paragraphs (cosine < 0.85) sent to LLM for change_type classification:
+          'tightened' | 'relaxed' | 'added' | 'removed'
+        Returns {changed_sections: [...], change_summary: str}.
+        Only called when content_hash differs from previous_hash.
+        """
+```
+
+### 3.5 CrawlService
+
+```python
+# backend/app/application/perception/crawl_service.py
+
+class CrawlService:
+    def __init__(self, crawlers, event_store, llm_pipeline, retrieval_service): ...
+
+    def run_crawl(self, sources: list[str] | None = None) -> Generator[dict, None, None]:
+        """Manual-trigger crawl. Yields progress SSE dicts:
+          {event: 'progress', data: {source, fetched, new, updated, stage}}
+          {event: 'done', data: {total_new, total_updated, duration_ms}}
+          {event: 'error', data: {source, message}}
+        
+        For each crawler:
+          1. fetch() RawEvents
+          2. hash check vs stored event → skip if unchanged
+          3. upsert raw event to DB
+          4. run LLM pipeline (extract → assess → diff)
+          5. upsert enriched event to DB
+          6. yield progress
+        """
+```
+
+---
+
+## 4. API Endpoints
+
+### Existing (unchanged interface, new store backend)
+- `GET /api/v1/perception/stats`
+- `GET /api/v1/perception/events`
+- `GET /api/v1/perception/events/{id}`
+- `POST /api/v1/perception/events/{id}/analyze` (streaming)
+
+### New endpoints
+
+```
+POST /api/v1/perception/crawl
+  Body: { sources?: ["CATARC", "国标委", "EUR-Lex", "UN-ECE"] }
+  Response: text/event-stream (SSE)
+  Auth: requires current_user (admin/legal role)
+  Streams progress events until done or error.
+
+POST /api/v1/perception/events/{id}/process
+  Trigger LLM pipeline for a single already-crawled event.
+  Response: { status: "ok", processed_at: "..." }
+  Auth: requires current_user
+
+GET /api/v1/perception/events/{id}/diff
+  Returns: { changed_sections: [...], change_summary: str, previous_hash: str }
+  Returns 404 if no diff available (first crawl or no change detected).
+```
+
+---
+
+## 5. Frontend Changes
+
+### 5.1 New: Crawl Control Bar (top of PerceptionPage)
+
+Above the stats-bar, add a `<CrawlBar>` component:
+- "刷新数据源" button — triggers `POST /crawl` (all sources)
+- Inline progress display: shows SSE progress events as a mini status line
+  - e.g. "CATARC: 抓取中… | 国标委: 12 条新增 | EUR-Lex: 等待中"
+- On completion: shows "更新完成 — 新增 N 条，更新 M 条"
+- Disabled while crawl is in progress (prevents double-trigger)
+
+### 5.2 Signal Card Enhancement
+
+Existing cards get two new indicators:
+- **NEW badge** — shown when `crawled_at` is within last 24h (green dot)
+- **CHANGED badge** — shown when `previous_hash != content_hash` and `change_summary` exists
+
+### 5.3 Right Panel — Structured Tab
+
+Right detail panel adds a tab bar: **概览 | 义务条款 | 影响评估 | 变更对比**
+
+**义务条款 tab:**
+- Table: 义务描述 | 主体 | 对象 | 截止日期
+- Tags for deontic type: 强制 / 禁止 / 允许
+- Shows `obligations[]` + `deadlines[]` from DB
+
+**影响评估 tab:**
+- Replaces hardcoded MOCK_DOCS with real `affected_docs[]` from DB
+- Each row: document name, similarity score (%), key clause excerpt, LLM recommendation
+- "Run fresh assessment" button → triggers `POST /events/{id}/process`
+
+**变更对比 tab:**
+- Only visible when `change_summary` is non-null
+- Top: `change_summary` text (LLM prose)
+- Below: diff table with old/new paragraph pairs, change_type badge per row
+- Hidden (tab disabled) on first-crawl events with no prior version
+
+### 5.4 Existing behavior preserved
+- `analyze` streaming (AI analysis) unchanged
+- Search/filter (source, impact) unchanged — now hits real DB data
+- Stats bar — now reflects real counts from PostgreSQL
+
+---
+
+## 6. Settings Additions
+
+```python
+# backend/app/config/settings.py additions
+perception_crawl_timeout_seconds: int = Field(default=120, ...)
+perception_max_events_per_source: int = Field(default=100, ...)
+perception_diff_similarity_threshold: float = Field(default=0.85, ...)
+```
+
+```env
+# .env additions
+PERCEPTION_CRAWL_TIMEOUT_SECONDS=120
+PERCEPTION_MAX_EVENTS_PER_SOURCE=100
+PERCEPTION_DIFF_SIMILARITY_THRESHOLD=0.85
+```
+
+---
+
+## 7. Dependencies
+
+```
+# requirements.txt additions
+httpx>=0.27.0              # already likely present; confirm
+beautifulsoup4>=4.12.0     # HTML parsing for CATARC
+lxml>=5.0.0                # BeautifulSoup parser backend
+# sentence-transformers NOT added — diff uses existing text-embedding-v3 API (EMBEDDING_BASE_URL)
+```
+
+No new infrastructure required (PostgreSQL + MinIO + Milvus already available).
+
+---
+
+## 8. Backward Compatibility
+
+- `DOCUMENT_REPOSITORY_BACKEND=json` → `bootstrap.py` uses `MockEventStore` (unchanged behavior)
+- `DOCUMENT_REPOSITORY_BACKEND=postgres` → uses `PostgresEventStore`
+- Migration: run `CREATE TABLE` SQL on first startup (idempotent `CREATE TABLE IF NOT EXISTS`)
+- Existing 20 mock events are not seeded to PostgreSQL; PostgreSQL starts empty until first crawl
+
+---
+
+## 9. Out of Scope (this phase)
+
+- Automatic/scheduled crawling (Celery Beat) — manual trigger only
+- Playwright-based JS-rendered pages — all target sites work with httpx
+- Knowledge Graph (Neo4j / LightRAG) — future phase
+- Email/Slack webhook notifications — future phase
+- User-facing diff history (versioning beyond one prior snapshot) — future phase
--- a/docs/superpowers/specs/2026-06-08-compliance-enhancement-design.md
+++ b/docs/superpowers/specs/2026-06-08-compliance-enhancement-design.md
@@ -0,0 +1,459 @@
+# Compliance Analysis Enhancement Design
+
+**Date:** 2026-06-08
+**Directions:** A (Analysis Quality) + B (History & Reports) + C (Deep Chat)
+**Approach:** Three independent but coordinated feature sets sharing one DB schema (method one / structured tables).
+
+---
+
+## Goals
+
+1. **A — Analysis Quality:** Parallel clause processing (3-5× speed), fix `highlight_terms` bug (always returns empty), add LLM retry with tenacity, reserve `PassThroughReranker` for future cross-encoder work.
+2. **B — Analysis History & Reports:** Auto-save every completed analysis to PostgreSQL, history rail in UI, per-record DOCX export, delete with confirmation.
+3. **C — Deep Chat:** Per-finding persistent chat threads grounded in real retrieved text, LLM-generated suggestion questions, multi-turn memory.
+
+---
+
+## Architecture Overview
+
+### Layering Rules (must not be violated)
+
+```
+api/routes/         →  thin HTTP handlers, SSE generators only
+application/        →  orchestration logic (pipeline.py)
+domain/ports/       →  ABCs, no implementation
+infrastructure/     →  DB, docx, external calls
+shared/bootstrap.py →  composition root, wires everything
+```
+
+New business logic goes in `application/compliance/pipeline.py` and domain ports. Never in `services/*` or `workflows/*`.
+
+### Shared Database Schema (B + C)
+
+Three tables, created together so C's FK references are valid from day one:
+
+```sql
+CREATE TABLE compliance_analyses (
+    id              UUID PRIMARY KEY DEFAULT gen_random_uuid(),
+    created_at      TIMESTAMPTZ NOT NULL DEFAULT now(),
+    created_by      VARCHAR(255),
+    doc_name        VARCHAR(500),
+    standard_name   VARCHAR(500),
+    risk_score      INTEGER,
+    conclusion      TEXT,
+    actions         JSONB,
+    para_text       TEXT,
+    highlight_terms JSONB
+);
+
+CREATE TABLE compliance_findings (
+    id          UUID PRIMARY KEY DEFAULT gen_random_uuid(),
+    analysis_id UUID NOT NULL REFERENCES compliance_analyses(id) ON DELETE CASCADE,
+    seq         INTEGER NOT NULL,
+    title       VARCHAR(500),
+    description TEXT,
+    status      VARCHAR(50),
+    clause_ref  VARCHAR(200)
+);
+
+CREATE TABLE finding_chat_messages (
+    id          UUID PRIMARY KEY DEFAULT gen_random_uuid(),
+    analysis_id UUID NOT NULL REFERENCES compliance_analyses(id) ON DELETE CASCADE,
+    finding_id  UUID NOT NULL REFERENCES compliance_findings(id) ON DELETE CASCADE,
+    role        VARCHAR(20) NOT NULL,  -- 'user' | 'assistant'
+    content     TEXT NOT NULL,
+    created_at  TIMESTAMPTZ NOT NULL DEFAULT now()
+);
+```
+
+---
+
+## Direction A — Analysis Quality
+
+### A1: Parallel Clause Processing
+
+**Current:** Route handler has a sequential `for i, clause in enumerate(clauses)` loop. Each iteration calls `retrieve_for_clause()` then `check_clause_compliance()` synchronously via `asyncio.to_thread`.
+
+**Change:** Extract a `process_single_clause(clause, idx, ...) -> dict` function in `pipeline.py`, then replace the loop with `asyncio.gather`:
+
+```python
+async def run_clauses_parallel(clauses, retrieval_svc, llm_client, standard_name, para_text):
+    tasks = [
+        asyncio.to_thread(process_single_clause, clause, i, retrieval_svc, llm_client, standard_name, para_text)
+        for i, clause in enumerate(clauses)
+    ]
+    return await asyncio.gather(*tasks, return_exceptions=True)
+```
+
+Results are yielded to the SSE stream in original order. Exceptions from individual clauses are caught and emitted as `{type: "error", clause_index: i}` events rather than crashing the whole stream.
+
+### A2: Fix highlight_terms
+
+**Root cause:** `synthesize_conclusion()` passes the LLM response through `json.loads()` but the LLM often wraps output in markdown fences (` ```json ... ``` `), causing a parse failure and silent fallback to `[]`.
+
+**Fix in `pipeline.py`:**
+
+```python
+import re
+
+def _extract_json(text: str) -> dict:
+    """Strip markdown fences then parse JSON. Raises ValueError on failure."""
+    cleaned = re.sub(r"^```(?:json)?\s*|\s*```$", "", text.strip(), flags=re.MULTILINE)
+    return json.loads(cleaned)
+```
+
+Apply `_extract_json` in `synthesize_conclusion()` instead of bare `json.loads`. Wrap with `@retry` (see A3) so transient parse failures get a second attempt.
+
+### A3: LLM Retry with tenacity
+
+`tenacity` is already in `requirements.txt` but unused. Add to all LLM calls in `pipeline.py`:
+
+```python
+from tenacity import retry, stop_after_attempt, wait_exponential, retry_if_exception_type
+
+@retry(
+    stop=stop_after_attempt(3),
+    wait=wait_exponential(multiplier=1, min=1, max=4),
+    retry=retry_if_exception_type((httpx.HTTPError, ValueError)),
+    reraise=True,
+)
+def _call_llm_with_retry(client, prompt: str) -> str:
+    """Call LLM and return raw text. Retries on HTTP errors and JSON parse failures."""
+    ...
+```
+
+On final failure, the calling function catches and emits `{type: "error", text: "LLM call failed after 3 attempts"}` to the SSE stream.
+
+### A4: PassThroughReranker (future-ready stub)
+
+`domain/retrieval/ports.py` already defines a `Reranker` ABC. Add the no-op implementation:
+
+**New file:** `backend/app/infrastructure/retrieval/reranker.py`
+
+```python
+from app.domain.retrieval.ports import Reranker, RetrievedChunk
+
+class PassThroughReranker(Reranker):
+    """No-op reranker. Replace with CrossEncoderReranker when a local model is available."""
+
+    def rerank(self, query: str, chunks: list[RetrievedChunk], top_k: int) -> list[RetrievedChunk]:
+        return chunks[:top_k]
+```
+
+Register in `shared/bootstrap.py` as the default `Reranker` implementation.
+
+### A — Files Changed
+
+| File | Action |
+|------|--------|
+| `backend/app/application/compliance/pipeline.py` | Add `process_single_clause`, `run_clauses_parallel`, `_extract_json`, `_call_llm_with_retry` |
+| `backend/app/api/routes/compliance.py` | Replace sequential loop with `await run_clauses_parallel(...)` |
+| `backend/app/infrastructure/retrieval/reranker.py` | New — `PassThroughReranker` |
+| `backend/app/shared/bootstrap.py` | Register `PassThroughReranker` |
+
+---
+
+## Direction B — History & Reports
+
+### B1: Domain Port
+
+**New file:** `backend/app/domain/compliance/ports.py`
+
+```python
+from abc import ABC, abstractmethod
+from dataclasses import dataclass, field
+from datetime import datetime
+from typing import Optional
+
+@dataclass
+class FindingRecord:
+    id: str
+    analysis_id: str
+    seq: int
+    title: str
+    description: str
+    status: str
+    clause_ref: Optional[str] = None
+
+@dataclass
+class AnalysisRecord:
+    id: str
+    created_at: datetime
+    created_by: Optional[str]
+    doc_name: str
+    standard_name: str
+    risk_score: int
+    conclusion: str
+    actions: list
+    para_text: str
+    highlight_terms: list
+    findings: list[FindingRecord] = field(default_factory=list)
+
+class ComplianceRepository(ABC):
+    @abstractmethod
+    def save_analysis(self, record: AnalysisRecord) -> str: ...
+    @abstractmethod
+    def list_analyses(self, limit: int = 50, offset: int = 0) -> list[AnalysisRecord]: ...
+    @abstractmethod
+    def get_analysis(self, analysis_id: str) -> Optional[AnalysisRecord]: ...
+    @abstractmethod
+    def delete_analysis(self, analysis_id: str) -> None: ...
+    @abstractmethod
+    def save_message(self, analysis_id: str, finding_id: str, role: str, content: str) -> str: ...
+    @abstractmethod
+    def get_messages(self, finding_id: str) -> list[dict]: ...
+```
+
+### B2: PostgresComplianceRepository
+
+**New file:** `backend/app/infrastructure/compliance/repository.py`
+
+Implements `ComplianceRepository` using `psycopg2` (already in requirements). Connection string from `settings.DATABASE_URL`. Key methods:
+
+- `save_analysis`: INSERT into `compliance_analyses`, then bulk INSERT findings into `compliance_findings`, return `analysis_id` (UUID string).
+- `list_analyses`: SELECT with JOIN on findings count, ORDER BY `created_at DESC`, supports limit/offset.
+- `get_analysis`: SELECT analysis + all findings by `analysis_id`.
+- `delete_analysis`: DELETE cascades to findings and chat messages via FK.
+- `save_message` / `get_messages`: INSERT/SELECT on `finding_chat_messages`.
+
+Uses a connection pool (simple `psycopg2.pool.ThreadedConnectionPool`, min=1, max=5).
+
+### B3: Auto-save Hook
+
+In the SSE generator in `compliance.py`, after the `done` event is assembled:
+
+```python
+# After yielding the done event
+if repo is not None:
+    record = AnalysisRecord(
+        id="",  # will be assigned by DB
+        created_at=datetime.utcnow(),
+        created_by=current_user,
+        doc_name=doc_name,
+        standard_name=standard_name,
+        risk_score=done_payload["risk_score"],
+        conclusion=done_payload["conclusion"],
+        actions=done_payload["actions"],
+        para_text=done_payload["para_text"],
+        highlight_terms=done_payload["highlight_terms"],
+        findings=[FindingRecord(...) for f in accumulated_findings],
+    )
+    analysis_id = await asyncio.to_thread(repo.save_analysis, record)
+    # Emit an extra SSE event so frontend receives the analysis_id
+    yield f"data: {json.dumps({'type': 'saved', 'analysis_id': analysis_id})}\n\n"
+```
+
+### B4: New API Endpoints
+
+Added to `backend/app/api/routes/compliance.py`:
+
+```
+GET    /api/v1/compliance/history
+       Query params: limit=20&offset=0
+       Response: [{id, created_at, doc_name, standard_name, risk_score, finding_count}]
+
+GET    /api/v1/compliance/history/{analysis_id}
+       Response: full AnalysisRecord including findings list
+
+DELETE /api/v1/compliance/history/{analysis_id}
+       Response: 204 No Content
+
+GET    /api/v1/compliance/history/{analysis_id}/download
+       Response: DOCX file (application/vnd.openxmlformats-officedocument.wordprocessingml.document)
+```
+
+### B5: DOCX Export
+
+**New file:** `backend/app/infrastructure/compliance/docx_export.py`
+
+Uses `python-docx` (already in requirements). Generates a structured report:
+
+- Cover: document name, standard, date, risk score badge
+- Executive summary: conclusion paragraph
+- Findings table: seq / title / status / clause_ref / description
+- Action items: numbered list
+- Footer: generated by AI Regulation Analysis System
+
+```python
+def generate_docx(record: AnalysisRecord) -> bytes:
+    """Generate a DOCX compliance report and return as bytes."""
+    doc = Document()
+    # ... build document ...
+    buf = BytesIO()
+    doc.save(buf)
+    return buf.getvalue()
+```
+
+### B6: Frontend — History Rail
+
+`CompliancePage.tsx` gains a left rail (same layout pattern as RagChat's `history-pane`):
+
+```
+┌──────────────┬─────────────────────────────────┐
+│ History      │  Main Analysis Area              │
+│ ──────────   │                                  │
+│ 2026-06-08   │  (current analysis or loaded     │
+│ doc.pdf      │   read-only historical record)   │
+│ ⚠ 72  [↓][×]│                                  │
+│ ──────────   │                                  │
+│ 2026-06-07   │                                  │
+│ csms.pdf     │                                  │
+│ ✓ 15  [↓][×]│                                  │
+└──────────────┴─────────────────────────────────┘
+```
+
+- `[↓]` triggers `GET /history/{id}/download` and saves the DOCX file
+- `[×]` shows a confirmation dialog, then calls `DELETE /history/{id}`
+- Clicking a row loads that analysis into the main area in read-only mode
+- `PageStateContext.ComplianceState` gains `analysisId: string | null` and `isReadOnly: boolean`
+
+On mount, the rail calls `GET /history?limit=20` to populate the list. The list re-fetches after delete or after a new analysis completes (triggered by the `saved` SSE event).
+
+### B — Files Changed
+
+| File | Action |
+|------|--------|
+| `backend/app/domain/compliance/ports.py` | New — `ComplianceRepository` ABC + data classes |
+| `backend/app/infrastructure/compliance/repository.py` | New — `PostgresComplianceRepository` |
+| `backend/app/infrastructure/compliance/docx_export.py` | New — `generate_docx()` |
+| `backend/app/api/routes/compliance.py` | Add history endpoints + auto-save hook |
+| `backend/app/shared/bootstrap.py` | Register `PostgresComplianceRepository` |
+| `frontend/src/pages/Compliance/CompliancePage.tsx` | Add History Rail |
+| `frontend/src/contexts/PageStateContext.tsx` | Add `analysisId`, `isReadOnly` to `ComplianceState` |
+
+---
+
+## Direction C — Deep Chat
+
+### C1: New Chat Endpoints
+
+Replace the existing `/compliance/chat/{segment_id}` (kept for backward compatibility but deprecated) with finding-scoped endpoints:
+
+```
+POST /api/v1/compliance/analyses/{analysis_id}/findings/{finding_id}/chat
+     Body: {query: string}
+     Response: SSE stream — chunk / done / error events
+
+GET  /api/v1/compliance/analyses/{analysis_id}/findings/{finding_id}/chat
+     Response: [{id, role, content, created_at}]
+
+POST /api/v1/compliance/analyses/{analysis_id}/findings/{finding_id}/suggestions
+     Response: {questions: [string, string, string]}
+```
+
+### C2: Grounded Context Construction
+
+New function in `pipeline.py`:
+
+```python
+def build_finding_context(finding: FindingRecord, analysis: AnalysisRecord) -> str:
+    """
+    Build a grounded system context string for a finding chat thread.
+    Combines finding details with analysis metadata for LLM grounding.
+    """
+    return (
+        f"Document: {analysis.doc_name}\n"
+        f"Standard: {analysis.standard_name}\n"
+        f"Finding [{finding.seq}]: {finding.title}\n"
+        f"Status: {finding.status}\n"
+        f"Clause reference: {finding.clause_ref or 'N/A'}\n"
+        f"Description: {finding.description}\n"
+        f"Overall conclusion: {analysis.conclusion}\n"
+    )
+```
+
+This string is prepended to the system prompt for every chat call — replacing the fragile `segment_context` approach.
+
+### C3: Multi-turn Context
+
+Chat handler fetches existing messages from `finding_chat_messages` via `repo.get_messages(finding_id)` and prepends them to the LLM call as `[{"role": "user"/"assistant", "content": "..."}]` message history. Max history: 10 most recent messages (5 turns) to avoid token overflow.
+
+After each LLM response, both the user message and assistant message are saved via `repo.save_message()`.
+
+### C4: Suggestion Generation
+
+New function in `pipeline.py`:
+
+```python
+SUGGESTION_PROMPTS = {
+    "non_compliant": "Generate 3 questions focused on remediation steps and timeline.",
+    "partial": "Generate 3 questions focused on identifying the compliance gap.",
+    "compliant": "Generate 3 questions focused on maintaining and evidencing compliance.",
+}
+
+def generate_suggestions(finding: FindingRecord, analysis: AnalysisRecord, llm_client) -> list[str]:
+    """
+    Generate 3 context-aware follow-up questions for a finding chat thread.
+    Returns a list of 3 question strings. Falls back to generic questions on error.
+    """
+    focus = SUGGESTION_PROMPTS.get(finding.status, SUGGESTION_PROMPTS["partial"])
+    context = build_finding_context(finding, analysis)
+    prompt = f"{context}\n\n{focus}\nReturn JSON: {{\"questions\": [\"...\", \"...\", \"...\"]}}"
+    # ... call LLM, parse JSON, return list ...
+    # Fallback on error:
+    return ["What are the specific requirements?", "What is the remediation timeline?", "Which regulation clause applies?"]
+```
+
+### C5: Frontend — Finding Chat Drawer
+
+New component: `frontend/src/pages/Compliance/FindingChatDrawer.tsx`
+
+Drawer slides in from the right (CSS: `position: fixed; right: 0; width: 420px`), reusing existing CSS variables (`--surface`, `--border`, `--accent`).
+
+Structure:
+- Header: finding title + close button
+- Suggestions section: 3 chip buttons (only shown before first user message; hidden after)
+- Message list: scrollable, same bubble style as RagChat
+- Composer: textarea + send button, same pattern as RagChat composer
+
+State managed in `PageStateContext.ComplianceState`:
+- `activeFindingId: string | null` — which finding's drawer is open
+- Drawer open/close controlled by `activeFindingId !== null`
+
+On open:
+1. `GET /analyses/{id}/findings/{fid}/chat` → restore history
+2. If history is empty: `POST /findings/{fid}/suggestions` → show chips
+
+Each finding card in `CompliancePage.tsx` gains a `💬 Chat` button that sets `activeFindingId`.
+
+### C — Files Changed
+
+| File | Action |
+|------|--------|
+| `backend/app/api/routes/compliance.py` | Add 3 new finding-chat endpoints |
+| `backend/app/application/compliance/pipeline.py` | Add `build_finding_context`, `generate_suggestions` |
+| `backend/app/infrastructure/compliance/repository.py` | Add `save_message`, `get_messages` (already in port) |
+| `frontend/src/pages/Compliance/FindingChatDrawer.tsx` | New component |
+| `frontend/src/pages/Compliance/CompliancePage.tsx` | Add Chat button to finding cards, render drawer |
+| `frontend/src/contexts/PageStateContext.tsx` | Add `activeFindingId` to `ComplianceState` |
+
+---
+
+## Implementation Order
+
+Direction A must be completed first (parallel processing changes the route handler that B's auto-save hook attaches to). B must be completed before C (C's FK references require B's tables and repository).
+
+```
+A (parallel + bug fixes + reranker stub)
+  └→ B (schema migration + history + DOCX)
+       └→ C (finding chat + suggestions)
+```
+
+---
+
+## Non-Goals
+
+- PDF export (DOCX only; users convert via Word/WPS)
+- Cross-encoder reranking (stub reserved, not implemented)
+- Scheduled/automatic crawling
+- User-level history isolation (all users share history — global visibility)
+- Prompt version management or A/B testing
+
+---
+
+## Constraints
+
+- Backend comments and docstrings: English only
+- No new top-level libraries beyond those already in `requirements.txt` (`tenacity`, `python-docx`, `psycopg2-binary` are all present)
+- `DOCUMENT_REPOSITORY_BACKEND=postgres` → `PostgresComplianceRepository`; any other value → raise `NotImplementedError` with a clear message (no mock fallback for compliance history)
+- Git commits are made by the user, never automated
--- a/docs/superpowers/specs/2026-06-08-i18n-design.md
+++ b/docs/superpowers/specs/2026-06-08-i18n-design.md
@@ -0,0 +1,421 @@
+# Internationalisation (i18n) Design — Frontend Chinese/English Toggle
+
+**Date:** 2026-06-08
+**Scope:** UI framework strings only (nav labels, button labels, status messages, placeholders). Mock data, API-returned content, and domain regulation text are explicitly excluded.
+
+---
+
+## Goals
+
+Add a language toggle button (EN ↔ 中) in the Sidebar footer, immediately left of the existing theme-toggle button, so users can switch the UI between English and Simplified Chinese. Default language is English on every page load; preference is not persisted across sessions.
+
+---
+
+## Architecture
+
+### Approach
+
+Custom `LanguageContext` following the same pattern as the existing `ThemeContext`. No external library dependencies. Translation strings live in two TypeScript modules (`locales/en.ts` and `locales/zh.ts`) that export identical-shape objects.
+
+### Layering
+
+```
+src/
+├── contexts/
+│   └── LanguageContext.tsx    # type Lang, LanguageProvider, useLanguage()
+└── locales/
+    ├── en.ts                  # English translations (default)
+    └── zh.ts                  # Simplified Chinese translations
+```
+
+`LanguageProvider` wraps the entire app in `App.tsx` — outermost provider so every component can consume it.
+
+### Context interface
+
+```ts
+type Lang = 'en' | 'zh';
+
+interface LanguageContextValue {
+  lang: Lang;
+  t: Translations;       // typed translation object
+  toggleLang: () => void;
+}
+```
+
+`useState<Lang>('en')` — hardcoded default, no localStorage read on mount.
+
+### Translation object shape (both files export `Translations`)
+
+```ts
+export interface Translations {
+  nav: {
+    groupMain: string;
+    groupWorkbench: string;
+    groupChat: string;
+    overview: string;
+    signals: string;
+    status: string;
+    documents: string;
+    compliance: string;
+    chat: string;
+  };
+  sidebar: {
+    toggleTheme: string;
+    toggleLang: string;
+    signOut: string;
+  };
+  overview: {
+    eyebrow: string;
+    heroTitle: string;
+    heroDesc: string;
+    openDashboard: string;
+    jumpToChat: string;
+    sectionHowItWorks: string;
+    sectionScreens: string;
+    stepUpload: string; stepUploadDesc: string;
+    stepProcess: string; stepProcessDesc: string;
+    stepMonitor: string; stepMonitorDesc: string;
+    stepAnalyze: string; stepAnalyzeDesc: string;
+    stepReview: string; stepReviewDesc: string;
+    stepChat: string; stepChatDesc: string;
+    statScreens: string;
+    statFlows: string;
+    statReviewPosture: string;
+    navLiveHealth: string;
+    navRegulatoryChanges: string;
+    navUploadDocs: string;
+    navComplianceWorkspace: string;
+    navChatCited: string;
+    navKPIs: string;
+  };
+  signals: {
+    topbarTitle: string;
+    topbarSub: string;
+    searchPlaceholder: string;
+    refreshBtn: string;
+    crawlingBtn: string;
+    statTotal: string;
+    statHigh: string;
+    statMedium: string;
+    statLast90: string;
+    badgeFinal: string;
+    badgeDraft: string;
+    badgeUrgent: string;
+    badgePublished: string;
+    emptySelectSignal: string;
+    runAnalysis: string;
+    stopBtn: string;
+    sourceLink: string;
+    tabOverview: string;
+    tabObligations: string;
+    tabImpact: string;
+    tabChanges: string;
+    cardScopeHeader: string;
+    cardObligationsHeader: string;
+    obligationsEmpty: string;
+    colObligationDesc: string;
+    colSubject: string;
+    colType: string;
+    colDeadline: string;
+    deadlinePending: string;
+    cardAffectedDocs: string;
+    noAffectedDocs: string;
+    cardAIImpact: string;
+    footerText: string;
+    statusConnecting: string;
+    statusNoStream: string;
+    statusCrawling: string;
+    statusProcessing: string;
+    statusComplete: string;
+    statusUpdateComplete: string;
+    statusError: string;
+    statusConnFailed: string;
+  };
+  status: {
+    topbarTitle: string;
+    searchPlaceholder: string;
+    exportBtn: string;
+    refreshBtn: string;
+    newUploadBtn: string;
+    statTotal: string;
+    statIndexed: string;
+    statFailed: string;
+    statChunks: string;
+    statCoverage: string;
+    cardHealth: string;
+    badgeOnline: string;
+    badgeError: string;
+    badgeDegraded: string;
+    badgeUnknown: string;
+    healthEndpointError: string;
+    serviceEnabled: string;
+    serviceDisabled: string;
+    serviceNotLoaded: string;
+    cardConfig: string;
+    labelLLMProvider: string;
+    labelLLMModel: string;
+    labelEmbeddingModel: string;
+    labelEmbeddingDim: string;
+    labelMilvusCollection: string;
+    labelParserBackend: string;
+    labelChunkBackend: string;
+    labelParserFailureMode: string;
+    configLoadError: string;
+    cardBreakdown: string;
+    breakdownIndexed: string;
+    breakdownProcessing: string;
+    breakdownFailed: string;
+    cardRuntime: string;
+    labelActiveSessions: string;
+    labelSessionCapacity: string;
+    labelReranker: string;
+    labelBM25: string;
+    statusActive: string;
+    statusUnavailable: string;
+    footerAllOk: string;
+    footerDegraded: string;
+    footerChecking: string;
+  };
+  docs: {
+    topbarTitle: string;
+    searchPlaceholder: string;
+    refreshBtn: string;
+    uploadBtn: string;
+    confirmDeleteTitle: string;
+    cancelBtn: string;
+    deleteBtn: string;
+    filterAll: string;
+    filterReady: string;
+    filterProcessing: string;
+    filterFailed: string;
+    filterPending: string;
+    filterAllTypes: string;
+    selectedCount: string;   // '{n} document(s) selected' — use {n} placeholder
+    deleteSelected: string;
+    colName: string;
+    colStatus: string;
+    colUploaded: string;
+    colChunks: string;
+    colSize: string;
+    colType: string;
+    colActions: string;
+    loading: string;
+    emptyNoDocuments: string;
+    emptyNoMatch: string;
+    footerCount: string;     // '{n} of {m} document(s)'
+    titleDownload: string;
+    titleRetry: string;
+    titleDelete: string;
+    confirmSingle: string;   // '{name}' placeholder
+    confirmBatch: string;    // '{n}' placeholder
+  };
+  compliance: {
+    topbarTitle: string;
+    searchPlaceholder: string;
+    clearBtn: string;
+    exportBtn: string;
+    exportJSON: string;
+    exportText: string;
+    newAnalysisBtn: string;
+    statusAnalyzing: string;
+    statusComplete: string;
+    statusError: string;
+    emptyTitle: string;
+    emptyDesc: string;
+    colRetrieved: string;    // 'Retrieved Regulations {count}'
+    retrievingMsg: string;
+    defaultRegulation: string;
+    matchSuffix: string;
+    colParagraph: string;
+    extractingMsg: string;
+    noTextExtracted: string;
+    stagesHeader: string;
+    stageExtraction: string;
+    stageClauseSplit: string;
+    stageRetrieval: string;
+    stageSynthesis: string;
+    colFindings: string;     // 'Findings {count}'
+    gapInProgress: string;
+    askAIBtn: string;
+    chatBtn: string;
+    conclusionHeader: string;
+    riskScoreTooltip: string;
+    statusCovered: string;
+    statusGap: string;
+    statusCritical: string;
+    statusInfo: string;
+    sourceTypePasted: string;
+    sourceTypeIndexed: string;
+    sourceTypeUploaded: string;
+    chatSidebarHeader: string;
+    chatThinking: string;
+    quickQ1: string;
+    quickQ2: string;
+    quickQ3: string;
+    chatPlaceholder: string;
+    sendBtn: string;
+    analysisFailed: string;
+    exportReportHeader: string;
+    exportSectionParagraph: string;
+    exportSectionFindings: string;
+    exportSectionConclusion: string;
+    exportSectionActions: string;
+    historyHeader: string;
+    downloadReport: string;
+    historyEmpty: string;
+    historyDeleteConfirm: string;
+    drawerClose: string;
+    drawerChatEmpty: string;
+    drawerSuggestionsHeader: string;
+  };
+  ragchat: {
+    topbarTitle: string;
+    exportBtn: string;
+    quickPromptsHeader: string;
+    inputPlaceholder: string;
+    citationsHeader: string;    // 'Sources {count}'
+    citationsEmpty: string;
+    jumpToSource: string;       // 'Jump to source [N]'
+    apiError: string;
+    quickPrompt1: string;
+    quickPrompt2: string;
+    quickPrompt3: string;
+    quickPrompt4: string;
+  };
+}
+```
+
+---
+
+## Language Toggle Button
+
+Location: `Sidebar.tsx` footer `<div style={{ display: 'flex', gap: 4 }}>`.
+
+Inserted **left of** the existing theme button:
+
+```tsx
+<button className="theme-btn" onClick={toggleLang} title={t.sidebar.toggleLang}>
+  {lang === 'en' ? 'EN' : '中'}
+</button>
+```
+
+- Reuses existing `theme-btn` CSS class — no new styles needed.
+- Displays two-character label: `EN` or `中`.
+- `title` attribute (tooltip) translates with the rest of the UI.
+
+---
+
+## Translation Files (complete values)
+
+### `locales/en.ts` (English — default)
+
+Key values (representative; full file contains all keys above):
+
+```ts
+nav: { groupMain: 'Main', groupWorkbench: 'Workbench', groupChat: 'Chat',
+       overview: 'Overview', signals: 'Regulatory Signals', status: 'System Status',
+       documents: 'Documents', compliance: 'Compliance Analysis', chat: 'Regulation Q&A' },
+sidebar: { toggleTheme: 'Toggle theme', toggleLang: 'Switch language', signOut: 'Sign out' },
+signals: { refreshBtn: 'Refresh Sources', crawlingBtn: 'Crawling...', ... },
+docs: { uploadBtn: 'Upload document', deleteBtn: 'Delete', cancelBtn: 'Cancel', ... },
+compliance: { newAnalysisBtn: 'New analysis', analyzeBtn: 'Analyze', sendBtn: 'Send', ... },
+ragchat: { exportBtn: 'Export chat', inputPlaceholder: 'Ask about your regulations…', ... },
+```
+
+### `locales/zh.ts` (Simplified Chinese)
+
+Key values:
+
+```ts
+nav: { groupMain: '主菜单', groupWorkbench: '工作台', groupChat: '对话',
+       overview: '概览', signals: '法规信号', status: '系统状态',
+       documents: '文档管理', compliance: '合规分析', chat: '法规问答' },
+sidebar: { toggleTheme: '切换主题', toggleLang: '切换语言', signOut: '退出' },
+signals: { refreshBtn: '刷新数据源', crawlingBtn: '抓取中...', ... },
+docs: { uploadBtn: '上传文档', deleteBtn: '删除', cancelBtn: '取消', ... },
+compliance: { newAnalysisBtn: '新建分析', analyzeBtn: '开始分析', sendBtn: '发送', ... },
+ragchat: { exportBtn: '导出对话', inputPlaceholder: '请输入关于法规的问题…', ... },
+```
+
+---
+
+## App.tsx Provider Wrapping
+
+```tsx
+// Before
+<ThemeProvider>
+  <AuthProvider>
+    <PageStateProvider>
+      <AppRouter />
+    </PageStateProvider>
+  </AuthProvider>
+</ThemeProvider>
+
+// After
+<LanguageProvider>
+  <ThemeProvider>
+    <AuthProvider>
+      <PageStateProvider>
+        <AppRouter />
+      </PageStateProvider>
+    </AuthProvider>
+  </ThemeProvider>
+</LanguageProvider>
+```
+
+`LanguageProvider` is outermost so it is available to all components including the theme toggle itself.
+
+---
+
+## Usage in Components
+
+```tsx
+import { useLanguage } from '../../contexts/LanguageContext';
+
+function MyComponent() {
+  const { t } = useLanguage();
+  return <button>{t.docs.uploadBtn}</button>;
+}
+```
+
+No wrapping needed — `t` is always the correct object for the current language.
+
+---
+
+## Files Changed
+
+| File | Action |
+|------|--------|
+| `src/contexts/LanguageContext.tsx` | New — `LanguageProvider`, `useLanguage()`, `Lang` type |
+| `src/locales/en.ts` | New — complete English `Translations` object |
+| `src/locales/zh.ts` | New — complete Chinese `Translations` object |
+| `src/App.tsx` | Add `<LanguageProvider>` wrapper |
+| `src/components/layout/Sidebar.tsx` | Add language toggle button; replace nav group titles and labels with `t.nav.*` |
+| `src/pages/Overview/OverviewPage.tsx` | Replace all UI strings with `t.overview.*` |
+| `src/pages/Perception/PerceptionPage.tsx` | Replace all UI strings with `t.signals.*` |
+| `src/pages/Status/StatusPage.tsx` | Replace all UI strings with `t.status.*` |
+| `src/pages/Docs/DocsPage.tsx` | Replace all UI strings with `t.docs.*` |
+| `src/pages/Compliance/CompliancePage.tsx` | Replace all UI strings with `t.compliance.*` |
+| `src/pages/RagChat/RagChatPage.tsx` | Replace all UI strings with `t.ragchat.*` |
+| `src/pages/Compliance/HistoryRail.tsx` | Replace UI strings with `t.compliance.*` |
+| `src/pages/Compliance/FindingChatDrawer.tsx` | Replace UI strings with `t.compliance.*` |
+
+---
+
+## Non-Goals
+
+- Persistence across sessions (no localStorage for language preference)
+- More than two languages
+- RTL layout support
+- Pluralisation helpers (simple string substitution with `{n}` placeholders is sufficient — callers replace via `t.docs.selectedCount.replace('{n}', String(count))`)
+- Translation of API-returned content, mock data, regulation names, or document file names
+- Date/number formatting localisation
+
+---
+
+## Constraints
+
+- Zero new npm dependencies
+- Follow existing `ThemeContext` pattern exactly
+- Backend comments/docstrings: English only (no backend changes in this feature)
+- Git commits made by the user, never automated
--- a/docs_dump.txt
+++ b/docs_dump.txt
@@ -0,0 +1,108 @@
+===== PPTX =====
+--- Slide 1 ---: AI + 法律法规 | 合规智能中枢 | 面向车企与工厂的 AI 驱动合规解决方案 | 2026年4月  |  EMS & EHS Compliance Intelligence Hub | AI Compliance
+Intelligence Hub | Internal  |  AI 合规智能中枢  |  2026.04
+--- Slide 2 ---: 背景与挑战 | 车企和工厂面临的合规困境 | 法规来源复杂 | 国标GB · MIIT · UN-ECE
+IATF 16949 · ISO 45001
+多轨并行，难以统管 | 更新频率高 | 新能源 · 数据安全 · 碳排放
+PIPL · NEV积分 · CCER
+政策持续迭代 | 跨语言需求 | 中英文法规混存
+跨国工厂多语言
+合规场景并存 | 文档高度分散 | 分散于 Confluence
+SharePoint · ERP · PLM
+无法联通查询 | 隐患识别被动 | EHS 安全依赖人工
+隐患发现滞后
+缺乏预防性机制 | 覆盖核心法规域 | 🚗 车辆安全  GB 7258 · GB 18384 · UN-ECE R155/156 | 🔒 数据安全  PIPL · DSL · GB/T 35273 | 🏭 工厂EHS  GB 6441 · AQ/T系列 · ISO 45001 | ♻️ 碳排放    NEV积分 · CCER · 欧盟碳边境税 | ✅ 质量管理  IATF 16949 · GB/T 19001 | AI 合规智能中枢  |  面向车企与工厂  |  2026.04 | 2 / 13
+--- Slide 3 ---: 产品定位与整体架构 | AI 驱动的全链路合规智能平台 | AI 合规智能中枢 | 📚  知识库构建 | 内外部法规 · 历史案例
+统一知识图谱 · 自动更新 | 💬  智能问答 | 混合检索 · 语义+关键词
+中英双语 · 引文溯源 | 📄  合规审查 | PDF/Word上传
+自动比对法规 · 风险标注 | 🔌  API集成 | 对接PLM · ERP · OA · MES | 🎯  个性化推荐 | 角色画像 · 上下文感知 | 📢  定制推送 | Email · Teams
+飞书 · 钉钉
+法规变更
+实时通知 | 🦺  EHS 隐患识别 & 管理体系审计（C-SG专项） | 事故报告 NLP | SIF潜力识别 | 四维根因分析 | ISO 45001 要素扫描 | 自动生成审计报告 | 趋势分析仪表板 | AI 合规智能中枢  |  面向车企与工厂  |  2026.04 | 3 / 13
+--- Slide 4 ---: 功能一：合规知识库构建与动态更新 | 统一接入内外部法规，构建可检索的结构化知识库 | 📥  数据来源 | 内部文档 | Confluence · SharePoint
+飞书 · 历史合规报告 · 审计记录 | ↓ | 外部法规 | 国标全文库 · 工标网
+MIIT政策 · UN-ECE · EUR-Lex | ↓ | 历史案例 | 处罚案例库 · 整改记录
+行业事故通报 | ⚙️  处理流程 | 1 | ① 文档解析 | 版面感知OCR，扫描件 · PDF表格 · 多栏 · Word/Excel | ↓ | 2 | ② 智能分块 | 章节级 / 条款级双粒度切割，保留语义完整性 | ↓ | 3 | ③ 向量化存储 | 多语言嵌入（中英双语），向量库 + 关键词索引双轨 | ↓ | 4 | ④ 知识图谱 | 法规实体 → 条款 → 义务 → 适用范围关系图谱 | ↓ | 5 | ⑤ 自动更新 | 定时监控法规变更，触发增量重索引 + 版本管理 | ✨  核心价值 | 数据不出厂 | 私有化本地部署
+满足PIPL/DSL数据主权 | 权限分级管理 | 研发/生产/采购/法务
+差异化访问控制 | 实时保鲜 | 法规修订自动触发重索引
+确保知识时效性 | 多格式支持 | 扫描件 · PDF · Word
+Excel · 标准文件全覆盖 | AI 合规智能中枢  |  面向车企与工厂  |  2026.04 | 4 / 13
+--- Slide 5 ---: 功能二：混合检索智能问答引擎 | 语义检索 + 关键词检索 + 知识图谱，生成可溯源的合规决策建议 | 用户提问 | 中 / 英 / 混合
+自然语言输入 | ▶ | 意图理解 | 识别法规实体
+适用场景 · 地域 | ▶ | 混合检索 | BM25关键词
+ 语义向量
+本地+网络双路 | ▶ | 重排序 | Cross-Encoder
+精排召回结果 | ▶ | 生成回答 | 引文锚定输出
+置信度评分
+页码溯源 | 典型问答场景 | 法规解读 | "我们的纯电SUV需满足哪些GB强制认证要求？" | 政策查询 | "2025年NEV积分核算方式有哪些最新变化？" | 合规判断 | "供应商A的REACH声明是否满足我司采购合规要求？" | 多跳推理 | "ISO 45001变更管理要求，对应哪些内部流程需更新？" | 对比分析 | "GB 18384与欧盟ECE R100在电池安全上有哪些差异？" | 📎 引文溯源 | 答案标注原文出处
+页码精确定位 | 🌐 多语言支持 | 中英混合检索
+无需切换语言 | ⚖️ 决策辅助 | 结合内部制度
+输出综合建议 | 🔄 图谱增强 | 关联上下游条款
+多跳推理支持 | AI 合规智能中枢  |  面向车企与工厂  |  2026.04 | 5 / 13
+--- Slide 6 ---: 功能三：智能文档合规审查 | 上传 PDF/Word，自动比对法规库，标注风险并给出整改建议 | ⚙️  审查流程 | 1 | ① 文件上传 | PDF · Word · Excel · 扫描件，支持批量 | ↓ | 2 | ② 文档解析 | 版面感知OCR，段落/条款级分块 | ↓ | 3 | ③ 法规域匹配 | 根据文档类型+内容自动识别适用法规域 | ↓ | 4 | ④ 合规比对 | 条款级语义对比，缺项检测 · 风险评分 | ↓ | 5 | ⑤ 报告输出 | 非合规位置标注，整改建议 · 风险等级 | 📋  报告输出内容 | 📍 | 非合规位置标注 | 页码 + 段落高亮，一键跳转原文 | ⚠️ | 风险等级分级 | 红（高危）/ 橙（中）/ 黄（低）三级 | 📖 | 法规条款引用 | 精确关联对应法规原文条款编号 | 🔧 | 整改建议 | 基于历史合规案例，给出可执行方案 | 📂  适用文档类型 | 供应商合规声明 | REACH/RoHS · 碳足迹申报 | 新产品EHS评估 | GB安全标准覆盖完整性核查 | 工厂安全作业规程 | AQ/T符合性 · 许可条款 | 劳动合同/协议 | 劳动法 · 工时 · 竞业条款 | 数据处理协议 | PIPL/GDPR 数据主体权利 | 供应链碳申报 | CCER/CBAM 核算方法验证 | AI 合规智能中枢  |  面向车企与工厂  |  2026.04 | 6 / 13
+--- Slide 7 ---: EHS 隐患识别 & 管理体系审计（C-SG专项） | AI驱动的主动安全预防：从被动响应到预测性干预 | 📥  数据输入 | 📝  事故/事件报告文本 · 巡检记录 · 安全观察卡 | 📊  设备运行数据 · 工伤统计 · 隐患整改台账 | 📷  现场照片（目标检测）· 视频（行为分析，可选） | 🤖  AI隐患识别引擎 | NLP文本分析 | 从叙述性文本中提取隐患实体
+触发因素 · 伤害类型 · 位置信息 | SIF风险评分 | 高严重性事件潜力预测
+优先处置最高风险隐患 | 四维根因分析 | 人因/设备/管理/环境
+系统性根因挖掘 | 法规自动关联 | 与GB 6441/AQ系列/ISO 45001
+自动映射对应条款 | 📋  体系审计功能 | ✓  ISO 45001要素覆盖度扫描（PDCA完整性） | ✓  历史案例相似度匹配与经验复用 | ✓  整改优先级排序（风险×紧迫×可行性） | ✓  审计报告自动生成（条款级评分） | ⚠️  典型隐患场景 | ▸  高处坠落 | AQ/T 3049 | ▸  有限空间 | AQ 3028 | ▸  化学品管理 | GB 13690 | ▸  设备点检 | IATF §8.5 | ▸  应急演练 | ISO 45001 §8.2 | 📤  输出成果 | 隐患清单 | 位置 · 类型
+风险等级
+法规依据
+整改建议 | 体系审计
+报告 | 条款级符合
+性评分
+整改优先级 | 趋势分析
+仪表板 | 隐患热图
+月度趋势
+部门对比 | AI 合规智能中枢  |  面向车企与工厂  |  2026.04 | 7 / 13
+--- Slide 8 ---: 系统集成 · 个性化推荐 · 定制推送 | 合规能力 API 化，主动触达用户，融入业务流程 | 🔌  合规审查 API 化 | POST | /compliance/check | 大文本分片合规检查 | POST | /compliance/upload | PDF/Word文件上传审查 | GET | /compliance/query | 法规知识库问答 | POST | /compliance/subscribe | 法规变更Webhook订阅 | 🔗  企业系统集成 | PLM | 新产品立项/BOM变更 | →  自动触发法规适用性检查 | ERP | 供应商准入/合同签署 | →  供应商自动合规评分 | OA | 合同/协议提交审批 | →  高风险自动抄送法务 | MES | 生产工艺变更 | →  触发EHS合规影响评估 | 🎯  个性化推荐 | 👤  角色画像：EHS · 法务 · 采购 · 研发 | 💡  上下文感知：对话主题 → 关联法规推荐 | 🔔  到期提醒：认证到期 · 法规更新预警 | 📈  行为学习：历史查询 → 智能问题推荐 | 📢  定制化法规推送 | 📧  Email | HTML富文本，含变更对比 | 💬  Teams | 企业Bot，实时推送 | 📱  飞书/钉钉 | 企业机器人，移动端 | 🔔  站内消息 | 系统内通知中心 | ⚙️  推送规则引擎 | ▸  订阅维度： | 按法规域 / 业务场景 / 地域灵活订阅 | ▸  优先级： | 🔴 强制  🟠 推荐  🔵 参考  三级分类 | ▸  免打扰： | 工作时间推送 · 摘要合并 · 频率上限 | ▸  内容生成： | LLM自动生成变更摘要 + 影响分析 + 行动项 | AI 合规智能中枢  |  面向车企与工厂  |  2026.04 | 8 / 13
+--- Slide 9 ---: 关键挑战与应对策略 | 确保合规建议的准确性、时效性与数据安全 | LLM幻觉风险 | 问题 | 合规建议失真
+可能导致法律责任 | 应对 | 引文锚定 + 输出验证
+高风险强制人工审核 | 数据主权 | 问题 | 敏感文件不能
+上传公有云 | 应对 | 全链路私有化部署
+数据不出厂 | 法规时效性 | 问题 | 知识库滞后
+导致错误建议 | 应对 | 自动更新机制
+时间戳标注 + 提醒 | 跨语言质量 | 问题 | 中英混合场景
+检索精度下降 | 应对 | 多语言嵌入模型
+语言标签过滤策略 | 大文件性能 | 问题 | GB标准数百页
+处理超时风险 | 应对 | 流式处理 + 分层索引
+异步队列实时进度 | 权限管控 | 问题 | 不同角色需
+不同密级访问 | 应对 | RBAC权限体系
+知识库分区 + 审计日志 | AI 合规智能中枢  |  面向车企与工厂  |  2026.04 | 9 / 13
+--- Slide 10 ---: 分阶段实施路线 | 从核心知识库到全链路合规智能，稳步落地 | 第一阶段 | 0 - 3 个月 | 知识库 + 基础问答 | 1 | 部署合规知识库平台，接入内部文档 | 2 | 接入 GB 标准 · AQ 系列 · IATF 16949 | 3 | 上线中英双语混合检索问答界面 | 4 | 完成权限分级与数据安全配置 | 第二阶段 | 3 - 6 个月 | 文档审查 + API 集成 | 1 | 构建文档合规审查引擎（PDF/Word） | 2 | 完成合规 API 封装，对接PLM/ERP/OA | 3 | 上线法规变更监控与推送服务 | 4 | 接入 Teams / 飞书 Bot 推送渠道 | 第三阶段 | 6 - 12 个月 | EHS隐患识别 + 个性化 | 1 | 构建 EHS 隐患识别与体系审计模块 | 2 | 引入知识图谱，支持多跳推理 | 3 | 上线个性化推荐引擎（角色画像） | 4 | 全链路合规智能体系正式上线 | ▶ | ▶ | AI 合规智能中枢  |  面向车企与工厂  |  2026.04 | 10 / 13
+--- Slide 11 ---: 三类合规闭环场景 | 从「发现问题」到「关闭归档」的完整业务闭环 | 📡  法规变更合规闭环 | 1 | ①  | 法规监控 |  ( | 扩展功能 | ) | 国内外法规数据库实时监控
+自动检测条款变更与新法发布 | ↓ | 2 | ② 知识库更新 | 变更内容自动解析入库
+版本管理 + 影响范围标注 | ↓ | 3 | ③ 精准推送 | 按角色/业务域推送变更摘要
+Email · Teams · 飞书多渠道 | ↓ | 4 | ④ 差距分析 | AI对比新旧法规差异
+识别企业现行制度缺口 | ↓ | 5 | ⑤  | 整改执行 |  ( | 扩展功能 | ) | 生成整改任务清单
+关联责任人与完成时限 | ↓ | 6 | ⑥  | 闭环归档 |  ( | 扩展功能 | ) | 整改完成后验收确认 | 
+ | 合规证据归档留存 | 归档的文档放在 | share point  | 同步更新知识库 | ↺  持续监控 → 知识库保鲜 → 合规常态化 | 📄  文档审查合规闭环 | 1 | ① 文件上传 | PDF · Word · Excel · 扫描件
+支持批量上传与拖拽 | ↓ | 2 | ② AI解析 | 版面感知OCR，条款级分块
+自动识别文档类型与法规域 | ↓ | 3 | ③ 合规比对 | 条款级语义对比法规库
+缺项检测 · 风险评分 | ↓ | 4 | ④ 风险标注 | 页码+段落精确定位
+红/橙/黄三级风险可视化 | ↓ | 5 | ⑤ 整改建议 | AI生成具体整改方案
+关联历史合规最佳实践 | ↓ | 6 | ⑥ 复审归档 | 整改后重新提交复核 | 
+ | 通过后合规证明自动归档 | 归档的文档放在 | share point  | 同步更新知识库 | ↺  上传即审查 → 整改即跟踪 → 归档即留证 | 🦺   | EHS安全管理闭环 |  ( | 扩展功能 | ) | 1 | ① 隐患发现 | NLP解析巡检/事故报告文本
+图像识别 · 传感器数据接入 | ↓ | 2 | ② 风险评级 | SIF潜力评分 + 四维根因分析
+高/中/低三级优先级排序 | ↓ | 3 | ③ 任务派发 | 自动生成整改工单
+关联责任人 · 截止时间 · 法规依据 | ↓ | 4 | ④ 过程跟踪 | 整改进度实时可视化
+超期自动升级提醒 | ↓ | 5 | ⑤ 验收关闭 | 整改完成后现场复查
+AI辅助验收确认 | ↓ | 6 | ⑥ 体系优化 | 根因数据回流知识库
+优化隐患模型与预防策略 | ↺  发现即评级 → 整改即跟踪 → 关闭即优化 | AI 合规智能中枢  |  面向车企与工厂  |  2026.04 | 11 / 13
+--- Slide 12 ---: 组织架构与 |  RBAC  | 权限体系 | 按角色分级授权，确保数据安全与合规责任落实到人 | 🏢  组织架构层级 | 集团 / 总部 | 合规委员会 · 法务部 · EHS总监 | ▼ | 事业部 / 工厂 | EHS部门 · 质量部 · 采购部 · 研发部 | ▼ | 业务线 / 车间 | 安全员 · 质检员 · 工艺工程师 | ▼ | 外部协作方 | 供应商 · 第三方审计 · 监管机构 | 🔐  角色权限矩阵（RBAC） | 知识库
+查询 | 文档
+审查 | EHS
+审计 | 法规
+推送 | 系统
+管理 | 合规管理员 | ● | ● | ● | ★ | ★ | 法务专员 | ● | ● | ◑ | ◑ | ○ | EHS工程师 | ● | ◑ | ● | ◑ | ○ | 采购专员 | ◑ | ● | ○ | ◑ | ○ | 研发工程师 | ◑ | ◑ | ○ | ◑ | ○ | 工厂安全员 | ◑ | ○ | ● | ◑ | ○ | 供应商（外部） | ○ | ◑ | ○ | ○ | ○ | ● 完全权限 | ◑ 只读/有限 | ○ 无权限 | ★ 管理权限 | AI 合规智能中枢  |  面向车企与工厂  |  2026.04 | 12 / 13
+--- Slide 13 ---: 总结与下一步行动 | 构建面向车企与工厂的 AI 驱动全链路合规智能体系 | 📚 | 知识统一 | 内外部法规 + 历史案例
+一库统管，自动更新 | 💬 | 智能问答 | 混合检索 + 知识图谱
+可溯源的决策建议 | 📄 | 合规审查 | AI自动比对标注
+风险等级 + 整改建议 | 🦺 | EHS防控 | SIF预测 + 体系审计
+被动响应到主动预防 | 🔌 | 无缝集成 | API化能力嵌入
+PLM · ERP · OA · MES | 建议下一步行动 | 01 | 需求确认 | 与EHS · 法务 · 采购
+核心用户开展访谈 | 02 | POC验证 | 选取2-3个场景快速
+搭建原型验证可行性 | 03 | 数据准备 | 梳理内部文档，确认
+数据分级与权限策略 | 04 | 架构评审 | 与IT安全团队确认
+私有化部署与集成规范 | AI 合规智能中枢  |  面向车企与工厂  |  2026.04 | 13 / 13
+
+===== DOCX =====
--- a/frontend/src/App.tsx
+++ b/frontend/src/App.tsx
@@ -1,12 +1,18 @@
 import './styles/globals.css';
-import { ThemeProvider } from './contexts';
+import { ThemeProvider, AuthProvider, PageStateProvider, LanguageProvider } from './contexts';
 import { AppRouter } from './router/AppRouter';

 function App() {
  return (
-    <ThemeProvider>
-      <AppRouter />
-    </ThemeProvider>
+    <LanguageProvider>
+      <ThemeProvider>
+        <AuthProvider>
+          <PageStateProvider>
+            <AppRouter />
+          </PageStateProvider>
+        </AuthProvider>
+      </ThemeProvider>
+    </LanguageProvider>
  );
 }

--- a/frontend/src/api/auth.ts
+++ b/frontend/src/api/auth.ts
@@ -0,0 +1,43 @@
+const AUTH_API_BASE = '/api/v1';
+
+export interface TokenResponse {
+  access_token: string;
+  token_type: string;
+  expires_in: number;
+}
+
+export interface MeResponse {
+  user_id: string;
+  username: string;
+  role: string;
+}
+
+export async function loginRequest(
+  username: string,
+  password: string,
+): Promise<TokenResponse> {
+  const body = new URLSearchParams();
+  body.set('username', username);
+  body.set('password', password);
+
+  const res = await fetch(`${AUTH_API_BASE}/auth/token`, {
+    method: 'POST',
+    headers: { 'Content-Type': 'application/x-www-form-urlencoded' },
+    body: body.toString(),
+  });
+
+  if (!res.ok) {
+    const payload = await res.json().catch(() => ({})) as { detail?: string };
+    throw new Error(payload.detail ?? `Login failed (${res.status})`);
+  }
+
+  return res.json() as Promise<TokenResponse>;
+}
+
+export async function getMeRequest(token: string): Promise<MeResponse> {
+  const res = await fetch(`${AUTH_API_BASE}/auth/me`, {
+    headers: { Authorization: `Bearer ${token}` },
+  });
+  if (!res.ok) throw new Error(`Unauthorised (${res.status})`);
+  return res.json() as Promise<MeResponse>;
+}
--- a/frontend/src/api/docs.ts
+++ b/frontend/src/api/docs.ts
@@ -1,6 +1,12 @@
 import type { DocInfo, DocListResponse, DocUploadResponse } from './index';
 import { API_BASE_URL } from './index';

+const TOKEN_KEY = 'auth_token';
+function authHeaders(extra?: Record<string, string>): Record<string, string> {
+  const token = localStorage.getItem(TOKEN_KEY);
+  return token ? { Authorization: `Bearer ${token}`, ...extra } : { ...extra };
+}
+
 interface BackendDocumentItem {
  doc_id: string;
  doc_name: string;
@@ -76,6 +82,7 @@ export async function uploadDocument(

  const response = await fetch(`${API_BASE_URL}/documents/upload`, {
    method: 'POST',
+    headers: authHeaders(),
    body: formData,
  });

@@ -95,7 +102,9 @@ export async function uploadDocument(
 }

 export async function getDocumentList(): Promise<DocListResponse> {
-  const response = await fetch(`${API_BASE_URL}/documents/management-list`);
+  const response = await fetch(`${API_BASE_URL}/documents/management-list`, {
+    headers: authHeaders(),
+  });
  if (!response.ok) {
    throw new Error(`List failed: ${response.status}`);
  }
@@ -107,7 +116,9 @@ export async function getDocumentList(): Promise<DocListResponse> {
 }

 export async function getDocumentStatus(docId: string): Promise<DocUploadResponse> {
-  const response = await fetch(`${API_BASE_URL}/documents/status/${docId}`);
+  const response = await fetch(`${API_BASE_URL}/documents/status/${docId}`, {
+    headers: authHeaders(),
+  });
  if (!response.ok) {
    throw new Error(`Status check failed: ${response.status}`);
  }
@@ -115,14 +126,20 @@ export async function getDocumentStatus(docId: string): Promise<DocUploadRespons
 }

 export async function deleteDocument(docId: string): Promise<void> {
-  const response = await fetch(`${API_BASE_URL}/documents/${docId}`, { method: 'DELETE' });
+  const response = await fetch(`${API_BASE_URL}/documents/${docId}`, {
+    method: 'DELETE',
+    headers: authHeaders(),
+  });
  if (!response.ok) {
    throw new Error(`Delete failed: ${response.status}`);
  }
 }

 export async function retryDocument(docId: string): Promise<DocUploadResponse> {
-  const response = await fetch(`${API_BASE_URL}/documents/${docId}/retry`, { method: 'POST' });
+  const response = await fetch(`${API_BASE_URL}/documents/${docId}/retry`, {
+    method: 'POST',
+    headers: authHeaders(),
+  });
  if (!response.ok) {
    throw new Error(`Retry failed: ${response.status}`);
  }
@@ -132,10 +149,10 @@ export async function retryDocument(docId: string): Promise<DocUploadResponse> {
 export async function searchRegulations(query: string, topK: number = 8): Promise<RegulationSearchResponse> {
  const response = await fetch(`${API_BASE_URL}/knowledge/retrieval`, {
    method: 'POST',
-    headers: {
+    headers: authHeaders({
      Accept: 'application/json',
      'Content-Type': 'application/json',
-    },
+    }),
    body: JSON.stringify({ query, top_k: topK }),
  });

--- a/frontend/src/api/index.ts
+++ b/frontend/src/api/index.ts
@@ -1,5 +1,12 @@
 const API_BASE_URL = '/api/v1';

+const TOKEN_KEY = 'auth_token';
+
+/** Read the stored JWT without importing AuthContext (avoids circular deps). */
+function getStoredToken(): string | null {
+  return localStorage.getItem(TOKEN_KEY);
+}
+
 interface ApiErrorPayload {
  detail?: string;
  message?: string;
@@ -19,8 +26,24 @@ async function readErrorMessage(response: Response): Promise<string> {
  }
 }

+/** Inject Authorization header when a token is available. */
+function withAuth(headers: Headers): Headers {
+  const token = getStoredToken();
+  if (token && !headers.has('Authorization')) {
+    headers.set('Authorization', `Bearer ${token}`);
+  }
+  return headers;
+}
+
+/** Handle 401 by clearing the stored token so the app redirects to login. */
+function handle401() {
+  localStorage.removeItem(TOKEN_KEY);
+  // Emit a custom event so AuthContext / router can react without a direct import.
+  window.dispatchEvent(new CustomEvent('auth:unauthorized'));
+}
+
 export async function fetchAPI<T>(endpoint: string, options?: RequestInit): Promise<T> {
-  const headers = new Headers(options?.headers);
+  const headers = withAuth(new Headers(options?.headers));
  if (!headers.has('Accept')) {
    headers.set('Accept', 'application/json');
  }
@@ -33,6 +56,11 @@ export async function fetchAPI<T>(endpoint: string, options?: RequestInit): Prom
    headers,
  });

+  if (response.status === 401) {
+    handle401();
+    throw new Error('Session expired, please log in again.');
+  }
+
  if (!response.ok) {
    throw new Error(`API Error: ${await readErrorMessage(response)}`);
  }
@@ -54,15 +82,25 @@ export async function streamSSE<TMessage extends SSEMessage>(
  onError?: (error: Error) => void,
  onComplete?: () => void
 ): Promise<void> {
+  const headers: Record<string, string> = {
+    Accept: 'text/event-stream',
+    'Content-Type': 'application/json',
+  };
+  const token = getStoredToken();
+  if (token) headers['Authorization'] = `Bearer ${token}`;
+
  const response = await fetch(buildUrl(endpoint), {
    method: 'POST',
-    headers: {
-      Accept: 'text/event-stream',
-      'Content-Type': 'application/json',
-    },
+    headers,
    body: JSON.stringify(body),
  });

+  if (response.status === 401) {
+    handle401();
+    onError?.(new Error('Session expired, please log in again.'));
+    return;
+  }
+
  if (!response.ok) {
    onError?.(new Error(`HTTP error! status: ${await readErrorMessage(response)}`));
    return;
--- a/frontend/src/api/perception.ts
+++ b/frontend/src/api/perception.ts
@@ -1,4 +1,9 @@
 const PERCEPTION_API_BASE = '/api/v1';
+const TOKEN_KEY = 'auth_token';
+function authHeader(): Record<string, string> {
+  const t = localStorage.getItem(TOKEN_KEY);
+  return t ? { Authorization: `Bearer ${t}` } : {};
+}

 export type ImpactLevel = 'high' | 'medium' | 'low';
 export type EventStatus = 'enacted' | 'draft' | 'consultation';
@@ -48,7 +53,7 @@ export interface AnalysisSSEMessage {
 }

 export async function getPerceptionStats(): Promise<PerceptionStats> {
-  const res = await fetch(`${PERCEPTION_API_BASE}/perception/stats`);
+  const res = await fetch(`${PERCEPTION_API_BASE}/perception/stats`, { headers: authHeader() });
  if (!res.ok) throw new Error(`stats failed: ${res.status}`);
  return res.json() as Promise<PerceptionStats>;
 }
@@ -62,7 +67,7 @@ export async function listEvents(params?: {
  if (params?.source) query.set('source', params.source);
  if (params?.impact_level) query.set('impact_level', params.impact_level);
  if (params?.limit) query.set('limit', String(params.limit));
-  const res = await fetch(`${PERCEPTION_API_BASE}/perception/events?${query.toString()}`);
+  const res = await fetch(`${PERCEPTION_API_BASE}/perception/events?${query.toString()}`, { headers: authHeader() });
  if (!res.ok) throw new Error(`list events failed: ${res.status}`);
  return res.json() as Promise<EventListResponse>;
 }
@@ -76,7 +81,7 @@ export async function analyzeEvent(
  try {
    const res = await fetch(`${PERCEPTION_API_BASE}/perception/events/${eventId}/analyze`, {
      method: 'POST',
-      headers: { Accept: 'text/event-stream' },
+      headers: { Accept: 'text/event-stream', ...authHeader() },
      signal,
    });
    if (!res.ok || !res.body) throw new Error(`analyze failed: ${res.status}`);
--- a/frontend/src/api/rag.ts
+++ b/frontend/src/api/rag.ts
@@ -1,6 +1,8 @@
 import type { QuickQuestionsResponse, SSEMessage } from './index';

 const AGENT_API_BASE = '/api/v1';
+const TOKEN_KEY = 'auth_token';
+function getToken(): string | null { return localStorage.getItem(TOKEN_KEY); }

 const _FALLBACK_QUESTIONS = [
  { id: '1', question: '请总结最新入库法规对电池安全的核心要求', category: '法规解读' },
@@ -100,6 +102,7 @@ export async function ragChat(
      headers: {
        'Content-Type': 'application/json',
        Accept: 'text/event-stream',
+        ...(getToken() ? { Authorization: `Bearer ${getToken()}` } : {}),
      },
      body: JSON.stringify({
        query,
--- a/frontend/src/components/layout/Sidebar.tsx
+++ b/frontend/src/components/layout/Sidebar.tsx
@@ -1,9 +1,11 @@
 import { NavLink } from 'react-router-dom';
 import {
  LayoutDashboard, Radio, Monitor, FileText,
-  Shield, MessageSquare, Sun, Moon
+  Shield, MessageSquare, Sun, Moon, LogOut
 } from 'lucide-react';
 import { useTheme } from '../../contexts/ThemeContext';
+import { useAuth } from '../../contexts/AuthContext';
+import { useLanguage } from '../../contexts/LanguageContext';

 interface NavItem {
  to: string;
@@ -12,21 +14,6 @@ interface NavItem {
  badge?: number;
 }

-const mainNav: NavItem[] = [
-  { to: '/', icon: <LayoutDashboard size={16} />, label: 'Overview' },
-  { to: '/signals', icon: <Radio size={16} />, label: 'Regulatory Signals' },
-  { to: '/status', icon: <Monitor size={16} />, label: 'System Status' },
-];
-
-const workbenchNav: NavItem[] = [
-  { to: '/documents', icon: <FileText size={16} />, label: 'Documents' },
-  { to: '/compliance', icon: <Shield size={16} />, label: 'Compliance Analysis' },
-];
-
-const chatNav: NavItem[] = [
-  { to: '/chat', icon: <MessageSquare size={16} />, label: 'Regulation Q&A' },
-];
-
 function NavGroup({ title, items }: { title: string; items: NavItem[] }) {
  return (
    <div className="nav-group">
@@ -49,8 +36,33 @@ function NavGroup({ title, items }: { title: string; items: NavItem[] }) {
  );
 }

+/** Avatar initials from username (up to 2 chars). */
+function initials(name: string): string {
+  const parts = name.trim().split(/[\s_-]+/);
+  if (parts.length >= 2) return (parts[0][0] + parts[1][0]).toUpperCase();
+  return name.slice(0, 2).toUpperCase();
+}
+
 export function Sidebar() {
  const { theme, toggleTheme } = useTheme();
+  const { user, logout } = useAuth();
+  const { lang, t, toggleLang } = useLanguage();
+
+  const mainNav: NavItem[] = [
+    { to: '/', icon: <LayoutDashboard size={16} />, label: t.nav.overview },
+    { to: '/signals', icon: <Radio size={16} />, label: t.nav.signals },
+    { to: '/status', icon: <Monitor size={16} />, label: t.nav.status },
+  ];
+
+  const workbenchNav: NavItem[] = [
+    { to: '/documents', icon: <FileText size={16} />, label: t.nav.documents },
+    { to: '/compliance', icon: <Shield size={16} />, label: t.nav.compliance },
+  ];
+
+  const chatNav: NavItem[] = [
+    { to: '/chat', icon: <MessageSquare size={16} />, label: t.nav.chat },
+  ];
+
  return (
    <aside className="sidebar">
      <div className="sidebar-brand">
@@ -62,22 +74,43 @@ export function Sidebar() {
      </div>

      <nav className="sidebar-nav">
-        <NavGroup title="Main" items={mainNav} />
-        <NavGroup title="Workbench" items={workbenchNav} />
-        <NavGroup title="Chat" items={chatNav} />
+        <NavGroup title={t.nav.groupMain} items={mainNav} />
+        <NavGroup title={t.nav.groupWorkbench} items={workbenchNav} />
+        <NavGroup title={t.nav.groupChat} items={chatNav} />
      </nav>

      <div className="sidebar-footer">
        <div className="sidebar-user">
-          <div className="user-avatar">TS</div>
+          <div className="user-avatar">{user ? initials(user.username) : 'TS'}</div>
          <div className="user-info">
-            <div className="user-name">Analyst</div>
-            <div className="user-role">T-Systems</div>
+            <div className="user-name">{user?.username ?? 'Analyst'}</div>
+            <div className="user-role">
+              {user ? (
+                <span className="user-badge">{user.role}</span>
+              ) : (
+                'T-Systems'
+              )}
+            </div>
          </div>
        </div>
-        <button className="theme-btn" onClick={toggleTheme} title="Toggle theme">
-          {theme === 'dark' ? <Sun size={14} /> : <Moon size={14} />}
-        </button>
+        <div style={{ display: 'flex', gap: 4 }}>
+          <button
+            className="theme-btn"
+            onClick={toggleLang}
+            title={t.sidebar.toggleLang}
+            style={{ fontSize: 12, fontWeight: 600 }}
+          >
+            {lang === 'en' ? 'EN' : '中'}
+          </button>
+          <button className="theme-btn" onClick={toggleTheme} title={t.sidebar.toggleTheme}>
+            {theme === 'dark' ? <Sun size={14} /> : <Moon size={14} />}
+          </button>
+          {user && (
+            <button className="logout-btn" onClick={logout} title={t.sidebar.signOut}>
+              <LogOut size={14} />
+            </button>
+          )}
+        </div>
      </div>
    </aside>
  );
--- a/frontend/src/contexts/AuthContext.tsx
+++ b/frontend/src/contexts/AuthContext.tsx
@@ -0,0 +1,72 @@
+import React, { createContext, useCallback, useContext, useEffect, useState } from 'react';
+import { loginRequest, getMeRequest } from '../api/auth';
+
+const TOKEN_KEY = 'auth_token';
+
+export interface AuthUser {
+  user_id: string;
+  username: string;
+  role: string;
+}
+
+interface AuthContextValue {
+  token: string | null;
+  user: AuthUser | null;
+  loading: boolean;
+  login: (username: string, password: string) => Promise<void>;
+  logout: () => void;
+}
+
+const AuthContext = createContext<AuthContextValue>({
+  token: null,
+  user: null,
+  loading: true,
+  login: async () => {},
+  logout: () => {},
+});
+
+export function AuthProvider({ children }: { children: React.ReactNode }) {
+  const [token, setToken] = useState<string | null>(() => localStorage.getItem(TOKEN_KEY));
+  const [user, setUser] = useState<AuthUser | null>(null);
+  const [loading, setLoading] = useState(true);
+
+  // Validate the stored token on mount by calling /auth/me.
+  useEffect(() => {
+    if (!token) {
+      setLoading(false);
+      return;
+    }
+    getMeRequest(token)
+      .then(setUser)
+      .catch(() => {
+        // Token is expired or invalid — force re-login.
+        localStorage.removeItem(TOKEN_KEY);
+        setToken(null);
+      })
+      .finally(() => setLoading(false));
+  }, []); // eslint-disable-line react-hooks/exhaustive-deps
+
+  const login = useCallback(async (username: string, password: string) => {
+    const resp = await loginRequest(username, password);
+    const me = await getMeRequest(resp.access_token);
+    localStorage.setItem(TOKEN_KEY, resp.access_token);
+    setToken(resp.access_token);
+    setUser(me);
+  }, []);
+
+  const logout = useCallback(() => {
+    localStorage.removeItem(TOKEN_KEY);
+    setToken(null);
+    setUser(null);
+  }, []);
+
+  return (
+    <AuthContext.Provider value={{ token, user, loading, login, logout }}>
+      {children}
+    </AuthContext.Provider>
+  );
+}
+
+export function useAuth() {
+  return useContext(AuthContext);
+}
--- a/frontend/src/contexts/LanguageContext.tsx
+++ b/frontend/src/contexts/LanguageContext.tsx
@@ -0,0 +1,36 @@
+import React, { createContext, useContext, useState } from 'react';
+import { en } from '../locales/en';
+import type { Translations } from '../locales/en';
+import { zh } from '../locales/zh';
+
+export type Lang = 'en' | 'zh';
+
+interface LanguageContextValue {
+  lang: Lang;
+  t: Translations;
+  toggleLang: () => void;
+}
+
+const LanguageContext = createContext<LanguageContextValue>({
+  lang: 'en',
+  t: en,
+  toggleLang: () => {},
+});
+
+export function LanguageProvider({ children }: { children: React.ReactNode }) {
+  const [lang, setLang] = useState<Lang>('en');
+
+  const toggleLang = () => setLang(l => (l === 'en' ? 'zh' : 'en'));
+
+  const t = lang === 'en' ? en : zh;
+
+  return (
+    <LanguageContext.Provider value={{ lang, t, toggleLang }}>
+      {children}
+    </LanguageContext.Provider>
+  );
+}
+
+export function useLanguage() {
+  return useContext(LanguageContext);
+}
--- a/frontend/src/contexts/PageStateContext.tsx
+++ b/frontend/src/contexts/PageStateContext.tsx
@@ -0,0 +1,218 @@
+/**
+ * PageStateContext — preserves page-level session state across route changes.
+ *
+ * When React Router unmounts a page component, all its useState values are lost.
+ * This context lives above the router and holds the state that must survive
+ * navigation so users can switch modules and return without losing their work.
+ *
+ * Covered pages:
+ *  - RagChat:    message history, citation rail, sessionId, input draft
+ *  - Compliance: analysis result (sources, findings, conclusion, meta)
+ *  - Perception: selected signal, filter state, AI analysis output
+ */
+
+import React, { createContext, useContext, useState, useCallback, useRef } from 'react';
+
+// ── RagChat types ─────────────────────────────────────────────────────────────
+
+export interface RagMessage {
+  id: string;
+  role: 'user' | 'assistant';
+  text: string;
+  citationRefs?: number[];
+}
+
+export interface RagCitation {
+  index: number;
+  score: number;
+  name: string;
+  clause: string;
+  snippet: string;
+  docId?: string;
+}
+
+export interface RagChatState {
+  messages: RagMessage[];
+  citations: RagCitation[];
+  sessionId: string | null;
+  inputDraft: string;
+}
+
+const RAG_INIT: RagChatState = {
+  messages: [
+    {
+      id: 'init',
+      role: 'assistant',
+      text: 'Hello! I can answer questions about your indexed regulations and compliance documents. Try asking about EU AI Act requirements, MIIT rules, or ISO/SAE 21434 scope.',
+    },
+  ],
+  citations: [],
+  sessionId: null,
+  inputDraft: '',
+};
+
+// ── Compliance types ──────────────────────────────────────────────────────────
+
+export interface ComplianceSourceEvent {
+  standard: string;
+  clause: string;
+  score: number;
+  status: string;
+  full_content: string;
+}
+
+export interface ComplianceFindingEvent {
+  title: string;
+  desc: string;
+  status: 'ok' | 'warn' | 'risk';
+  clause_ref?: string;
+}
+
+export interface ComplianceActionItem {
+  label: string;
+  value: string;
+  risk?: boolean;
+}
+
+export interface ComplianceDonePayload {
+  conclusion: string;
+  actions: ComplianceActionItem[];
+  risk_score: number;
+  highlight_terms: string[];
+  para_text: string;
+}
+
+export interface ComplianceMeta {
+  title: string;
+  sourceType: 'text' | 'doc' | 'upload';
+  startedAt: string;
+}
+
+export type ComplianceStatus = 'idle' | 'streaming' | 'done' | 'error';
+
+export interface ComplianceState {
+  status: ComplianceStatus;
+  stageLabel: string;
+  stageKey: string;
+  meta: ComplianceMeta | null;
+  sources: ComplianceSourceEvent[];
+  findings: ComplianceFindingEvent[];
+  done: ComplianceDonePayload | null;
+  errorText: string;
+  // Direction B additions:
+  analysisId: string | null;
+  isReadOnly: boolean;
+  activeFindingId: string | null;
+}
+
+const COMPLIANCE_INIT: ComplianceState = {
+  status: 'idle',
+  stageLabel: '',
+  stageKey: '',
+  meta: null,
+  sources: [],
+  findings: [],
+  done: null,
+  errorText: '',
+  analysisId: null,
+  isReadOnly: false,
+  activeFindingId: null,
+};
+
+// ── Perception types ──────────────────────────────────────────────────────────
+
+export interface PerceptionSignal {
+  id: string;
+  source: string;
+  standard: string;
+  status: 'ok' | 'warn' | 'risk' | 'info';
+  title: string;
+  summary: string;
+  date: string;
+  tags: string[];
+  impact: 'High' | 'Medium' | 'Low';
+}
+
+export interface PerceptionPageState {
+  signals: PerceptionSignal[];
+  searchQuery: string;
+  sourceFilter: string;
+  impactFilter: string;
+  selectedId: string | null;
+  aiOutput: string;
+  detailTab: 'overview' | 'obligations' | 'assessment' | 'diff';
+  crawlStatus: string;
+}
+
+const PERCEPTION_INIT: PerceptionPageState = {
+  signals: [],
+  searchQuery: '',
+  sourceFilter: 'All',
+  impactFilter: 'All',
+  selectedId: null,
+  aiOutput: '',
+  detailTab: 'overview',
+  crawlStatus: '',
+};
+
+// ── Context value ─────────────────────────────────────────────────────────────
+
+interface PageStateContextValue {
+  // RagChat
+  ragState: RagChatState;
+  setRagState: React.Dispatch<React.SetStateAction<RagChatState>>;
+  ragStreamingRef: React.MutableRefObject<boolean>;
+  ragAbortRef: React.MutableRefObject<AbortController | null>;
+
+  // Compliance
+  complianceState: ComplianceState;
+  setComplianceState: React.Dispatch<React.SetStateAction<ComplianceState>>;
+  complianceAbortRef: React.MutableRefObject<AbortController | null>;
+  resetCompliance: () => void;
+
+  // Perception
+  perceptionState: PerceptionPageState;
+  setPerceptionState: React.Dispatch<React.SetStateAction<PerceptionPageState>>;
+  perceptionAbortRef: React.MutableRefObject<AbortController | null>;
+  perceptionCrawlAbortRef: React.MutableRefObject<AbortController | null>;
+}
+
+const PageStateContext = createContext<PageStateContextValue | null>(null);
+
+// ── Provider ──────────────────────────────────────────────────────────────────
+
+export function PageStateProvider({ children }: { children: React.ReactNode }) {
+  const [ragState, setRagState] = useState<RagChatState>(RAG_INIT);
+  const ragStreamingRef = useRef(false);
+  const ragAbortRef = useRef<AbortController | null>(null);
+
+  const [complianceState, setComplianceState] = useState<ComplianceState>(COMPLIANCE_INIT);
+  const complianceAbortRef = useRef<AbortController | null>(null);
+
+  const resetCompliance = useCallback(() => {
+    complianceAbortRef.current?.abort();
+    setComplianceState(COMPLIANCE_INIT);
+  }, []);
+
+  const [perceptionState, setPerceptionState] = useState<PerceptionPageState>(PERCEPTION_INIT);
+  const perceptionAbortRef = useRef<AbortController | null>(null);
+  const perceptionCrawlAbortRef = useRef<AbortController | null>(null);
+
+  return (
+    <PageStateContext.Provider value={{
+      ragState, setRagState, ragStreamingRef, ragAbortRef,
+      complianceState, setComplianceState, complianceAbortRef, resetCompliance,
+      perceptionState, setPerceptionState, perceptionAbortRef, perceptionCrawlAbortRef,
+    }}>
+      {children}
+    </PageStateContext.Provider>
+  );
+}
+
+// ── Hook ──────────────────────────────────────────────────────────────────────
+
+export function usePageState() {
+  const ctx = useContext(PageStateContext);
+  if (!ctx) throw new Error('usePageState must be used inside PageStateProvider');
+  return ctx;
+}
--- a/frontend/src/contexts/index.ts
+++ b/frontend/src/contexts/index.ts
@@ -1 +1,20 @@
 export { ThemeProvider, useTheme } from './ThemeContext';
+export { AuthProvider, useAuth } from './AuthContext';
+export type { AuthUser } from './AuthContext';
+export { PageStateProvider, usePageState } from './PageStateContext';
+export { LanguageProvider, useLanguage } from './LanguageContext';
+export type { Lang } from './LanguageContext';
+export type {
+  RagChatState,
+  RagMessage,
+  RagCitation,
+  ComplianceState,
+  ComplianceStatus,
+  ComplianceSourceEvent,
+  ComplianceFindingEvent,
+  ComplianceDonePayload,
+  ComplianceMeta,
+  ComplianceActionItem,
+  PerceptionPageState,
+  PerceptionSignal,
+} from './PageStateContext';
--- a/frontend/src/locales/en.ts
+++ b/frontend/src/locales/en.ts
@@ -0,0 +1,460 @@
+// English translations — default language
+export interface Translations {
+  nav: {
+    groupMain: string;
+    groupWorkbench: string;
+    groupChat: string;
+    overview: string;
+    signals: string;
+    status: string;
+    documents: string;
+    compliance: string;
+    chat: string;
+  };
+  sidebar: {
+    toggleTheme: string;
+    toggleLang: string;
+    signOut: string;
+  };
+  overview: {
+    eyebrow: string;
+    heroTitle: string;
+    heroDesc: string;
+    openDashboard: string;
+    jumpToChat: string;
+    sectionHowItWorks: string;
+    sectionScreens: string;
+    statScreens: string;
+    statFlows: string;
+    statReviewPosture: string;
+    stepUpload: string; stepUploadDesc: string;
+    stepProcess: string; stepProcessDesc: string;
+    stepMonitor: string; stepMonitorDesc: string;
+    stepAnalyze: string; stepAnalyzeDesc: string;
+    stepReview: string; stepReviewDesc: string;
+    stepChat: string; stepChatDesc: string;
+    screenStatus: string; screenStatusDesc: string;
+    screenSignals: string; screenSignalsDesc: string;
+    screenDocuments: string; screenDocumentsDesc: string;
+    screenCompliance: string; screenComplianceDesc: string;
+    screenChat: string; screenChatDesc: string;
+    screenAnalytics: string; screenAnalyticsDesc: string;
+  };
+  signals: {
+    topbarTitle: string;
+    topbarSub: string;
+    searchPlaceholder: string;
+    refreshBtn: string;
+    crawlingBtn: string;
+    statTotal: string;
+    statHigh: string;
+    statMedium: string;
+    statLast90: string;
+    badgeFinal: string;
+    badgeDraft: string;
+    badgeUrgent: string;
+    badgePublished: string;
+    emptySelectSignal: string;
+    runAnalysis: string;
+    stopBtn: string;
+    sourceLink: string;
+    tabOverview: string;
+    tabObligations: string;
+    tabImpact: string;
+    tabChanges: string;
+    cardScopeHeader: string;
+    cardObligationsHeader: string;
+    obligationsEmpty: string;
+    colObligationDesc: string;
+    colSubject: string;
+    colType: string;
+    colDeadline: string;
+    deadlinePending: string;
+    cardAffectedDocs: string;
+    noAffectedDocs: string;
+    cardAIImpact: string;
+    footerText: string;
+    statusConnecting: string;
+    statusNoStream: string;
+    statusCrawling: string;
+    statusProcessing: string;
+    statusComplete: string;
+    statusUpdateComplete: string;
+    statusError: string;
+    statusConnFailed: string;
+    diffOld: string;
+    diffNew: string;
+    diffCardHeader: string;
+  };
+  status: {
+    topbarTitle: string;
+    searchPlaceholder: string;
+    exportBtn: string;
+    refreshBtn: string;
+    newUploadBtn: string;
+    statTotal: string;
+    statIndexed: string;
+    statFailed: string;
+    statChunks: string;
+    statCoverage: string;
+    cardHealth: string;
+    badgeOnline: string;
+    badgeError: string;
+    badgeDegraded: string;
+    badgeUnknown: string;
+    healthEndpointError: string;
+    serviceEnabled: string;
+    serviceDisabled: string;
+    serviceNotLoaded: string;
+    cardConfig: string;
+    labelLLMProvider: string;
+    labelLLMModel: string;
+    labelEmbeddingModel: string;
+    labelEmbeddingDim: string;
+    labelMilvusCollection: string;
+    labelParserBackend: string;
+    labelChunkBackend: string;
+    labelParserFailureMode: string;
+    configLoadError: string;
+    cardBreakdown: string;
+    breakdownIndexed: string;
+    breakdownProcessing: string;
+    breakdownFailed: string;
+    cardRuntime: string;
+    labelActiveSessions: string;
+    labelSessionCapacity: string;
+    labelReranker: string;
+    labelBM25: string;
+    statusActive: string;
+    statusUnavailable: string;
+    footerAllOk: string;
+    footerDegraded: string;
+    footerChecking: string;
+    totalChunks: string;
+  };
+  docs: {
+    topbarTitle: string;
+    searchPlaceholder: string;
+    refreshBtn: string;
+    uploadBtn: string;
+    confirmDeleteTitle: string;
+    cancelBtn: string;
+    deleteBtn: string;
+    filterAll: string;
+    filterReady: string;
+    filterProcessing: string;
+    filterFailed: string;
+    filterPending: string;
+    filterAllTypes: string;
+    deleteSelected: string;
+    colName: string;
+    colStatus: string;
+    colUploaded: string;
+    colChunks: string;
+    colSize: string;
+    colType: string;
+    colActions: string;
+    loading: string;
+    emptyNoDocuments: string;
+    emptyNoMatch: string;
+    titleDownload: string;
+    titleRetry: string;
+    titleDelete: string;
+  };
+  compliance: {
+    topbarTitle: string;
+    searchPlaceholder: string;
+    clearBtn: string;
+    exportBtn: string;
+    exportJSON: string;
+    exportText: string;
+    newAnalysisBtn: string;
+    statusAnalyzing: string;
+    statusComplete: string;
+    statusError: string;
+    emptyTitle: string;
+    emptyDesc: string;
+    retrievingMsg: string;
+    defaultRegulation: string;
+    matchSuffix: string;
+    colParagraph: string;
+    extractingMsg: string;
+    noTextExtracted: string;
+    stagesHeader: string;
+    stageExtraction: string;
+    stageClauseSplit: string;
+    stageRetrieval: string;
+    stageSynthesis: string;
+    gapInProgress: string;
+    askAIBtn: string;
+    chatBtn: string;
+    conclusionHeader: string;
+    riskScoreTooltip: string;
+    statusCovered: string;
+    statusGap: string;
+    statusCritical: string;
+    statusInfo: string;
+    sourceTypePasted: string;
+    sourceTypeIndexed: string;
+    sourceTypeUploaded: string;
+    chatSidebarHeader: string;
+    chatThinking: string;
+    quickQ1: string;
+    quickQ2: string;
+    quickQ3: string;
+    chatPlaceholder: string;
+    sendBtn: string;
+    analysisFailed: string;
+    exportReportHeader: string;
+    exportSectionParagraph: string;
+    exportSectionFindings: string;
+    exportSectionConclusion: string;
+    exportSectionActions: string;
+    historyHeader: string;
+    downloadReport: string;
+    historyEmpty: string;
+    historyDeleteConfirm: string;
+    drawerClose: string;
+    drawerChatEmpty: string;
+    drawerSuggestionsHeader: string;
+  };
+  ragchat: {
+    topbarTitle: string;
+    exportBtn: string;
+    quickPromptsHeader: string;
+    inputPlaceholder: string;
+    citationsHeader: string;
+    citationsEmpty: string;
+    apiError: string;
+  };
+}
+
+export const en: Translations = {
+  nav: {
+    groupMain: 'Main',
+    groupWorkbench: 'Workbench',
+    groupChat: 'Chat',
+    overview: 'Overview',
+    signals: 'Regulatory Signals',
+    status: 'System Status',
+    documents: 'Documents',
+    compliance: 'Compliance Analysis',
+    chat: 'Regulation Q&A',
+  },
+  sidebar: {
+    toggleTheme: 'Toggle theme',
+    toggleLang: 'Switch language',
+    signOut: 'Sign out',
+  },
+  overview: {
+    eyebrow: 'T-Systems · AI Regulation Hub',
+    heroTitle: 'AI Compliance,\nAutomated end-to-end',
+    heroDesc: 'Monitor global AI regulations, analyze document compliance gaps, and get cited answers — all in one platform.',
+    openDashboard: 'Open dashboard',
+    jumpToChat: 'Jump to regulation chat',
+    sectionHowItWorks: 'How it works',
+    sectionScreens: 'Screens',
+    statScreens: 'Screens',
+    statFlows: 'Backend-aware flows',
+    statReviewPosture: 'Review posture',
+    stepUpload: 'Upload', stepUploadDesc: 'Ingest regulation documents',
+    stepProcess: 'Process', stepProcessDesc: 'Embed and chunk via vector DB',
+    stepMonitor: 'Monitor', stepMonitorDesc: 'Watch regulatory signal feed',
+    stepAnalyze: 'Analyze', stepAnalyzeDesc: 'Run compliance gap analysis',
+    stepReview: 'Review', stepReviewDesc: 'Inspect findings with AI assist',
+    stepChat: 'Chat', stepChatDesc: 'Ask questions with cited answers',
+    screenStatus: 'System Status', screenStatusDesc: 'Live health and workflow queue',
+    screenSignals: 'Regulatory Signals', screenSignalsDesc: 'AI-detected regulatory changes',
+    screenDocuments: 'Document Management', screenDocumentsDesc: 'Upload and inspect documents',
+    screenCompliance: 'Compliance Analysis', screenComplianceDesc: 'Three-column compliance workspace',
+    screenChat: 'Regulation Q&A', screenChatDesc: 'Chat with cited regulation sources',
+    screenAnalytics: 'Analytics', screenAnalyticsDesc: 'KPIs and coverage metrics',
+  },
+  signals: {
+    topbarTitle: 'Regulatory Signals',
+    topbarSub: 'ai-powered · live feed',
+    searchPlaceholder: 'Search signals...',
+    refreshBtn: 'Refresh Sources',
+    crawlingBtn: 'Crawling...',
+    statTotal: 'Total signals',
+    statHigh: 'High impact',
+    statMedium: 'Medium impact',
+    statLast90: 'Last 90 days',
+    badgeFinal: 'Final',
+    badgeDraft: 'Draft',
+    badgeUrgent: 'Urgent',
+    badgePublished: 'Published',
+    emptySelectSignal: 'Select a signal to run impact analysis',
+    runAnalysis: 'Run impact analysis',
+    stopBtn: 'Stop',
+    sourceLink: 'Source',
+    tabOverview: 'Overview',
+    tabObligations: 'Obligations',
+    tabImpact: 'Impact Assessment',
+    tabChanges: 'Change Comparison',
+    cardScopeHeader: 'Scope & Summary',
+    cardObligationsHeader: 'Obligations',
+    obligationsEmpty: 'No structured data yet. Click "Run impact analysis" to extract.',
+    colObligationDesc: 'Obligation',
+    colSubject: 'Subject',
+    colType: 'Type',
+    colDeadline: 'Deadlines',
+    deadlinePending: 'Pending',
+    cardAffectedDocs: 'Affected documents',
+    noAffectedDocs: 'No affected documents found.',
+    cardAIImpact: 'AI Impact Analysis',
+    footerText: 'Live feed · Regulation Hub',
+    statusConnecting: 'Connecting to data sources...',
+    statusNoStream: 'No stream',
+    statusCrawling: 'Crawling...',
+    statusProcessing: 'Processing {count} items...',
+    statusComplete: 'Done +{count} items',
+    statusUpdateComplete: 'Update complete — {new} added, {updated} updated',
+    statusError: 'Error: {message}',
+    statusConnFailed: 'Connection failed: {message}',
+    diffOld: 'Previous',
+    diffNew: 'Current',
+    diffCardHeader: 'Change Comparison',
+  },
+  status: {
+    topbarTitle: 'System Status',
+    searchPlaceholder: 'Search...',
+    exportBtn: 'Export',
+    refreshBtn: 'Refresh',
+    newUploadBtn: 'New upload',
+    statTotal: 'Documents total',
+    statIndexed: 'Indexed',
+    statFailed: 'Failed',
+    statChunks: 'Vector chunks',
+    statCoverage: 'Index coverage',
+    cardHealth: 'System health',
+    badgeOnline: 'Online',
+    badgeError: 'Error',
+    badgeDegraded: 'Degraded',
+    badgeUnknown: 'Unknown',
+    healthEndpointError: 'Could not reach health endpoint',
+    serviceEnabled: 'Enabled',
+    serviceDisabled: 'Disabled',
+    serviceNotLoaded: 'Not loaded',
+    cardConfig: 'System configuration',
+    labelLLMProvider: 'LLM provider',
+    labelLLMModel: 'LLM model',
+    labelEmbeddingModel: 'Embedding model',
+    labelEmbeddingDim: 'Embedding dim',
+    labelMilvusCollection: 'Milvus collection',
+    labelParserBackend: 'Parser backend',
+    labelChunkBackend: 'Chunk backend',
+    labelParserFailureMode: 'Parser failure mode',
+    configLoadError: 'Could not load config',
+    cardBreakdown: 'Document breakdown',
+    breakdownIndexed: 'Indexed',
+    breakdownProcessing: 'Processing / Parsed',
+    breakdownFailed: 'Failed',
+    cardRuntime: 'Runtime info',
+    labelActiveSessions: 'Active chat sessions',
+    labelSessionCapacity: 'Session capacity',
+    labelReranker: 'Cross-encoder reranker',
+    labelBM25: 'BM25 hybrid retrieval',
+    statusActive: 'Active',
+    statusUnavailable: 'Unavailable',
+    footerAllOk: 'All systems operational',
+    footerDegraded: 'Degraded',
+    footerChecking: 'Checking…',
+    totalChunks: 'Total vector chunks',
+  },
+  docs: {
+    topbarTitle: 'Document Management',
+    searchPlaceholder: 'Search documents...',
+    refreshBtn: 'Refresh',
+    uploadBtn: 'Upload document',
+    confirmDeleteTitle: 'Confirm deletion',
+    cancelBtn: 'Cancel',
+    deleteBtn: 'Delete',
+    filterAll: 'All',
+    filterReady: 'Ready',
+    filterProcessing: 'Processing',
+    filterFailed: 'Failed',
+    filterPending: 'Pending',
+    filterAllTypes: 'All types',
+    deleteSelected: 'Delete selected',
+    colName: 'Document name',
+    colStatus: 'Status',
+    colUploaded: 'Uploaded',
+    colChunks: 'Chunks',
+    colSize: 'Size',
+    colType: 'Type',
+    colActions: 'Actions',
+    loading: 'Loading documents…',
+    emptyNoDocuments: 'No documents yet. Upload a document to get started.',
+    emptyNoMatch: 'No documents match the current filters.',
+    titleDownload: 'Download original file',
+    titleRetry: 'Retry processing',
+    titleDelete: 'Delete document',
+  },
+  compliance: {
+    topbarTitle: 'Compliance Analysis',
+    searchPlaceholder: 'Search analyses...',
+    clearBtn: 'Clear',
+    exportBtn: 'Export',
+    exportJSON: 'Export JSON',
+    exportText: 'Export Text',
+    newAnalysisBtn: 'New analysis',
+    statusAnalyzing: 'Analyzing…',
+    statusComplete: 'Analysis complete',
+    statusError: 'Error',
+    emptyTitle: 'No analysis running',
+    emptyDesc: 'Click New analysis to start a compliance gap review against your indexed regulations.',
+    retrievingMsg: 'Retrieving relevant regulations…',
+    defaultRegulation: 'Regulation',
+    matchSuffix: '% match',
+    colParagraph: 'Paragraph Under Review',
+    extractingMsg: 'Extracting and analyzing text…',
+    noTextExtracted: 'No text extracted',
+    stagesHeader: 'Analysis stages',
+    stageExtraction: 'Text extraction',
+    stageClauseSplit: 'Clause splitting',
+    stageRetrieval: 'Regulation retrieval',
+    stageSynthesis: 'Conclusion synthesis',
+    gapInProgress: 'Gap analysis in progress…',
+    askAIBtn: 'Ask AI',
+    chatBtn: 'Chat',
+    conclusionHeader: 'Conclusion',
+    riskScoreTooltip: 'Risk score (0=safe, 100=critical)',
+    statusCovered: 'Covered',
+    statusGap: 'Gap',
+    statusCritical: 'Critical',
+    statusInfo: 'Info',
+    sourceTypePasted: 'Pasted Text',
+    sourceTypeIndexed: 'Indexed Document',
+    sourceTypeUploaded: 'Uploaded File',
+    chatSidebarHeader: 'AI Compliance Q&A',
+    chatThinking: 'Thinking▋',
+    quickQ1: 'What regulation applies?',
+    quickQ2: 'How to remediate?',
+    quickQ3: 'What is the risk?',
+    chatPlaceholder: 'Ask about this finding…',
+    sendBtn: 'Send',
+    analysisFailed: 'Analysis failed',
+    exportReportHeader: 'COMPLIANCE ANALYSIS REPORT',
+    exportSectionParagraph: '── PARAGRAPH UNDER REVIEW ──',
+    exportSectionFindings: '── FINDINGS ──',
+    exportSectionConclusion: '── CONCLUSION ──',
+    exportSectionActions: '── RECOMMENDED ACTIONS ──',
+    historyHeader: 'History',
+    downloadReport: 'Download report',
+    historyEmpty: 'No analyses yet.',
+    historyDeleteConfirm: 'Delete this analysis record? This cannot be undone.',
+    drawerClose: 'Close',
+    drawerChatEmpty: 'No messages yet. Ask a question below.',
+    drawerSuggestionsHeader: 'Suggested questions',
+  },
+  ragchat: {
+    topbarTitle: 'Regulation Q&A',
+    exportBtn: 'Export chat',
+    quickPromptsHeader: 'Quick prompts',
+    inputPlaceholder: 'Ask about your regulations…',
+    citationsHeader: 'Sources',
+    citationsEmpty: 'Citations will appear here after a response is generated.',
+    apiError: 'Could not reach the RAG API. Please check the backend.',
+  },
+};
--- a/frontend/src/locales/zh.ts
+++ b/frontend/src/locales/zh.ts
@@ -0,0 +1,231 @@
+import type { Translations } from './en';
+
+export const zh: Translations = {
+  nav: {
+    groupMain: '主菜单',
+    groupWorkbench: '工作台',
+    groupChat: '对话',
+    overview: '概览',
+    signals: '法规信号',
+    status: '系统状态',
+    documents: '文档管理',
+    compliance: '合规分析',
+    chat: '法规问答',
+  },
+  sidebar: {
+    toggleTheme: '切换主题',
+    toggleLang: '切换语言',
+    signOut: '退出',
+  },
+  overview: {
+    eyebrow: 'T-Systems · AI 法规中心',
+    heroTitle: 'AI 合规，\n端到端自动化',
+    heroDesc: '监控全球 AI 法规，分析文档合规差距，获取有引用来源的回答——一站式平台。',
+    openDashboard: '打开仪表盘',
+    jumpToChat: '跳转到法规对话',
+    sectionHowItWorks: '工作流程',
+    sectionScreens: '功能页面',
+    statScreens: '功能页面',
+    statFlows: '后端感知流程',
+    statReviewPosture: '审查状态',
+    stepUpload: '上传', stepUploadDesc: '导入法规文档',
+    stepProcess: '处理', stepProcessDesc: '向量化与分块',
+    stepMonitor: '监控', stepMonitorDesc: '监控法规信号流',
+    stepAnalyze: '分析', stepAnalyzeDesc: '运行合规差距分析',
+    stepReview: '审查', stepReviewDesc: 'AI 辅助审查发现',
+    stepChat: '对话', stepChatDesc: '带引用来源的问答',
+    screenStatus: '系统状态', screenStatusDesc: '实时健康与任务队列',
+    screenSignals: '法规信号', screenSignalsDesc: 'AI 检测法规变更',
+    screenDocuments: '文档管理', screenDocumentsDesc: '上传与查阅文档',
+    screenCompliance: '合规分析', screenComplianceDesc: '三栏合规工作台',
+    screenChat: '法规问答', screenChatDesc: '带引用来源的法规对话',
+    screenAnalytics: '数据分析', screenAnalyticsDesc: 'KPI 与覆盖指标',
+  },
+  signals: {
+    topbarTitle: '法规信号',
+    topbarSub: 'AI 驱动 · 实时订阅',
+    searchPlaceholder: '搜索信号...',
+    refreshBtn: '刷新数据源',
+    crawlingBtn: '抓取中...',
+    statTotal: '信号总数',
+    statHigh: '高影响',
+    statMedium: '中影响',
+    statLast90: '近 90 天',
+    badgeFinal: '已发布',
+    badgeDraft: '草案',
+    badgeUrgent: '紧急',
+    badgePublished: '已发布',
+    emptySelectSignal: '选择信号以运行影响分析',
+    runAnalysis: '运行影响分析',
+    stopBtn: '停止',
+    sourceLink: '来源',
+    tabOverview: '概览',
+    tabObligations: '义务条款',
+    tabImpact: '影响评估',
+    tabChanges: '变更对比',
+    cardScopeHeader: '范围与摘要',
+    cardObligationsHeader: '义务条款',
+    obligationsEmpty: '暂无结构化数据。点击"运行影响分析"触发提取。',
+    colObligationDesc: '义务描述',
+    colSubject: '主体',
+    colType: '类型',
+    colDeadline: '截止日期',
+    deadlinePending: '待定',
+    cardAffectedDocs: '受影响文档',
+    noAffectedDocs: '未找到受影响文档。',
+    cardAIImpact: 'AI 影响分析',
+    footerText: '实时订阅 · 法规中心',
+    statusConnecting: '正在连接数据源...',
+    statusNoStream: '无数据流',
+    statusCrawling: '抓取中...',
+    statusProcessing: '处理 {count} 条...',
+    statusComplete: '完成 +{count} 条',
+    statusUpdateComplete: '更新完成 — 新增 {new} 条，更新 {updated} 条',
+    statusError: '错误: {message}',
+    statusConnFailed: '连接失败: {message}',
+    diffOld: '旧版',
+    diffNew: '新版',
+    diffCardHeader: '变更对比',
+  },
+  status: {
+    topbarTitle: '系统状态',
+    searchPlaceholder: '搜索...',
+    exportBtn: '导出',
+    refreshBtn: '刷新',
+    newUploadBtn: '上传文档',
+    statTotal: '文档总数',
+    statIndexed: '已索引',
+    statFailed: '失败',
+    statChunks: '向量分块数',
+    statCoverage: '索引覆盖率',
+    cardHealth: '系统健康',
+    badgeOnline: '在线',
+    badgeError: '错误',
+    badgeDegraded: '降级',
+    badgeUnknown: '未知',
+    healthEndpointError: '无法访问健康检查端点',
+    serviceEnabled: '已启用',
+    serviceDisabled: '已禁用',
+    serviceNotLoaded: '未加载',
+    cardConfig: '系统配置',
+    labelLLMProvider: 'LLM 提供商',
+    labelLLMModel: 'LLM 模型',
+    labelEmbeddingModel: '向量模型',
+    labelEmbeddingDim: '向量维度',
+    labelMilvusCollection: 'Milvus 集合',
+    labelParserBackend: '解析后端',
+    labelChunkBackend: '分块后端',
+    labelParserFailureMode: '解析失败模式',
+    configLoadError: '无法加载配置',
+    cardBreakdown: '文档分布',
+    breakdownIndexed: '已索引',
+    breakdownProcessing: '处理中 / 已解析',
+    breakdownFailed: '失败',
+    cardRuntime: '运行时信息',
+    labelActiveSessions: '活跃对话会话',
+    labelSessionCapacity: '会话容量',
+    labelReranker: '交叉编码器重排序',
+    labelBM25: 'BM25 混合检索',
+    statusActive: '活跃',
+    statusUnavailable: '不可用',
+    footerAllOk: '所有系统正常',
+    footerDegraded: '降级运行',
+    footerChecking: '检查中…',
+    totalChunks: '向量分块总数',
+  },
+  docs: {
+    topbarTitle: '文档管理',
+    searchPlaceholder: '搜索文档...',
+    refreshBtn: '刷新',
+    uploadBtn: '上传文档',
+    confirmDeleteTitle: '确认删除',
+    cancelBtn: '取消',
+    deleteBtn: '删除',
+    filterAll: '全部',
+    filterReady: '就绪',
+    filterProcessing: '处理中',
+    filterFailed: '失败',
+    filterPending: '待处理',
+    filterAllTypes: '所有类型',
+    deleteSelected: '删除所选',
+    colName: '文档名称',
+    colStatus: '状态',
+    colUploaded: '上传时间',
+    colChunks: '分块数',
+    colSize: '大小',
+    colType: '类型',
+    colActions: '操作',
+    loading: '加载文档中…',
+    emptyNoDocuments: '暂无文档。请上传文档以开始使用。',
+    emptyNoMatch: '没有文档符合当前筛选条件。',
+    titleDownload: '下载原始文件',
+    titleRetry: '重试处理',
+    titleDelete: '删除文档',
+  },
+  compliance: {
+    topbarTitle: '合规分析',
+    searchPlaceholder: '搜索分析记录...',
+    clearBtn: '清除',
+    exportBtn: '导出',
+    exportJSON: '导出 JSON',
+    exportText: '导出文本',
+    newAnalysisBtn: '新建分析',
+    statusAnalyzing: '分析中…',
+    statusComplete: '分析完成',
+    statusError: '错误',
+    emptyTitle: '暂无分析任务',
+    emptyDesc: '点击"新建分析"对已索引法规进行合规差距审查。',
+    retrievingMsg: '正在检索相关法规…',
+    defaultRegulation: '法规',
+    matchSuffix: '% 匹配',
+    colParagraph: '待审查段落',
+    extractingMsg: '正在提取并分析文本…',
+    noTextExtracted: '未提取到文本',
+    stagesHeader: '分析阶段',
+    stageExtraction: '文本提取',
+    stageClauseSplit: '条款分割',
+    stageRetrieval: '法规检索',
+    stageSynthesis: '结论综合',
+    gapInProgress: '差距分析进行中…',
+    askAIBtn: '问 AI',
+    chatBtn: '对话',
+    conclusionHeader: '结论',
+    riskScoreTooltip: '风险评分（0=安全，100=严重）',
+    statusCovered: '已覆盖',
+    statusGap: '存在差距',
+    statusCritical: '严重',
+    statusInfo: '信息',
+    sourceTypePasted: '粘贴文本',
+    sourceTypeIndexed: '已索引文档',
+    sourceTypeUploaded: '上传文件',
+    chatSidebarHeader: 'AI 合规问答',
+    chatThinking: '思考中▋',
+    quickQ1: '适用哪条法规？',
+    quickQ2: '如何整改？',
+    quickQ3: '风险等级如何？',
+    chatPlaceholder: '针对此发现提问…',
+    sendBtn: '发送',
+    analysisFailed: '分析失败',
+    exportReportHeader: '合规分析报告',
+    exportSectionParagraph: '── 待审查段落 ──',
+    exportSectionFindings: '── 发现 ──',
+    exportSectionConclusion: '── 结论 ──',
+    exportSectionActions: '── 建议行动 ──',
+    historyHeader: '历史记录',
+    downloadReport: '下载报告',
+    historyEmpty: '暂无分析记录。',
+    historyDeleteConfirm: '删除此分析记录？此操作不可撤销。',
+    drawerClose: '关闭',
+    drawerChatEmpty: '暂无消息。请在下方提问。',
+    drawerSuggestionsHeader: '建议问题',
+  },
+  ragchat: {
+    topbarTitle: '法规问答',
+    exportBtn: '导出对话',
+    quickPromptsHeader: '快捷问题',
+    inputPlaceholder: '请输入关于法规的问题…',
+    citationsHeader: '引用来源',
+    citationsEmpty: '生成回答后，引用来源将显示在此处。',
+    apiError: '无法连接到 RAG API，请检查后端服务。',
+  },
+};
--- a/frontend/src/pages/Compliance/CompliancePage.tsx
+++ b/frontend/src/pages/Compliance/CompliancePage.tsx
@@ -1,12 +1,19 @@
-import { useState, useRef } from 'react';
+import { useState, useRef, useEffect } from 'react';
+import { useLanguage } from '../../contexts/LanguageContext';
 import { Search, Plus, AlertTriangle, Download, MessageSquare, ChevronDown } from 'lucide-react';
 import { Topbar } from '../../components/layout/Topbar';
 import { NewAnalysisModal } from './NewAnalysisModal';
 import { useComplianceAnalysis } from './useComplianceAnalysis';
+import { usePageState } from '../../contexts';
+import { HistoryRail } from './HistoryRail';
+import { FindingChatDrawer } from './FindingChatDrawer';
 import type { FindingEvent, SourceEvent, AnalysisMeta } from './useComplianceAnalysis';

-const STATUS_LABEL: Record<string, string> = { ok: 'Covered', warn: 'Gap', risk: 'Critical', info: 'Info' };
-const SOURCE_TYPE_LABEL: Record<string, string> = { text: 'Pasted Text', doc: 'Indexed Document', upload: 'Uploaded File' };
+const TOKEN_KEY = 'auth_token';
+function authHeader(): Record<string, string> {
+  const t = localStorage.getItem(TOKEN_KEY);
+  return t ? { Authorization: `Bearer ${t}` } : {};
+}

 function riskClass(score: number) {
  if (score >= 70) return 'high';
@@ -71,7 +78,7 @@ function useFindingChat() {
    try {
      const res = await fetch(`/api/v1/compliance/chat/${findingIdx ?? 0}`, {
        method: 'POST',
-        headers: { 'Content-Type': 'application/json' },
+        headers: { 'Content-Type': 'application/json', ...authHeader() },
        body: JSON.stringify({ query: q, segment_context: segmentContext }),
        signal: ctrl.signal,
      });
@@ -106,11 +113,93 @@ function useFindingChat() {
  return { open, findingIdx, messages, input, setInput, loading, openFor, close, send };
 }

+function _FindingChatDrawerWrapper({
+  analysisId,
+  findingIndex,
+  finding,
+  onClose,
+}: {
+  analysisId: string;
+  findingIndex: number;
+  finding: { title: string; desc: string; status: string; clause_ref?: string };
+  onClose: () => void;
+}) {
+  const [findingId, setFindingId] = useState<string | null>(null);
+
+  useEffect(() => {
+    fetch(`/api/v1/compliance/history/${analysisId}`, {
+      headers: { Authorization: `Bearer ${localStorage.getItem('auth_token') ?? ''}` },
+    })
+      .then(r => r.json())
+      .then((data: { findings?: Array<{ seq: number; id: string }> }) => {
+        const f = (data.findings ?? []).find(f => f.seq === findingIndex);
+        if (f?.id) setFindingId(f.id);
+      })
+      .catch(() => {});
+  }, [analysisId, findingIndex]);
+
+  if (!findingId) return null;
+  return (
+    <FindingChatDrawer
+      analysisId={analysisId}
+      findingId={findingId}
+      finding={finding}
+      onClose={onClose}
+    />
+  );
+}
+
 export function CompliancePage() {
  const [showModal, setShowModal] = useState(false);
  const [showExportMenu, setShowExportMenu] = useState(false);
  const { state, run, reset } = useComplianceAnalysis();
  const chat = useFindingChat();
+  const [drawerFindingIdx, setDrawerFindingIdx] = useState<number | null>(null);
+
+  const { setComplianceState } = usePageState();
+  const { t } = useLanguage();
+  const STATUS_LABEL: Record<string, string> = { ok: t.compliance.statusCovered, warn: t.compliance.statusGap, risk: t.compliance.statusCritical, info: t.compliance.statusInfo };
+  const SOURCE_TYPE_LABEL: Record<string, string> = { text: t.compliance.sourceTypePasted, doc: t.compliance.sourceTypeIndexed, upload: t.compliance.sourceTypeUploaded };
+
+  const [historyRefresh, setHistoryRefresh] = useState(0);
+  const prevAnalysisIdRef = useRef<string | null>(null);
+
+  useEffect(() => {
+    if (state.analysisId && state.analysisId !== prevAnalysisIdRef.current) {
+      prevAnalysisIdRef.current = state.analysisId;
+      setHistoryRefresh(n => n + 1);
+    }
+  }, [state.analysisId]);
+
+  async function handleSelectHistory(id: string) {
+    const res = await fetch(`/api/v1/compliance/history/${id}`, { headers: authHeader() });
+    if (!res.ok) return;
+    const data = await res.json();
+    setComplianceState({
+      status: 'done',
+      stageLabel: 'Complete',
+      stageKey: 'concluding',
+      meta: { title: data.doc_name, sourceType: 'doc', startedAt: data.created_at },
+      sources: [],
+      findings: (data.findings || []).map((f: Record<string, unknown>) => ({
+        title: String(f.title ?? ''),
+        desc: String(f.description ?? ''),
+        status: String(f.status ?? 'ok'),
+        clause_ref: f.clause_ref ? String(f.clause_ref) : undefined,
+      })),
+      done: {
+        conclusion: String(data.conclusion ?? ''),
+        actions: data.actions ?? [],
+        risk_score: Number(data.risk_score ?? 0),
+        highlight_terms: data.highlight_terms ?? [],
+        para_text: String(data.para_text ?? ''),
+      },
+      errorText: '',
+      analysisId: data.id,
+      isReadOnly: true,
+      activeFindingId: null,
+    });
+  }

  const isIdle = state.status === 'idle';
  const isStreaming = state.status === 'streaming';
@@ -141,24 +230,24 @@ export function CompliancePage() {

  function exportText() {
    const lines: string[] = [
-      `COMPLIANCE ANALYSIS REPORT`,
+      t.compliance.exportReportHeader,
      `Title: ${state.meta?.title ?? 'Untitled'}`,
      `Date: ${state.meta?.startedAt ? formatTs(state.meta.startedAt) : ''}`,
      `Source: ${SOURCE_TYPE_LABEL[state.meta?.sourceType ?? 'text']}`,
      `Risk Score: ${state.done?.risk_score ?? 'N/A'} / 100`,
      '',
-      '── PARAGRAPH UNDER REVIEW ──',
+      t.compliance.exportSectionParagraph,
      state.done?.para_text ?? '',
      '',
-      '── FINDINGS ──',
+      t.compliance.exportSectionFindings,
      ...state.findings.map((f, i) =>
        `[${i + 1}] [${f.status.toUpperCase()}] ${f.title}\n    ${f.desc}${f.clause_ref ? `\n    Ref: ${f.clause_ref}` : ''}`
      ),
      '',
-      '── CONCLUSION ──',
+      t.compliance.exportSectionConclusion,
      state.done?.conclusion ?? '',
      '',
-      '── RECOMMENDED ACTIONS ──',
+      t.compliance.exportSectionActions,
      ...(state.done?.actions ?? []).map(a => `• ${a.label}: ${a.value}`),
    ];
    const blob = new Blob([lines.join('\n')], { type: 'text/plain' });
@@ -178,15 +267,15 @@ export function CompliancePage() {
  return (
    <div className="compliance-page" style={{ position: 'relative' }}>
      <Topbar
-        title="Compliance Analysis"
+        title={t.compliance.topbarTitle}
        actions={
          <>
            <div className="search-box">
              <Search size={13} />
-              <input placeholder="Search analyses..." />
+              <input placeholder={t.compliance.searchPlaceholder} />
            </div>
            {isStreaming || isDone || isError ? (
-              <button className="btn sm" onClick={reset}>Clear</button>
+              <button className="btn sm" onClick={reset}>{t.compliance.clearBtn}</button>
            ) : null}
            {isDone && (
              <div style={{ position: 'relative' }}>
@@ -194,7 +283,7 @@ export function CompliancePage() {
                  className="btn sm"
                  onClick={() => setShowExportMenu(v => !v)}
                >
-                  <Download size={13} />Export<ChevronDown size={11} />
+                  <Download size={13} />{t.compliance.exportBtn}<ChevronDown size={11} />
                </button>
                {showExportMenu && (
                  <div style={{
@@ -206,17 +295,17 @@ export function CompliancePage() {
                    <button onClick={exportJSON} style={{ display: 'block', width: '100%', padding: '9px 14px', textAlign: 'left', fontSize: 13, background: 'none', border: 'none', cursor: 'pointer', color: 'var(--fg)' }}
                      onMouseEnter={e => (e.currentTarget.style.background = 'var(--bg)')}
                      onMouseLeave={e => (e.currentTarget.style.background = 'none')}
-                    >Export JSON</button>
+                    >{t.compliance.exportJSON}</button>
                    <button onClick={exportText} style={{ display: 'block', width: '100%', padding: '9px 14px', textAlign: 'left', fontSize: 13, background: 'none', border: 'none', cursor: 'pointer', color: 'var(--fg)' }}
                      onMouseEnter={e => (e.currentTarget.style.background = 'var(--bg)')}
                      onMouseLeave={e => (e.currentTarget.style.background = 'none')}
-                    >Export Text</button>
+                    >{t.compliance.exportText}</button>
                  </div>
                )}
              </div>
            )}
            <button className="btn sm primary" onClick={() => setShowModal(true)}>
-              <Plus size={13} />New analysis
+              <Plus size={13} />{t.compliance.newAnalysisBtn}
            </button>
          </>
        }
@@ -235,7 +324,7 @@ export function CompliancePage() {
          <div className={`compliance-status-bar ${state.status}`}>
            <div className="status-dot" />
            <span className="status-bar-label">
-              {isStreaming ? 'Analyzing…' : isDone ? 'Analysis complete' : 'Error'}
+              {isStreaming ? t.compliance.statusAnalyzing : isDone ? t.compliance.statusComplete : t.compliance.statusError}
            </span>
            <span className="status-bar-sub">{state.stageLabel}</span>
          </div>
@@ -246,8 +335,8 @@ export function CompliancePage() {
      {isIdle && (
        <div className="analysis-empty">
          <div className="analysis-empty-icon"><Plus size={24} /></div>
-          <h3>No analysis running</h3>
-          <p>Click <strong>New analysis</strong> to start a compliance gap review against your indexed regulations.</p>
+          <h3>{t.compliance.emptyTitle}</h3>
+          <p>{t.compliance.emptyDesc}</p>
        </div>
      )}

@@ -279,22 +368,29 @@ export function CompliancePage() {
            </div>
          )}

-          <div className="compliance-workspace" style={{ position: 'relative' }}>
+          <div style={{ display: 'flex', flex: 1, overflow: 'hidden' }}>
+            <HistoryRail
+              refreshTrigger={historyRefresh}
+              onSelect={handleSelectHistory}
+              selectedId={state.analysisId}
+            />
+            <div style={{ flex: 1, overflow: 'hidden', display: 'flex', flexDirection: 'column' }}>
+              <div className="compliance-workspace" style={{ position: 'relative' }}>

            {/* Column 1: Retrieved Regulations */}
            <div className="comp-col source-col">
              <div className="col-header">
-                Retrieved Regulations {state.sources.length > 0 && `(${state.sources.length})`}
+                {t.compliance.stageRetrieval} {state.sources.length > 0 && `(${state.sources.length})`}
              </div>
              {state.sources.length === 0 && isStreaming && (
                <div style={{ padding: '20px 16px', color: 'var(--muted)', fontSize: 12 }}>
-                  Retrieving relevant regulations…
+                  {t.compliance.retrievingMsg}
                </div>
              )}
              {state.sources.map((s: SourceEvent, i: number) => (
                <div key={i} className="source-item card">
                  <div className="source-top">
-                    <span className="source-std">{s.standard || 'Regulation'}</span>
+                    <span className="source-std">{s.standard || t.compliance.defaultRegulation}</span>
                    <span className={`status ${s.status === 'retrieved' ? 'ok' : s.status}`}>
                      {STATUS_LABEL[s.status] ?? 'Retrieved'}
                    </span>
@@ -303,7 +399,7 @@ export function CompliancePage() {
                  {s.score > 0 && (
                    <div className="source-scores">
                      <span className="score-pill">
-                        {s.score <= 1 ? Math.round(s.score * 100) : Math.round(s.score)}% match
+                        {s.score <= 1 ? Math.round(s.score * 100) : Math.round(s.score)}{t.compliance.matchSuffix}
                      </span>
                    </div>
                  )}
@@ -318,7 +414,7 @@ export function CompliancePage() {

            {/* Column 2: Paragraph Under Review + Stages */}
            <div className="comp-col review-col">
-              <div className="col-header">Paragraph Under Review</div>
+              <div className="col-header">{t.compliance.colParagraph}</div>

              <div className="card para-card">
                {isDone && state.done?.para_text ? (
@@ -327,16 +423,16 @@ export function CompliancePage() {
                  </p>
                ) : (
                  <p className="para-text" style={{ color: 'var(--muted)' }}>
-                    {isStreaming ? 'Extracting and analyzing text…' : 'No text extracted'}
+                    {isStreaming ? t.compliance.extractingMsg : t.compliance.noTextExtracted}
                  </p>
                )}
              </div>

              <div className="card stages-card">
-                <div className="card-header">Analysis stages</div>
+                <div className="card-header">{t.compliance.stagesHeader}</div>
                {(() => {
                  const STAGE_KEYS = ['extracting', 'splitting', 'analyzing', 'concluding'];
-                  const STAGE_LABELS = ['Text extraction', 'Clause splitting', 'Regulation retrieval', 'Conclusion synthesis'];
+                  const STAGE_LABELS = [t.compliance.stageExtraction, t.compliance.stageClauseSplit, t.compliance.stageRetrieval, t.compliance.stageSynthesis];
                  const curIdx = STAGE_KEYS.indexOf(state.stageKey);
                  return STAGE_KEYS.map((key, idx) => {
                    const pct = isDone ? 100 : idx < curIdx ? 100 : idx === curIdx ? 60 : 0;
@@ -365,7 +461,7 @@ export function CompliancePage() {

              {state.findings.length === 0 && isStreaming && (
                <div style={{ padding: '20px 16px', color: 'var(--muted)', fontSize: 12 }}>
-                  Gap analysis in progress…
+                  {t.compliance.gapInProgress}
                </div>
              )}

@@ -385,8 +481,17 @@ export function CompliancePage() {
                      style={{ marginLeft: 'auto', fontSize: 11, padding: '3px 8px', gap: 4 }}
                      onClick={() => chat.openFor(i, f)}
                    >
-                      <MessageSquare size={11} />Ask AI
+                      <MessageSquare size={11} />{t.compliance.askAIBtn}
                    </button>
+                    {state.analysisId && (
+                      <button
+                        className="btn sm"
+                        onClick={() => setDrawerFindingIdx(i)}
+                        style={{ marginTop: 6 }}
+                      >
+                        💬 {t.compliance.chatBtn}
+                      </button>
+                    )}
                  </div>
                </div>
              ))}
@@ -395,10 +500,10 @@ export function CompliancePage() {
              {isDone && state.done && (
                <div className="card conclusion-box">
                  <div className="card-header" style={{ display: 'flex', alignItems: 'center', gap: 10 }}>
-                    <span>Conclusion</span>
+                    <span>{t.compliance.conclusionHeader}</span>
                    <div
                      className={`risk-score-badge ${riskClass(state.done.risk_score)}`}
-                      title="Risk score (0=safe, 100=critical)"
+                      title={t.compliance.riskScoreTooltip}
                    >
                      {state.done.risk_score}
                    </div>
@@ -425,12 +530,14 @@ export function CompliancePage() {
              {isError && (
                <div className="card" style={{ borderColor: 'var(--danger)', padding: '14px 16px' }}>
                  <div style={{ display: 'flex', alignItems: 'center', gap: 8, color: 'var(--danger)', fontSize: 13, fontWeight: 600 }}>
-                    <AlertTriangle size={14} /> Analysis failed
+                    <AlertTriangle size={14} /> {t.compliance.analysisFailed}
                  </div>
                  <p style={{ fontSize: 12, color: 'var(--muted)', marginTop: 6 }}>{state.errorText}</p>
                </div>
              )}
            </div>
+            </div>
+            </div>
          </div>

          {/* ── Finding Chat Side Panel ────────────────────────────────── */}
@@ -444,7 +551,7 @@ export function CompliancePage() {
              {/* Header */}
              <div style={{ padding: '16px 20px', borderBottom: '1px solid var(--border)', display: 'flex', alignItems: 'center', justifyContent: 'space-between' }}>
                <div>
-                  <div style={{ fontSize: 13, fontWeight: 600 }}>AI Compliance Q&A</div>
+                  <div style={{ fontSize: 13, fontWeight: 600 }}>{t.compliance.chatSidebarHeader}</div>
                  <div style={{ fontSize: 11, color: 'var(--muted)', marginTop: 2 }}>
                    Finding #{(chat.findingIdx ?? 0) + 1} · {activeFinding?.title}
                  </div>
@@ -474,7 +581,7 @@ export function CompliancePage() {
                  <div style={{ display: 'flex', gap: 10 }}>
                    <div style={{ width: 28, height: 28, borderRadius: 8, background: 'var(--accent)', display: 'flex', alignItems: 'center', justifyContent: 'center', flexShrink: 0, fontSize: 11, color: '#fff', fontWeight: 700 }}>AI</div>
                    <div style={{ padding: '10px 14px', borderRadius: 10, border: '1px solid var(--border)', background: 'var(--bg)', fontSize: 13, color: 'var(--muted)' }}>
-                      Thinking<span className="blink-cursor">▋</span>
+                      {t.compliance.chatThinking}
                    </div>
                  </div>
                )}
@@ -482,7 +589,7 @@ export function CompliancePage() {

              {/* Quick questions */}
              <div style={{ padding: '8px 20px', display: 'flex', flexWrap: 'wrap', gap: 6 }}>
-                {['What regulation applies?', 'How to remediate?', 'What is the risk?'].map(q => (
+                {[t.compliance.quickQ1, t.compliance.quickQ2, t.compliance.quickQ3].map(q => (
                  <button key={q} onClick={() => chat.setInput(q)}
                    style={{ padding: '4px 10px', fontSize: 11, background: 'var(--bg)', border: '1px solid var(--border)', borderRadius: 6, cursor: 'pointer', color: 'var(--muted)' }}>
                    {q}
@@ -496,7 +603,7 @@ export function CompliancePage() {
                  value={chat.input}
                  onChange={e => chat.setInput(e.target.value)}
                  onKeyDown={e => { if (e.key === 'Enter' && !e.shiftKey) { e.preventDefault(); chat.send(chatContext); } }}
-                  placeholder="Ask about this finding…"
+                  placeholder={t.compliance.chatPlaceholder}
                  style={{ flex: 1, padding: '9px 12px', fontSize: 13, background: 'var(--bg)', border: '1px solid var(--border)', borderRadius: 8, color: 'var(--fg)', outline: 'none' }}
                />
                <button
@@ -504,10 +611,23 @@ export function CompliancePage() {
                  onClick={() => chat.send(chatContext)}
                  disabled={!chat.input.trim() || chat.loading}
                  style={{ padding: '9px 14px' }}
-                >Send</button>
+                >{t.compliance.sendBtn}</button>
              </div>
            </div>
          )}
+          {drawerFindingIdx !== null && state.analysisId && (
+            <_FindingChatDrawerWrapper
+              analysisId={state.analysisId}
+              findingIndex={drawerFindingIdx}
+              finding={{
+                title: state.findings[drawerFindingIdx]?.title ?? '',
+                desc: state.findings[drawerFindingIdx]?.desc ?? '',
+                status: state.findings[drawerFindingIdx]?.status ?? 'ok',
+                clause_ref: state.findings[drawerFindingIdx]?.clause_ref,
+              }}
+              onClose={() => setDrawerFindingIdx(null)}
+            />
+          )}
        </>
      )}
    </div>
--- a/frontend/src/pages/Compliance/FindingChatDrawer.tsx
+++ b/frontend/src/pages/Compliance/FindingChatDrawer.tsx
@@ -0,0 +1,237 @@
+// frontend/src/pages/Compliance/FindingChatDrawer.tsx
+import { useEffect, useRef, useState } from 'react';
+import { X, Send } from 'lucide-react';
+import { useLanguage } from '../../contexts/LanguageContext';
+
+const TOKEN_KEY = 'auth_token';
+function authHeader(): Record<string, string> {
+  const t = localStorage.getItem(TOKEN_KEY);
+  return t ? { Authorization: `Bearer ${t}` } : {};
+}
+
+interface Message {
+  id: string;
+  role: 'user' | 'assistant';
+  content: string;
+}
+
+interface FindingInfo {
+  title: string;
+  desc: string;
+  status: string;
+  clause_ref?: string;
+}
+
+interface Props {
+  analysisId: string;
+  findingId: string;
+  finding: FindingInfo;
+  onClose: () => void;
+}
+
+export function FindingChatDrawer({ analysisId, findingId, finding, onClose }: Props) {
+  const [messages, setMessages] = useState<Message[]>([]);
+  const [suggestions, setSuggestions] = useState<string[]>([]);
+  const [input, setInput] = useState('');
+  const [loading, setLoading] = useState(false);
+  const [loadingHistory, setLoadingHistory] = useState(true);
+  const abortRef = useRef<AbortController | null>(null);
+  const bottomRef = useRef<HTMLDivElement>(null);
+  const { t } = useLanguage();
+
+  // Load history + suggestions on open
+  useEffect(() => {
+    setLoadingHistory(true);
+    fetch(`/api/v1/compliance/analyses/${analysisId}/findings/${findingId}/chat`, {
+      headers: authHeader(),
+    })
+      .then(r => r.json())
+      .then((data: Message[]) => {
+        setMessages(Array.isArray(data) ? data.map(m => ({ id: m.id, role: m.role, content: m.content })) : []);
+        setLoadingHistory(false);
+        if (!data.length) {
+          fetch(
+            `/api/v1/compliance/analyses/${analysisId}/findings/${findingId}/suggestions`,
+            { method: 'POST', headers: authHeader() }
+          )
+            .then(r => r.json())
+            .then(d => { if (Array.isArray(d?.questions)) setSuggestions(d.questions); })
+            .catch(() => {});
+        }
+      })
+      .catch(() => setLoadingHistory(false));
+
+    return () => { abortRef.current?.abort(); };
+  }, [analysisId, findingId]);
+
+  // Auto-scroll to bottom
+  useEffect(() => {
+    bottomRef.current?.scrollIntoView({ behavior: 'smooth' });
+  }, [messages]);
+
+  async function send(text?: string) {
+    const q = (text ?? input).trim();
+    if (!q || loading) return;
+    setInput('');
+    setSuggestions([]); // hide chips after first message
+
+    const assistantId = `ast-${Date.now()}`;
+    setMessages(prev => [
+      ...prev,
+      { id: `usr-${Date.now()}`, role: 'user', content: q },
+      { id: assistantId, role: 'assistant', content: '' },
+    ]);
+    setLoading(true);
+
+    const ctrl = new AbortController();
+    abortRef.current = ctrl;
+
+    try {
+      const res = await fetch(
+        `/api/v1/compliance/analyses/${analysisId}/findings/${findingId}/chat`,
+        {
+          method: 'POST',
+          headers: { 'Content-Type': 'application/json', ...authHeader() },
+          body: JSON.stringify({ query: q }),
+          signal: ctrl.signal,
+        }
+      );
+      if (!res.body) { setLoading(false); return; }
+      const reader = res.body.getReader();
+      const dec = new TextDecoder();
+      let buf = '';
+
+      while (true) {
+        const { done, value } = await reader.read();
+        if (done) break;
+        buf += dec.decode(value, { stream: true });
+        const blocks = buf.split('\n\n');
+        buf = blocks.pop() ?? '';
+        for (const block of blocks) {
+          const dl = block.split('\n').find(l => l.startsWith('data: '));
+          if (!dl) continue;
+          try {
+            const j = JSON.parse(dl.slice(6));
+            if (j.type === 'chunk' && j.text) {
+              setMessages(prev =>
+                prev.map(m => m.id === assistantId ? { ...m, content: m.content + (j.text as string) } : m)
+              );
+            }
+          } catch { /* skip */ }
+        }
+      }
+    } catch (e: unknown) {
+      if (e instanceof Error && e.name !== 'AbortError') {
+        setMessages(prev =>
+          prev.map(m => m.id === assistantId ? { ...m, content: 'Error reaching server.' } : m)
+        );
+      }
+    } finally {
+      setLoading(false);
+    }
+  }
+
+  const STATUS_COLOR: Record<string, string> = {
+    risk: 'var(--danger, #dc143c)',
+    warn: 'var(--warning, #ff8c00)',
+    ok: 'var(--success, #228b22)',
+  };
+
+  return (
+    <div
+      style={{
+        position: 'fixed', right: 0, top: 0, bottom: 0, width: 420,
+        background: 'var(--surface)', borderLeft: '1px solid var(--border)',
+        display: 'flex', flexDirection: 'column', zIndex: 200,
+        boxShadow: '-4px 0 16px rgba(0,0,0,0.12)',
+      }}
+    >
+      {/* Header */}
+      <div style={{
+        padding: '14px 16px', borderBottom: '1px solid var(--border)',
+        display: 'flex', alignItems: 'flex-start', gap: 10,
+      }}>
+        <div style={{ flex: 1, minWidth: 0 }}>
+          <div style={{ fontSize: 11, color: STATUS_COLOR[finding.status] ?? 'var(--muted)', fontWeight: 600, marginBottom: 2 }}>
+            {finding.status.toUpperCase()}
+            {finding.clause_ref && (
+              <span style={{ fontWeight: 400, marginLeft: 6, color: 'var(--muted)' }}>
+                {finding.clause_ref}
+              </span>
+            )}
+          </div>
+          <div style={{ fontSize: 13, fontWeight: 600, overflow: 'hidden', textOverflow: 'ellipsis', whiteSpace: 'nowrap' }}>
+            {finding.title}
+          </div>
+          <div style={{ fontSize: 11, color: 'var(--muted)', marginTop: 2, lineHeight: 1.4 }}>
+            {finding.desc.length > 100 ? finding.desc.slice(0, 100) + '…' : finding.desc}
+          </div>
+        </div>
+        <button className="btn icon-btn" onClick={onClose} style={{ flexShrink: 0 }} title={t.compliance.drawerClose}>
+          <X size={14} />
+        </button>
+      </div>
+
+      {/* Suggestion chips */}
+      {suggestions.length > 0 && (
+        <div style={{ padding: '10px 16px', borderBottom: '1px solid var(--border)' }}>
+          <div style={{ fontSize: 11, color: 'var(--muted)', marginBottom: 6 }}>{t.compliance.drawerSuggestionsHeader}</div>
+          <div style={{ display: 'flex', flexDirection: 'column', gap: 6 }}>
+            {suggestions.map((q, i) => (
+              <button
+                key={i}
+                className="chip"
+                style={{ textAlign: 'left', whiteSpace: 'normal', height: 'auto', padding: '6px 10px' }}
+                onClick={() => send(q)}
+              >
+                {q}
+              </button>
+            ))}
+          </div>
+        </div>
+      )}
+
+      {/* Messages */}
+      <div style={{ flex: 1, overflowY: 'auto', padding: '12px 16px', display: 'flex', flexDirection: 'column', gap: 10 }}>
+        {loadingHistory && (
+          <p style={{ fontSize: 12, color: 'var(--muted)', textAlign: 'center' }}>Loading history…</p>
+        )}
+        {!loadingHistory && messages.length === 0 && (
+          <p style={{ fontSize: 12, color: 'var(--muted)', textAlign: 'center' }}>{t.compliance.drawerChatEmpty}</p>
+        )}
+        {messages.map(msg => (
+          <div key={msg.id} className={`message msg-${msg.role}`} style={{ maxWidth: '100%' }}>
+            {msg.role === 'assistant' && <div className="msg-avatar">AI</div>}
+            <div className="msg-bubble" style={{ fontSize: 13, whiteSpace: 'pre-wrap' }}>
+              {msg.content || (loading ? '…' : '')}
+            </div>
+            {msg.role === 'user' && <div className="msg-avatar user-av">You</div>}
+          </div>
+        ))}
+        <div ref={bottomRef} />
+      </div>
+
+      {/* Composer */}
+      <div style={{ padding: '10px 16px', borderTop: '1px solid var(--border)', display: 'flex', gap: 8 }}>
+        <textarea
+          className="composer-input"
+          placeholder={t.compliance.chatPlaceholder}
+          value={input}
+          rows={2}
+          style={{ flex: 1, fontSize: 13 }}
+          onChange={e => setInput(e.target.value)}
+          onKeyDown={e => { if (e.key === 'Enter' && !e.shiftKey) { e.preventDefault(); void send(); } }}
+        />
+        <button
+          className="btn primary"
+          disabled={!input.trim() || loading}
+          onClick={() => void send()}
+          style={{ alignSelf: 'flex-end' }}
+          title={t.compliance.sendBtn}
+        >
+          <Send size={14} />
+        </button>
+      </div>
+    </div>
+  );
+}
--- a/frontend/src/pages/Compliance/HistoryRail.tsx
+++ b/frontend/src/pages/Compliance/HistoryRail.tsx
@@ -0,0 +1,142 @@
+// frontend/src/pages/Compliance/HistoryRail.tsx
+import { useEffect, useState, useCallback } from 'react';
+import { Download, Trash2 } from 'lucide-react';
+import { useLanguage } from '../../contexts/LanguageContext';
+
+const TOKEN_KEY = 'auth_token';
+function authHeader(): Record<string, string> {
+  const t = localStorage.getItem(TOKEN_KEY);
+  return t ? { Authorization: `Bearer ${t}` } : {};
+}
+
+interface HistoryItem {
+  id: string;
+  created_at: string;
+  doc_name: string;
+  standard_name: string;
+  risk_score: number;
+  finding_count: number;
+}
+
+interface Props {
+  refreshTrigger: number;
+  onSelect: (id: string) => void;
+  selectedId: string | null;
+}
+
+function riskClass(score: number): string {
+  if (score >= 70) return 'risk-high';
+  if (score >= 40) return 'risk-medium';
+  return 'risk-low';
+}
+
+export function HistoryRail({ refreshTrigger, onSelect, selectedId }: Props) {
+  const [items, setItems] = useState<HistoryItem[]>([]);
+  const [deletingId, setDeletingId] = useState<string | null>(null);
+  const { t } = useLanguage();
+
+  const fetchHistory = useCallback(() => {
+    fetch('/api/v1/compliance/history?limit=30', { headers: authHeader() })
+      .then(r => r.json())
+      .then(data => {
+        if (Array.isArray(data)) setItems(data);
+      })
+      .catch(() => {/* backend may not have postgres configured */});
+  }, []);
+
+  useEffect(() => { fetchHistory(); }, [fetchHistory, refreshTrigger]);
+
+  function handleDownload(e: React.MouseEvent, item: HistoryItem) {
+    e.stopPropagation();
+    fetch(`/api/v1/compliance/history/${item.id}/download`, { headers: authHeader() })
+      .then(r => r.blob())
+      .then(blob => {
+        const blobUrl = URL.createObjectURL(blob);
+        const link = document.createElement('a');
+        link.href = blobUrl;
+        link.download = `compliance-${item.doc_name.slice(0, 30)}.docx`;
+        link.click();
+        URL.revokeObjectURL(blobUrl);
+      });
+  }
+
+  function handleDelete(e: React.MouseEvent, item: HistoryItem) {
+    e.stopPropagation();
+    if (!window.confirm(t.compliance.historyDeleteConfirm)) return;
+    setDeletingId(item.id);
+    fetch(`/api/v1/compliance/history/${item.id}`, {
+      method: 'DELETE',
+      headers: authHeader(),
+    })
+      .then(() => {
+        setItems(prev => prev.filter(i => i.id !== item.id));
+        setDeletingId(null);
+      })
+      .catch(() => setDeletingId(null));
+  }
+
+  function formatDate(iso: string): string {
+    try {
+      return new Date(iso).toLocaleDateString(undefined, { month: 'short', day: 'numeric' });
+    } catch {
+      return iso.slice(0, 10);
+    }
+  }
+
+  if (items.length === 0) {
+    return (
+      <div className="history-pane" style={{ minWidth: 200, maxWidth: 220 }}>
+        <div className="history-header">{t.compliance.historyHeader}</div>
+        <p style={{ padding: '12px 16px', fontSize: 12, color: 'var(--muted)', lineHeight: 1.5 }}>
+          {t.compliance.historyEmpty}
+        </p>
+      </div>
+    );
+  }
+
+  return (
+    <div className="history-pane" style={{ minWidth: 200, maxWidth: 220, overflowY: 'auto' }}>
+      <div className="history-header">{t.compliance.historyHeader}</div>
+      {items.map(item => (
+        <div
+          key={item.id}
+          className={`quick-item${selectedId === item.id ? ' active' : ''}`}
+          onClick={() => onSelect(item.id)}
+          style={{ cursor: 'pointer' }}
+        >
+          <div style={{ fontSize: 11, color: 'var(--muted)', marginBottom: 2 }}>
+            {formatDate(item.created_at)}
+          </div>
+          <div style={{ fontSize: 12, fontWeight: 500, marginBottom: 4, overflow: 'hidden', textOverflow: 'ellipsis', whiteSpace: 'nowrap' }}>
+            {item.doc_name || 'Untitled'}
+          </div>
+          <div style={{ display: 'flex', alignItems: 'center', gap: 6 }}>
+            <span className={`risk-badge ${riskClass(item.risk_score)}`} style={{ fontSize: 10 }}>
+              {item.risk_score}
+            </span>
+            <span style={{ fontSize: 10, color: 'var(--muted)', flex: 1 }}>
+              {item.finding_count} finding{item.finding_count !== 1 ? 's' : ''}
+            </span>
+            <button
+              className="btn icon-btn"
+              title={t.compliance.downloadReport}
+              onClick={e => handleDownload(e, item)}
+              style={{ padding: '2px 4px' }}
+            >
+              <Download size={11} />
+            </button>
+            <button
+              className="btn icon-btn danger"
+              title="Delete"
+              disabled={deletingId === item.id}
+              onClick={e => handleDelete(e, item)}
+              style={{ padding: '2px 4px' }}
+            >
+              <Trash2 size={11} />
+            </button>
+          </div>
+        </div>
+      ))}
+    </div>
+  );
+}
--- a/frontend/src/pages/Compliance/NewAnalysisModal.tsx
+++ b/frontend/src/pages/Compliance/NewAnalysisModal.tsx
@@ -1,6 +1,12 @@
 import { useState, useRef, useEffect } from 'react';
 import { X, Upload, FileText, Database } from 'lucide-react';

+const TOKEN_KEY = 'auth_token';
+function authHeader(): Record<string, string> {
+  const t = localStorage.getItem(TOKEN_KEY);
+  return t ? { Authorization: `Bearer ${t}` } : {};
+}
+
 interface DocOption {
  id: string;
  name: string;
@@ -30,7 +36,7 @@ export function NewAnalysisModal({ onClose, onSubmit }: Props) {

  // Fetch indexed docs for "From Document" tab
  useEffect(() => {
-    fetch('/api/v1/documents/management-list')
+    fetch('/api/v1/documents/management-list', { headers: authHeader() })
      .then(r => r.json())
      .then(d => {
        const list: DocOption[] = (d?.documents ?? d ?? []).map((item: Record<string, unknown>) => ({
--- a/frontend/src/pages/Compliance/useComplianceAnalysis.ts
+++ b/frontend/src/pages/Compliance/useComplianceAnalysis.ts
@@ -1,54 +1,33 @@
-import { useState, useCallback, useRef } from 'react';
+/**
+ * useComplianceAnalysis — compliance analysis state wired to PageStateContext.
+ *
+ * State is stored in the global context so it persists when the user navigates
+ * to another module and returns. The `run` and `reset` actions are identical
+ * to the previous hook API so CompliancePage needs no structural changes.
+ */

-export type AnalysisStatus = 'idle' | 'streaming' | 'done' | 'error';
+import { useCallback } from 'react';
+import { usePageState } from '../../contexts';
+import type {
+  ComplianceMeta,
+  ComplianceState,
+  ComplianceSourceEvent,
+  ComplianceFindingEvent,
+  ComplianceDonePayload,
+} from '../../contexts';

-export interface SourceEvent {
-  standard: string;
-  clause: string;
-  score: number;
-  status: string;
-  full_content: string;
+export type { ComplianceMeta, ComplianceState, ComplianceSourceEvent as SourceEvent, ComplianceFindingEvent as FindingEvent, ComplianceDonePayload as DonePayload };
+export type { ComplianceActionItem as ActionItem } from '../../contexts';
+export type AnalysisStatus = import('../../contexts').ComplianceStatus;
+export type AnalysisMeta = ComplianceMeta;
+
+const TOKEN_KEY = 'auth_token';
+function authHeader(): Record<string, string> {
+  const t = localStorage.getItem(TOKEN_KEY);
+  return t ? { Authorization: `Bearer ${t}` } : {};
 }

-export interface FindingEvent {
-  title: string;
-  desc: string;
-  status: 'ok' | 'warn' | 'risk';
-  clause_ref?: string;
-}
-
-export interface ActionItem {
-  label: string;
-  value: string;
-  risk?: boolean;
-}
-
-export interface DonePayload {
-  conclusion: string;
-  actions: ActionItem[];
-  risk_score: number;
-  highlight_terms: string[];
-  para_text: string;
-}
-
-export interface AnalysisMeta {
-  title: string;
-  sourceType: 'text' | 'doc' | 'upload';
-  startedAt: string; // ISO timestamp
-}
-
-export interface AnalysisState {
-  status: AnalysisStatus;
-  stageLabel: string;
-  stageKey: string;
-  meta: AnalysisMeta | null;
-  sources: SourceEvent[];
-  findings: FindingEvent[];
-  done: DonePayload | null;
-  errorText: string;
-}
-
-const INITIAL_STATE: AnalysisState = {
+const INITIAL_STATE: ComplianceState = {
  status: 'idle',
  stageLabel: '',
  stageKey: '',
@@ -57,27 +36,24 @@ const INITIAL_STATE: AnalysisState = {
  findings: [],
  done: null,
  errorText: '',
+  analysisId: null,
+  isReadOnly: false,
 };

 export function useComplianceAnalysis() {
-  const [state, setState] = useState<AnalysisState>(INITIAL_STATE);
-  const abortRef = useRef<AbortController | null>(null);
+  const { complianceState: state, setComplianceState: setState, complianceAbortRef, resetCompliance: reset } = usePageState();

-  const reset = useCallback(() => {
-    abortRef.current?.abort();
-    setState(INITIAL_STATE);
-  }, []);
-
-  const run = useCallback(async (formData: FormData, meta: AnalysisMeta) => {
-    abortRef.current?.abort();
+  const run = useCallback(async (formData: FormData, meta: ComplianceMeta) => {
+    complianceAbortRef.current?.abort();
    const ctrl = new AbortController();
-    abortRef.current = ctrl;
+    complianceAbortRef.current = ctrl;

    setState({ ...INITIAL_STATE, status: 'streaming', stageLabel: 'Starting…', meta });

    try {
      const res = await fetch('/api/v1/compliance/analyze-stream', {
        method: 'POST',
+        headers: authHeader(),
        body: formData,
        signal: ctrl.signal,
      });
@@ -117,7 +93,7 @@ export function useComplianceAnalysis() {
            if (j.type === 'stage') {
              setState(s => ({ ...s, stageLabel: j.label ?? '', stageKey: j.stage ?? '' }));
            } else if (j.type === 'source') {
-              const src: SourceEvent = {
+              const src: ComplianceSourceEvent = {
                standard: j.standard ?? '',
                clause: j.clause ?? '',
                score: j.score ?? 0,
@@ -126,7 +102,7 @@ export function useComplianceAnalysis() {
              };
              setState(s => ({ ...s, sources: [...s.sources, src] }));
            } else if (j.type === 'finding') {
-              const finding: FindingEvent = {
+              const finding: ComplianceFindingEvent = {
                title: j.title ?? '',
                desc: j.desc ?? '',
                status: j.status ?? 'info',
@@ -134,7 +110,7 @@ export function useComplianceAnalysis() {
              };
              setState(s => ({ ...s, findings: [...s.findings, finding] }));
            } else if (j.type === 'done') {
-              const payload: DonePayload = {
+              const payload: ComplianceDonePayload = {
                conclusion: j.conclusion ?? '',
                actions: j.actions ?? [],
                risk_score: j.risk_score ?? 0,
@@ -142,6 +118,8 @@ export function useComplianceAnalysis() {
                para_text: j.para_text ?? '',
              };
              setState(s => ({ ...s, status: 'done', done: payload, stageKey: 'concluding', stageLabel: 'Complete' }));
+            } else if (j.type === 'saved') {
+              setState(s => ({ ...s, analysisId: j.analysis_id ?? null }));
            } else if (j.type === 'error') {
              setState(s => ({ ...s, status: 'error', errorText: j.text ?? 'Unknown error' }));
            }
@@ -155,7 +133,7 @@ export function useComplianceAnalysis() {
      if (e instanceof Error && e.name === 'AbortError') return;
      setState(s => ({ ...s, status: 'error', errorText: String(e) }));
    }
-  }, []);
+  }, [setState, complianceAbortRef]);

  return { state, run, reset };
 }
--- a/frontend/src/pages/Docs/DocsPage.tsx
+++ b/frontend/src/pages/Docs/DocsPage.tsx
@@ -2,6 +2,13 @@ import { useState, useEffect, useCallback } from 'react';
 import { Topbar } from '../../components/layout/Topbar';
 import { Upload, Search, Download, Trash2, RefreshCw, AlertTriangle } from 'lucide-react';
 import { UploadModal } from './UploadModal';
+import { useLanguage } from '../../contexts/LanguageContext';
+
+const TOKEN_KEY = 'auth_token';
+function authHeader(): Record<string, string> {
+  const t = localStorage.getItem(TOKEN_KEY);
+  return t ? { Authorization: `Bearer ${t}` } : {};
+}

 interface Doc {
  id: string;
@@ -39,6 +46,7 @@ function ConfirmDialog({ message, onConfirm, onCancel }: {
  onConfirm: () => void;
  onCancel: () => void;
 }) {
+  const { t } = useLanguage();
  return (
    <div className="modal-overlay" onClick={onCancel}>
      <div
@@ -47,13 +55,13 @@ function ConfirmDialog({ message, onConfirm, onCancel }: {
      >
        <div style={{ display: 'flex', alignItems: 'center', gap: 10, marginBottom: 14 }}>
          <AlertTriangle size={18} color="var(--danger)" />
-          <span style={{ fontWeight: 600, fontSize: 15 }}>Confirm deletion</span>
+          <span style={{ fontWeight: 600, fontSize: 15 }}>{t.docs.confirmDeleteTitle}</span>
        </div>
        <p style={{ fontSize: 13, color: 'var(--muted)', lineHeight: 1.6, marginBottom: 20 }}>{message}</p>
        <div style={{ display: 'flex', gap: 10, justifyContent: 'flex-end' }}>
-          <button className="btn sm" onClick={onCancel}>Cancel</button>
+          <button className="btn sm" onClick={onCancel}>{t.docs.cancelBtn}</button>
          <button className="btn sm" style={{ background: 'var(--danger)', color: '#fff', borderColor: 'var(--danger)' }} onClick={onConfirm}>
-            Delete
+            {t.docs.deleteBtn}
          </button>
        </div>
      </div>
@@ -62,6 +70,7 @@ function ConfirmDialog({ message, onConfirm, onCancel }: {
 }

 export function DocsPage() {
+  const { t } = useLanguage();
  const [search, setSearch] = useState('');
  const [statusF, setStatusF] = useState('All');
  const [typeF, setTypeF] = useState('All types');
@@ -79,7 +88,7 @@ export function DocsPage() {

  const fetchDocs = useCallback(() => {
    setLoading(true);
-    fetch('/api/v1/documents/management-list')
+    fetch('/api/v1/documents/management-list', { headers: authHeader() })
      .then(r => r.json())
      .then(d => {
        if (!Array.isArray(d?.documents)) { setLoading(false); return; }
@@ -132,7 +141,7 @@ export function DocsPage() {
  async function retryDoc(id: string) {
    setRetrying(r => new Set([...r, id]));
    try {
-      await fetch(`/api/v1/documents/${id}/retry`, { method: 'POST' });
+      await fetch(`/api/v1/documents/${id}/retry`, { method: 'POST', headers: authHeader() });
      setTimeout(() => {
        setRetrying(r => { const s = new Set(r); s.delete(id); return s; });
        setRefreshKey(k => k + 1);
@@ -155,7 +164,7 @@ export function DocsPage() {
    setDeleting(new Set(ids));

    await Promise.allSettled(
-      ids.map(id => fetch(`/api/v1/documents/${id}`, { method: 'DELETE' }))
+      ids.map(id => fetch(`/api/v1/documents/${id}`, { method: 'DELETE', headers: authHeader() }))
    );

    setDeleting(new Set());
@@ -166,22 +175,22 @@ export function DocsPage() {
  return (
    <div className="docs-page">
      <Topbar
-        title="Document Management"
+        title={t.docs.topbarTitle}
        actions={
          <>
            <div className="search-box">
              <Search size={13} />
              <input
-                placeholder="Search documents..."
+                placeholder={t.docs.searchPlaceholder}
                value={search}
                onChange={e => setSearch(e.target.value)}
              />
            </div>
            <button className="btn sm" onClick={() => setRefreshKey(k => k + 1)}>
-              <RefreshCw size={13} />Refresh
+              <RefreshCw size={13} />{t.docs.refreshBtn}
            </button>
            <button className="btn sm primary" onClick={() => setShowUpload(true)}>
-              <Upload size={13} />Upload document
+              <Upload size={13} />{t.docs.uploadBtn}
            </button>
          </>
        }
@@ -195,24 +204,37 @@ export function DocsPage() {
                key={f}
                className={`chip${statusF === f ? ' active' : ''}`}
                onClick={() => setStatusF(f)}
-              >{f}</button>
+              >
+                {f === 'All' ? t.docs.filterAll
+                  : f === 'Ready' ? t.docs.filterReady
+                  : f === 'Processing' ? t.docs.filterProcessing
+                  : f === 'Failed' ? t.docs.filterFailed
+                  : t.docs.filterPending}
+              </button>
            ))}
          </div>
          <select className="select-input" value={typeF} onChange={e => setTypeF(e.target.value)}>
-            {typeOpts.map(o => <option key={o}>{o}</option>)}
+            {typeOpts.map(o => (
+              <option key={o} value={o}>{o === 'All types' ? t.docs.filterAllTypes : o}</option>
+            ))}
          </select>
        </div>

        {/* Batch action bar */}
        {selected.size > 0 && (
          <div className="batch-bar">
-            <span>{selected.size} document{selected.size > 1 ? 's' : ''} selected</span>
+            <span>
+              {selected.size}{' '}
+              {t.docs.colName === 'Document name'
+                ? `document${selected.size > 1 ? 's' : ''} selected`
+                : '份文档已选择'}
+            </span>
            <button
              className="btn sm"
              style={{ color: 'var(--danger)', borderColor: 'rgba(239,68,68,.4)' }}
              onClick={() => askDelete([...selected])}
            >
-              <Trash2 size={12} />Delete selected
+              <Trash2 size={12} />{t.docs.deleteSelected}
            </button>
          </div>
        )}
@@ -225,22 +247,22 @@ export function DocsPage() {
              checked={selected.size === filtered.length && filtered.length > 0}
              onChange={toggleAll}
            />
-            <span>Document name</span>
-            <span>Status</span>
-            <span>Uploaded</span>
-            <span>Chunks</span>
-            <span>Size</span>
-            <span>Type</span>
-            <span>Actions</span>
+            <span>{t.docs.colName}</span>
+            <span>{t.docs.colStatus}</span>
+            <span>{t.docs.colUploaded}</span>
+            <span>{t.docs.colChunks}</span>
+            <span>{t.docs.colSize}</span>
+            <span>{t.docs.colType}</span>
+            <span>{t.docs.colActions}</span>
          </div>

          {loading ? (
            <div style={{ padding: '32px 16px', color: 'var(--muted)', fontSize: 13, textAlign: 'center' }}>
-              Loading documents…
+              {t.docs.loading}
            </div>
          ) : filtered.length === 0 ? (
            <div style={{ padding: '40px 16px', color: 'var(--muted)', fontSize: 13, textAlign: 'center' }}>
-              {docs.length === 0 ? 'No documents yet. Upload a document to get started.' : 'No documents match the current filters.'}
+              {docs.length === 0 ? t.docs.emptyNoDocuments : t.docs.emptyNoMatch}
            </div>
          ) : (
            filtered.map(d => {
@@ -270,7 +292,7 @@ export function DocsPage() {
                    {/* Download */}
                    <button
                      className="text-link"
-                      title="Download original file"
+                      title={t.docs.titleDownload}
                      onClick={() => downloadDoc(d.id, d.name)}
                    >
                      <Download size={12} />
@@ -280,7 +302,7 @@ export function DocsPage() {
                    {d.status === 'risk' && (
                      <button
                        className="text-link"
-                        title="Retry processing"
+                        title={t.docs.titleRetry}
                        disabled={isRetrying}
                        onClick={() => retryDoc(d.id)}
                        style={{ color: 'var(--warn)' }}
@@ -292,7 +314,7 @@ export function DocsPage() {
                    {/* Delete */}
                    <button
                      className="text-link danger-link"
-                      title="Delete document"
+                      title={t.docs.titleDelete}
                      disabled={isDeleting}
                      onClick={() => askDelete([d.id])}
                    >
--- a/frontend/src/pages/Docs/UploadModal.tsx
+++ b/frontend/src/pages/Docs/UploadModal.tsx
@@ -1,6 +1,12 @@
 import { useState, useRef, useCallback } from 'react';
 import { X, Upload } from 'lucide-react';

+const TOKEN_KEY = 'auth_token';
+function authHeader(): Record<string, string> {
+  const t = localStorage.getItem(TOKEN_KEY);
+  return t ? { Authorization: `Bearer ${t}` } : {};
+}
+
 interface Props {
  onClose: () => void;
  onComplete?: () => void;  // called when all uploads finish (indexed)
@@ -44,11 +50,6 @@ function docStatusToStages(status: DocStatus): StageState[] {
  }
 }

-// Generate a short unique ID client-side (matches backend's 8-char uuid prefix pattern)
-function genDocId(): string {
-  return Math.random().toString(36).slice(2, 10);
-}
-
 export function UploadModal({ onClose, onComplete }: Props) {
  const [files, setFiles] = useState<File[]>([]);
  const [regType, setRegType] = useState(REG_TYPES[0]);
@@ -93,13 +94,14 @@ export function UploadModal({ onClose, onComplete }: Props) {

  const pollStatus = useCallback((docId: string, resolve: () => void, reject: (msg: string) => void) => {
    let attempts = 0;
-    const MAX_ATTEMPTS = 120; // 4 minutes at 2s interval
+    const MAX_ATTEMPTS = 450; // 15 minutes at 2s interval — Aliyun DocMind can take several minutes
    stopPolling();
    pollTimer.current = setInterval(async () => {
      attempts++;
      try {
-        const res = await fetch(`/api/v1/documents/status/${docId}`);
+        const res = await fetch(`/api/v1/documents/status/${docId}`, { headers: authHeader() });
        if (!res.ok) {
+          // Transient HTTP error (e.g. 502 during restart) — keep polling until timeout.
          if (attempts > MAX_ATTEMPTS) { stopPolling(); reject('Polling timeout'); }
          return;
        }
@@ -114,7 +116,7 @@ export function UploadModal({ onClose, onComplete }: Props) {
          reject(data.message ?? 'Processing failed');
        } else if (attempts > MAX_ATTEMPTS) {
          stopPolling();
-          reject('Processing timeout — check Document Management for status');
+          reject('Processing timeout (15 min) — check Document Management for status');
        }
      } catch {
        // network hiccup — keep polling
@@ -127,37 +129,42 @@ export function UploadModal({ onClose, onComplete }: Props) {
    setCurrentFileIdx(idx);
    setDocStatus('idle');

-    const docId = genDocId();
    const form = new FormData();
    form.append('file', file);
-    form.append('doc_id', docId);
    form.append('doc_name', file.name);
    form.append('regulation_type', regType);
    if (version) form.append('version', version);
    form.append('generate_summary', 'false');

-    // Fire upload — this is a long-running synchronous call on the backend.
-    // We start polling immediately so the UI updates as the backend writes status transitions.
-    const uploadPromise = fetch('/api/v1/documents/upload', { method: 'POST', body: form });
+    // Upload the file first — response contains the authoritative doc_id.
+    // Without waiting here we risk polling an ID the server has not yet created.
+    let docId: string;
+    const uploadRes = await fetch('/api/v1/documents/upload', {
+      method: 'POST',
+      headers: authHeader(),
+      body: form,
+    });
+    if (!uploadRes.ok) {
+      const detail = await uploadRes.text().catch(() => uploadRes.statusText);
+      throw new Error(`${file.name}: ${uploadRes.status} ${detail}`);
+    }
+    const uploadData = await uploadRes.json() as { doc_id: string; status: string };
+    docId = uploadData.doc_id;

-    // Start polling after a short delay so the backend has time to create the document record
+    // If backend processed synchronously (sync=true or status already 'indexed'), resolve immediately.
+    if (uploadData.status === 'indexed') {
+      setDocStatus('indexed');
+      return;
+    }
+    if (uploadData.status === 'failed') {
+      setDocStatus('failed');
+      throw new Error(`${file.name}: Processing failed on server`);
+    }
+
+    // Otherwise start polling the authoritative doc_id returned by the server.
+    setDocStatus(uploadData.status as DocStatus);
    await new Promise<void>((res, rej) => {
-      const reject = (msg: string) => rej(new Error(msg));
-      // Begin polling immediately — backend creates the record synchronously before processing
-      setTimeout(() => pollStatus(docId, res, reject), 800);
-
-      // Also handle the upload response (in case processing finishes before poll catches it)
-      uploadPromise.then(async httpRes => {
-        if (!httpRes.ok) {
-          const detail = await httpRes.text().catch(() => httpRes.statusText);
-          stopPolling();
-          reject(`${file.name}: ${httpRes.status} ${detail}`);
-        }
-        // Upload succeeded — polling will catch the final status
-      }).catch(err => {
-        stopPolling();
-        reject(err instanceof Error ? err.message : 'Upload error');
-      });
+      pollStatus(docId, res, (msg: string) => rej(new Error(msg)));
    });
  }

--- a/frontend/src/pages/Login/LoginPage.tsx
+++ b/frontend/src/pages/Login/LoginPage.tsx
@@ -0,0 +1,80 @@
+import React, { FormEvent, useState } from 'react';
+import { useAuth } from '../../contexts';
+
+export function LoginPage() {
+  const { login } = useAuth();
+  const [username, setUsername] = useState('');
+  const [password, setPassword] = useState('');
+  const [error, setError] = useState('');
+  const [loading, setLoading] = useState(false);
+
+  async function handleSubmit(e: FormEvent) {
+    e.preventDefault();
+    if (!username.trim() || !password.trim()) return;
+    setError('');
+    setLoading(true);
+    try {
+      await login(username.trim(), password);
+    } catch (err) {
+      setError(err instanceof Error ? err.message : 'Login failed');
+    } finally {
+      setLoading(false);
+    }
+  }
+
+  return (
+    <div className="login-page">
+      <div className="login-card">
+        <div className="login-brand">
+          <img src="/company-logo.ico" alt="T-Systems" className="login-logo" />
+          <div className="login-brand-text">
+            <div className="login-brand-name">T-Systems</div>
+            <div className="login-brand-sub">AI Regulation Hub</div>
+          </div>
+        </div>
+
+        <h2 className="login-title">Sign in</h2>
+
+        <form onSubmit={handleSubmit} className="login-form">
+          <div className="login-field">
+            <label className="login-label" htmlFor="username">Username</label>
+            <input
+              id="username"
+              type="text"
+              className="login-input"
+              value={username}
+              onChange={e => setUsername(e.target.value)}
+              autoFocus
+              autoComplete="username"
+              disabled={loading}
+              placeholder="e.g. admin"
+            />
+          </div>
+
+          <div className="login-field">
+            <label className="login-label" htmlFor="password">Password</label>
+            <input
+              id="password"
+              type="password"
+              className="login-input"
+              value={password}
+              onChange={e => setPassword(e.target.value)}
+              autoComplete="current-password"
+              disabled={loading}
+            />
+          </div>
+
+          {error && <p className="login-error">{error}</p>}
+
+          <button type="submit" className="login-btn" disabled={loading}>
+            {loading ? 'Signing in…' : 'Sign in'}
+          </button>
+        </form>
+
+        <p className="login-hint">
+          Demo accounts: <code>admin</code> / <code>legal</code> / <code>ehs</code> / <code>readonly</code>
+        </p>
+      </div>
+    </div>
+  );
+}
--- a/frontend/src/pages/Overview/OverviewPage.tsx
+++ b/frontend/src/pages/Overview/OverviewPage.tsx
@@ -1,87 +1,93 @@
 import { useNavigate } from 'react-router-dom';
 import { ArrowRight, BarChart2, Eye, FileText, Shield, MessageSquare, Monitor } from 'lucide-react';
-
-const SCREENS = [
-  { id: 'status', label: 'System Status', icon: <Monitor size={20} />, to: '/status', desc: 'Live health and workflow queue' },
-  { id: 'signals', label: 'Regulatory Signals', icon: <Eye size={20} />, to: '/signals', desc: 'AI-detected regulatory changes' },
-  { id: 'documents', label: 'Document Management', icon: <FileText size={20} />, to: '/documents', desc: 'Upload and inspect documents' },
-  { id: 'compliance', label: 'Compliance Analysis', icon: <Shield size={20} />, to: '/compliance', desc: 'Three-column compliance workspace' },
-  { id: 'chat', label: 'Regulation Q&A', icon: <MessageSquare size={20} />, to: '/chat', desc: 'Chat with cited regulation sources' },
-  { id: 'analytics', label: 'Analytics', icon: <BarChart2 size={20} />, to: '/status', desc: 'KPIs and coverage metrics' },
-];
-
-const STEPS = [
-  { num: '01', label: 'Upload', desc: 'Ingest regulation documents' },
-  { num: '02', label: 'Process', desc: 'Embed and chunk via vector DB' },
-  { num: '03', label: 'Monitor', desc: 'Watch regulatory signal feed' },
-  { num: '04', label: 'Analyze', desc: 'Run compliance gap analysis' },
-  { num: '05', label: 'Review', desc: 'Inspect findings with AI assist' },
-  { num: '06', label: 'Chat', desc: 'Ask questions with cited answers' },
-];
+import { useLanguage } from '../../contexts/LanguageContext';

 export function OverviewPage() {
  const navigate = useNavigate();
+  const { t } = useLanguage();
+
+  const SCREENS = [
+    { id: 'status', label: t.overview.screenStatus, icon: <Monitor size={20} />, to: '/status', desc: t.overview.screenStatusDesc },
+    { id: 'signals', label: t.overview.screenSignals, icon: <Eye size={20} />, to: '/signals', desc: t.overview.screenSignalsDesc },
+    { id: 'documents', label: t.overview.screenDocuments, icon: <FileText size={20} />, to: '/documents', desc: t.overview.screenDocumentsDesc },
+    { id: 'compliance', label: t.overview.screenCompliance, icon: <Shield size={20} />, to: '/compliance', desc: t.overview.screenComplianceDesc },
+    { id: 'chat', label: t.overview.screenChat, icon: <MessageSquare size={20} />, to: '/chat', desc: t.overview.screenChatDesc },
+    { id: 'analytics', label: t.overview.screenAnalytics, icon: <BarChart2 size={20} />, to: '/status', desc: t.overview.screenAnalyticsDesc },
+  ];
+
+  const STEPS = [
+    { num: '01', label: t.overview.stepUpload, desc: t.overview.stepUploadDesc },
+    { num: '02', label: t.overview.stepProcess, desc: t.overview.stepProcessDesc },
+    { num: '03', label: t.overview.stepMonitor, desc: t.overview.stepMonitorDesc },
+    { num: '04', label: t.overview.stepAnalyze, desc: t.overview.stepAnalyzeDesc },
+    { num: '05', label: t.overview.stepReview, desc: t.overview.stepReviewDesc },
+    { num: '06', label: t.overview.stepChat, desc: t.overview.stepChatDesc },
+  ];
+
  return (
-    <div className="overview-page">
-      <section className="overview-hero">
-        <p className="hero-eyebrow">T-Systems · AI Regulation Hub</p>
-        <h1 className="hero-title">AI Compliance,<br />Automated end-to-end</h1>
-        <p className="hero-desc">
-          Monitor global AI regulations, analyze document compliance gaps,
-          and get cited answers — all in one platform.
-        </p>
-        <div className="hero-actions">
-          <button className="btn primary" onClick={() => navigate('/status')}>
-            Open dashboard <ArrowRight size={14} />
-          </button>
-          <button className="btn" onClick={() => navigate('/chat')}>
-            Jump to regulation chat
-          </button>
-        </div>
-      </section>
-
-      <div className="overview-summary card">
-        <div className="summary-item">
-          <span className="summary-num">6</span>
-          <span className="summary-label">Screens</span>
-        </div>
-        <div className="summary-divider" />
-        <div className="summary-item">
-          <span className="summary-num">5</span>
-          <span className="summary-label">Backend-aware flows</span>
-        </div>
-        <div className="summary-divider" />
-        <div className="summary-item">
-          <span className="summary-num">AI</span>
-          <span className="summary-label">Review posture</span>
-        </div>
-      </div>
-
-      <section className="overview-workflow">
-        <h2 className="section-title">How it works</h2>
-        <div className="workflow-steps">
-          {STEPS.map(s => (
-            <div key={s.num} className="workflow-step">
-              <div className="step-num">{s.num}</div>
-              <div className="step-label">{s.label}</div>
-              <div className="step-desc">{s.desc}</div>
-            </div>
-          ))}
-        </div>
-      </section>
-
-      <section className="overview-screens">
-        <h2 className="section-title">Screens</h2>
-        <div className="screen-grid">
-          {SCREENS.map(s => (
-            <button key={s.id} className="screen-card card" onClick={() => navigate(s.to)}>
-              <div className="screen-icon">{s.icon}</div>
-              <div className="screen-label">{s.label}</div>
-              <div className="screen-desc">{s.desc}</div>
+    <div className="overview-scroll-wrapper">
+      <div className="overview-page">
+        <section className="overview-hero">
+          <p className="hero-eyebrow">{t.overview.eyebrow}</p>
+          <h1 className="hero-title">
+            {t.overview.heroTitle.split('\n').map((line, i) => (
+              <span key={i}>{line}{i === 0 && <br />}</span>
+            ))}
+          </h1>
+          <p className="hero-desc">{t.overview.heroDesc}</p>
+          <div className="hero-actions">
+            <button className="btn primary" onClick={() => navigate('/status')}>
+              {t.overview.openDashboard} <ArrowRight size={14} />
            </button>
-          ))}
+            <button className="btn" onClick={() => navigate('/chat')}>
+              {t.overview.jumpToChat}
+            </button>
+          </div>
+        </section>
+
+        <div className="overview-summary card">
+          <div className="summary-item">
+            <span className="summary-num">6</span>
+            <span className="summary-label">{t.overview.statScreens}</span>
+          </div>
+          <div className="summary-divider" />
+          <div className="summary-item">
+            <span className="summary-num">5</span>
+            <span className="summary-label">{t.overview.statFlows}</span>
+          </div>
+          <div className="summary-divider" />
+          <div className="summary-item">
+            <span className="summary-num">AI</span>
+            <span className="summary-label">{t.overview.statReviewPosture}</span>
+          </div>
        </div>
-      </section>
+
+        <section className="overview-workflow">
+          <h2 className="section-title">{t.overview.sectionHowItWorks}</h2>
+          <div className="workflow-steps">
+            {STEPS.map(s => (
+              <div key={s.num} className="workflow-step">
+                <div className="step-num">{s.num}</div>
+                <div className="step-label">{s.label}</div>
+                <div className="step-desc">{s.desc}</div>
+              </div>
+            ))}
+          </div>
+        </section>
+
+        <section className="overview-screens">
+          <h2 className="section-title">{t.overview.sectionScreens}</h2>
+          <div className="screen-grid">
+            {SCREENS.map(s => (
+              <button key={s.id} className="screen-card card" onClick={() => navigate(s.to)}>
+                <div className="screen-icon">{s.icon}</div>
+                <div className="screen-label">{s.label}</div>
+                <div className="screen-desc">{s.desc}</div>
+              </button>
+            ))}
+          </div>
+        </section>
+      </div>
    </div>
  );
 }
--- a/frontend/src/pages/Perception/PerceptionPage.tsx
+++ b/frontend/src/pages/Perception/PerceptionPage.tsx
@@ -1,17 +1,14 @@
 import { useState, useEffect, useRef } from 'react';
 import { Topbar } from '../../components/layout/Topbar';
 import { RefreshCw, Play, Square, ExternalLink } from 'lucide-react';
+import { usePageState } from '../../contexts';
+import type { PerceptionSignal } from '../../contexts';
+import { useLanguage } from '../../contexts/LanguageContext';

-interface Signal {
-  id: string;
-  source: string;
-  standard: string;
-  status: 'ok' | 'warn' | 'risk' | 'info';
-  title: string;
-  summary: string;
-  date: string;
-  tags: string[];
-  impact: 'High' | 'Medium' | 'Low';
+const TOKEN_KEY = 'auth_token';
+function authHeader(): Record<string, string> {
+  const t = localStorage.getItem(TOKEN_KEY);
+  return t ? { Authorization: `Bearer ${t}` } : {};
 }

 interface Stats {
@@ -21,29 +18,17 @@ interface Stats {
  last_90_days: number;
 }

-interface DocResult {
-  score: number;
-  name: string;
-  clause: string;
-  snippet: string;
-}
-
 const SOURCES = ['All', 'MIIT', 'UN-ECE', 'ISO', 'GB Comm.', 'EUR-Lex', 'IATF'];
 const IMPACTS = ['All', 'High', 'Medium', 'Low'];

-// Backend /api/v1/perception/stats returns:
-// { total, high_impact, medium_impact, last_90_days } — field names match, ✓
-
-// Backend /api/v1/perception/events returns:
-// { events: [{ id, title, summary, source, standard, impact_level, published_at, tags, status }] }
-// Map backend event fields → frontend Signal shape
-function mapEvent(e: Record<string, unknown>): Signal {
+// Backend event → Signal
+function mapEvent(e: Record<string, unknown>): PerceptionSignal {
  const impact = String(e.impact_level ?? '').toLowerCase();
  const backendStatus = String(e.status ?? '').toLowerCase();
  return {
    id: String(e.id ?? e.event_id ?? ''),
    source: String(e.source ?? ''),
-    standard: String(e.standard ?? e.regulation_id ?? ''),
+    standard: String(e.standard ?? e.standard_code ?? e.regulation_id ?? ''),
    status: backendStatus === 'high' || backendStatus === 'urgent' ? 'risk'
          : backendStatus === 'medium' || backendStatus === 'draft' ? 'warn'
          : backendStatus === 'low' || backendStatus === 'final' ? 'ok'
@@ -56,67 +41,78 @@ function mapEvent(e: Record<string, unknown>): Signal {
  };
 }

-const MOCK_SIGNALS: Signal[] = [
+const MOCK_SIGNALS: PerceptionSignal[] = [
  {
    id: '1', source: 'EUR-Lex', standard: 'EU/2024/1689', status: 'risk',
    title: 'EU AI Act — High-risk AI in vehicles',
    summary: 'Article 9 mandates risk management systems for automotive AI classifying as high-risk under Annex III point 3.',
-    date: '2025-11-18', tags: ['automotive', 'GDPR', 'certification'], impact: 'High'
+    date: '2025-11-18', tags: ['automotive', 'GDPR', 'certification'], impact: 'High',
  },
  {
    id: '2', source: 'MIIT', standard: 'Draft-2025-08', status: 'warn',
    title: 'MIIT Draft — in-vehicle AI training data',
    summary: 'Draft regulation requires OEM data provenance documentation and OTA audit trails for AI systems.',
-    date: '2025-10-30', tags: ['OTA', 'data-governance', 'China'], impact: 'High'
+    date: '2025-10-30', tags: ['OTA', 'data-governance', 'China'], impact: 'High',
  },
  {
    id: '3', source: 'ISO', standard: 'ISO/SAE 21434:2021/Amd1', status: 'info',
    title: 'ISO/SAE 21434 Amendment 1',
    summary: 'Amendment clarifies CSMS scope for software-only updates and vulnerability disclosure timelines.',
-    date: '2025-10-05', tags: ['cybersecurity', 'CSMS', 'ISO'], impact: 'Medium'
+    date: '2025-10-05', tags: ['cybersecurity', 'CSMS', 'ISO'], impact: 'Medium',
  },
-  {
-    id: '4', source: 'UN-ECE', standard: 'UNECE WP.29 R155', status: 'ok',
-    title: 'UNECE R155 Corrigendum',
-    summary: 'Editorial corrections to cybersecurity management system requirements. No substantive changes.',
-    date: '2025-09-12', tags: ['type-approval', 'UNECE'], impact: 'Low'
-  },
-];
-
-const MOCK_DOCS: DocResult[] = [
-  { score: 94, name: 'Vehicle AI Safety Manual v3.2', clause: '§4.2.1', snippet: 'The risk management process shall identify and evaluate risks arising from AI system decisions in safety-critical scenarios...' },
-  { score: 87, name: 'ADAS System Requirements', clause: '§7.1', snippet: 'Automated driving functions must document training data lineage and model performance envelopes prior to deployment.' },
-  { score: 71, name: 'Type Approval Documentation', clause: 'Annex B', snippet: 'Cybersecurity management system certification requires third-party audit of AI decision audit logs retention policy.' },
 ];

 export function PerceptionPage() {
-  const [stats, setStats] = useState<Stats | null>(null);
-  const [signals, setSignals] = useState<Signal[]>(MOCK_SIGNALS);
-  const [searchQuery, setSearchQuery] = useState('');
-  const [sourceFilter, setSourceFilter] = useState('All');
-  const [impactFilter, setImpactFilter] = useState('All');
-  const [selected, setSelected] = useState<Signal | null>(null);
-  const [streaming, setStreaming] = useState(false);
-  const [aiOutput, setAiOutput] = useState('');
-  const abortRef = useRef<AbortController | null>(null);
+  const { t } = useLanguage();
+  // Persistent state lives in PageStateContext — survives route changes
+  const { perceptionState, setPerceptionState, perceptionAbortRef, perceptionCrawlAbortRef } = usePageState();
+  const { signals, searchQuery, sourceFilter, impactFilter, selectedId, aiOutput, detailTab, crawlStatus } = perceptionState;

+  // Stats and selectedFull are lightweight to re-fetch on mount
+  const [stats, setStats] = useState<Stats | null>(null);
+  const [streaming, setStreaming] = useState(false);
+  const [crawling, setCrawling] = useState(false);
+  // Full event detail — re-fetched when selected changes or page mounts with a selection
+  const [selectedFull, setSelectedFull] = useState<Record<string, unknown> | null>(null);
+
+  // Re-fetch stats every time the page mounts
  useEffect(() => {
-    fetch('/api/v1/perception/stats')
+    fetch('/api/v1/perception/stats', { headers: authHeader() })
      .then(r => r.json())
      .then(setStats)
      .catch(() => setStats({ total: 47, high_impact: 7, medium_impact: 18, last_90_days: 14 }));
  }, []);

+  // Fetch signal list on first mount only (if empty), otherwise preserve context state
  useEffect(() => {
-    fetch('/api/v1/perception/events?limit=100')
+    if (signals.length > 0) return; // already loaded
+    fetch('/api/v1/perception/events?limit=100', { headers: authHeader() })
      .then(r => r.json())
      .then(d => {
        if (Array.isArray(d?.events) && d.events.length > 0) {
-          setSignals(d.events.map(mapEvent));
+          setPerceptionState(s => ({ ...s, signals: d.events.map(mapEvent) }));
+        } else {
+          setPerceptionState(s => ({ ...s, signals: MOCK_SIGNALS }));
        }
      })
-      .catch(() => { /* keep mock data on error */ });
-  }, []);
+      .catch(() => {
+        setPerceptionState(s => ({ ...s, signals: s.signals.length > 0 ? s.signals : MOCK_SIGNALS }));
+      });
+  }, []); // eslint-disable-line react-hooks/exhaustive-deps
+
+  // Re-fetch full event detail when navigating back with a selected signal
+  useEffect(() => {
+    if (selectedId) {
+      fetch(`/api/v1/perception/events/${selectedId}`, { headers: authHeader() })
+        .then(r => r.ok ? r.json() : null)
+        .then(d => { if (d) setSelectedFull(d); })
+        .catch(() => {});
+    } else {
+      setSelectedFull(null);
+    }
+  }, [selectedId]);
+
+  const selected = signals.find(s => s.id === selectedId) ?? null;

  const filtered = signals.filter(s => {
    if (sourceFilter !== 'All' && s.source !== sourceFilter) return false;
@@ -131,13 +127,20 @@ export function PerceptionPage() {
  function runAnalysis() {
    if (!selected) return;
    setStreaming(true);
-    setAiOutput('');
+    setPerceptionState(s => ({ ...s, aiOutput: '' }));
    const ctrl = new AbortController();
-    abortRef.current = ctrl;
-    // Backend: POST /api/v1/perception/events/{id}/analyze  → SSE stream
-    fetch(`/api/v1/perception/events/${selected.id}/analyze`, { method: 'POST', signal: ctrl.signal })
+    perceptionAbortRef.current = ctrl;
+    fetch(`/api/v1/perception/events/${selected.id}/analyze`, {
+      method: 'POST',
+      headers: authHeader(),
+      signal: ctrl.signal,
+    })
      .then(async res => {
-        if (!res.body) { setAiOutput('No stream available.'); setStreaming(false); return; }
+        if (!res.body) {
+          setPerceptionState(s => ({ ...s, aiOutput: 'No stream available.' }));
+          setStreaming(false);
+          return;
+        }
        const reader = res.body.getReader();
        const dec = new TextDecoder();
        let buf = '';
@@ -154,47 +157,124 @@ export function PerceptionPage() {
            if (!raw || raw === '[DONE]') continue;
            try {
              const j = JSON.parse(raw);
-              if (j.text) setAiOutput(p => p + j.text);
-              else if (typeof j === 'string') setAiOutput(p => p + j);
+              if (j.text) setPerceptionState(s => ({ ...s, aiOutput: s.aiOutput + j.text }));
+              else if (typeof j === 'string') setPerceptionState(s => ({ ...s, aiOutput: s.aiOutput + j }));
            } catch {
-              setAiOutput(p => p + raw);
+              setPerceptionState(s => ({ ...s, aiOutput: s.aiOutput + raw }));
            }
          }
        }
        setStreaming(false);
      })
      .catch(e => {
-        if (e.name !== 'AbortError') setAiOutput('Analysis failed. Check API connection.');
+        if (e.name !== 'AbortError') setPerceptionState(s => ({ ...s, aiOutput: 'Analysis failed. Check API connection.' }));
        setStreaming(false);
      });
  }

  function stopAnalysis() {
-    abortRef.current?.abort();
+    perceptionAbortRef.current?.abort();
    setStreaming(false);
  }

-  function selectSignal(sig: Signal) {
-    setSelected(sig);
-    setAiOutput('');
+  async function runCrawl() {
+    setCrawling(true);
+    setPerceptionState(s => ({ ...s, crawlStatus: t.signals.statusConnecting }));
+    try {
+      const res = await fetch('/api/v1/perception/crawl', {
+        method: 'POST',
+        headers: { 'Content-Type': 'application/json', ...authHeader() },
+        body: JSON.stringify({}),
+      });
+      if (!res.body) {
+        setPerceptionState(s => ({ ...s, crawlStatus: 'No stream' }));
+        setCrawling(false);
+        return;
+      }
+      const reader = res.body.getReader();
+      const dec = new TextDecoder();
+      let buf = '';
+      while (true) {
+        const { done, value } = await reader.read();
+        if (done) break;
+        buf += dec.decode(value);
+        const parts = buf.split('\n\n');
+        buf = parts.pop() ?? '';
+        for (const block of parts) {
+          const eventLine = block.split('\n').find(l => l.startsWith('event: '));
+          const dataLine = block.split('\n').find(l => l.startsWith('data: '));
+          const evtName = eventLine?.slice(7).trim();
+          const raw = dataLine?.slice(6).trim();
+          if (!raw) continue;
+          try {
+            const d = JSON.parse(raw);
+            if (evtName === 'progress') {
+              setPerceptionState(s => ({
+                ...s,
+                crawlStatus: `${d.source}: ${d.stage === 'fetching' ? t.signals.statusCrawling : d.stage === 'processing' ? t.signals.statusProcessing.replace('{count}', String(d.fetched)) : t.signals.statusComplete.replace('{count}', String(d.new))}`,
+              }));
+            } else if (evtName === 'done') {
+              setPerceptionState(s => ({ ...s, crawlStatus: t.signals.statusUpdateComplete.replace('{new}', String(d.total_new)).replace('{updated}', String(d.total_updated)) }));
+              fetch('/api/v1/perception/events?limit=100', { headers: authHeader() })
+                .then(r => r.json())
+                .then(d2 => {
+                  if (Array.isArray(d2?.events)) {
+                    setPerceptionState(s => ({ ...s, signals: d2.events.map(mapEvent) }));
+                  }
+                });
+            } else if (evtName === 'error') {
+              setPerceptionState(s => ({
+                ...s,
+                crawlStatus: t.signals.statusError.replace('{message}', typeof d === 'string' ? d : String(d.message)),
+              }));
+            }
+          } catch { /* ignore */ }
+        }
+      }
+    } catch (e: unknown) {
+      setPerceptionState(s => ({
+        ...s,
+        crawlStatus: t.signals.statusConnFailed.replace('{message}', e instanceof Error ? e.message : String(e)),
+      }));
+    }
+    setCrawling(false);
+  }
+
+  function selectSignal(sig: PerceptionSignal) {
+    setPerceptionState(s => ({
+      ...s,
+      selectedId: sig.id,
+      aiOutput: '',
+      detailTab: 'overview',
+    }));
+    setSelectedFull(null);
    setStreaming(false);
+    perceptionAbortRef.current?.abort();
  }

  return (
    <div className="perception-page">
      <Topbar
-        title="Regulatory Signals"
-        subtitle="ai-powered · live feed"
+        title={t.signals.topbarTitle}
+        subtitle={t.signals.topbarSub}
        actions={
          <>
            <div className="search-box">
              <input
-                placeholder="Search signals..."
+                placeholder={t.signals.searchPlaceholder}
                value={searchQuery}
-                onChange={e => setSearchQuery(e.target.value)}
+                onChange={e => setPerceptionState(s => ({ ...s, searchQuery: e.target.value }))}
              />
            </div>
-            <button className="btn sm"><RefreshCw size={13} />Refresh</button>
+            <button className="btn sm primary" onClick={runCrawl} disabled={crawling}>
+              <RefreshCw size={13} className={crawling ? 'spin' : ''} />
+              {crawling ? t.signals.crawlingBtn : t.signals.refreshBtn}
+            </button>
+            {crawlStatus && (
+              <span style={{ fontSize: 12, color: 'var(--text-secondary)', marginLeft: 8 }}>
+                {crawlStatus}
+              </span>
+            )}
          </>
        }
      />
@@ -202,32 +282,44 @@ export function PerceptionPage() {
      <div className="stats-bar">
        <div className="sbar-cell">
          <span className="sbar-val">{stats?.total ?? '—'}</span>
-          <span className="sbar-lbl">Total signals</span>
+          <span className="sbar-lbl">{t.signals.statTotal}</span>
        </div>
        <div className="sbar-cell danger">
          <span className="sbar-val">{stats?.high_impact ?? '—'}</span>
-          <span className="sbar-lbl">High impact</span>
+          <span className="sbar-lbl">{t.signals.statHigh}</span>
        </div>
        <div className="sbar-cell warn">
          <span className="sbar-val">{stats?.medium_impact ?? '—'}</span>
-          <span className="sbar-lbl">Medium impact</span>
+          <span className="sbar-lbl">{t.signals.statMedium}</span>
        </div>
        <div className="sbar-cell accent">
          <span className="sbar-val">{stats?.last_90_days ?? '—'}</span>
-          <span className="sbar-lbl">Last 90 days</span>
+          <span className="sbar-lbl">{t.signals.statLast90}</span>
        </div>
      </div>

      <div className="filter-bar">
        <div className="chip-group">
          {SOURCES.map(s => (
-            <button key={s} className={`chip${sourceFilter === s ? ' active' : ''}`} onClick={() => setSourceFilter(s)}>{s}</button>
+            <button
+              key={s}
+              className={`chip${sourceFilter === s ? ' active' : ''}`}
+              onClick={() => setPerceptionState(st => ({ ...st, sourceFilter: s }))}
+            >
+              {s}
+            </button>
          ))}
        </div>
        <div className="filter-sep" />
        <div className="chip-group">
          {IMPACTS.map(i => (
-            <button key={i} className={`chip${impactFilter === i ? ' active' : ''}`} onClick={() => setImpactFilter(i)}>{i}</button>
+            <button
+              key={i}
+              className={`chip${impactFilter === i ? ' active' : ''}`}
+              onClick={() => setPerceptionState(st => ({ ...st, impactFilter: i }))}
+            >
+              {i}
+            </button>
          ))}
        </div>
      </div>
@@ -237,21 +329,21 @@ export function PerceptionPage() {
          {filtered.map(sig => (
            <div
              key={sig.id}
-              className={`ev-card${selected?.id === sig.id ? ' selected' : ''}`}
+              className={`ev-card${selectedId === sig.id ? ' selected' : ''}`}
              onClick={() => selectSignal(sig)}
            >
              <div className="ev-top">
                <span className="source-tag">{sig.source}</span>
                <span className="ev-std">{sig.standard}</span>
                <span className={`status ${sig.status}`}>
-                  {sig.status === 'ok' ? 'Final' : sig.status === 'warn' ? 'Draft' : sig.status === 'risk' ? 'Urgent' : 'Published'}
+                  {sig.status === 'ok' ? t.signals.badgeFinal : sig.status === 'warn' ? t.signals.badgeDraft : sig.status === 'risk' ? t.signals.badgeUrgent : t.signals.badgePublished}
                </span>
              </div>
              <div className="ev-title">{sig.title}</div>
              <div className="ev-summary">{sig.summary}</div>
              <div className="ev-bottom">
                <span className="ev-date">{sig.date}</span>
-                <div className="ev-tags">{sig.tags.map(t => <span key={t} className="ev-tag">{t}</span>)}</div>
+                <div className="ev-tags">{sig.tags.map(tag => <span key={tag} className="ev-tag">{tag}</span>)}</div>
                <span className={`impact-dot impact-${sig.impact.toLowerCase()}`}>{sig.impact}</span>
              </div>
            </div>
@@ -262,7 +354,7 @@ export function PerceptionPage() {
          {!selected ? (
            <div className="analysis-empty">
              <div className="empty-ring" />
-              <p>Select a signal to run impact analysis</p>
+              <p>{t.signals.emptySelectSignal}</p>
            </div>
          ) : (
            <>
@@ -271,36 +363,176 @@ export function PerceptionPage() {
                  <span className="source-tag">{selected.source}</span>
                  <span className="ev-std">{selected.standard}</span>
                  <span className={`status ${selected.status}`}>
-                    {selected.status === 'risk' ? 'Urgent' : 'Published'}
+                    {selected.status === 'risk' ? t.signals.badgeUrgent : selected.status === 'warn' ? t.signals.badgeDraft : t.signals.badgePublished}
                  </span>
+                  {selectedFull?.change_summary && (
+                    <span className="status warn" style={{ marginLeft: 'auto' }}>CHANGED</span>
+                  )}
                </div>
                <div className="detail-title">{selected.title}</div>
                <p className="detail-summary">{selected.summary}</p>
                <div className="detail-actions">
                  {!streaming
-                    ? <button className="btn sm primary" onClick={runAnalysis}><Play size={12} />Run impact analysis</button>
-                    : <button className="btn sm" onClick={stopAnalysis}><Square size={12} />Stop</button>
+                    ? <button className="btn sm primary" onClick={runAnalysis}><Play size={12} />{t.signals.runAnalysis}</button>
+                    : <button className="btn sm" onClick={stopAnalysis}><Square size={12} />{t.signals.stopBtn}</button>
                  }
-                  <button className="btn sm"><ExternalLink size={12} />Source</button>
+                  {selected && (
+                    <a
+                      href={(selectedFull?.full_text_url as string) || '#'}
+                      target="_blank"
+                      rel="noopener noreferrer"
+                      className="btn sm"
+                    >
+                      <ExternalLink size={12} />{t.signals.sourceLink}
+                    </a>
+                  )}
                </div>
              </div>

-              <div className="card docs-card">
-                <div className="card-header">Affected documents</div>
-                {MOCK_DOCS.map(d => (
-                  <div key={d.name} className="doc-row">
-                    <span className="doc-score">{d.score}%</span>
-                    <div>
-                      <div className="doc-name">{d.name} <span className="doc-clause">{d.clause}</span></div>
-                      <div className="doc-snippet">{d.snippet}</div>
-                    </div>
-                  </div>
+              <div className="detail-tabs">
+                {(['overview', 'obligations', 'assessment', 'diff'] as const).map(tab => (
+                  <button
+                    key={tab}
+                    className={`detail-tab${detailTab === tab ? ' active' : ''}${tab === 'diff' && !selectedFull?.change_summary ? ' disabled' : ''}`}
+                    onClick={() => {
+                      if (tab !== 'diff' || selectedFull?.change_summary) {
+                        setPerceptionState(s => ({ ...s, detailTab: tab }));
+                      }
+                    }}
+                  >
+                    {tab === 'overview' ? t.signals.tabOverview : tab === 'obligations' ? t.signals.tabObligations : tab === 'assessment' ? t.signals.tabImpact : t.signals.tabChanges}
+                  </button>
                ))}
              </div>

+              {detailTab === 'overview' && (
+                <div className="card">
+                  <div className="card-header">{t.signals.cardScopeHeader}</div>
+                  <p className="detail-summary" style={{ marginTop: 8 }}>
+                    {(selectedFull?.scope as string) || selected.summary}
+                  </p>
+                  {selectedFull?.penalties && (
+                    <p style={{ fontSize: 13, color: 'var(--danger)', marginTop: 6 }}>
+                      ⚠ {selectedFull.penalties as string}
+                    </p>
+                  )}
+                </div>
+              )}
+
+              {detailTab === 'obligations' && (
+                <div className="card">
+                  <div className="card-header">{t.signals.cardObligationsHeader}</div>
+                  {(() => {
+                    const obs = (selectedFull?.obligations as Array<Record<string, string>>) || [];
+                    const deadlines = (selectedFull?.deadlines as Array<Record<string, string>>) || [];
+                    return obs.length === 0 && deadlines.length === 0 ? (
+                      <p className="detail-summary" style={{ marginTop: 8 }}>{t.signals.obligationsEmpty}</p>
+                    ) : (
+                      <>
+                        {obs.length > 0 && (
+                          <table style={{ width: '100%', fontSize: 13, borderCollapse: 'collapse', marginTop: 8 }}>
+                            <thead>
+                              <tr style={{ borderBottom: '1px solid var(--border)' }}>
+                                <th style={{ textAlign: 'left', padding: '4px 8px' }}>{t.signals.colObligationDesc}</th>
+                                <th style={{ textAlign: 'left', padding: '4px 8px', width: 80 }}>{t.signals.colSubject}</th>
+                                <th style={{ textAlign: 'left', padding: '4px 8px', width: 60 }}>{t.signals.colType}</th>
+                              </tr>
+                            </thead>
+                            <tbody>
+                              {obs.map((ob, i) => (
+                                <tr key={i} style={{ borderBottom: '1px solid var(--border-faint)' }}>
+                                  <td style={{ padding: '6px 8px' }}>{ob.text}</td>
+                                  <td style={{ padding: '6px 8px', color: 'var(--text-secondary)' }}>{ob.subject}</td>
+                                  <td style={{ padding: '6px 8px' }}>
+                                    <span className={`status ${ob.deontic === 'must' || ob.deontic === 'shall' ? 'risk' : ob.deontic === 'prohibited' ? 'risk' : 'info'}`}>
+                                      {ob.deontic}
+                                    </span>
+                                  </td>
+                                </tr>
+                              ))}
+                            </tbody>
+                          </table>
+                        )}
+                        {deadlines.length > 0 && (
+                          <div style={{ marginTop: 12 }}>
+                            <div className="card-header">{t.signals.colDeadline}</div>
+                            {deadlines.map((d, i) => (
+                              <div key={i} style={{ fontSize: 13, padding: '4px 0', display: 'flex', gap: 12 }}>
+                                <span style={{ fontWeight: 600, color: 'var(--danger)' }}>{d.date || t.signals.deadlinePending}</span>
+                                <span style={{ color: 'var(--text-secondary)' }}>{d.description}</span>
+                              </div>
+                            ))}
+                          </div>
+                        )}
+                      </>
+                    );
+                  })()}
+                </div>
+              )}
+
+              {detailTab === 'assessment' && (
+                <div className="card docs-card">
+                  <div className="card-header">{t.signals.cardAffectedDocs}</div>
+                  {(() => {
+                    const docs = (selectedFull?.affected_docs as Array<Record<string, unknown>>);
+                    const displayDocs = docs && docs.length > 0 ? docs : [];
+                    return displayDocs.length === 0
+                      ? <p className="detail-summary" style={{ marginTop: 8 }}>{t.signals.noAffectedDocs}</p>
+                      : displayDocs.map((d, i) => (
+                          <div key={i} className="doc-row">
+                            <span className="doc-score">{Math.round(Number(d.score ?? 0) * 100)}%</span>
+                            <div>
+                              <div className="doc-name">
+                                {String(d.doc_name || '')}
+                                <span className="doc-clause">{String(d.key_clauses || d.clause || '')}</span>
+                              </div>
+                              {d.snippet && <div className="doc-snippet">{String(d.snippet)}</div>}
+                              {d.recommendation && (
+                                <div style={{ fontSize: 12, color: 'var(--accent)', marginTop: 2 }}>→ {String(d.recommendation)}</div>
+                              )}
+                            </div>
+                          </div>
+                        ));
+                  })()}
+                </div>
+              )}
+
+              {detailTab === 'diff' && selectedFull?.change_summary && (
+                <div className="card">
+                  <div className="card-header">{t.signals.diffCardHeader}</div>
+                  <p style={{ fontSize: 13, color: 'var(--text-secondary)', marginTop: 8 }}>
+                    {selectedFull.change_summary as string}
+                  </p>
+                  {(() => {
+                    const sections = (selectedFull.changed_sections as Array<Record<string, unknown>>) || [];
+                    return sections.map((s, i) => (
+                      <div key={i} style={{ marginTop: 12, borderTop: '1px solid var(--border)', paddingTop: 10 }}>
+                        <div style={{ display: 'flex', gap: 8, marginBottom: 6 }}>
+                          <span className={`status ${s.change_type === 'tightened' || s.change_type === 'added' ? 'risk' : s.change_type === 'removed' ? 'warn' : 'info'}`}>
+                            {String(s.change_type)}
+                          </span>
+                          <span style={{ fontSize: 12, color: 'var(--text-secondary)' }}>cosine: {String(s.similarity)}</span>
+                        </div>
+                        <div style={{ display: 'grid', gridTemplateColumns: '1fr 1fr', gap: 8, fontSize: 12 }}>
+                          <div style={{ background: 'var(--danger-bg)', padding: 8, borderRadius: 4 }}>
+                            <div style={{ fontWeight: 600, marginBottom: 4 }}>{t.signals.diffOld}</div>
+                            {String(s.old_text || '')}
+                          </div>
+                          <div style={{ background: 'var(--success-bg)', padding: 8, borderRadius: 4 }}>
+                            <div style={{ fontWeight: 600, marginBottom: 4 }}>{t.signals.diffNew}</div>
+                            {String(s.new_text || '')}
+                          </div>
+                        </div>
+                        {s.summary && <p style={{ fontSize: 12, marginTop: 6, color: 'var(--text-secondary)' }}>{String(s.summary)}</p>}
+                      </div>
+                    ));
+                  })()}
+                </div>
+              )}
+
              {(aiOutput || streaming) && (
                <div className="card ai-card">
-                  <div className="card-header">AI Impact Analysis</div>
+                  <div className="card-header">{t.signals.cardAIImpact}</div>
                  <div className="ai-output">
                    {aiOutput}
                    {streaming && <span className="blink-cursor">▋</span>}
@@ -314,7 +546,7 @@ export function PerceptionPage() {

      <footer className="page-footer">
        <div className="live-dot" />
-        <span>Live feed · Regulation Hub</span>
+        <span>{t.signals.footerText}</span>
      </footer>
    </div>
  );
--- a/frontend/src/pages/RagChat/RagChatPage.tsx
+++ b/frontend/src/pages/RagChat/RagChatPage.tsx
@@ -1,27 +1,18 @@
-import { useState, useRef, useEffect, useCallback } from 'react';
+import { useRef, useEffect, useCallback, useState } from 'react';
 import { Topbar } from '../../components/layout/Topbar';
 import { Send, Download } from 'lucide-react';
+import { usePageState } from '../../contexts';
+import type { RagCitation } from '../../contexts';
+import { useLanguage } from '../../contexts/LanguageContext';

-interface Message {
-  id: string;
-  role: 'user' | 'assistant';
-  text: string;
-  // citation indices mentioned in this assistant message (1-based, matching citations array)
-  citationRefs?: number[];
-}
-
-interface Citation {
-  index: number;   // 1-based, matches [N] markers in text
-  score: number;   // 0–100 display percentage
-  name: string;    // doc_name
-  clause: string;  // section_title or clause
-  snippet: string; // preview text
-  docId?: string;
+const TOKEN_KEY = 'auth_token';
+function authHeader(): Record<string, string> {
+  const t = localStorage.getItem(TOKEN_KEY);
+  return t ? { Authorization: `Bearer ${t}` } : {};
 }

 // Map a raw source doc from the backend "retrieved" event to our Citation shape.
-// Backend fields: { id, score(0-1), preview, doc_name, clause, doc_id }
-function mapSource(s: Record<string, unknown>, idx: number): Citation {
+function mapSource(s: Record<string, unknown>, idx: number): RagCitation {
  const rawScore = typeof s.score === 'number' ? s.score : 0;
  const displayScore = rawScore <= 1 ? Math.round(rawScore * 100) : Math.round(rawScore);
  return {
@@ -67,27 +58,24 @@ const MOCK_QUICK = [
 ];

 export function RagChatPage() {
-  const [messages, setMessages] = useState<Message[]>([
-    {
-      id: 'init', role: 'assistant',
-      text: 'Hello! I can answer questions about your indexed regulations and compliance documents. Try asking about EU AI Act requirements, MIIT rules, or ISO/SAE 21434 scope.',
-    }
-  ]);
-  const [quickPrompts, setQuickPrompts] = useState<string[]>(MOCK_QUICK);
-  const [input, setInput] = useState('');
-  const [streaming, setStreaming] = useState(false);
-  const [citations, setCitations] = useState<Citation[]>([]);
+  // All persistent state lives in PageStateContext — survives route changes
+  const { ragState, setRagState, ragStreamingRef, ragAbortRef } = usePageState();
+  const { t } = useLanguage();
+  const { messages, citations, sessionId, inputDraft } = ragState;
+
+  // Local-only UI state: highlighted citation and streaming indicator
+  // These are fine to reset on navigation since they're transient UI feedback
  const [highlightedCit, setHighlightedCit] = useState<number | null>(null);
-  const [sessionId, setSessionId] = useState<string | null>(null);
+  const [streaming, setStreaming] = useState(ragStreamingRef.current);
+  const [quickPrompts, setQuickPrompts] = useState<string[]>(MOCK_QUICK);

  const bottomRef = useRef<HTMLDivElement>(null);
  const citRailRef = useRef<HTMLDivElement>(null);
  const citItemRefs = useRef<Record<number, HTMLDivElement | null>>({});
-  const abortRef = useRef<AbortController | null>(null);

-  // Fetch quick questions from backend on mount
+  // Fetch quick questions from backend on mount (only once per session)
  useEffect(() => {
-    fetch('/api/v1/rag/quick-questions')
+    fetch('/api/v1/rag/quick-questions', { headers: authHeader() })
      .then(r => r.json())
      .then(d => {
        if (Array.isArray(d?.questions) && d.questions.length > 0) {
@@ -109,26 +97,33 @@ export function RagChatPage() {
    if (el) {
      el.scrollIntoView({ behavior: 'smooth', block: 'nearest' });
    }
-    // Clear highlight after 3s
    setTimeout(() => setHighlightedCit(h => h === n ? null : h), 3000);
  }, []);

  async function send(text?: string) {
-    const q = (text ?? input).trim();
-    if (!q || streaming) return;
-    setInput('');
-
-    const userMsg: Message = { id: Date.now().toString(), role: 'user', text: q };
-    setMessages(m => [...m, userMsg]);
+    const q = (text ?? inputDraft).trim();
+    if (!q || ragStreamingRef.current) return;
+    setRagState(s => ({ ...s, inputDraft: '' }));

+    const userMsgId = Date.now().toString();
    const assistantId = (Date.now() + 1).toString();
-    setMessages(m => [...m, { id: assistantId, role: 'assistant', text: '' }]);
+
+    setRagState(s => ({
+      ...s,
+      messages: [
+        ...s.messages,
+        { id: userMsgId, role: 'user', text: q },
+        { id: assistantId, role: 'assistant', text: '' },
+      ],
+      citations: [],
+    }));
+
+    ragStreamingRef.current = true;
    setStreaming(true);
-    setCitations([]);
    setHighlightedCit(null);

    const ctrl = new AbortController();
-    abortRef.current = ctrl;
+    ragAbortRef.current = ctrl;

    try {
      const body: Record<string, unknown> = { query: q, top_k: 5 };
@@ -136,7 +131,7 @@ export function RagChatPage() {

      const res = await fetch('/api/v1/rag/chat', {
        method: 'POST',
-        headers: { 'Content-Type': 'application/json' },
+        headers: { 'Content-Type': 'application/json', ...authHeader() },
        body: JSON.stringify(body),
        signal: ctrl.signal,
      });
@@ -145,14 +140,13 @@ export function RagChatPage() {
      const reader = res.body.getReader();
      const dec = new TextDecoder();
      let buffer = '';
-      const newCitations: Citation[] = [];
+      const newCitations: RagCitation[] = [];

      while (true) {
        const { done, value } = await reader.read();
        if (done) break;
        buffer += dec.decode(value, { stream: true });

-        // SSE blocks separated by double newline
        const blocks = buffer.split('\n\n');
        buffer = blocks.pop() ?? '';

@@ -165,56 +159,62 @@ export function RagChatPage() {
            const j = JSON.parse(raw);

            if (j.type === 'session') {
-              // Backend assigned a session_id — persist for next request
-              if (j.session_id) setSessionId(j.session_id);
+              if (j.session_id) setRagState(s => ({ ...s, sessionId: j.session_id }));

            } else if (j.type === 'retrieved' && Array.isArray(j.docs)) {
-              // Sources arrive before the answer starts
              const mapped = j.docs.map((d: Record<string, unknown>, i: number) => mapSource(d, i + 1));
              newCitations.push(...mapped);
-              setCitations([...mapped]);
+              setRagState(s => ({ ...s, citations: [...mapped] }));

            } else if (j.type === 'chunk' && j.text) {
-              setMessages(m => m.map(msg =>
-                msg.id === assistantId
-                  ? { ...msg, text: msg.text + (j.text as string) }
-                  : msg
-              ));
-
-            } else if (j.type === 'status') {
-              // Status message (e.g. "找到N条相关法规…") — could show in UI if desired
-              // For now we ignore it to keep the bubble clean
+              setRagState(s => ({
+                ...s,
+                messages: s.messages.map(msg =>
+                  msg.id === assistantId
+                    ? { ...msg, text: msg.text + (j.text as string) }
+                    : msg
+                ),
+              }));

            } else if (j.type === 'done') {
-              // Extract which citation numbers appear in the final answer
-              setMessages(m => m.map(msg => {
-                if (msg.id !== assistantId) return msg;
-                const refs = [...new Set(
-                  [...msg.text.matchAll(/\[(\d+)\]/g)].map(r => parseInt(r[1], 10))
-                )].filter(n => n >= 1 && n <= newCitations.length);
-                return { ...msg, citationRefs: refs };
+              setRagState(s => ({
+                ...s,
+                messages: s.messages.map(msg => {
+                  if (msg.id !== assistantId) return msg;
+                  const refs = [...new Set(
+                    [...msg.text.matchAll(/\[(\d+)\]/g)].map(r => parseInt(r[1], 10))
+                  )].filter(n => n >= 1 && n <= newCitations.length);
+                  return { ...msg, citationRefs: refs };
+                }),
              }));
              break;

            } else if (j.type === 'error') {
-              setMessages(m => m.map(msg =>
-                msg.id === assistantId
-                  ? { ...msg, text: `Error: ${j.text ?? 'Unknown error'}` }
-                  : msg
-              ));
+              setRagState(s => ({
+                ...s,
+                messages: s.messages.map(msg =>
+                  msg.id === assistantId
+                    ? { ...msg, text: `Error: ${j.text ?? 'Unknown error'}` }
+                    : msg
+                ),
+              }));
            }
          } catch { /* malformed JSON chunk, skip */ }
        }
      }
    } catch (e: unknown) {
      if (e instanceof Error && e.name !== 'AbortError') {
-        setMessages(m => m.map(msg =>
-          msg.id === assistantId
-            ? { ...msg, text: 'Could not reach the RAG API. Please check the backend.' }
-            : msg
-        ));
+        setRagState(s => ({
+          ...s,
+          messages: s.messages.map(msg =>
+            msg.id === assistantId
+              ? { ...msg, text: t.ragchat.apiError }
+              : msg
+          ),
+        }));
      }
    } finally {
+      ragStreamingRef.current = false;
      setStreaming(false);
    }
  }
@@ -224,7 +224,7 @@ export function RagChatPage() {
  return (
    <div className="chat-page">
      <Topbar
-        title="Regulation Q&A"
+        title={t.ragchat.topbarTitle}
        actions={
          <button
            className="btn sm"
@@ -236,7 +236,7 @@ export function RagChatPage() {
              URL.revokeObjectURL(url);
            }}
          >
-            <Download size={13} />Export chat
+            <Download size={13} />{t.ragchat.exportBtn}
          </button>
        }
      />
@@ -244,7 +244,7 @@ export function RagChatPage() {
      <div className="chat-body">
        {/* ── History pane ── */}
        <div className="history-pane">
-          <div className="history-header">Quick prompts</div>
+          <div className="history-header">{t.ragchat.quickPromptsHeader}</div>
          {quickPrompts.map(q => (
            <button key={q} className="quick-item" onClick={() => send(q)}>
              {q}
@@ -284,16 +284,16 @@ export function RagChatPage() {
            <div className="composer-row">
              <textarea
                className="composer-input"
-                placeholder="Ask about your regulations…"
-                value={input}
-                onChange={e => setInput(e.target.value)}
+                placeholder={t.ragchat.inputPlaceholder}
+                value={inputDraft}
+                onChange={e => setRagState(s => ({ ...s, inputDraft: e.target.value }))}
                onKeyDown={e => { if (e.key === 'Enter' && !e.shiftKey) { e.preventDefault(); send(); } }}
                rows={2}
              />
              <button
                className="btn primary"
                onClick={() => send()}
-                disabled={!input.trim() || streaming}
+                disabled={!inputDraft.trim() || streaming}
              >
                <Send size={14} />
              </button>
@@ -304,11 +304,11 @@ export function RagChatPage() {
        {/* ── Citation rail ── */}
        <div className="citation-rail" ref={citRailRef}>
          <div className="citation-header">
-            Sources {citations.length > 0 && `(${citations.length})`}
+            {t.ragchat.citationsHeader}{citations.length > 0 && ` (${citations.length})`}
          </div>
          {citations.length === 0 && (
            <p style={{ padding: '12px 16px', fontSize: 12, color: 'var(--muted)', lineHeight: 1.5 }}>
-              Citations will appear here after a response is generated.
+              {t.ragchat.citationsEmpty}
            </p>
          )}
          {citations.map(c => (
--- a/frontend/src/pages/Status/StatusPage.tsx
+++ b/frontend/src/pages/Status/StatusPage.tsx
@@ -2,6 +2,13 @@ import { useState, useEffect } from 'react';
 import { Topbar } from '../../components/layout/Topbar';
 import { Search, Upload, Download, RefreshCw, CheckCircle, XCircle, AlertTriangle, Info } from 'lucide-react';
 import { UploadModal } from '../Docs/UploadModal';
+import { useLanguage } from '../../contexts/LanguageContext';
+
+const TOKEN_KEY = 'auth_token';
+function authHeader(): Record<string, string> {
+  const t = localStorage.getItem(TOKEN_KEY);
+  return t ? { Authorization: `Bearer ${t}` } : {};
+}

 // ── API types ──────────────────────────────────────────────────────────────
 interface Stats {
@@ -42,13 +49,14 @@ function StatusIcon({ status }: { status: 'ok' | 'error' | 'warn' | 'info' }) {
 }

 function ServiceRow({ name, status, detail }: { name: string; status: 'ok' | 'error' | 'warn' | 'info'; detail?: string }) {
+  const { t } = useLanguage();
  return (
    <div className="service-row">
      <StatusIcon status={status} />
      <span className="service-name" style={{ marginLeft: 8 }}>{name}</span>
      {detail && <span style={{ fontSize: 11, color: 'var(--muted)', marginLeft: 6 }}>{detail}</span>}
      <span className={`status ${status}`} style={{ marginLeft: 'auto' }}>
-        {status === 'ok' ? 'Online' : status === 'error' ? 'Error' : status === 'warn' ? 'Degraded' : 'Unknown'}
+        {status === 'ok' ? t.status.badgeOnline : status === 'error' ? t.status.badgeError : status === 'warn' ? t.status.badgeDegraded : t.status.badgeUnknown}
      </span>
    </div>
  );
@@ -67,6 +75,7 @@ function ConfigRow({ label, value }: { label: string; value: string | number | n

 // ── Main component ─────────────────────────────────────────────────────────
 export function StatusPage() {
+  const { t } = useLanguage();
  const [stats, setStats] = useState<Stats | null>(null);
  const [health, setHealth] = useState<Health | null>(null);
  const [config, setConfig] = useState<Config | null>(null);
@@ -83,9 +92,9 @@ export function StatusPage() {

    // Fetch all three endpoints in parallel
    Promise.allSettled([
-      fetch('/api/v1/status/stats').then(r => r.json()),
-      fetch('/api/v1/status/health').then(r => r.json()),
-      fetch('/api/v1/status/config').then(r => r.json()),
+      fetch('/api/v1/status/stats', { headers: authHeader() }).then(r => r.json()),
+      fetch('/api/v1/status/health', { headers: authHeader() }).then(r => r.json()),
+      fetch('/api/v1/status/config', { headers: authHeader() }).then(r => r.json()),
    ]).then(([statsRes, healthRes, configRes]) => {
      if (statsRes.status === 'fulfilled') setStats(statsRes.value);
      else setStats({ documents_total: 0, documents_indexed: 0, documents_failed: 0, chunks_total: 0 });
@@ -130,21 +139,21 @@ export function StatusPage() {
  return (
    <div className="status-page">
      <Topbar
-        title="System Status"
+        title={t.status.topbarTitle}
        actions={
          <>
            <div className="search-box">
              <Search size={13} />
-              <input placeholder="Search..." />
+              <input placeholder={t.status.searchPlaceholder} />
            </div>
            <button className="btn sm" onClick={handleExport}>
-              <Download size={13} />Export
+              <Download size={13} />{t.status.exportBtn}
            </button>
            <button className="btn sm" onClick={() => setRefreshKey(k => k + 1)}>
-              <RefreshCw size={13} />Refresh
+              <RefreshCw size={13} />{t.status.refreshBtn}
            </button>
            <button className="btn sm primary" onClick={() => setShowUpload(true)}>
-              <Upload size={13} />New upload
+              <Upload size={13} />{t.status.newUploadBtn}
            </button>
          </>
        }
@@ -156,26 +165,26 @@ export function StatusPage() {
        <div className="stats-grid">
          <div className="stat-cell">
            {loading ? <span className="loading-shimmer stat-value-loading" /> : <div className="stat-value">{stats?.documents_total ?? '—'}</div>}
-            <div className="stat-label">Documents total</div>
+            <div className="stat-label">{t.status.statTotal}</div>
          </div>
          <div className="stat-cell">
            {loading ? <span className="loading-shimmer stat-value-loading" /> : <div className="stat-value">{stats?.documents_indexed ?? '—'}</div>}
-            <div className="stat-label">Indexed</div>
+            <div className="stat-label">{t.status.statIndexed}</div>
          </div>
          <div className="stat-cell danger">
            {loading ? <span className="loading-shimmer stat-value-loading" /> : <div className="stat-value">{stats?.documents_failed ?? '—'}</div>}
-            <div className="stat-label">Failed</div>
+            <div className="stat-label">{t.status.statFailed}</div>
          </div>
          <div className="stat-cell">
            {loading ? <span className="loading-shimmer stat-value-loading" /> : <div className="stat-value">{stats?.chunks_total?.toLocaleString() ?? '—'}</div>}
-            <div className="stat-label">Vector chunks</div>
+            <div className="stat-label">{t.status.statChunks}</div>
          </div>
        </div>

        {/* Indexed progress bar */}
        {!loading && stats && stats.documents_total > 0 && (
          <div style={{ padding: '0 0 20px', display: 'flex', alignItems: 'center', gap: 12 }}>
-            <span style={{ fontSize: 12, color: 'var(--muted)', whiteSpace: 'nowrap' }}>Index coverage</span>
+            <span style={{ fontSize: 12, color: 'var(--muted)', whiteSpace: 'nowrap' }}>{t.status.statCoverage}</span>
            <div style={{ flex: 1, height: 6, background: 'var(--border)', borderRadius: 3, overflow: 'hidden' }}>
              <div style={{
                height: '100%', borderRadius: 3,
@@ -197,7 +206,7 @@ export function StatusPage() {
            {/* System health */}
            <div className="card">
              <div className="card-header" style={{ display: 'flex', alignItems: 'center', justifyContent: 'space-between' }}>
-                <span>System health</span>
+                <span>{t.status.cardHealth}</span>
                {lastRefresh && (
                  <span style={{ fontSize: 11, color: 'var(--muted)', fontWeight: 400 }}>
                    Updated {lastRefresh.toLocaleTimeString(undefined, { hour: '2-digit', minute: '2-digit', second: '2-digit' })}
@@ -225,12 +234,12 @@ export function StatusPage() {
                  <ServiceRow
                    name="BM25 keyword retriever"
                    status={health.bm25.available ? 'ok' : 'warn'}
-                    detail={health.bm25.available ? undefined : 'Not loaded'}
+                    detail={health.bm25.available ? undefined : t.status.serviceNotLoaded}
                  />
                  <ServiceRow
                    name={`Reranker${health.reranker.model ? ` (${health.reranker.model})` : ''}`}
                    status={health.reranker.enabled ? 'ok' : 'info'}
-                    detail={health.reranker.enabled ? 'Enabled' : 'Disabled'}
+                    detail={health.reranker.enabled ? t.status.serviceEnabled : t.status.serviceDisabled}
                  />
                  <ServiceRow
                    name="Active sessions"
@@ -240,7 +249,7 @@ export function StatusPage() {
                </>
              ) : (
                <div style={{ padding: '12px 0', color: 'var(--muted)', fontSize: 13 }}>
-                  Could not reach health endpoint
+                  {t.status.healthEndpointError}
                </div>
              )}
            </div>
@@ -251,7 +260,7 @@ export function StatusPage() {
                onClick={() => setConfigOpen(v => !v)}
                style={{ width: '100%', display: 'flex', alignItems: 'center', justifyContent: 'space-between', background: 'none', border: 'none', cursor: 'pointer', padding: 0 }}
              >
-                <div className="card-header" style={{ margin: 0, padding: 0, flex: 1, textAlign: 'left' }}>System configuration</div>
+                <div className="card-header" style={{ margin: 0, padding: 0, flex: 1, textAlign: 'left' }}>{t.status.cardConfig}</div>
                <span style={{ fontSize: 11, color: 'var(--muted)', transform: configOpen ? 'rotate(180deg)' : 'none', transition: 'transform 0.2s' }}>▾</span>
              </button>

@@ -259,17 +268,17 @@ export function StatusPage() {
                <div style={{ marginTop: 12 }}>
                  {config ? (
                    <>
-                      <ConfigRow label="LLM provider" value={config.llm_provider} />
-                      <ConfigRow label="LLM model" value={config.llm_model} />
-                      <ConfigRow label="Embedding model" value={config.embedding_model} />
-                      <ConfigRow label="Embedding dim" value={config.embedding_dim} />
-                      <ConfigRow label="Milvus collection" value={config.milvus_collection} />
-                      <ConfigRow label="Parser backend" value={config.parser_backend} />
-                      <ConfigRow label="Chunk backend" value={config.chunk_backend} />
-                      <ConfigRow label="Parser failure mode" value={config.parser_failure_mode} />
+                      <ConfigRow label={t.status.labelLLMProvider} value={config.llm_provider} />
+                      <ConfigRow label={t.status.labelLLMModel} value={config.llm_model} />
+                      <ConfigRow label={t.status.labelEmbeddingModel} value={config.embedding_model} />
+                      <ConfigRow label={t.status.labelEmbeddingDim} value={config.embedding_dim} />
+                      <ConfigRow label={t.status.labelMilvusCollection} value={config.milvus_collection} />
+                      <ConfigRow label={t.status.labelParserBackend} value={config.parser_backend} />
+                      <ConfigRow label={t.status.labelChunkBackend} value={config.chunk_backend} />
+                      <ConfigRow label={t.status.labelParserFailureMode} value={config.parser_failure_mode} />
                    </>
                  ) : (
-                    <div style={{ color: 'var(--muted)', fontSize: 13 }}>Could not load config</div>
+                    <div style={{ color: 'var(--muted)', fontSize: 13 }}>{t.status.configLoadError}</div>
                  )}
                </div>
              )}
@@ -280,7 +289,7 @@ export function StatusPage() {

            {/* Document breakdown */}
            <div className="card">
-              <div className="card-header">Document breakdown</div>
+              <div className="card-header">{t.status.cardBreakdown}</div>
              {loading ? (
                <div style={{ display: 'flex', flexDirection: 'column', gap: 8 }}>
                  {[1, 2, 3].map(i => <div key={i} className="loading-shimmer" style={{ height: 24, borderRadius: 4 }} />)}
@@ -288,9 +297,9 @@ export function StatusPage() {
              ) : stats ? (
                <>
                  {[
-                    { label: 'Indexed', value: stats.documents_indexed, total: stats.documents_total, color: 'var(--ok)' },
-                    { label: 'Processing / Parsed', value: stats.documents_total - stats.documents_indexed - stats.documents_failed, total: stats.documents_total, color: 'var(--warn)' },
-                    { label: 'Failed', value: stats.documents_failed, total: stats.documents_total, color: 'var(--danger)' },
+                    { label: t.status.breakdownIndexed, value: stats.documents_indexed, total: stats.documents_total, color: 'var(--ok)' },
+                    { label: t.status.breakdownProcessing, value: stats.documents_total - stats.documents_indexed - stats.documents_failed, total: stats.documents_total, color: 'var(--warn)' },
+                    { label: t.status.breakdownFailed, value: stats.documents_failed, total: stats.documents_total, color: 'var(--danger)' },
                  ].map(row => {
                    const pct = stats.documents_total > 0 ? Math.round((Math.max(0, row.value) / stats.documents_total) * 100) : 0;
                    return (
@@ -306,7 +315,7 @@ export function StatusPage() {
                    );
                  })}
                  <div style={{ marginTop: 8, paddingTop: 8, borderTop: '1px solid var(--border)', display: 'flex', justifyContent: 'space-between', fontSize: 12 }}>
-                    <span style={{ color: 'var(--muted)' }}>Total vector chunks</span>
+                    <span style={{ color: 'var(--muted)' }}>{t.status.totalChunks}</span>
                    <span style={{ fontFamily: 'var(--font-mono)', fontWeight: 600 }}>{stats.chunks_total.toLocaleString()}</span>
                  </div>
                </>
@@ -316,26 +325,26 @@ export function StatusPage() {
            {/* Sessions & reranker quick facts */}
            {health && (
              <div className="card">
-                <div className="card-header">Runtime info</div>
+                <div className="card-header">{t.status.cardRuntime}</div>
                <div style={{ display: 'flex', flexDirection: 'column', gap: 6 }}>
                  <div style={{ display: 'flex', justifyContent: 'space-between', fontSize: 12, padding: '4px 0' }}>
-                    <span style={{ color: 'var(--muted)' }}>Active chat sessions</span>
+                    <span style={{ color: 'var(--muted)' }}>{t.status.labelActiveSessions}</span>
                    <span style={{ fontFamily: 'var(--font-mono)' }}>{health.sessions.active}</span>
                  </div>
                  <div style={{ display: 'flex', justifyContent: 'space-between', fontSize: 12, padding: '4px 0' }}>
-                    <span style={{ color: 'var(--muted)' }}>Session capacity</span>
+                    <span style={{ color: 'var(--muted)' }}>{t.status.labelSessionCapacity}</span>
                    <span style={{ fontFamily: 'var(--font-mono)' }}>{health.sessions.max}</span>
                  </div>
                  <div style={{ display: 'flex', justifyContent: 'space-between', fontSize: 12, padding: '4px 0' }}>
-                    <span style={{ color: 'var(--muted)' }}>Cross-encoder reranker</span>
+                    <span style={{ color: 'var(--muted)' }}>{t.status.labelReranker}</span>
                    <span style={{ fontFamily: 'var(--font-mono)', color: health.reranker.enabled ? 'var(--ok)' : 'var(--muted)' }}>
-                      {health.reranker.enabled ? (health.reranker.model ?? 'Enabled') : 'Disabled'}
+                      {health.reranker.enabled ? (health.reranker.model ?? t.status.serviceEnabled) : t.status.serviceDisabled}
                    </span>
                  </div>
                  <div style={{ display: 'flex', justifyContent: 'space-between', fontSize: 12, padding: '4px 0' }}>
-                    <span style={{ color: 'var(--muted)' }}>BM25 hybrid retrieval</span>
+                    <span style={{ color: 'var(--muted)' }}>{t.status.labelBM25}</span>
                    <span style={{ fontFamily: 'var(--font-mono)', color: health.bm25.available ? 'var(--ok)' : 'var(--muted)' }}>
-                      {health.bm25.available ? 'Active' : 'Unavailable'}
+                      {health.bm25.available ? t.status.statusActive : t.status.statusUnavailable}
                    </span>
                  </div>
                </div>
@@ -347,7 +356,7 @@ export function StatusPage() {

      <footer className="page-footer">
        <div className="live-dot" />
-        <span>Regulation Hub · T-Systems AI · {health ? (health.milvus.status === 'ok' && health.minio.connected ? 'All systems operational' : 'Degraded') : 'Checking…'}</span>
+        <span>Regulation Hub · T-Systems AI · {health ? (health.milvus.status === 'ok' && health.minio.connected ? t.status.footerAllOk : t.status.footerDegraded) : t.status.footerChecking}</span>
      </footer>

      {showUpload && <UploadModal onClose={() => setShowUpload(false)} />}
--- a/frontend/src/router/AppRouter.tsx
+++ b/frontend/src/router/AppRouter.tsx
@@ -1,5 +1,8 @@
-import { BrowserRouter, Routes, Route } from 'react-router-dom';
+import { useEffect } from 'react';
+import { BrowserRouter, Navigate, Routes, Route } from 'react-router-dom';
+import { useAuth } from '../contexts';
 import { AppShell } from '../components/layout/AppShell';
+import { LoginPage } from '../pages/Login/LoginPage';
 import { OverviewPage } from '../pages/Overview/OverviewPage';
 import { StatusPage } from '../pages/Status/StatusPage';
 import { PerceptionPage } from '../pages/Perception/PerceptionPage';
@@ -7,11 +10,47 @@ import { DocsPage } from '../pages/Docs/DocsPage';
 import { CompliancePage } from '../pages/Compliance/CompliancePage';
 import { RagChatPage } from '../pages/RagChat/RagChatPage';

+/** Redirect to /login when not authenticated. */
+function RequireAuth({ children }: { children: React.ReactNode }) {
+  const { token, loading } = useAuth();
+  if (loading) return null; // wait for localStorage token validation
+  if (!token) return <Navigate to="/login" replace />;
+  return <>{children}</>;
+}
+
+/** Redirect to / when already authenticated. */
+function GuestOnly({ children }: { children: React.ReactNode }) {
+  const { token, loading } = useAuth();
+  if (loading) return null;
+  if (token) return <Navigate to="/" replace />;
+  return <>{children}</>;
+}
+
 export function AppRouter() {
+  const { logout } = useAuth();
+
+  // Listen for global 401 events emitted by the API layer.
+  useEffect(() => {
+    function onUnauthorized() { logout(); }
+    window.addEventListener('auth:unauthorized', onUnauthorized);
+    return () => window.removeEventListener('auth:unauthorized', onUnauthorized);
+  }, [logout]);
+
  return (
    <BrowserRouter>
      <Routes>
-        <Route path="/" element={<AppShell />}>
+        {/* Public route */}
+        <Route path="/login" element={<GuestOnly><LoginPage /></GuestOnly>} />
+
+        {/* Protected routes */}
+        <Route
+          path="/"
+          element={
+            <RequireAuth>
+              <AppShell />
+            </RequireAuth>
+          }
+        >
          <Route index element={<OverviewPage />} />
          <Route path="status" element={<StatusPage />} />
          <Route path="signals" element={<PerceptionPage />} />
@@ -19,6 +58,9 @@ export function AppRouter() {
          <Route path="compliance" element={<CompliancePage />} />
          <Route path="chat" element={<RagChatPage />} />
        </Route>
+
+        {/* Catch-all */}
+        <Route path="*" element={<Navigate to="/" replace />} />
      </Routes>
    </BrowserRouter>
  );
--- a/frontend/src/styles/globals.css
+++ b/frontend/src/styles/globals.css
@@ -150,10 +150,10 @@ body {
  display: inline-flex;
  align-items: center;
  gap: 6px;
-  height: 32px;
-  padding: 0 12px;
+  height: 34px;
+  padding: 0 14px;
  border-radius: var(--radius-sm);
-  font-size: 13px;
+  font-size: 14px;
  font-family: var(--font-body);
  font-weight: 500;
  cursor: pointer;
@@ -170,7 +170,7 @@ body {
  border-color: var(--accent);
 }
 .btn.primary:hover { background: var(--accent-hover); border-color: var(--accent-hover); }
-.btn.sm { height: 28px; font-size: 12px; padding: 0 10px; }
+.btn.sm { height: 30px; font-size: 13px; padding: 0 11px; }
 .btn:disabled { opacity: 0.5; cursor: not-allowed; }

 /* ── App Shell ──────────────────────────────────── */
@@ -216,14 +216,14 @@ body {
  object-fit: contain;
  flex-shrink: 0;
 }
-.brand-name { font-size: 13px; font-weight: 700; font-family: var(--font-display); color: var(--rail-fg); }
-.brand-sub  { font-size: 10px; color: var(--rail-muted); }
+.brand-name { font-size: 15px; font-weight: 700; font-family: var(--font-display); color: var(--rail-fg); }
+.brand-sub  { font-size: 12px; color: var(--rail-muted); }

 .sidebar-nav { flex: 1; overflow-y: auto; padding: 12px 0; }

 .nav-group { margin-bottom: 4px; }
 .nav-group-label {
-  font-size: 10px; font-weight: 700;
+  font-size: 11px; font-weight: 700;
  text-transform: uppercase; letter-spacing: 0.06em;
  color: var(--rail-muted);
  padding: 8px 16px 4px;
@@ -231,10 +231,10 @@ body {

 .nav-item {
  display: flex; align-items: center; gap: 9px;
-  height: 36px; padding: 0 14px 0 16px;
+  height: 38px; padding: 0 14px 0 16px;
  text-decoration: none;
  color: var(--rail-fg);
-  font-size: 13px;
+  font-size: 14px;
  border-left: 3px solid transparent;
  transition: background 0.12s, color 0.12s;
  position: relative;
@@ -261,14 +261,14 @@ body {
 }
 .sidebar-user { display: flex; align-items: center; gap: 8px; flex: 1; min-width: 0; }
 .user-avatar {
-  width: 28px; height: 28px;
+  width: 30px; height: 30px;
  background: var(--accent-dim); color: var(--accent);
  border-radius: 50%;
  display: flex; align-items: center; justify-content: center;
-  font-size: 10px; font-weight: 700; flex-shrink: 0;
+  font-size: 11px; font-weight: 700; flex-shrink: 0;
 }
-.user-name { font-size: 12px; font-weight: 600; color: var(--rail-fg); }
-.user-role { font-size: 10px; color: var(--rail-muted); }
+.user-name { font-size: 13px; font-weight: 600; color: var(--rail-fg); }
+.user-role { font-size: 11px; color: var(--rail-muted); }

 .theme-btn {
  width: 28px; height: 28px;
@@ -297,8 +297,8 @@ body {
  z-index: 10;
 }
 .topbar-left { display: flex; align-items: baseline; gap: 10px; min-width: 0; }
-.topbar-title { font-size: 15px; font-weight: 700; font-family: var(--font-display); color: var(--fg); }
-.topbar-sub { font-size: 11px; color: var(--muted); font-family: var(--font-mono); }
+.topbar-title { font-size: 17px; font-weight: 700; font-family: var(--font-display); color: var(--fg); }
+.topbar-sub { font-size: 12px; color: var(--muted); font-family: var(--font-mono); }
 .topbar-actions { display: flex; align-items: center; gap: 8px; }

 /* ── Page Content ───────────────────────────────── */
@@ -309,13 +309,13 @@ body {
 }

 /* ── Search Box ─────────────────────────────────── */
-.search-box { display: flex; align-items: center; gap: 6px; height: 32px; padding: 0 10px; border: 1px solid var(--border); border-radius: var(--radius-sm); background: var(--bg); font-size: 13px; color: var(--muted); }
-.search-box input { border: none; background: transparent; outline: none; font-size: 13px; color: var(--fg); width: 160px; }
+.search-box { display: flex; align-items: center; gap: 6px; height: 34px; padding: 0 10px; border: 1px solid var(--border); border-radius: var(--radius-sm); background: var(--bg); font-size: 14px; color: var(--muted); }
+.search-box input { border: none; background: transparent; outline: none; font-size: 14px; color: var(--fg); width: 160px; }

 /* ── Filter Bar / Chips ─────────────────────────── */
 .filter-bar { display: flex; align-items: center; gap: 12px; padding: 10px 22px; border-bottom: 1px solid var(--border); background: var(--surface); flex-shrink: 0; }
 .chip-group { display: flex; gap: 6px; flex-wrap: wrap; }
-.chip { height: 26px; padding: 0 10px; border-radius: var(--radius-pill); border: 1px solid var(--border); background: transparent; font-size: 11px; font-weight: 500; cursor: pointer; color: var(--muted); transition: all 0.12s; }
+.chip { height: 28px; padding: 0 11px; border-radius: var(--radius-pill); border: 1px solid var(--border); background: transparent; font-size: 12px; font-weight: 500; cursor: pointer; color: var(--muted); transition: all 0.12s; }
 .chip:hover { border-color: var(--accent); color: var(--accent); }
 .chip.active { background: var(--accent-dim); border-color: var(--accent); color: var(--accent); font-weight: 600; }
 .filter-sep { width: 1px; height: 20px; background: var(--border); flex-shrink: 0; }
@@ -327,34 +327,47 @@ body {
@keyframes spin { from { transform: rotate(0deg); } to { transform: rotate(360deg); } }

 /* ── Overview Page ──────────────────────────────── */
-.overview-page { padding: 32px; max-width: 900px; display: flex; flex-direction: column; gap: 32px; }
+/* Outer container fills content-area and handles scrolling.          */
+/* Inner .overview-page constrains width and holds the page content.  */
+.overview-scroll-wrapper {
+  flex: 1;
+  overflow-y: auto;
+  height: 100%;
+}
+.overview-page {
+  padding: 32px;
+  max-width: 960px;
+  display: flex;
+  flex-direction: column;
+  gap: 32px;
+}

 .overview-hero { display: flex; flex-direction: column; gap: 12px; }
-.hero-eyebrow { font-size: 11px; font-weight: 700; text-transform: uppercase; letter-spacing: 0.08em; color: var(--accent); }
-.hero-title { font-size: 32px; font-weight: 700; font-family: var(--font-display); line-height: 1.15; }
-.hero-desc { font-size: 14px; color: var(--muted); max-width: 480px; line-height: 1.6; }
+.hero-eyebrow { font-size: 12px; font-weight: 700; text-transform: uppercase; letter-spacing: 0.08em; color: var(--accent); }
+.hero-title { font-size: 34px; font-weight: 700; font-family: var(--font-display); line-height: 1.15; }
+.hero-desc { font-size: 15px; color: var(--muted); max-width: 520px; line-height: 1.6; }
 .hero-actions { display: flex; gap: 10px; padding-top: 4px; }

 .overview-summary { display: flex; align-items: center; gap: 0; }
 .summary-item { display: flex; flex-direction: column; align-items: center; gap: 2px; flex: 1; padding: 14px; }
-.summary-num { font-size: 22px; font-weight: 700; font-family: var(--font-display); color: var(--accent); }
-.summary-label { font-size: 11px; color: var(--muted); }
+.summary-num { font-size: 24px; font-weight: 700; font-family: var(--font-display); color: var(--accent); }
+.summary-label { font-size: 12px; color: var(--muted); }
 .summary-divider { width: 1px; height: 40px; background: var(--border); flex-shrink: 0; }

-.section-title { font-size: 13px; font-weight: 700; font-family: var(--font-display); color: var(--fg); margin-bottom: 14px; }
+.section-title { font-size: 14px; font-weight: 700; font-family: var(--font-display); color: var(--fg); margin-bottom: 14px; }

 .workflow-steps { display: grid; grid-template-columns: repeat(6, 1fr); gap: 12px; }
 .workflow-step { display: flex; flex-direction: column; gap: 4px; padding: 12px; background: var(--surface); border-radius: var(--radius-md); box-shadow: var(--shadow-card); }
-.step-num { font-size: 10px; font-weight: 700; font-family: var(--font-mono); color: var(--accent); }
-.step-label { font-size: 13px; font-weight: 700; font-family: var(--font-display); }
-.step-desc { font-size: 11px; color: var(--muted); line-height: 1.4; }
+.step-num { font-size: 11px; font-weight: 700; font-family: var(--font-mono); color: var(--accent); }
+.step-label { font-size: 14px; font-weight: 700; font-family: var(--font-display); }
+.step-desc { font-size: 12px; color: var(--muted); line-height: 1.4; }

 .screen-grid { display: grid; grid-template-columns: repeat(3, 1fr); gap: 14px; }
 .screen-card { text-align: left; cursor: pointer; border: none; transition: box-shadow 0.15s; display: flex; flex-direction: column; gap: 6px; }
 .screen-card:hover { box-shadow: 0 4px 12px rgba(0,0,0,.10), 0 0 0 2px var(--accent-dim); }
 .screen-icon { width: 36px; height: 36px; background: var(--accent-dim); color: var(--accent); border-radius: var(--radius-sm); display: flex; align-items: center; justify-content: center; margin-bottom: 4px; }
-.screen-label { font-size: 13px; font-weight: 700; font-family: var(--font-display); }
-.screen-desc { font-size: 12px; color: var(--muted); line-height: 1.4; }
+.screen-label { font-size: 14px; font-weight: 700; font-family: var(--font-display); }
+.screen-desc { font-size: 13px; color: var(--muted); line-height: 1.4; }

 /* ── Status Page ────────────────────────────────── */
 .status-page { display: flex; flex-direction: column; height: 100%; }
@@ -375,18 +388,18 @@ body {
  display: flex; flex-direction: column; gap: 4px;
 }
 .stat-cell:last-child { border-right: none; }
-.stat-value { font-size: 26px; font-weight: 700; font-family: var(--font-display); }
-.stat-label { font-size: 11px; color: var(--muted); }
+.stat-value { font-size: 28px; font-weight: 700; font-family: var(--font-display); }
+.stat-label { font-size: 12px; color: var(--muted); }
 .stat-cell.danger .stat-value { color: var(--danger); }

 .panel-grid { display: grid; grid-template-columns: 1.4fr 0.9fr; gap: 16px; }
 .panel-left, .panel-right { display: flex; flex-direction: column; gap: 16px; }

-.card-header { font-size: 12px; font-weight: 700; font-family: var(--font-display); color: var(--muted); text-transform: uppercase; letter-spacing: 0.05em; margin-bottom: 12px; }
+.card-header { font-size: 13px; font-weight: 700; font-family: var(--font-display); color: var(--muted); text-transform: uppercase; letter-spacing: 0.05em; margin-bottom: 12px; }

 .task-row { display: flex; align-items: center; gap: 12px; padding: 8px 0; border-top: 1px solid var(--border); }
 .task-info { flex: 1; min-width: 0; }
-.task-name { font-size: 13px; font-weight: 500; margin-bottom: 4px; }
+.task-name { font-size: 14px; font-weight: 500; margin-bottom: 4px; }
 .task-progress-bar { height: 3px; background: var(--border); border-radius: 2px; overflow: hidden; }
 .task-progress-fill { height: 100%; background: var(--accent); border-radius: 2px; }

@@ -401,12 +414,12 @@ body {
 .kpi-value { font-size: 11px; font-weight: 700; font-family: var(--font-mono); color: var(--fg); width: 36px; text-align: right; flex-shrink: 0; }

 .service-row { display: flex; align-items: center; justify-content: space-between; padding: 8px 0; border-top: 1px solid var(--border); }
-.service-name { font-size: 13px; }
+.service-name { font-size: 14px; }

 .event-row { padding: 10px 0; border-top: 1px solid var(--border); display: flex; flex-direction: column; gap: 3px; }
-.event-date { font-size: 10px; font-family: var(--font-mono); color: var(--muted); }
-.event-title { font-size: 13px; font-weight: 600; }
-.event-summary { font-size: 12px; color: var(--muted); display: -webkit-box; -webkit-line-clamp: 2; -webkit-box-orient: vertical; overflow: hidden; }
+.event-date { font-size: 11px; font-family: var(--font-mono); color: var(--muted); }
+.event-title { font-size: 14px; font-weight: 600; }
+.event-summary { font-size: 13px; color: var(--muted); display: -webkit-box; -webkit-line-clamp: 2; -webkit-box-orient: vertical; overflow: hidden; }

 /* ── Perception Page ────────────────────────────── */
 .perception-page { display: flex; flex-direction: column; height: 100%; }
@@ -414,8 +427,8 @@ body {
 .stats-bar { display: flex; border-bottom: 1px solid var(--border); background: var(--surface); flex-shrink: 0; }
 .sbar-cell { flex: 1; padding: 14px 22px; border-right: 1px solid var(--border); display: flex; flex-direction: column; gap: 3px; }
 .sbar-cell:last-child { border-right: none; }
-.sbar-val { font-size: 22px; font-weight: 700; font-family: var(--font-display); }
-.sbar-lbl { font-size: 11px; color: var(--muted); }
+.sbar-val { font-size: 24px; font-weight: 700; font-family: var(--font-display); }
+.sbar-lbl { font-size: 12px; color: var(--muted); }
 .sbar-cell.danger .sbar-val { color: var(--danger); }
 .sbar-cell.warn   .sbar-val { color: var(--warn); }
 .sbar-cell.accent .sbar-val { color: var(--accent); }
@@ -427,14 +440,14 @@ body {
 .ev-card:hover { background: var(--bg); }
 .ev-card.selected { border-left-color: var(--accent); background: var(--accent-dim); box-shadow: inset 0 0 0 1px var(--accent-dim); }
 .ev-top { display: flex; align-items: center; gap: 7px; margin-bottom: 6px; }
-.ev-std { font-size: 10px; font-family: var(--font-mono); color: var(--muted); }
-.ev-title { font-size: 13px; font-weight: 600; line-height: 1.35; margin-bottom: 5px; }
-.ev-summary { font-size: 12px; color: var(--muted); display: -webkit-box; -webkit-line-clamp: 2; -webkit-box-orient: vertical; overflow: hidden; margin-bottom: 8px; }
+.ev-std { font-size: 11px; font-family: var(--font-mono); color: var(--muted); }
+.ev-title { font-size: 14px; font-weight: 600; line-height: 1.35; margin-bottom: 5px; }
+.ev-summary { font-size: 13px; color: var(--muted); display: -webkit-box; -webkit-line-clamp: 2; -webkit-box-orient: vertical; overflow: hidden; margin-bottom: 8px; }
 .ev-bottom { display: flex; align-items: center; gap: 8px; flex-wrap: wrap; }
-.ev-date { font-size: 10px; font-family: var(--font-mono); color: var(--muted); }
+.ev-date { font-size: 11px; font-family: var(--font-mono); color: var(--muted); }
 .ev-tags { display: flex; gap: 4px; flex-wrap: wrap; }
-.ev-tag { font-size: 10px; padding: 1px 6px; background: var(--bg); border: 1px solid var(--border); border-radius: var(--radius-pill); color: var(--muted); }
-.impact-dot { font-size: 10px; font-weight: 700; margin-left: auto; }
+.ev-tag { font-size: 11px; padding: 1px 6px; background: var(--bg); border: 1px solid var(--border); border-radius: var(--radius-pill); color: var(--muted); }
+.impact-dot { font-size: 11px; font-weight: 700; margin-left: auto; }
 .impact-high   { color: var(--danger); }
 .impact-medium { color: var(--warn); }
 .impact-low    { color: var(--success); }
@@ -447,18 +460,18 @@ body {

 .detail-card { display: flex; flex-direction: column; gap: 10px; }
 .detail-header { display: flex; align-items: center; gap: 8px; }
-.detail-title { font-size: 15px; font-weight: 700; font-family: var(--font-display); }
-.detail-summary { font-size: 13px; color: var(--muted); line-height: 1.6; }
+.detail-title { font-size: 16px; font-weight: 700; font-family: var(--font-display); }
+.detail-summary { font-size: 14px; color: var(--muted); line-height: 1.6; }
 .detail-actions { display: flex; gap: 8px; padding-top: 4px; }

 .docs-card { display: flex; flex-direction: column; gap: 0; }
 .doc-row { display: flex; gap: 10px; padding: 10px 0; border-top: 1px solid var(--border); }
 .doc-score { font-size: 11px; font-weight: 700; font-family: var(--font-mono); color: var(--success); width: 34px; flex-shrink: 0; padding-top: 1px; }
-.doc-name { font-size: 12px; font-weight: 600; margin-bottom: 3px; }
-.doc-clause { font-size: 10px; font-family: var(--font-mono); color: var(--muted); margin-left: 5px; }
-.doc-snippet { font-size: 11px; color: var(--muted); display: -webkit-box; -webkit-line-clamp: 2; -webkit-box-orient: vertical; overflow: hidden; }
+.doc-name { font-size: 13px; font-weight: 600; margin-bottom: 3px; }
+.doc-clause { font-size: 11px; font-family: var(--font-mono); color: var(--muted); margin-left: 5px; }
+.doc-snippet { font-size: 12px; color: var(--muted); display: -webkit-box; -webkit-line-clamp: 2; -webkit-box-orient: vertical; overflow: hidden; }

-.ai-card .ai-output { font-size: 13px; line-height: 1.7; white-space: pre-wrap; font-family: var(--font-mono); }
+.ai-card .ai-output { font-size: 14px; line-height: 1.7; white-space: pre-wrap; font-family: var(--font-mono); }
 .blink-cursor { animation: blink 1s step-end infinite; }
@keyframes blink { 0%,100% { opacity: 1; } 50% { opacity: 0; } }

@@ -466,7 +479,7 @@ body {
 .docs-page { display: flex; flex-direction: column; height: 100%; }

 .docs-controls { display: flex; align-items: center; gap: 12px; margin-bottom: 14px; flex-wrap: wrap; }
-.select-input { height: 28px; padding: 0 10px; border: 1px solid var(--border); border-radius: var(--radius-sm); background: var(--surface); font-size: 12px; color: var(--fg); outline: none; cursor: pointer; }
+.select-input { height: 30px; padding: 0 10px; border: 1px solid var(--border); border-radius: var(--radius-sm); background: var(--surface); font-size: 13px; color: var(--fg); outline: none; cursor: pointer; }

 .batch-bar { display: flex; align-items: center; gap: 10px; padding: 8px 12px; background: var(--accent-dim); border: 1px solid var(--accent); border-radius: var(--radius-sm); margin-bottom: 12px; font-size: 13px; color: var(--accent); font-weight: 600; }
 .risk-btn { color: var(--danger); border-color: var(--danger-bg); }
@@ -479,7 +492,7 @@ body {
  padding: 10px 14px;
  background: var(--bg);
  border-bottom: 1px solid var(--border);
-  font-size: 11px; font-weight: 700; text-transform: uppercase; letter-spacing: 0.05em; color: var(--muted);
+  font-size: 12px; font-weight: 700; text-transform: uppercase; letter-spacing: 0.05em; color: var(--muted);
  align-items: center;
 }
 .table-row {
@@ -488,7 +501,7 @@ body {
  gap: 12px;
  padding: 11px 14px;
  border-bottom: 1px solid var(--border);
-  font-size: 13px;
+  font-size: 14px;
  align-items: center;
  transition: background 0.1s, opacity 0.3s;
 }
@@ -497,10 +510,10 @@ body {
 .table-row.row-selected { background: var(--accent-dim); }
 .table-row.row-deleting { opacity: 0.4; pointer-events: none; }
 .doc-name-cell { font-weight: 500; }
-.cell-mono { font-family: var(--font-mono); font-size: 11px; color: var(--muted); }
-.cell-muted { font-size: 12px; color: var(--muted); }
+.cell-mono { font-family: var(--font-mono); font-size: 12px; color: var(--muted); }
+.cell-muted { font-size: 13px; color: var(--muted); }
 .row-actions { display: flex; gap: 10px; }
-.text-link { background: none; border: none; font-size: 12px; color: var(--accent); cursor: pointer; font-weight: 500; padding: 0; }
+.text-link { background: none; border: none; font-size: 13px; color: var(--accent); cursor: pointer; font-weight: 500; padding: 0; }
 .text-link:hover { text-decoration: underline; }
 .danger-link { color: var(--danger); }

@@ -514,24 +527,24 @@ body {
 .compliance-workspace { display: grid; grid-template-columns: 0.95fr 1.25fr 0.9fr; gap: 14px; padding: 16px 24px 24px; flex: 1; overflow: hidden; min-height: 0; }

 .comp-col { display: flex; flex-direction: column; gap: 12px; overflow-y: auto; }
-.col-header { font-size: 11px; font-weight: 700; text-transform: uppercase; letter-spacing: 0.05em; color: var(--muted); padding: 0 2px 4px; flex-shrink: 0; }
+.col-header { font-size: 12px; font-weight: 700; text-transform: uppercase; letter-spacing: 0.05em; color: var(--muted); padding: 0 2px 4px; flex-shrink: 0; }

 .source-item { display: flex; flex-direction: column; gap: 6px; flex-shrink: 0; }
 .source-top { display: flex; align-items: center; justify-content: space-between; gap: 8px; }
-.source-std { font-size: 13px; font-weight: 700; font-family: var(--font-display); }
-.source-helper { font-size: 11px; color: var(--muted); }
+.source-std { font-size: 14px; font-weight: 700; font-family: var(--font-display); }
+.source-helper { font-size: 12px; color: var(--muted); }
 .source-scores { display: flex; gap: 5px; flex-wrap: wrap; }
-.score-pill { font-size: 10px; font-family: var(--font-mono); padding: 2px 6px; background: var(--bg); border: 1px solid var(--border); border-radius: var(--radius-pill); color: var(--muted); }
+.score-pill { font-size: 11px; font-family: var(--font-mono); padding: 2px 6px; background: var(--bg); border: 1px solid var(--border); border-radius: var(--radius-pill); color: var(--muted); }

 .para-card { flex-shrink: 0; }
-.para-text { font-size: 13px; line-height: 1.7; color: var(--fg); }
+.para-text { font-size: 14px; line-height: 1.7; color: var(--fg); }
 .para-text mark { background: rgba(226,0,116,.15); color: var(--accent); padding: 0 2px; border-radius: 2px; }

 .stages-card { flex-shrink: 0; }
 .stage-row { padding: 8px 0; border-top: 1px solid var(--border); display: flex; flex-direction: column; gap: 5px; }
 .stage-label-row { display: flex; justify-content: space-between; align-items: center; }
-.stage-label { font-size: 12px; }
-.stage-pct { font-size: 11px; font-family: var(--font-mono); color: var(--muted); }
+.stage-label { font-size: 13px; }
+.stage-pct { font-size: 12px; font-family: var(--font-mono); color: var(--muted); }
 .stage-bar { height: 4px; background: var(--border); border-radius: 2px; overflow: hidden; }
 .stage-fill { height: 100%; border-radius: 2px; }
 .stage-fill.stage-ok   { background: var(--success); }
@@ -540,13 +553,13 @@ body {

 .finding-item { display: flex; flex-direction: column; gap: 6px; flex-shrink: 0; }
 .finding-top { display: flex; align-items: flex-start; justify-content: space-between; gap: 8px; }
-.finding-title { font-size: 13px; font-weight: 600; line-height: 1.3; }
-.finding-desc { font-size: 12px; color: var(--muted); line-height: 1.5; }
+.finding-title { font-size: 14px; font-weight: 600; line-height: 1.3; }
+.finding-desc { font-size: 13px; color: var(--muted); line-height: 1.5; }

 .conclusion-box { display: flex; flex-direction: column; gap: 10px; flex-shrink: 0; }
-.conclusion-text { font-size: 12px; line-height: 1.6; color: var(--fg); }
+.conclusion-text { font-size: 13px; line-height: 1.6; color: var(--fg); }
 .action-items { display: flex; flex-direction: column; gap: 8px; padding-top: 8px; border-top: 1px solid var(--border); }
-.action-item { display: flex; justify-content: space-between; align-items: center; gap: 8px; font-size: 12px; }
+.action-item { display: flex; justify-content: space-between; align-items: center; gap: 8px; font-size: 13px; }
 .action-label { color: var(--muted); }
 .action-value { font-weight: 600; }
 .risk-text { color: var(--danger); }
@@ -559,9 +572,9 @@ body {
 .history-header, .quick-header { font-size: 10px; font-weight: 700; text-transform: uppercase; letter-spacing: 0.06em; color: var(--muted); padding: 10px 16px 6px; }
 .history-item { padding: 8px 16px; cursor: pointer; border-radius: 0; transition: background 0.1s; }
 .history-item:hover { background: var(--bg); }
-.history-title { font-size: 12px; font-weight: 500; display: -webkit-box; -webkit-line-clamp: 2; -webkit-box-orient: vertical; overflow: hidden; }
-.history-date { font-size: 10px; font-family: var(--font-mono); color: var(--muted); margin-top: 2px; }
-.quick-item { background: none; border: none; text-align: left; padding: 8px 16px; font-size: 12px; color: var(--muted); cursor: pointer; line-height: 1.4; transition: color 0.1s, background 0.1s; }
+.history-title { font-size: 13px; font-weight: 500; display: -webkit-box; -webkit-line-clamp: 2; -webkit-box-orient: vertical; overflow: hidden; }
+.history-date { font-size: 11px; font-family: var(--font-mono); color: var(--muted); margin-top: 2px; }
+.quick-item { background: none; border: none; text-align: left; padding: 8px 16px; font-size: 13px; color: var(--muted); cursor: pointer; line-height: 1.4; transition: color 0.1s, background 0.1s; }
 .quick-item:hover { color: var(--accent); background: var(--accent-dim); }

 .chat-main { display: flex; flex-direction: column; overflow: hidden; }
@@ -570,14 +583,14 @@ body {
 .msg-user { flex-direction: row-reverse; }
 .msg-avatar { width: 28px; height: 28px; border-radius: 50%; display: flex; align-items: center; justify-content: center; font-size: 10px; font-weight: 700; flex-shrink: 0; background: var(--accent-dim); color: var(--accent); }
 .msg-avatar.user-av { background: var(--bg); color: var(--muted); border: 1px solid var(--border); }
-.msg-bubble { max-width: 72%; padding: 10px 14px; border-radius: 14px; font-size: 13px; line-height: 1.6; }
+.msg-bubble { max-width: 72%; padding: 10px 14px; border-radius: 14px; font-size: 14px; line-height: 1.6; }
 .msg-assistant .msg-bubble { background: var(--surface); border: 1px solid var(--border); border-bottom-left-radius: 4px; }
 .msg-user .msg-bubble { background: var(--accent); color: #fff; border-bottom-right-radius: 4px; }

 .composer { padding: 12px 16px; border-top: 1px solid var(--border); background: var(--surface); display: flex; flex-direction: column; gap: 8px; flex-shrink: 0; }
 .quick-chips { display: flex; gap: 6px; flex-wrap: wrap; }
 .composer-row { display: flex; gap: 8px; align-items: flex-end; }
-.composer-input { flex: 1; padding: 8px 12px; border: 1px solid var(--border); border-radius: var(--radius-sm); background: var(--bg); font-size: 13px; font-family: var(--font-body); color: var(--fg); resize: none; outline: none; line-height: 1.5; }
+.composer-input { flex: 1; padding: 8px 12px; border: 1px solid var(--border); border-radius: var(--radius-sm); background: var(--bg); font-size: 14px; font-family: var(--font-body); color: var(--fg); resize: none; outline: none; line-height: 1.5; }
 .composer-input:focus { border-color: var(--accent); }

 .citation-rail { border-left: 1px solid var(--border); overflow-y: auto; padding: 14px 0; background: var(--surface); }
@@ -586,9 +599,9 @@ body {
 .citation-item.highlighted { background: var(--accent-dim); border-left: 3px solid var(--accent); }
 .cit-score { font-size: 11px; font-weight: 700; font-family: var(--font-mono); color: var(--success); width: 34px; flex-shrink: 0; padding-top: 1px; }
 .cit-index { font-size: 10px; font-weight: 700; font-family: var(--font-mono); color: var(--muted); width: 18px; flex-shrink: 0; padding-top: 2px; }
-.cit-name { font-size: 12px; font-weight: 600; margin-bottom: 3px; }
-.cit-clause { font-size: 10px; font-family: var(--font-mono); color: var(--muted); margin-left: 5px; }
-.cit-snippet { font-size: 11px; color: var(--muted); display: -webkit-box; -webkit-line-clamp: 3; -webkit-box-orient: vertical; overflow: hidden; line-height: 1.5; }
+.cit-name { font-size: 13px; font-weight: 600; margin-bottom: 3px; }
+.cit-clause { font-size: 11px; font-family: var(--font-mono); color: var(--muted); margin-left: 5px; }
+.cit-snippet { font-size: 12px; color: var(--muted); display: -webkit-box; -webkit-line-clamp: 3; -webkit-box-orient: vertical; overflow: hidden; line-height: 1.5; }

 /* Inline citation badge [N] in message text */
 .cite-ref {
@@ -792,7 +805,7 @@ body {
 }
 .modal-tab {
  padding: 10px 18px;
-  font-size: 13px;
+  font-size: 14px;
  font-weight: 500;
  border: none;
  background: none;
@@ -816,7 +829,7 @@ body {
 .domain-chip {
  padding: 4px 12px;
  border-radius: 20px;
-  font-size: 11px;
+  font-size: 12px;
  font-weight: 500;
  border: 1px solid var(--border);
  background: var(--surface);
@@ -867,8 +880,8 @@ body {
  background: var(--accent);
  border-color: var(--accent);
 }
-.doc-select-name { font-size: 13px; font-weight: 500; flex: 1; }
-.doc-select-meta { font-size: 11px; color: var(--muted); }
+.doc-select-name { font-size: 14px; font-weight: 500; flex: 1; }
+.doc-select-meta { font-size: 12px; color: var(--muted); }

 /* Stage running animation */
@keyframes stage-pulse {
@@ -945,8 +958,8 @@ body {
  color: var(--accent);
  opacity: 0.7;
 }
-.analysis-empty h3 { font-size: 15px; font-weight: 600; color: var(--fg); margin: 0; }
-.analysis-empty p { font-size: 13px; max-width: 280px; line-height: 1.6; margin: 0; }
+.analysis-empty h3 { font-size: 16px; font-weight: 600; color: var(--fg); margin: 0; }
+.analysis-empty p { font-size: 14px; max-width: 280px; line-height: 1.6; margin: 0; }

 /* Highlight terms in paragraph */
 mark.comp-highlight {
@@ -976,3 +989,152 @@ mark.comp-highlight {
  background: linear-gradient(to right, #22c55e 0%, #eab308 50%, #ef4444 100%);
  transition: width 0.6s ease;
 }
+
+/* ── Login Page ─────────────────────────────────── */
+.login-page {
+  min-height: 100vh;
+  display: flex;
+  align-items: center;
+  justify-content: center;
+  background: var(--bg);
+}
+
+.login-card {
+  width: 100%;
+  max-width: 380px;
+  background: var(--surface);
+  border: 1px solid var(--border);
+  border-radius: var(--radius-md);
+  box-shadow: var(--shadow-card);
+  padding: 36px 32px 28px;
+}
+
+.login-brand {
+  display: flex;
+  align-items: center;
+  gap: 10px;
+  margin-bottom: 28px;
+}
+.login-logo { width: 32px; height: 32px; object-fit: contain; }
+.login-brand-name { font-size: 14px; font-weight: 700; font-family: var(--font-display); color: var(--fg); }
+.login-brand-sub  { font-size: 11px; color: var(--muted); }
+
+.login-title {
+  font-size: 20px;
+  font-weight: 700;
+  font-family: var(--font-display);
+  margin-bottom: 20px;
+  color: var(--fg);
+}
+
+.login-form { display: flex; flex-direction: column; gap: 16px; }
+
+.login-field { display: flex; flex-direction: column; gap: 5px; }
+.login-label { font-size: 12px; font-weight: 600; color: var(--fg); }
+
+.login-input {
+  height: 38px;
+  padding: 0 12px;
+  border: 1px solid var(--border-strong);
+  border-radius: var(--radius-sm);
+  background: var(--bg);
+  color: var(--fg);
+  font-size: 13px;
+  outline: none;
+  transition: border-color 0.15s;
+}
+.login-input:focus { border-color: var(--accent); }
+.login-input:disabled { opacity: 0.6; }
+
+.login-error {
+  font-size: 12px;
+  color: var(--danger);
+  background: var(--danger-bg);
+  border: 1px solid rgba(220,38,38,.2);
+  border-radius: var(--radius-sm);
+  padding: 8px 12px;
+  margin: 0;
+}
+
+.login-btn {
+  height: 40px;
+  background: var(--accent);
+  color: #fff;
+  border: none;
+  border-radius: var(--radius-sm);
+  font-size: 14px;
+  font-weight: 700;
+  cursor: pointer;
+  transition: background 0.15s;
+}
+.login-btn:hover:not(:disabled) { background: var(--accent-hover); }
+.login-btn:disabled { opacity: 0.6; cursor: not-allowed; }
+
+.login-hint {
+  margin-top: 16px;
+  font-size: 11px;
+  color: var(--muted);
+  text-align: center;
+}
+.login-hint code {
+  font-family: var(--font-mono);
+  background: var(--bg);
+  padding: 1px 4px;
+  border-radius: 3px;
+  border: 1px solid var(--border);
+}
+
+/* ── Sidebar user block (authenticated) ─────────── */
+.user-badge {
+  display: inline-block;
+  font-size: 10px;
+  font-weight: 700;
+  text-transform: uppercase;
+  padding: 1px 5px;
+  border-radius: 3px;
+  background: var(--accent-dim);
+  color: var(--accent);
+  letter-spacing: 0.04em;
+}
+.logout-btn {
+  background: none;
+  border: none;
+  cursor: pointer;
+  color: var(--muted);
+  padding: 4px;
+  border-radius: var(--radius-sm);
+  display: flex;
+  align-items: center;
+  transition: color 0.15s;
+}
+.logout-btn:hover { color: var(--danger); }
+
+/* ── Detail Tabs (Perception) ──────────────────── */
+.detail-tabs {
+  display: flex;
+  gap: 2px;
+  margin: 8px 0 0;
+  border-bottom: 1px solid var(--border);
+  padding-bottom: 0;
+}
+.detail-tab {
+  background: none;
+  border: none;
+  border-bottom: 2px solid transparent;
+  padding: 6px 14px;
+  font-size: 13px;
+  color: var(--text-secondary);
+  cursor: pointer;
+  transition: color 0.15s, border-color 0.15s;
+}
+.detail-tab:hover { color: var(--text); }
+.detail-tab.active {
+  color: var(--accent);
+  border-bottom-color: var(--accent);
+  font-weight: 600;
+}
+.detail-tab.disabled {
+  opacity: 0.35;
+  cursor: not-allowed;
+}
+.spin { animation: spin 1s linear infinite; }
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -17,13 +17,15 @@ dependencies = [
    "langchain>=0.1.0",
    "langchain-milvus>=0.1.0",
    "pymupdf>=1.24.0",
-    "python-docx>=0.8.11",
+    "python-docx>=1.1.0",
    "pydantic>=2.0.0",
    "pydantic-settings>=2.0.0",
    "python-dotenv>=1.0.0",
    "loguru>=0.7.0",
    "tenacity>=8.2.0",
    "httpx>=0.24.0",
+    "beautifulsoup4>=4.12.0",
+    "lxml>=5.0.0",
    "alibabacloud-docmind-api20220711>=1.0.6",
    "alibabacloud-tea-openapi>=0.3.11",
    "alibabacloud-tea-util>=0.3.13",
@@ -31,10 +33,13 @@ dependencies = [
    "redis>=4.5.0",
    "minio>=7.1.0",
    "psycopg2-binary>=2.9.0",
+    "python-jose[cryptography]>=3.3.0",
+    "passlib[bcrypt]>=1.7.4",
+    "bcrypt>=3.2.0,<4.0.0",
 ]

 [dependency-groups]
-dev = ["pytest>=7.0.0", "pytest-asyncio>=0.21.0", "isort>=8.0.1"]
+dev = ["pytest>=7.0.0", "pytest-asyncio>=0.21.0", "isort>=8.0.1", "fakeredis>=2.0.0"]

 [build-system]
 requires = ["setuptools>=61.0"]
--- a/requirements.txt
+++ b/requirements.txt
@@ -17,7 +17,7 @@ langchain-milvus>=0.1.0
 pymupdf>=1.24.0

 # Word文档解析
-python-docx>=0.8.11
+python-docx>=1.1.0

 # 阿里云文档解析
 alibabacloud-docmind-api20220711>=1.0.6
@@ -42,3 +42,7 @@ python-dotenv>=1.0.0
 loguru>=0.7.0
 tenacity>=8.2.0
 httpx>=0.24.0
+
+# Authentication
+python-jose[cryptography]>=3.3.0
+passlib[bcrypt]>=1.7.4
--- a/scripts/seed_users.py
+++ b/scripts/seed_users.py
@@ -0,0 +1,84 @@
+#!/usr/bin/env python
+"""Seed demo users into the PostgreSQL users table.
+
+Run from the repo root:
+    PYTHONPATH=backend python scripts/seed_users.py
+
+Creates four demo accounts (one per role). Safe to run multiple times —
+existing usernames are left unchanged (ON CONFLICT DO NOTHING).
+"""
+
+import os
+import sys
+
+# Allow running from repo root without installing the package.
+sys.path.insert(0, os.path.join(os.path.dirname(__file__), "..", "backend"))
+
+import psycopg2
+from passlib.context import CryptContext
+from app.config.settings import settings
+
+_PWD_CTX = CryptContext(schemes=["bcrypt"], deprecated="auto")
+
+DEMO_USERS = [
+    {"username": "admin",    "password": "Admin@2026!",   "role": "admin"},
+    {"username": "legal",    "password": "Legal@2026!",   "role": "legal"},
+    {"username": "ehs",      "password": "EHS@2026!",     "role": "ehs"},
+    {"username": "readonly", "password": "Read@2026!",    "role": "readonly"},
+]
+
+_CREATE_TABLE_SQL = """
+CREATE TABLE IF NOT EXISTS users (
+    id          UUID        PRIMARY KEY DEFAULT gen_random_uuid(),
+    username    VARCHAR(100) UNIQUE NOT NULL,
+    hashed_pw   TEXT         NOT NULL,
+    role        VARCHAR(50)  NOT NULL DEFAULT 'readonly',
+    is_active   BOOLEAN      NOT NULL DEFAULT TRUE,
+    created_at  TIMESTAMPTZ  NOT NULL DEFAULT NOW()
+);
+"""
+
+
+def seed() -> None:
+    """Insert demo users. Skips any username that already exists."""
+    conn = psycopg2.connect(
+        host=settings.postgres_host,
+        port=settings.postgres_port,
+        user=settings.postgres_user,
+        password=settings.postgres_password,
+        dbname=settings.postgres_db,
+    )
+    conn.autocommit = True
+
+    with conn.cursor() as cur:
+        # Enable pgcrypto for gen_random_uuid() if not already enabled, or use uuid-ossp fallback.
+        try:
+            cur.execute("CREATE EXTENSION IF NOT EXISTS pgcrypto;")
+        except Exception:
+            conn.rollback()
+        cur.execute(_CREATE_TABLE_SQL)
+
+    inserted = 0
+    with conn.cursor() as cur:
+        for user in DEMO_USERS:
+            hashed = _PWD_CTX.hash(user["password"])
+            cur.execute(
+                """
+                INSERT INTO users (username, hashed_pw, role)
+                VALUES (%s, %s, %s)
+                ON CONFLICT (username) DO NOTHING
+                """,
+                (user["username"], hashed, user["role"]),
+            )
+            if cur.rowcount > 0:
+                print(f"  Created user: {user['username']} (role={user['role']})")
+                inserted += 1
+            else:
+                print(f"  Skipped (already exists): {user['username']}")
+
+    print(f"\nDone. {inserted} user(s) created.")
+    conn.close()
+
+
+if __name__ == "__main__":
+    seed()
--- a/Show More
+++ b/Show More
Author	SHA1	Message	Date
wangwei	9212747e1b	update for 1. 优化 2.中英切换	2026-06-10 11:10:36 +08:00
wangwei	e7963b267e	fix somethings	2026-06-08 11:16:28 +08:00
wangwei	9fea9c6a53	1. Add 登陆功能 2. 调整字体大小 3. 新增部分功能	2026-06-05 18:00:31 +08:00
				`@@ -0,0 +1 @@`
				`{"reason":"idle timeout","timestamp":1780894411095}`
				`@@ -0,0 +1 @@`
				`"""HTTP middleware for cross-cutting concerns: audit logging."""`