feat: add admin routes, summarizer service, and CLI summarize command

- Add /admin routes for manual trigger and status inspection - Add summarizer service with batch/single summary support - Add summarize CLI command (single arxiv_id or batch pending) - Register admin router in main app - Add tests for summarizer
2026-06-05 22:29:33 +08:00
parent d69df2be10
commit 29e6797c12
7 changed files with 1874 additions and 0 deletions
@@ -49,6 +49,46 @@ def crawl(
        db.close()


+@cli_app.command()
+def summarize(
+    arxiv_id: str = typer.Argument(
+        None,
+        help="指定论文 arXiv ID；留空则批量处理所有 pending",
+    ),
+):
+    """手动触发 AI 总结。"""
+    from app.config import settings
+    from app.database import SessionLocal, engine
+    from app.models import init_db as _init
+    from app.services.summarizer import summarize_batch, summarize_single
+
+    import os
+    os.makedirs(settings.db_path.parent, exist_ok=True)
+    _init(engine)
+
+    db = SessionLocal()
+    try:
+        if arxiv_id:
+            typer.echo(f"🤖 开始总结 {arxiv_id} ...")
+            result = asyncio.run(summarize_single(db, arxiv_id))
+        else:
+            typer.echo("🤖 开始批量总结 pending 论文 ...")
+            result = asyncio.run(summarize_batch(db))
+
+        if result.get("status") in ("success", "done"):
+            typer.echo(f"✅ 总结完成：{result}")
+        elif result.get("status") == "conflict":
+            typer.echo("⚠️  已有批量总结任务在运行中", err=True)
+            raise typer.Exit(code=1)
+        elif result.get("status") == "not_found":
+            typer.echo(f"❌ 论文未找到：{arxiv_id}", err=True)
+            raise typer.Exit(code=1)
+        else:
+            typer.echo(f"⚠️  总结结果：{result}", err=True)
+    finally:
+        db.close()
+
+
@cli_app.command()
 def init_db():
    """初始化数据库表。"""
@@ -9,6 +9,7 @@ from fastapi.staticfiles import StaticFiles
 from app.config import settings
 from app.database import engine
 from app.models import init_db
+from app.routes.admin import router as admin_router
 from app.routes.pages import router as pages_router

 logging.basicConfig(
@@ -41,6 +42,7 @@ def create_app() -> FastAPI:

    # 路由
    app.include_router(pages_router)
+    app.include_router(admin_router)

    return app

@@ -0,0 +1,48 @@
+"""管理接口 — AI 总结触发，需要 ADMIN_TOKEN 鉴权。"""
+
+from __future__ import annotations
+
+from fastapi import APIRouter, Depends, HTTPException
+from fastapi.security import HTTPAuthorizationCredentials, HTTPBearer
+from sqlalchemy.orm import Session
+
+from app.config import settings
+from app.database import get_db
+from app.services.summarizer import summarize_batch, summarize_single
+
+router = APIRouter(prefix="/admin", tags=["admin"])
+security = HTTPBearer()
+
+
+async def verify_admin(
+    credentials: HTTPAuthorizationCredentials = Depends(security),
+) -> str:
+    """验证 ADMIN_TOKEN。"""
+    if credentials.credentials != settings.ADMIN_TOKEN:
+        raise HTTPException(status_code=401, detail="Invalid admin token")
+    return credentials.credentials
+
+
+@router.post("/summarize")
+async def admin_summarize_batch(
+    _admin: str = Depends(verify_admin),
+    db: Session = Depends(get_db),
+):
+    """批量总结所有 pending 论文。"""
+    result = await summarize_batch(db)
+    if result.get("status") == "conflict":
+        raise HTTPException(status_code=409, detail=result.get("error", "batch already running"))
+    return result
+
+
+@router.post("/summarize/{arxiv_id}")
+async def admin_summarize_single(
+    arxiv_id: str,
+    _admin: str = Depends(verify_admin),
+    db: Session = Depends(get_db),
+):
+    """总结或重跑单篇论文。"""
+    result = await summarize_single(db, arxiv_id, force=True)
+    if result.get("status") == "not_found":
+        raise HTTPException(status_code=404, detail=f"Paper not found: {arxiv_id}")
+    return result
@@ -0,0 +1,168 @@
+"""AI 总结 schema — Pydantic 校验模型、质量评估、DB 展平。"""
+
+from __future__ import annotations
+
+import json
+from datetime import datetime, timezone
+
+from pydantic import BaseModel, Field, ValidationError, field_validator
+
+
+# ── 子模型 ──────────────────────────────────────────────────────────────
+
+
+class PrerequisitesSchema(BaseModel):
+    concepts: list[str] = Field(default_factory=list)
+    level: str = ""
+
+
+class MotivationSchema(BaseModel):
+    problem: str
+    goal: str = ""
+    gap: str = ""
+
+    @field_validator("problem")
+    @classmethod
+    def non_empty_problem(cls, v: str) -> str:
+        if not v or not v.strip():
+            raise ValueError("motivation.problem cannot be empty")
+        return v.strip()
+
+
+class MethodSchema(BaseModel):
+    overview: str = ""
+    key_idea: str
+    steps: list[str] = Field(default_factory=list)
+    novelty: str = ""
+
+    @field_validator("key_idea")
+    @classmethod
+    def non_empty_key_idea(cls, v: str) -> str:
+        if not v or not v.strip():
+            raise ValueError("method.key_idea cannot be empty")
+        return v.strip()
+
+
+class ResultsSchema(BaseModel):
+    main_findings: list[str] = Field(default_factory=list)
+    benchmarks: list[dict] = Field(default_factory=list)
+    limitations: list[str] = Field(default_factory=list)
+
+
+class ImprovementsSchema(BaseModel):
+    weaknesses: list[str] = Field(default_factory=list)
+    future_work: list[str] = Field(default_factory=list)
+    reproducibility: str = ""
+
+
+# ── 顶层 schema ─────────────────────────────────────────────────────────
+
+
+class SummarySchema(BaseModel):
+    model_config = {"extra": "ignore"}
+
+    title_zh: str
+    one_line: str
+    tags: list[str]
+    difficulty: str = ""
+    paper_date: str | None = None
+    prerequisites: PrerequisitesSchema = Field(default_factory=PrerequisitesSchema)
+    motivation: MotivationSchema
+    method: MethodSchema
+    results: ResultsSchema = Field(default_factory=ResultsSchema)
+    improvements: ImprovementsSchema = Field(default_factory=ImprovementsSchema)
+
+    @field_validator("title_zh", "one_line")
+    @classmethod
+    def non_empty_text(cls, v: str) -> str:
+        if not v or not v.strip():
+            raise ValueError("field cannot be empty")
+        return v.strip()
+
+    @field_validator("tags")
+    @classmethod
+    def non_empty_tags(cls, v: list[str]) -> list[str]:
+        tags = [tag.strip() for tag in v if tag and tag.strip()]
+        if not tags:
+            raise ValueError("tags cannot be empty")
+        return tags
+
+
+# ── 质量评估 ────────────────────────────────────────────────────────────
+
+# 必填字段：title_zh, one_line, tags, motivation.problem, method.key_idea
+#   — 缺失时 Pydantic 校验就会报错，不会走到 assess_quality
+# 重要字段：motivation.goal, motivation.gap, method.overview, results.main_findings
+#   — 缺失可入库，标记 degraded
+_OPTIONAL_BUT_IMPORTANT_FIELDS = [
+    "motivation.goal",
+    "motivation.gap",
+    "method.overview",
+    "results.main_findings",
+]
+
+
+def assess_quality(schema: SummarySchema) -> str:
+    """评估总结质量：normal / degraded / low。"""
+    # low：内容空洞的启发式判断
+    if len(schema.one_line.strip()) < 10 or len(schema.method.key_idea.strip()) < 10:
+        return "low"
+
+    # 检查重要字段是否缺失
+    missing_important = 0
+    if not schema.motivation.goal.strip():
+        missing_important += 1
+    if not schema.motivation.gap.strip():
+        missing_important += 1
+    if not schema.method.overview.strip():
+        missing_important += 1
+    if not schema.results.main_findings:
+        missing_important += 1
+
+    if missing_important == 0:
+        return "normal"
+    return "degraded"
+
+
+# ── DB 展平 ─────────────────────────────────────────────────────────────
+
+
+def flatten_for_db(schema: SummarySchema) -> dict:
+    """将 SummarySchema 展平为 paper_summaries 表的列值 dict。"""
+    return {
+        "one_line": schema.one_line,
+        "difficulty": schema.difficulty,
+        "prerequisites_json": json.dumps(schema.prerequisites.model_dump(), ensure_ascii=False),
+        "motivation_problem": schema.motivation.problem,
+        "motivation_goal": schema.motivation.goal,
+        "motivation_gap": schema.motivation.gap,
+        "method_overview": schema.method.overview,
+        "method_key_idea": schema.method.key_idea,
+        "method_steps_json": json.dumps(schema.method.steps, ensure_ascii=False),
+        "method_novelty": schema.method.novelty,
+        "results_main_json": json.dumps(schema.results.main_findings, ensure_ascii=False),
+        "results_benchmarks_json": json.dumps(schema.results.benchmarks, ensure_ascii=False),
+        "limitations_json": json.dumps(schema.results.limitations, ensure_ascii=False),
+        "weaknesses_json": json.dumps(schema.improvements.weaknesses, ensure_ascii=False),
+        "future_work_json": json.dumps(schema.improvements.future_work, ensure_ascii=False),
+        "reproducibility": schema.improvements.reproducibility,
+        "full_json": schema.model_dump_json(ensure_ascii=False),
+        "updated_at": datetime.now(timezone.utc),
+    }
+
+
+# ── 错误分类 ────────────────────────────────────────────────────────────
+
+_REQUIRED_FIELDS = {"title_zh", "one_line", "tags", "problem", "key_idea"}
+
+
+def classify_validation_error(exc: ValidationError) -> str:
+    """区分 field_missing（必填缺失）和 schema_error（类型不合法等）。"""
+    for err in exc.errors():
+        field_name = err["loc"][-1] if err["loc"] else ""
+        if field_name in _REQUIRED_FIELDS and err["type"] in (
+            "missing",
+            "value_error",
+        ):
+            return "field_missing"
+    return "schema_error"
@@ -0,0 +1,682 @@
+"""AI 总结服务 — 调用 pi CLI 生成论文中文结构化总结。"""
+
+from __future__ import annotations
+
+import asyncio
+import json
+import logging
+import re
+import shutil
+from datetime import datetime, timezone
+from pathlib import Path
+
+import httpx
+from pydantic import ValidationError
+from sqlalchemy import select, text
+from sqlalchemy.orm import Session, joinedload
+
+from app.config import settings
+from app.database import SessionLocal
+from app.models import (
+    CrawlLog,
+    Paper,
+    PaperSummary,
+    PaperTag,
+    SummaryStatus,
+    TaskLock,
+)
+from app.services.schemas import (
+    SummarySchema,
+    assess_quality,
+    classify_validation_error,
+    flatten_for_db,
+)
+
+logger = logging.getLogger(__name__)
+
+# ── 自定义异常 ──────────────────────────────────────────────────────────
+
+
+class PdfDownloadError(Exception):
+    pass
+
+
+class PiTimeoutError(Exception):
+    pass
+
+
+class PiProcessError(Exception):
+    def __init__(self, returncode: int, stderr: str):
+        self.returncode = returncode
+        self.stderr = stderr
+        super().__init__(f"pi exited with code {returncode}: {stderr[:500]}")
+
+
+class JsonNotFoundError(Exception):
+    pass
+
+
+# ── 路径工具 ────────────────────────────────────────────────────────────
+
+_DATA_DIR = Path("data")
+_PAPERS_DIR = _DATA_DIR / "papers"
+_TMP_DIR = _DATA_DIR / "tmp"
+
+
+def _paper_dir(arxiv_id: str) -> Path:
+    return _PAPERS_DIR / arxiv_id
+
+
+def _tmp_dir(arxiv_id: str) -> Path:
+    return _TMP_DIR / arxiv_id
+
+
+# ── PDF 下载 ────────────────────────────────────────────────────────────
+
+
+async def _download_pdf(arxiv_id: str, pdf_url: str) -> Path:
+    """下载 PDF 到 data/tmp/{arxiv_id}/paper.pdf。"""
+    if not pdf_url:
+        raise PdfDownloadError(f"no pdf_url for {arxiv_id}")
+
+    tmp = _tmp_dir(arxiv_id)
+    tmp.mkdir(parents=True, exist_ok=True)
+    dest = tmp / "paper.pdf"
+
+    transport = None
+    if settings.http_proxy:
+        transport = httpx.AsyncHTTPTransport(proxy=settings.http_proxy)
+
+    try:
+        async with httpx.AsyncClient(
+            timeout=settings.HTTP_TIMEOUT_SECONDS,
+            headers={"User-Agent": settings.HTTP_USER_AGENT},
+            transport=transport,
+            follow_redirects=True,
+        ) as client:
+            resp = await client.get(pdf_url)
+            resp.raise_for_status()
+            dest.write_bytes(resp.content)
+    except Exception as exc:
+        raise PdfDownloadError(f"failed to download PDF for {arxiv_id}: {exc}") from exc
+
+    logger.info("Downloaded PDF: %s (%d bytes)", arxiv_id, dest.stat().st_size)
+    return dest
+
+
+# ── meta.json ───────────────────────────────────────────────────────────
+
+
+def _write_meta_json(paper: Paper) -> Path:
+    """写入 data/papers/{arxiv_id}/meta.json，返回路径。"""
+    d = _paper_dir(paper.arxiv_id)
+    d.mkdir(parents=True, exist_ok=True)
+    meta_path = d / "meta.json"
+
+    authors = [a.name for a in paper.authors]
+    tags = [t.tag for t in paper.tags]
+    meta = {
+        "arxiv_id": paper.arxiv_id,
+        "title_en": paper.title_en,
+        "abstract": paper.abstract or "",
+        "published_at": paper.published_at.isoformat() if paper.published_at else None,
+        "authors": authors,
+        "tags": tags,
+        "upvotes": paper.upvotes,
+    }
+    meta_path.write_text(json.dumps(meta, ensure_ascii=False, indent=2), encoding="utf-8")
+    return meta_path
+
+
+# ── pi CLI 调用 ────────────────────────────────────────────────────────
+
+
+async def _call_pi(meta_path: Path, pdf_path: Path) -> str:
+    """调用 pi CLI 非交互模式，返回 stdout 文本。"""
+    cmd = [
+        settings.PI_BIN,
+        "-p",
+        "--no-tools",
+        "--skill",
+        settings.SUMMARY_SKILL,
+        "请深度解读以下论文，并按指定 JSON schema 输出：",
+        f"@{meta_path}",
+        f"@{pdf_path}",
+    ]
+    logger.info("Calling pi: %s %s", paper_id_from_path(meta_path), " ".join(cmd[:4]))
+
+    proc = await asyncio.create_subprocess_exec(
+        *cmd,
+        stdout=asyncio.subprocess.PIPE,
+        stderr=asyncio.subprocess.PIPE,
+    )
+    try:
+        stdout, stderr = await asyncio.wait_for(
+            proc.communicate(),
+            timeout=settings.SUMMARY_TIMEOUT_SECONDS,
+        )
+    except asyncio.TimeoutError:
+        proc.kill()
+        await proc.wait()
+        raise PiTimeoutError(
+            f"pi timed out after {settings.SUMMARY_TIMEOUT_SECONDS}s"
+        )
+
+    if proc.returncode != 0:
+        raise PiProcessError(proc.returncode, stderr.decode("utf-8", errors="replace"))
+
+    return stdout.decode("utf-8", errors="replace")
+
+
+def paper_id_from_path(meta_path: Path) -> str:
+    """从 meta.json 路径反推 arxiv_id。"""
+    return meta_path.parent.name
+
+
+# ── JSON 提取 ──────────────────────────────────────────────────────────
+
+
+def _extract_json(raw_output: str) -> dict:
+    """从 pi 输出中提取 JSON dict。三步策略：直接解析 → 代码块 → 最大花括号块。"""
+    # 策略 1：整体直接解析
+    stripped = raw_output.strip()
+    try:
+        result = json.loads(stripped)
+        if isinstance(result, dict) and "title_zh" in result:
+            return result
+    except json.JSONDecodeError:
+        pass
+
+    # 策略 2：提取 ```json ... ``` 代码块
+    fence_pattern = re.compile(r"```(?:json)?\s*\n(.*?)```", re.DOTALL)
+    for match in fence_pattern.finditer(raw_output):
+        try:
+            result = json.loads(match.group(1).strip())
+            if isinstance(result, dict) and "title_zh" in result:
+                return result
+        except json.JSONDecodeError:
+            continue
+
+    # 策略 3：匹配包含 title_zh 的最大 {...} 块
+    brace_pattern = re.compile(r"\{[^{}]*\"title_zh\"[^{}]*\}", re.DOTALL)
+    # 先尝试一层嵌套；如果没命中再用更宽松的策略
+    for match in brace_pattern.finditer(raw_output):
+        try:
+            return json.loads(match.group(0))
+        except json.JSONDecodeError:
+            continue
+
+    # 更宽松：找到最大的 { ... } 平衡块
+    best = None
+    best_len = 0
+    for i, ch in enumerate(raw_output):
+        if ch != "{":
+            continue
+        depth = 0
+        for j in range(i, len(raw_output)):
+            if raw_output[j] == "{":
+                depth += 1
+            elif raw_output[j] == "}":
+                depth -= 1
+            if depth == 0:
+                candidate = raw_output[i : j + 1]
+                if len(candidate) > best_len:
+                    try:
+                        parsed = json.loads(candidate)
+                        if isinstance(parsed, dict):
+                            best = parsed
+                            best_len = len(candidate)
+                    except json.JSONDecodeError:
+                        pass
+                break
+
+    if best is not None:
+        return best
+
+    raise JsonNotFoundError("no JSON object found in pi output")
+
+
+# ── 错误分类 ────────────────────────────────────────────────────────────
+
+
+def _classify_error(exc: Exception) -> str:
+    """将异常映射到 error_type 枚举值。"""
+    if isinstance(exc, PdfDownloadError):
+        return "pdf_download_failed"
+    if isinstance(exc, PiTimeoutError):
+        return "timeout"
+    if isinstance(exc, PiProcessError):
+        return "process_error"
+    if isinstance(exc, JsonNotFoundError):
+        return "json_not_found"
+    if isinstance(exc, json.JSONDecodeError):
+        return "json_invalid"
+    if isinstance(exc, ValidationError):
+        return classify_validation_error(exc)
+    return "unknown"
+
+
+# ── FTS5 文本构建 ───────────────────────────────────────────────────────
+
+
+def _build_fts_summary_text(schema: SummarySchema) -> str:
+    """拼接用于 FTS5 索引的总结文本。"""
+    parts = [
+        schema.one_line or "",
+        schema.motivation.problem or "",
+        schema.motivation.goal or "",
+        schema.method_overview if hasattr(schema, "method_overview") else "",
+        schema.method.overview or "",
+        schema.method.key_idea or "",
+        " ".join(schema.results.main_findings or []),
+    ]
+    return " ".join(p for p in parts if p)
+
+
+# ── DB 更新 ─────────────────────────────────────────────────────────────
+
+
+def _update_summary_in_db(
+    db: Session,
+    paper: Paper,
+    schema: SummarySchema,
+    quality: str,
+    raw_output: str,
+) -> None:
+    """将校验后的总结写入 DB：paper_summaries + papers + paper_tags + FTS5。"""
+    now = datetime.now(timezone.utc)
+
+    # 1. paper_summaries：upsert
+    existing = db.get(PaperSummary, paper.id)
+    flat = flatten_for_db(schema)
+    if existing:
+        for k, v in flat.items():
+            setattr(existing, k, v)
+    else:
+        db.add(PaperSummary(paper_id=paper.id, **flat))
+
+    # 2. papers 表
+    paper.title_zh = schema.title_zh
+    paper.summary_quality = quality
+    paper_dir = _paper_dir(paper.arxiv_id)
+    paper.summary_path = str(paper_dir / "summary.json")
+    paper.raw_output_path = str(paper_dir / "raw_output.txt")
+
+    # 3. AI 标签
+    existing_tag_names = {t.tag for t in paper.tags}
+    for tag_name in schema.tags:
+        if tag_name not in existing_tag_names:
+            db.add(PaperTag(paper_id=paper.id, tag=tag_name, source="ai"))
+            existing_tag_names.add(tag_name)
+
+    # 4. FTS5 更新
+    summary_text = _build_fts_summary_text(schema)
+    db.execute(
+        text(
+            "UPDATE papers_fts SET title_zh=:title_zh, summary_text=:summary_text "
+            "WHERE rowid=:paper_id"
+        ),
+        {
+            "title_zh": schema.title_zh,
+            "summary_text": summary_text,
+            "paper_id": paper.id,
+        },
+    )
+
+    db.commit()
+    logger.info("DB updated: paper=%s quality=%s", paper.arxiv_id, quality)
+
+
+# ── 文件操作 ────────────────────────────────────────────────────────────
+
+
+def _save_files(arxiv_id: str, schema: SummarySchema, raw_output: str) -> None:
+    """保存 summary.json 和 raw_output.txt。"""
+    d = _paper_dir(arxiv_id)
+    d.mkdir(parents=True, exist_ok=True)
+    (d / "summary.json").write_text(
+        schema.model_dump_json(ensure_ascii=False, indent=2),
+        encoding="utf-8",
+    )
+    (d / "raw_output.txt").write_text(raw_output, encoding="utf-8")
+
+
+def _save_raw_output_only(arxiv_id: str, raw_output: str) -> None:
+    """仅保存 raw_output.txt（失败时）。"""
+    d = _paper_dir(arxiv_id)
+    d.mkdir(parents=True, exist_ok=True)
+    (d / "raw_output.txt").write_text(raw_output, encoding="utf-8")
+
+
+def _cleanup_tmp(arxiv_id: str) -> None:
+    """清理 data/tmp/{arxiv_id}/ 目录。"""
+    tmp = _tmp_dir(arxiv_id)
+    if tmp.exists():
+        try:
+            shutil.rmtree(tmp)
+            logger.debug("Cleaned tmp: %s", arxiv_id)
+        except Exception:
+            logger.warning("Failed to clean tmp for %s", arxiv_id, exc_info=True)
+
+
+# ── 单篇总结 ────────────────────────────────────────────────────────────
+
+
+async def summarize_one(
+    db: Session,
+    paper: Paper,
+    semaphore: asyncio.Semaphore | None = None,
+    *,
+    force: bool = False,
+) -> dict:
+    """总结单篇论文的完整流程。"""
+    arxiv_id = paper.arxiv_id
+
+    # 获取或创建 summary_status
+    if not paper.summary_status:
+        db.add(SummaryStatus(paper_id=paper.id, status="pending"))
+        db.commit()
+        db.refresh(paper)
+
+    status = paper.summary_status
+
+    # 跳过已完成的（除非 force）
+    if status.status == "done" and not force:
+        return {"arxiv_id": arxiv_id, "status": "skipped", "reason": "already_done"}
+
+    # 跳过 permanent_failure（除非 force）
+    if status.status == "permanent_failure" and not force:
+        return {"arxiv_id": arxiv_id, "status": "skipped", "reason": "permanent_failure"}
+
+    if semaphore:
+        await semaphore.acquire()
+    try:
+        return await _do_summarize_one(db, paper)
+    finally:
+        if semaphore:
+            semaphore.release()
+
+
+async def _do_summarize_one(db: Session, paper: Paper) -> dict:
+    """实际的单篇总结执行（在 semaphore 保护下）。"""
+    arxiv_id = paper.arxiv_id
+    status = paper.summary_status
+    now = datetime.now(timezone.utc)
+
+    # 状态 → processing
+    status.status = "processing"
+    status.started_at = now
+    db.commit()
+
+    raw_output = ""
+    try:
+        # 写 meta.json
+        meta_path = _write_meta_json(paper)
+
+        # 下载 PDF
+        await _download_pdf(arxiv_id, paper.pdf_url)
+
+        # 调用 pi
+        raw_output = await _call_pi(meta_path, _tmp_dir(arxiv_id) / "paper.pdf")
+
+        # 提取 JSON
+        json_data = _extract_json(raw_output)
+
+        # Pydantic 校验
+        schema = SummarySchema.model_validate(json_data)
+
+        # 质量评估
+        quality = assess_quality(schema)
+
+        # 保存文件
+        _save_files(arxiv_id, schema, raw_output)
+
+        # 更新 DB
+        _update_summary_in_db(db, paper, schema, quality, raw_output)
+
+        # 状态 → done
+        status.status = "done"
+        status.quality = quality
+        status.completed_at = datetime.now(timezone.utc)
+        status.raw_output_saved = True
+        db.commit()
+
+        logger.info("Summarize done: %s quality=%s", arxiv_id, quality)
+        return {"arxiv_id": arxiv_id, "status": "done", "quality": quality}
+
+    except Exception as exc:
+        error_type = _classify_error(exc)
+        logger.error(
+            "Summarize failed: %s error_type=%s %s",
+            arxiv_id,
+            error_type,
+            str(exc)[:200],
+        )
+
+        # 保存 raw_output（如果有）
+        if raw_output:
+            _save_raw_output_only(arxiv_id, raw_output)
+            status.raw_output_saved = True
+
+        # 重试逻辑
+        status.retry_count = (status.retry_count or 0) + 1
+        status.error_type = error_type
+        status.error = str(exc)[:2000]
+
+        if status.retry_count >= settings.SUMMARY_MAX_RETRIES + 1:
+            status.status = "permanent_failure"
+        else:
+            status.status = "pending"
+
+        status.completed_at = datetime.now(timezone.utc)
+        db.commit()
+
+        return {
+            "arxiv_id": arxiv_id,
+            "status": "failed",
+            "error_type": error_type,
+            "error": str(exc)[:200],
+            "retry_count": status.retry_count,
+        }
+
+    finally:
+        _cleanup_tmp(arxiv_id)
+
+
+# ── 单篇入口 ────────────────────────────────────────────────────────────
+
+
+async def summarize_single(
+    db: Session,
+    arxiv_id: str,
+    *,
+    force: bool = True,
+    _session_factory=None,
+) -> dict:
+    """单篇总结入口（供 admin 路由和 CLI 调用）。
+
+    _session_factory: 可选的 session 工厂，测试时注入内存 DB 的 session。
+    """
+    paper = (
+        db.query(Paper)
+        .filter(Paper.arxiv_id == arxiv_id)
+        .options(
+            joinedload(Paper.authors),
+            joinedload(Paper.tags),
+            joinedload(Paper.summary_status),
+        )
+        .first()
+    )
+    if not paper:
+        return {"status": "not_found", "arxiv_id": arxiv_id}
+
+    make_session = _session_factory or SessionLocal
+
+    # 每篇用独立 session 避免并发问题
+    paper_db = make_session()
+    try:
+        paper_in_new_session = (
+            paper_db.query(Paper)
+            .filter(Paper.arxiv_id == arxiv_id)
+            .options(
+                joinedload(Paper.authors),
+                joinedload(Paper.tags),
+                joinedload(Paper.summary_status),
+            )
+            .first()
+        )
+        result = await summarize_one(paper_db, paper_in_new_session, force=force)
+    finally:
+        paper_db.close()
+
+    return result
+
+
+# ── 批量总结 ────────────────────────────────────────────────────────────
+
+
+async def summarize_batch(
+    db: Session,
+    arxiv_ids: list[str] | None = None,
+    *,
+    _session_factory=None,
+) -> dict:
+    """批量总结入口。arxiv_ids=None 时处理所有 pending 论文。
+
+    _session_factory: 可选的 session 工厂，测试时注入内存 DB 的 session。
+    """
+    now = datetime.now(timezone.utc)
+
+    # TaskLock 防重入
+    lock = TaskLock(
+        task="summarize",
+        lock_key="batch",
+        status="running",
+        owner="summarize_batch",
+        acquired_at=now,
+    )
+    try:
+        db.add(lock)
+        db.commit()
+    except Exception:
+        db.rollback()
+        logger.warning("Summarize batch already running (lock conflict)")
+        return {"status": "conflict", "error": "summarize batch already running"}
+
+    # CrawlLog
+    log_entry = CrawlLog(
+        task="summarize",
+        status="running",
+        started_at=now,
+    )
+    db.add(log_entry)
+    db.commit()
+
+    try:
+        # 查询待总结论文
+        query = db.query(Paper).options(
+            joinedload(Paper.authors),
+            joinedload(Paper.tags),
+            joinedload(Paper.summary_status),
+        )
+        if arxiv_ids:
+            query = query.filter(Paper.arxiv_id.in_(arxiv_ids))
+        else:
+            # 只处理 pending 或 failed（可重试的）
+            query = query.join(SummaryStatus).filter(
+                SummaryStatus.status.in_(["pending", "failed"])
+            )
+
+        papers = query.all()
+        total = len(papers)
+        logger.info("Summarize batch: %d papers to process", total)
+
+        if total == 0:
+            log_entry.status = "success"
+            log_entry.papers_found = 0
+            log_entry.papers_new = 0
+            log_entry.completed_at = datetime.now(timezone.utc)
+            _release_lock(db, lock)
+            return {"status": "success", "done": 0, "failed": 0, "skipped": 0, "total": 0}
+
+        # 并发控制
+        semaphore = asyncio.Semaphore(settings.SUMMARY_CONCURRENCY)
+        make_session = _session_factory or SessionLocal
+
+        async def _process_paper(paper: Paper) -> dict:
+            paper_db = make_session()
+            try:
+                p = (
+                    paper_db.query(Paper)
+                    .filter(Paper.id == paper.id)
+                    .options(
+                        joinedload(Paper.authors),
+                        joinedload(Paper.tags),
+                        joinedload(Paper.summary_status),
+                    )
+                    .first()
+                )
+                return await summarize_one(paper_db, p, semaphore)
+            finally:
+                paper_db.close()
+
+        results = await asyncio.gather(
+            *[_process_paper(p) for p in papers],
+            return_exceptions=True,
+        )
+
+        # 统计结果
+        done = 0
+        failed = 0
+        skipped = 0
+        for r in results:
+            if isinstance(r, Exception):
+                logger.error("Unexpected error in batch: %s", r)
+                failed += 1
+            elif isinstance(r, dict):
+                if r.get("status") == "done":
+                    done += 1
+                elif r.get("status") == "skipped":
+                    skipped += 1
+                else:
+                    failed += 1
+
+        log_entry.status = "success" if failed == 0 else "failed"
+        log_entry.papers_found = total
+        log_entry.papers_new = done
+        log_entry.completed_at = datetime.now(timezone.utc)
+        db.commit()
+
+        logger.info(
+            "Summarize batch done: total=%d done=%d failed=%d skipped=%d",
+            total, done, failed, skipped,
+        )
+        return {
+            "status": "success" if failed == 0 else "partial",
+            "total": total,
+            "done": done,
+            "failed": failed,
+            "skipped": skipped,
+        }
+
+    except Exception as exc:
+        logger.exception("Summarize batch failed")
+        log_entry.status = "failed"
+        log_entry.error = str(exc)[:2000]
+        log_entry.completed_at = datetime.now(timezone.utc)
+        db.commit()
+        return {"status": "failed", "error": str(exc)}
+
+    finally:
+        _release_lock(db, lock)
+
+
+def _release_lock(db: Session, lock: TaskLock) -> None:
+    """释放 TaskLock。"""
+    try:
+        lock.status = "finished"
+        lock.released_at = datetime.now(timezone.utc)
+        db.commit()
+    except Exception:
+        db.rollback()
+        logger.warning("Failed to release summarize lock", exc_info=True)
@@ -0,0 +1,209 @@
+"""测试 fixtures — 内存 SQLite、TestClient、样例数据。"""
+
+from __future__ import annotations
+
+import json
+from datetime import date, datetime, timezone
+from pathlib import Path
+from unittest.mock import AsyncMock
+
+import pytest
+from fastapi.testclient import TestClient
+from sqlalchemy import create_engine, event
+from sqlalchemy.orm import DeclarativeBase, sessionmaker
+
+from app.database import get_db
+from app.main import create_app
+from app.models import (
+    Paper,
+    PaperAuthor,
+    PaperSummary,
+    PaperTag,
+    SummaryStatus,
+    init_db,
+)
+
+
+# ── 内存数据库 ──────────────────────────────────────────────────────────
+
+
+class _TestBase(DeclarativeBase):
+    pass
+
+
+# 复用 app.models 的 Base metadata
+from app.database import Base as _AppBase  # noqa: E402
+
+_TestBase.metadata = _AppBase.metadata
+
+
+@pytest.fixture
+def db_engine():
+    """创建内存 SQLite 引擎 + FTS5。"""
+    engine = create_engine(
+        "sqlite:///:memory:",
+        connect_args={"check_same_thread": False},
+    )
+
+    @event.listens_for(engine, "connect")
+    def _pragma(dbapi_connection, _record):
+        cursor = dbapi_connection.cursor()
+        cursor.execute("PRAGMA foreign_keys=ON")
+        cursor.close()
+
+    init_db(engine)
+    return engine
+
+
+@pytest.fixture
+def db_session(db_engine):
+    """提供事务隔离的数据库 session。"""
+    Session = sessionmaker(bind=db_engine, autoflush=False, autocommit=False)
+    session = Session()
+    try:
+        yield session
+    finally:
+        session.close()
+
+
+@pytest.fixture
+def client(db_engine, db_session):
+    """FastAPI TestClient，override get_db。"""
+    app = create_app()
+
+    def _override_get_db():
+        yield db_session
+
+    app.dependency_overrides[get_db] = _override_get_db
+
+    with TestClient(app, raise_server_exceptions=False) as c:
+        yield c
+
+    app.dependency_overrides.clear()
+
+
+# ── 样例数据 ────────────────────────────────────────────────────────────
+
+SAMPLE_ARXIV_ID = "2401.12345"
+ADMIN_TOKEN = "test-admin-token-12345"
+
+
+@pytest.fixture
+def sample_paper(db_session):
+    """插入一篇测试论文 + 作者 + 标签 + summary_status(pending)。"""
+    now = datetime.now(timezone.utc)
+    paper = Paper(
+        arxiv_id=SAMPLE_ARXIV_ID,
+        title_en="Test Paper Title",
+        abstract="This is a test abstract for the paper.",
+        published_at=date(2024, 1, 15),
+        paper_date=date(2024, 1, 15),
+        crawled_at=now,
+        upvotes=42,
+        hf_url=f"https://huggingface.co/papers/{SAMPLE_ARXIV_ID}",
+        arxiv_url=f"https://arxiv.org/abs/{SAMPLE_ARXIV_ID}",
+        pdf_url=f"https://arxiv.org/pdf/{SAMPLE_ARXIV_ID}.pdf",
+    )
+    db_session.add(paper)
+    db_session.flush()
+
+    db_session.add(PaperAuthor(paper_id=paper.id, name="Alice Smith", position=0))
+    db_session.add(PaperAuthor(paper_id=paper.id, name="Bob Jones", position=1))
+    db_session.add(PaperTag(paper_id=paper.id, tag="NLP", source="hf"))
+    db_session.add(PaperTag(paper_id=paper.id, tag="LLM", source="hf"))
+
+    db_session.add(SummaryStatus(paper_id=paper.id, status="pending"))
+
+    # FTS5 初始行（与 crawler 一致）
+    db_session.execute(
+        __import__("sqlalchemy").text(
+            "INSERT INTO papers_fts(rowid, title_en, abstract, authors, tags) "
+            "VALUES (:id, :title, :abstract, :authors, :tags)"
+        ),
+        {
+            "id": paper.id,
+            "title": paper.title_en,
+            "abstract": paper.abstract or "",
+            "authors": "Alice Smith, Bob Jones",
+            "tags": "NLP, LLM",
+        },
+    )
+    db_session.commit()
+    return paper
+
+
+@pytest.fixture
+def sample_summary_dict() -> dict:
+    """完整合法的 summary dict。"""
+    return {
+        "title_zh": "测试论文中文标题",
+        "one_line": "这是一篇关于自然语言处理的测试论文的一句话总结。",
+        "tags": ["自然语言处理", "大语言模型", "Transformer"],
+        "difficulty": "中级",
+        "prerequisites": {
+            "concepts": ["Transformer", "注意力机制"],
+            "level": "中级",
+        },
+        "motivation": {
+            "problem": "现有模型在长文本理解上存在不足。",
+            "goal": "提出一种新的注意力机制来提升长文本建模能力。",
+            "gap": "当前方法计算复杂度过高。",
+        },
+        "method": {
+            "overview": "提出了一种高效的稀疏注意力机制。",
+            "key_idea": "使用局部-全局混合的注意力模式来降低计算复杂度。",
+            "steps": [
+                "分析现有注意力机制的瓶颈",
+                "设计稀疏注意力模式",
+                "在多个基准上验证效果",
+            ],
+            "novelty": "首次将局部-全局注意力模式结合应用于长文本建模。",
+        },
+        "results": {
+            "main_findings": [
+                "在长文本基准上取得了 SOTA 结果",
+                "推理速度提升了 2 倍",
+            ],
+            "benchmarks": [
+                {"dataset": "LongBench", "score": 85.3},
+            ],
+            "limitations": [
+                "在超长文本（>100k tokens）上效果有所下降",
+            ],
+        },
+        "improvements": {
+            "weaknesses": ["仅验证了英文数据"],
+            "future_work": ["扩展到多语言场景"],
+            "reproducibility": "代码已开源，模型权重可下载。",
+        },
+    }
+
+
+@pytest.fixture
+def sample_summary_json(sample_summary_dict) -> str:
+    """合法 summary 的 JSON 字符串。"""
+    return json.dumps(sample_summary_dict, ensure_ascii=False, indent=2)
+
+
+@pytest.fixture
+def mock_pi_output(sample_summary_json) -> str:
+    """模拟 pi CLI 的完整输出（包含 JSON）。"""
+    return f"""以下是论文的深度解读：
+
+```json
+{sample_summary_json}
+```
+
+希望这个总结对你有帮助！"""
+
+
+@pytest.fixture
+def admin_token():
+    """返回测试用的 ADMIN_TOKEN（需要配合 monkeypatch 使用）。"""
+    return ADMIN_TOKEN
+
+
+@pytest.fixture
+def admin_headers(admin_token):
+    """带 Bearer token 的请求头。"""
+    return {"Authorization": f"Bearer {admin_token}"}
@@ -0,0 +1,725 @@
+"""AI 总结服务测试 — Mock 全链路，不调用真实 pi。"""
+
+from __future__ import annotations
+
+import asyncio
+import json
+from datetime import date, datetime, timezone
+from pathlib import Path
+from unittest.mock import AsyncMock, MagicMock, patch
+
+import pytest
+from pydantic import ValidationError
+from sqlalchemy import text
+
+from app.models import (
+    CrawlLog,
+    Paper,
+    PaperSummary,
+    PaperTag,
+    SummaryStatus,
+    TaskLock,
+)
+from app.services.schemas import (
+    SummarySchema,
+    assess_quality,
+    classify_validation_error,
+    flatten_for_db,
+)
+from app.services.summarizer import (
+    JsonNotFoundError,
+    PdfDownloadError,
+    PiProcessError,
+    PiTimeoutError,
+    _call_pi,
+    _classify_error,
+    _cleanup_tmp,
+    _extract_json,
+    _save_files,
+    _save_raw_output_only,
+    _update_summary_in_db,
+    summarize_batch,
+    summarize_one,
+    summarize_single,
+)
+
+
+# ═══════════════════════════════════════════════════════════════════════
+# Schema 校验测试
+# ═══════════════════════════════════════════════════════════════════════
+
+
+class TestSummarySchema:
+    """Pydantic schema 校验。"""
+
+    def test_valid_summary(self, sample_summary_dict):
+        schema = SummarySchema.model_validate(sample_summary_dict)
+        assert schema.title_zh == "测试论文中文标题"
+        assert len(schema.tags) == 3
+        assert schema.motivation.problem
+
+    def test_missing_title_zh(self, sample_summary_dict):
+        del sample_summary_dict["title_zh"]
+        with pytest.raises(ValidationError) as exc_info:
+            SummarySchema.model_validate(sample_summary_dict)
+        assert classify_validation_error(exc_info.value) == "field_missing"
+
+    def test_empty_one_line(self, sample_summary_dict):
+        sample_summary_dict["one_line"] = ""
+        with pytest.raises(ValidationError):
+            SummarySchema.model_validate(sample_summary_dict)
+
+    def test_empty_tags(self, sample_summary_dict):
+        sample_summary_dict["tags"] = []
+        with pytest.raises(ValidationError):
+            SummarySchema.model_validate(sample_summary_dict)
+
+    def test_empty_motivation_problem(self, sample_summary_dict):
+        sample_summary_dict["motivation"]["problem"] = ""
+        with pytest.raises(ValidationError):
+            SummarySchema.model_validate(sample_summary_dict)
+
+    def test_empty_method_key_idea(self, sample_summary_dict):
+        sample_summary_dict["method"]["key_idea"] = ""
+        with pytest.raises(ValidationError):
+            SummarySchema.model_validate(sample_summary_dict)
+
+    def test_extra_fields_ignored(self, sample_summary_dict):
+        sample_summary_dict["figures"] = ["fig1.png"]
+        sample_summary_dict["takeaway"] = "important paper"
+        schema = SummarySchema.model_validate(sample_summary_dict)
+        assert not hasattr(schema, "figures")
+        assert schema.title_zh  # 正常解析
+
+    def test_flatten_for_db(self, sample_summary_dict):
+        schema = SummarySchema.model_validate(sample_summary_dict)
+        flat = flatten_for_db(schema)
+        assert flat["one_line"] == schema.one_line
+        assert flat["motivation_problem"] == schema.motivation.problem
+        assert flat["method_key_idea"] == schema.method.key_idea
+        assert "full_json" in flat
+        assert "updated_at" in flat
+        # JSON 字段可解析
+        assert isinstance(json.loads(flat["prerequisites_json"]), dict)
+        assert isinstance(json.loads(flat["method_steps_json"]), list)
+
+
+class TestQualityAssessment:
+    """质量分级测试。"""
+
+    def test_quality_normal(self, sample_summary_dict):
+        schema = SummarySchema.model_validate(sample_summary_dict)
+        assert assess_quality(schema) == "normal"
+
+    def test_quality_degraded_missing_goal(self, sample_summary_dict):
+        sample_summary_dict["motivation"]["goal"] = ""
+        sample_summary_dict["motivation"]["gap"] = ""
+        sample_summary_dict["method"]["overview"] = ""
+        sample_summary_dict["results"]["main_findings"] = []
+        schema = SummarySchema.model_validate(sample_summary_dict)
+        assert assess_quality(schema) == "degraded"
+
+    def test_quality_low_short_one_line(self, sample_summary_dict):
+        sample_summary_dict["one_line"] = "短"
+        schema = SummarySchema.model_validate(sample_summary_dict)
+        assert assess_quality(schema) == "low"
+
+    def test_quality_low_short_key_idea(self, sample_summary_dict):
+        sample_summary_dict["method"]["key_idea"] = "短"
+        schema = SummarySchema.model_validate(sample_summary_dict)
+        assert assess_quality(schema) == "low"
+
+
+# ═══════════════════════════════════════════════════════════════════════
+# JSON 提取测试
+# ═══════════════════════════════════════════════════════════════════════
+
+
+class TestJsonExtraction:
+    """pi 输出的 JSON 提取。"""
+
+    def test_direct_json(self, sample_summary_json):
+        result = _extract_json(sample_summary_json)
+        assert result["title_zh"] == "测试论文中文标题"
+
+    def test_fenced_code_block(self, sample_summary_json):
+        raw = f"一些文字\n```json\n{sample_summary_json}\n```\n更多文字"
+        result = _extract_json(raw)
+        assert result["title_zh"] == "测试论文中文标题"
+
+    def test_fenced_without_lang(self, sample_summary_json):
+        raw = f"文字\n```\n{sample_summary_json}\n```"
+        result = _extract_json(raw)
+        assert result["title_zh"] == "测试论文中文标题"
+
+    def test_embedded_braces(self, sample_summary_dict):
+        json_str = json.dumps(sample_summary_dict, ensure_ascii=False)
+        raw = f"Here is the summary:\n{json_str}\nEnd."
+        result = _extract_json(raw)
+        assert result["title_zh"] == "测试论文中文标题"
+
+    def test_no_json_raises(self):
+        with pytest.raises(JsonNotFoundError):
+            _extract_json("No JSON here at all.")
+
+    def test_json_without_title_zh_falls_through(self):
+        """不含 title_zh 的 JSON 不是我们要的。"""
+        raw = json.dumps({"other": "data"})
+        # 如果有其他合法 JSON 块也能返回，但没有就直接找最大块
+        # 此场景 raw 本身就是一个 JSON dict，但没有 title_zh
+        # 策略 1 会跳过（无 title_zh），策略 2 无代码块，策略 3 找到最大块
+        result = _extract_json(raw)
+        assert result == {"other": "data"}  # 最大块兜底
+
+
+# ═══════════════════════════════════════════════════════════════════════
+# 错误分类测试
+# ═══════════════════════════════════════════════════════════════════════
+
+
+class TestErrorClassification:
+    """异常 → error_type 映射。"""
+
+    def test_pdf_download_error(self):
+        assert _classify_error(PdfDownloadError("fail")) == "pdf_download_failed"
+
+    def test_timeout_error(self):
+        assert _classify_error(PiTimeoutError("timeout")) == "timeout"
+
+    def test_process_error(self):
+        assert _classify_error(PiProcessError(1, "stderr")) == "process_error"
+
+    def test_json_not_found(self):
+        assert _classify_error(JsonNotFoundError("not found")) == "json_not_found"
+
+    def test_json_invalid(self):
+        assert _classify_error(json.JSONDecodeError("bad", "", 0)) == "json_invalid"
+
+    def test_field_missing(self):
+        try:
+            SummarySchema.model_validate({"title_zh": ""})  # type: ignore
+        except ValidationError as exc:
+            assert _classify_error(exc) == "field_missing"
+
+    def test_unknown_error(self):
+        assert _classify_error(RuntimeError("boom")) == "unknown"
+
+
+# ═══════════════════════════════════════════════════════════════════════
+# DB 更新测试
+# ═══════════════════════════════════════════════════════════════════════
+
+
+class TestDbUpdate:
+    """_update_summary_in_db 验证。"""
+
+    def test_summary_written(self, db_session, sample_paper, sample_summary_dict):
+        schema = SummarySchema.model_validate(sample_summary_dict)
+        _update_summary_in_db(db_session, sample_paper, schema, "normal", "raw")
+
+        summary = db_session.get(PaperSummary, sample_paper.id)
+        assert summary is not None
+        assert summary.one_line == schema.one_line
+        assert summary.motivation_problem == schema.motivation.problem
+        assert json.loads(summary.full_json)["title_zh"] == schema.title_zh
+
+    def test_paper_title_zh_updated(self, db_session, sample_paper, sample_summary_dict):
+        schema = SummarySchema.model_validate(sample_summary_dict)
+        _update_summary_in_db(db_session, sample_paper, schema, "normal", "raw")
+
+        db_session.refresh(sample_paper)
+        assert sample_paper.title_zh == "测试论文中文标题"
+        assert sample_paper.summary_quality == "normal"
+
+    def test_fts_updated(self, db_session, sample_paper, sample_summary_dict):
+        schema = SummarySchema.model_validate(sample_summary_dict)
+        _update_summary_in_db(db_session, sample_paper, schema, "normal", "raw")
+
+        row = db_session.execute(
+            text("SELECT title_zh, summary_text FROM papers_fts WHERE rowid = :id"),
+            {"id": sample_paper.id},
+        ).fetchone()
+        assert row is not None
+        assert row[0] == "测试论文中文标题"
+        assert schema.one_line in row[1]
+
+    def test_ai_tags_added(self, db_session, sample_paper, sample_summary_dict):
+        schema = SummarySchema.model_validate(sample_summary_dict)
+        _update_summary_in_db(db_session, sample_paper, schema, "normal", "raw")
+
+        tags = (
+            db_session.query(PaperTag)
+            .filter(PaperTag.paper_id == sample_paper.id, PaperTag.source == "ai")
+            .all()
+        )
+        tag_names = {t.tag for t in tags}
+        # AI tags 来自 schema.tags
+        assert "自然语言处理" in tag_names
+        assert "大语言模型" in tag_names
+
+    def test_existing_tags_not_duplicated(self, db_session, sample_paper, sample_summary_dict):
+        """已存在的标签名（同 name）不会被 AI source 重复插入。"""
+        # sample_paper 已有 NLP (hf)、LLM (hf)
+        # 让 AI 输出包含 NLP（与 HF 重复）和 "新标签"（新的）
+        sample_summary_dict["tags"] = ["NLP", "新标签"]
+        schema = SummarySchema.model_validate(sample_summary_dict)
+        _update_summary_in_db(db_session, sample_paper, schema, "normal", "raw")
+
+        all_tags = (
+            db_session.query(PaperTag)
+            .filter(PaperTag.paper_id == sample_paper.id)
+            .all()
+        )
+        tag_names = [t.tag for t in all_tags]
+        # NLP 只出现一次（HF 原有的），AI 不会重复加
+        assert tag_names.count("NLP") == 1
+        # "新标签" 是 AI 新加的
+        assert "新标签" in tag_names
+
+
+# ═══════════════════════════════════════════════════════════════════════
+# 文件操作测试
+# ═══════════════════════════════════════════════════════════════════════
+
+
+class TestFileOperations:
+    """文件保存和清理。"""
+
+    def test_save_files(self, tmp_path, sample_summary_dict):
+        schema = SummarySchema.model_validate(sample_summary_dict)
+        with patch("app.services.summarizer._PAPERS_DIR", tmp_path):
+            _save_files("2401.12345", schema, "raw output text")
+
+            paper_dir = tmp_path / "2401.12345"
+            assert (paper_dir / "summary.json").exists()
+            assert (paper_dir / "raw_output.txt").exists()
+            saved = json.loads((paper_dir / "summary.json").read_text())
+            assert saved["title_zh"] == "测试论文中文标题"
+
+    def test_save_raw_output_only(self, tmp_path):
+        with patch("app.services.summarizer._PAPERS_DIR", tmp_path):
+            _save_raw_output_only("2401.12345", "raw output")
+            paper_dir = tmp_path / "2401.12345"
+            assert (paper_dir / "raw_output.txt").exists()
+            assert not (paper_dir / "summary.json").exists()
+
+    def test_cleanup_tmp(self, tmp_path):
+        tmp_paper = tmp_path / "2401.12345"
+        tmp_paper.mkdir()
+        (tmp_paper / "paper.pdf").write_bytes(b"%PDF-fake")
+        with patch("app.services.summarizer._TMP_DIR", tmp_path):
+            _cleanup_tmp("2401.12345")
+        assert not tmp_paper.exists()
+
+    def test_cleanup_tmp_nonexistent(self, tmp_path):
+        """清理不存在的目录不报错。"""
+        with patch("app.services.summarizer._TMP_DIR", tmp_path):
+            _cleanup_tmp("nonexistent")  # 不抛异常
+
+
+# ═══════════════════════════════════════════════════════════════════════
+# 全流程状态流转测试
+# ═══════════════════════════════════════════════════════════════════════
+
+
+class TestSummarizeOneFlow:
+    """summarize_one 的状态流转（mock pi 和 PDF）。"""
+
+    @pytest.fixture
+    def _patch_paths(self, tmp_path):
+        """将 data 目录重定向到 tmp_path。"""
+        with (
+            patch("app.services.summarizer._PAPERS_DIR", tmp_path / "papers"),
+            patch("app.services.summarizer._TMP_DIR", tmp_path / "tmp"),
+            patch("app.services.summarizer._DATA_DIR", tmp_path),
+        ):
+            yield
+
+    @pytest.mark.asyncio
+    async def test_full_success_path(
+        self, db_session, sample_paper, mock_pi_output, _patch_paths
+    ):
+        """pending → processing → done 全流程。"""
+        with (
+            patch("app.services.summarizer._download_pdf", new_callable=AsyncMock),
+            patch("app.services.summarizer._call_pi", new_callable=AsyncMock, return_value=mock_pi_output),
+        ):
+            result = await summarize_one(db_session, sample_paper)
+
+        assert result["status"] == "done"
+        assert result["quality"] == "normal"
+
+        # 验证 DB 状态
+        db_session.refresh(sample_paper)
+        assert sample_paper.summary_status.status == "done"
+        assert sample_paper.summary_status.quality == "normal"
+        assert sample_paper.title_zh == "测试论文中文标题"
+
+        # 验证 summary 已写入
+        summary = db_session.get(PaperSummary, sample_paper.id)
+        assert summary is not None
+        assert summary.one_line
+
+        # 验证 FTS 已更新
+        fts_row = db_session.execute(
+            text("SELECT title_zh FROM papers_fts WHERE rowid = :id"),
+            {"id": sample_paper.id},
+        ).fetchone()
+        assert fts_row[0] == "测试论文中文标题"
+
+    @pytest.mark.asyncio
+    async def test_pdf_download_failure(
+        self, db_session, sample_paper, _patch_paths
+    ):
+        """PDF 下载失败 → error_type=pdf_download_failed，tmp 被清理。"""
+        with (
+            patch(
+                "app.services.summarizer._download_pdf",
+                new_callable=AsyncMock,
+                side_effect=PdfDownloadError("network error"),
+            ),
+        ):
+            result = await summarize_one(db_session, sample_paper)
+
+        assert result["status"] == "failed"
+        assert result["error_type"] == "pdf_download_failed"
+
+        db_session.refresh(sample_paper)
+        status = sample_paper.summary_status
+        assert status.error_type == "pdf_download_failed"
+
+    @pytest.mark.asyncio
+    async def test_pi_timeout(self, db_session, sample_paper, _patch_paths):
+        """pi 超时 → timeout 错误，retry_count 递增。"""
+        with (
+            patch("app.services.summarizer._download_pdf", new_callable=AsyncMock),
+            patch(
+                "app.services.summarizer._call_pi",
+                new_callable=AsyncMock,
+                side_effect=PiTimeoutError("timeout after 300s"),
+            ),
+        ):
+            result = await summarize_one(db_session, sample_paper)
+
+        assert result["status"] == "failed"
+        assert result["error_type"] == "timeout"
+        assert result["retry_count"] == 1
+
+    @pytest.mark.asyncio
+    async def test_json_not_found(self, db_session, sample_paper, _patch_paths):
+        """pi 输出无 JSON → json_not_found。"""
+        with (
+            patch("app.services.summarizer._download_pdf", new_callable=AsyncMock),
+            patch(
+                "app.services.summarizer._call_pi",
+                new_callable=AsyncMock,
+                return_value="No JSON in this output at all.",
+            ),
+        ):
+            result = await summarize_one(db_session, sample_paper)
+
+        assert result["status"] == "failed"
+        assert result["error_type"] == "json_not_found"
+
+    @pytest.mark.asyncio
+    async def test_field_missing_and_retry(
+        self, db_session, sample_paper, _patch_paths
+    ):
+        """必填字段缺失 → field_missing → retry → permanent_failure。"""
+        bad_json = json.dumps({
+            "title_zh": "",  # 空的必填字段
+            "one_line": "valid line",
+            "tags": ["tag1"],
+            "motivation": {"problem": "valid problem"},
+            "method": {"key_idea": "valid idea"},
+        }, ensure_ascii=False)
+        bad_output = f"```json\n{bad_json}\n```"
+
+        with (
+            patch("app.services.summarizer._download_pdf", new_callable=AsyncMock),
+            patch(
+                "app.services.summarizer._call_pi",
+                new_callable=AsyncMock,
+                return_value=bad_output,
+            ),
+        ):
+            # 第一次失败 → pending (retry)
+            result1 = await summarize_one(db_session, sample_paper)
+            assert result1["status"] == "failed"
+            assert result1["error_type"] == "field_missing"
+            assert result1["retry_count"] == 1
+
+            # 第二次失败 → permanent_failure (SUMMARY_MAX_RETRIES=1, 所以 2 次 > 1+1)
+            db_session.refresh(sample_paper)
+            result2 = await summarize_one(db_session, sample_paper)
+            assert result2["status"] == "failed"
+            assert result2["retry_count"] == 2
+
+            db_session.refresh(sample_paper)
+            assert sample_paper.summary_status.status == "permanent_failure"
+
+    @pytest.mark.asyncio
+    async def test_raw_output_saved_on_failure(
+        self, db_session, sample_paper, tmp_path, _patch_paths
+    ):
+        """失败时仍保存 raw_output.txt。"""
+        with (
+            patch("app.services.summarizer._download_pdf", new_callable=AsyncMock),
+            patch(
+                "app.services.summarizer._call_pi",
+                new_callable=AsyncMock,
+                return_value="Some output without JSON",
+            ),
+        ):
+            await summarize_one(db_session, sample_paper)
+
+        raw_file = tmp_path / "papers" / sample_paper.arxiv_id / "raw_output.txt"
+        assert raw_file.exists()
+        assert "Some output without JSON" in raw_file.read_text()
+
+    @pytest.mark.asyncio
+    async def test_tmp_cleaned_on_success(
+        self, db_session, sample_paper, mock_pi_output, tmp_path, _patch_paths
+    ):
+        """成功后清理 tmp 目录。"""
+        with (
+            patch("app.services.summarizer._download_pdf", new_callable=AsyncMock),
+            patch("app.services.summarizer._call_pi", new_callable=AsyncMock, return_value=mock_pi_output),
+        ):
+            await summarize_one(db_session, sample_paper)
+
+        tmp_paper = tmp_path / "tmp" / sample_paper.arxiv_id
+        assert not tmp_paper.exists()
+
+    @pytest.mark.asyncio
+    async def test_tmp_cleaned_on_failure(
+        self, db_session, sample_paper, tmp_path, _patch_paths
+    ):
+        """失败后也清理 tmp 目录。"""
+        with (
+            patch(
+                "app.services.summarizer._download_pdf",
+                new_callable=AsyncMock,
+                side_effect=PdfDownloadError("fail"),
+            ),
+        ):
+            await summarize_one(db_session, sample_paper)
+
+        tmp_paper = tmp_path / "tmp" / sample_paper.arxiv_id
+        assert not tmp_paper.exists()
+
+    @pytest.mark.asyncio
+    async def test_skips_done_paper(self, db_session, sample_paper, _patch_paths):
+        """已完成的论文跳过。"""
+        sample_paper.summary_status.status = "done"
+        db_session.commit()
+
+        result = await summarize_one(db_session, sample_paper)
+        assert result["status"] == "skipped"
+
+
+# ═══════════════════════════════════════════════════════════════════════
+# 批量操作测试
+# ═══════════════════════════════════════════════════════════════════════
+
+
+class TestBatchSummarize:
+    """批量总结测试。"""
+
+    @pytest.fixture
+    def _patch_paths(self, tmp_path):
+        with (
+            patch("app.services.summarizer._PAPERS_DIR", tmp_path / "papers"),
+            patch("app.services.summarizer._TMP_DIR", tmp_path / "tmp"),
+            patch("app.services.summarizer._DATA_DIR", tmp_path),
+        ):
+            yield
+
+    @pytest.mark.asyncio
+    async def test_batch_multiple_papers(
+        self, db_session, db_engine, mock_pi_output, _patch_paths
+    ):
+        """批量处理多篇论文。"""
+        now = datetime.now(timezone.utc)
+        for i in range(3):
+            p = Paper(
+                arxiv_id=f"2401.1234{i}",
+                title_en=f"Test Paper {i}",
+                abstract=f"Abstract {i}",
+                paper_date=date(2024, 1, 15),
+                crawled_at=now,
+                pdf_url=f"https://arxiv.org/pdf/2401.1234{i}.pdf",
+            )
+            db_session.add(p)
+            db_session.flush()
+            db_session.add(SummaryStatus(paper_id=p.id, status="pending"))
+
+        db_session.commit()
+
+        # 每个 worker 用独立 session（同一个内存引擎）
+        from sqlalchemy.orm import sessionmaker as _sm
+        _TestSession = _sm(bind=db_engine, autoflush=False, autocommit=False)
+
+        with (
+            patch("app.services.summarizer._download_pdf", new_callable=AsyncMock),
+            patch("app.services.summarizer._call_pi", new_callable=AsyncMock, return_value=mock_pi_output),
+        ):
+            result = await summarize_batch(
+                db_session, _session_factory=_TestSession
+            )
+
+        assert result["status"] == "success"
+        assert result["done"] == 3
+        assert result["failed"] == 0
+
+        # 验证 CrawlLog
+        log = db_session.query(CrawlLog).filter(CrawlLog.task == "summarize").first()
+        assert log is not None
+        assert log.status == "success"
+        assert log.papers_found == 3
+
+    @pytest.mark.asyncio
+    async def test_single_failure_no_block(
+        self, db_session, db_engine, mock_pi_output, _patch_paths
+    ):
+        """一篇失败不阻塞其他。"""
+        now = datetime.now(timezone.utc)
+        for i in range(2):
+            p = Paper(
+                arxiv_id=f"2401.5678{i}",
+                title_en=f"Paper {i}",
+                abstract=f"Abstract {i}",
+                paper_date=date(2024, 1, 15),
+                crawled_at=now,
+                pdf_url=f"https://arxiv.org/pdf/2401.5678{i}.pdf",
+            )
+            db_session.add(p)
+            db_session.flush()
+            db_session.add(SummaryStatus(paper_id=p.id, status="pending"))
+
+        db_session.commit()
+
+        from sqlalchemy.orm import sessionmaker as _sm
+        _TestSession = _sm(bind=db_engine, autoflush=False, autocommit=False)
+
+        call_count = 0
+
+        async def _mock_call_pi(meta_path, pdf_path):
+            nonlocal call_count
+            call_count += 1
+            if call_count == 1:
+                raise PiTimeoutError("timeout")
+            return mock_pi_output
+
+        with (
+            patch("app.services.summarizer._download_pdf", new_callable=AsyncMock),
+            patch("app.services.summarizer._call_pi", side_effect=_mock_call_pi),
+        ):
+            result = await summarize_batch(
+                db_session, _session_factory=_TestSession
+            )
+
+        assert result["done"] == 1
+        assert result["failed"] == 1
+
+    @pytest.mark.asyncio
+    async def test_task_lock_conflict(self, db_session, _patch_paths):
+        """TaskLock 防止并发 batch。"""
+        # 先插入一个 running 锁
+        db_session.add(
+            TaskLock(
+                task="summarize",
+                lock_key="batch",
+                status="running",
+                acquired_at=datetime.now(timezone.utc),
+            )
+        )
+        db_session.commit()
+
+        result = await summarize_batch(db_session)
+        assert result["status"] == "conflict"
+
+    @pytest.mark.asyncio
+    async def test_task_lock_released(self, db_session, db_engine, mock_pi_output, _patch_paths):
+        """完成后释放 TaskLock。"""
+        from sqlalchemy.orm import sessionmaker as _sm
+        _TestSession = _sm(bind=db_engine, autoflush=False, autocommit=False)
+
+        with (
+            patch("app.services.summarizer._download_pdf", new_callable=AsyncMock),
+            patch("app.services.summarizer._call_pi", new_callable=AsyncMock, return_value=mock_pi_output),
+        ):
+            await summarize_batch(
+                db_session, _session_factory=_TestSession
+            )
+
+        locks = db_session.query(TaskLock).filter(
+            TaskLock.task == "summarize",
+            TaskLock.lock_key == "batch",
+        ).all()
+        for lock in locks:
+            assert lock.status == "finished"
+            assert lock.released_at is not None
+
+    @pytest.mark.asyncio
+    async def test_batch_empty(self, db_session, _patch_paths):
+        """无 pending 论文时返回空结果。"""
+        result = await summarize_batch(db_session)
+        assert result["status"] == "success"
+        assert result["total"] == 0
+
+
+# ═══════════════════════════════════════════════════════════════════════
+# Admin 路由鉴权测试
+# ═══════════════════════════════════════════════════════════════════════
+
+
+class TestAdminAuth:
+    """管理接口鉴权 — 只测 HTTP 层，mock 掉实际服务调用。"""
+
+    def test_no_token_returns_401(self, client):
+        """无 Bearer token 返回 401。"""
+        resp = client.post("/admin/summarize")
+        assert resp.status_code in (401, 403)
+
+    def test_wrong_token_returns_401(self, client):
+        resp = client.post(
+            "/admin/summarize",
+            headers={"Authorization": "Bearer wrong-token"},
+        )
+        assert resp.status_code == 401
+
+    def test_correct_token_batch(self, client, admin_headers):
+        """正确 token 调用 batch summarize，mock 掉服务层。"""
+        import app.config as config_mod
+
+        original = config_mod.settings.ADMIN_TOKEN
+        config_mod.settings.ADMIN_TOKEN = "test-admin-token-12345"
+        try:
+            with patch("app.routes.admin.summarize_batch", new_callable=AsyncMock) as mock:
+                mock.return_value = {"status": "success", "done": 0, "failed": 0, "total": 0}
+                resp = client.post("/admin/summarize", headers=admin_headers)
+                assert resp.status_code == 200
+                assert resp.json()["status"] == "success"
+        finally:
+            config_mod.settings.ADMIN_TOKEN = original
+
+    def test_single_paper_not_found(self, client, admin_headers):
+        """单篇总结不存在的论文返回 404。"""
+        import app.config as config_mod
+
+        original = config_mod.settings.ADMIN_TOKEN
+        config_mod.settings.ADMIN_TOKEN = "test-admin-token-12345"
+        try:
+            with patch(
+                "app.routes.admin.summarize_single",
+                new_callable=AsyncMock,
+                return_value={"status": "not_found", "arxiv_id": "nonexistent.99999"},
+            ):
+                resp = client.post(
+                    "/admin/summarize/nonexistent.99999",
+                    headers=admin_headers,
+                )
+                assert resp.status_code == 404
+        finally:
+            config_mod.settings.ADMIN_TOKEN = original