From 4b80bd59aa2062cdbc1e2f1584994b9c15a24943 Mon Sep 17 00:00:00 2001
From: txxxxz <chendi_zhou@163.com>
Date: Tue, 14 Apr 2026 20:58:17 +0800
Subject: [PATCH 1/4] Add structure note workspace and generation flow

---
 deeptutor/api/main.py                         |   16 +-
 deeptutor/api/routers/settings.py             |    9 +-
 deeptutor/api/routers/structure_note.py       |  404 ++++
 deeptutor/api/routers/system.py               |    5 +-
 deeptutor/services/__init__.py                |    3 +
 deeptutor/services/config/loader.py           |   32 +-
 deeptutor/services/path_service.py            |   47 +-
 deeptutor/services/setup/init.py              |   14 +-
 deeptutor/services/structure_note/__init__.py |   40 +
 .../services/structure_note/difficulty.py     |   64 +
 .../services/structure_note/generator.py      |  571 +++++
 .../services/structure_note/image_pipeline.py |  132 ++
 deeptutor/services/structure_note/manager.py  |  592 ++++++
 .../structure_note/markdown_postprocessor.py  |  252 +++
 deeptutor/services/structure_note/models.py   |  184 ++
 .../services/structure_note/normalizer.py     |   49 +
 .../services/structure_note/page_index.py     |  108 +
 deeptutor/services/structure_note/planner.py  |  125 ++
 deeptutor/services/structure_note/renderer.py |  178 ++
 deeptutor/services/structure_note/storage.py  |  185 ++
 .../services/structure_note/tree_builder.py   |  205 ++
 docs/features/overview.md                     |  162 ++
 docs/guide/data-preparation.md                |  185 ++
 docs/guide/local-start.md                     |  190 ++
 docs/guide/pre-config.md                      |  201 ++
 docs/guide/troubleshooting.md                 |  170 ++
 docs/index.md                                 |   77 +
 docs/roadmap.md                               |   41 +
 docs/testdoc/structure-note-prd.md            |  278 +++
 docs/testdoc/structure-note-technical-plan.md |  539 +++++
 docs/zh/features/overview.md                  |   57 +
 docs/zh/guide/data-preparation.md             |  185 ++
 docs/zh/guide/local-conda-cursor.md           |   56 +
 docs/zh/guide/local-start.md                  |  190 ++
 docs/zh/guide/pre-config.md                   |  201 ++
 docs/zh/guide/troubleshooting.md              |   48 +
 docs/zh/index.md                              |   77 +
 pyproject.toml                                |    3 +
 requirements/cli.txt                          |    1 +
 requirements/server.txt                       |    1 +
 tests/api/test_structure_note_router.py       |  325 +++
 tests/services/test_path_service.py           |   94 +-
 tests/services/test_runtime_storage_guard.py  |   11 +-
 tests/services/test_structure_note_service.py |  373 ++++
 web/app/(workspace)/structure-note/page.tsx   | 1876 +++++++++++++++++
 web/components/sidebar/SidebarShell.tsx       |  151 +-
 web/components/ui/Button.tsx                  |   51 +-
 web/lib/latex.ts                              |  287 ++-
 web/lib/structure-note-api.ts                 |  275 +++
 web/locales/en/app.json                       |  115 +-
 web/locales/zh/app.json                       |  117 +-
 web/package-lock.json                         |    1 +
 web/scripts/route_budgets.mjs                 |  135 +-
 web/tests/e2e/structure-note.audit.ts         |   25 +
 54 files changed, 9344 insertions(+), 369 deletions(-)
 create mode 100644 deeptutor/api/routers/structure_note.py
 create mode 100644 deeptutor/services/structure_note/__init__.py
 create mode 100644 deeptutor/services/structure_note/difficulty.py
 create mode 100644 deeptutor/services/structure_note/generator.py
 create mode 100644 deeptutor/services/structure_note/image_pipeline.py
 create mode 100644 deeptutor/services/structure_note/manager.py
 create mode 100644 deeptutor/services/structure_note/markdown_postprocessor.py
 create mode 100644 deeptutor/services/structure_note/models.py
 create mode 100644 deeptutor/services/structure_note/normalizer.py
 create mode 100644 deeptutor/services/structure_note/page_index.py
 create mode 100644 deeptutor/services/structure_note/planner.py
 create mode 100644 deeptutor/services/structure_note/renderer.py
 create mode 100644 deeptutor/services/structure_note/storage.py
 create mode 100644 deeptutor/services/structure_note/tree_builder.py
 create mode 100644 docs/features/overview.md
 create mode 100644 docs/guide/data-preparation.md
 create mode 100644 docs/guide/local-start.md
 create mode 100644 docs/guide/pre-config.md
 create mode 100644 docs/guide/troubleshooting.md
 create mode 100644 docs/index.md
 create mode 100644 docs/roadmap.md
 create mode 100644 docs/testdoc/structure-note-prd.md
 create mode 100644 docs/testdoc/structure-note-technical-plan.md
 create mode 100644 docs/zh/features/overview.md
 create mode 100644 docs/zh/guide/data-preparation.md
 create mode 100644 docs/zh/guide/local-conda-cursor.md
 create mode 100644 docs/zh/guide/local-start.md
 create mode 100644 docs/zh/guide/pre-config.md
 create mode 100644 docs/zh/guide/troubleshooting.md
 create mode 100644 docs/zh/index.md
 create mode 100644 tests/api/test_structure_note_router.py
 create mode 100644 tests/services/test_structure_note_service.py
 create mode 100644 web/app/(workspace)/structure-note/page.tsx
 create mode 100644 web/lib/structure-note-api.ts
 create mode 100644 web/tests/e2e/structure-note.audit.ts

diff --git a/deeptutor/api/main.py b/deeptutor/api/main.py
index ceee8107d..7b4aec318 100644
--- a/deeptutor/api/main.py
+++ b/deeptutor/api/main.py
@@ -1,9 +1,7 @@
-import logging
 from contextlib import asynccontextmanager
-from pathlib import Path
+import logging
 
-from fastapi import FastAPI
-from fastapi import HTTPException
+from fastapi import FastAPI, HTTPException
 from fastapi.middleware.cors import CORSMiddleware
 from fastapi.staticfiles import StaticFiles
 
@@ -107,6 +105,7 @@ async def lifespan(app: FastAPI):
 
     try:
         from deeptutor.services.tutorbot import get_tutorbot_manager
+
         await get_tutorbot_manager().auto_start_bots()
     except Exception as e:
         logger.warning(f"Failed to auto-start TutorBots: {e}")
@@ -119,6 +118,7 @@ async def lifespan(app: FastAPI):
     # Stop TutorBots
     try:
         from deeptutor.services.tutorbot import get_tutorbot_manager
+
         await get_tutorbot_manager().stop_all()
         logger.info("TutorBots stopped")
     except Exception as e:
@@ -207,14 +207,15 @@ async def selective_access_log(request, call_next):
     notebook,
     plugins_api,
     question,
+    question_notebook,
     sessions,
     settings,
     solve,
+    structure_note,
     system,
     tutorbot,
     unified_ws,
     vision_solver,
-    question_notebook,
 )
 
 # Include routers
@@ -226,9 +227,12 @@ async def selective_access_log(request, call_next):
 app.include_router(co_writer.router, prefix="/api/v1/co_writer", tags=["co_writer"])
 app.include_router(notebook.router, prefix="/api/v1/notebook", tags=["notebook"])
 app.include_router(guide.router, prefix="/api/v1/guide", tags=["guide"])
+app.include_router(structure_note.router, prefix="/api/v1/structure-note", tags=["structure-note"])
 app.include_router(memory.router, prefix="/api/v1/memory", tags=["memory"])
 app.include_router(sessions.router, prefix="/api/v1/sessions", tags=["sessions"])
-app.include_router(question_notebook.router, prefix="/api/v1/question-notebook", tags=["question-notebook"])
+app.include_router(
+    question_notebook.router, prefix="/api/v1/question-notebook", tags=["question-notebook"]
+)
 app.include_router(settings.router, prefix="/api/v1/settings", tags=["settings"])
 app.include_router(system.router, prefix="/api/v1/system", tags=["system"])
 app.include_router(plugins_api.router, prefix="/api/v1/plugins", tags=["plugins"])
diff --git a/deeptutor/api/routers/settings.py b/deeptutor/api/routers/settings.py
index 23a26ff7c..fb6bdb6a7 100644
--- a/deeptutor/api/routers/settings.py
+++ b/deeptutor/api/routers/settings.py
@@ -29,7 +29,14 @@
 
 DEFAULT_SIDEBAR_NAV_ORDER = {
     "start": ["/", "/history", "/knowledge", "/notebook"],
-    "learnResearch": ["/question", "/solver", "/guide", "/research", "/co_writer"],
+    "learnResearch": [
+        "/question",
+        "/solver",
+        "/guide",
+        "/structure-note",
+        "/research",
+        "/co_writer",
+    ],
 }
 
 DEFAULT_UI_SETTINGS = {
diff --git a/deeptutor/api/routers/structure_note.py b/deeptutor/api/routers/structure_note.py
new file mode 100644
index 000000000..7c5677392
--- /dev/null
+++ b/deeptutor/api/routers/structure_note.py
@@ -0,0 +1,404 @@
+"""
+Structure Note API Router
+=========================
+
+Independent workspace for turning PDF/PPT/PPTX course materials into structured notes.
+"""
+
+from __future__ import annotations
+
+from datetime import datetime
+import json
+from pathlib import Path, PurePosixPath
+import shutil
+from uuid import uuid4
+
+from fastapi import APIRouter, BackgroundTasks, File, Form, HTTPException, UploadFile
+from fastapi.responses import StreamingResponse
+
+from deeptutor.api.utils.task_id_manager import TaskIDManager
+from deeptutor.api.utils.task_log_stream import get_task_stream_manager
+from deeptutor.logging import get_logger
+from deeptutor.services.config import PROJECT_ROOT, load_config_with_main
+from deeptutor.services.structure_note import (
+    DifficultyLevel,
+    ExplanationStyleLevel,
+    JobStatus,
+    NoteLanguage,
+    StructureNoteManager,
+)
+from deeptutor.utils.document_validator import DocumentValidator
+
+router = APIRouter()
+_structure_note_manager: StructureNoteManager | None = None
+_kb_base_dir = PROJECT_ROOT / "data" / "knowledge_bases"
+_accepted_source_extensions = {".pdf", ".ppt", ".pptx"}
+
+try:
+    config = load_config_with_main("main.yaml", PROJECT_ROOT)
+except FileNotFoundError:
+    config = {}
+log_dir = config.get("paths", {}).get("user_log_dir") or config.get("logging", {}).get("log_dir")
+logger = get_logger("StructureNote", level="INFO", log_dir=log_dir)
+
+
+def get_structure_note_manager() -> StructureNoteManager:
+    global _structure_note_manager
+    if _structure_note_manager is None:
+        _structure_note_manager = StructureNoteManager()
+    return _structure_note_manager
+
+
+def _build_unique_task_id(task_type: str, task_key_prefix: str) -> str:
+    task_manager = TaskIDManager.get_instance()
+    task_key = f"{task_key_prefix}_{datetime.now().isoformat()}_{uuid4().hex[:8]}"
+    return task_manager.generate_task_id(task_type, task_key)
+
+
+def _emit_log(task_id: str, message: str) -> None:
+    manager = get_task_stream_manager()
+    manager.ensure_task(task_id)
+    manager.emit_log(task_id, message)
+    logger.info(f"[{task_id}] {message}")
+
+
+def _save_upload(file: UploadFile, target_dir: Path) -> tuple[Path, str, int]:
+    safe_name = DocumentValidator.validate_upload_safety(
+        file.filename or "upload",
+        None,
+        allowed_extensions={".pdf", ".ppt", ".pptx"},
+    )
+    target_dir.mkdir(parents=True, exist_ok=True)
+    target_path = target_dir / safe_name
+    written_bytes = 0
+    with open(target_path, "wb") as handle:
+        for chunk in iter(lambda: file.file.read(8192), b""):
+            written_bytes += len(chunk)
+            if written_bytes > DocumentValidator.MAX_FILE_SIZE:
+                raise HTTPException(status_code=400, detail="Uploaded file exceeds the size limit.")
+            handle.write(chunk)
+
+    DocumentValidator.validate_upload_safety(
+        safe_name,
+        written_bytes,
+        allowed_extensions={".pdf", ".ppt", ".pptx"},
+    )
+    return target_path, safe_name, written_bytes
+
+
+def _validate_kb_file_id(file_id: str) -> PurePosixPath:
+    relative_path = PurePosixPath(file_id)
+    if (
+        relative_path.is_absolute()
+        or not relative_path.parts
+        or any(part in {"", ".", ".."} for part in relative_path.parts)
+    ):
+        raise HTTPException(status_code=400, detail="Invalid Knowledge Base file id.")
+    return relative_path
+
+
+def _is_safe_kb_name(kb_name: str) -> bool:
+    relative_name = PurePosixPath(kb_name)
+    return (
+        not relative_name.is_absolute()
+        and len(relative_name.parts) == 1
+        and all(part not in {"", ".", ".."} for part in relative_name.parts)
+    )
+
+
+def _validate_kb_name(kb_name: str) -> str:
+    if not _is_safe_kb_name(kb_name):
+        raise HTTPException(status_code=400, detail="Invalid Knowledge Base name.")
+    return PurePosixPath(kb_name).name
+
+
+def _list_kb_names_readonly() -> list[str]:
+    kb_names: set[str] = set()
+    config_path = _kb_base_dir / "kb_config.json"
+    if config_path.exists():
+        try:
+            payload = json.loads(config_path.read_text(encoding="utf-8"))
+            knowledge_bases = payload.get("knowledge_bases", {})
+            if isinstance(knowledge_bases, dict):
+                kb_names.update(
+                    str(name) for name in knowledge_bases.keys() if _is_safe_kb_name(str(name))
+                )
+        except Exception as exc:
+            logger.warning(f"Failed to read Knowledge Base config for Structure Note: {exc}")
+
+    if _kb_base_dir.exists():
+        for item in _kb_base_dir.iterdir():
+            if not item.is_dir() or item.name.startswith(("__", ".")):
+                continue
+            if (
+                (item / "raw").exists()
+                or (item / "llamaindex_storage").exists()
+                or (item / "rag_storage").exists()
+            ):
+                kb_names.add(item.name)
+
+    return sorted(kb_names)
+
+
+def _kb_raw_dir(kb_name: str) -> Path:
+    safe_kb_name = _validate_kb_name(kb_name)
+    if safe_kb_name not in _list_kb_names_readonly():
+        raise HTTPException(status_code=404, detail="Knowledge Base not found.")
+
+    base_dir = _kb_base_dir.resolve()
+    kb_dir = (base_dir / safe_kb_name).resolve()
+    try:
+        kb_dir.relative_to(base_dir)
+    except ValueError:
+        raise HTTPException(status_code=400, detail="Invalid Knowledge Base name.")
+    return kb_dir / "raw"
+
+
+def _resolve_kb_source_file(kb_name: str, file_id: str) -> Path:
+    relative_path = _validate_kb_file_id(file_id)
+    raw_dir = _kb_raw_dir(kb_name).resolve()
+    source_path = (raw_dir / Path(*relative_path.parts)).resolve()
+    try:
+        source_path.relative_to(raw_dir)
+    except ValueError:
+        raise HTTPException(status_code=400, detail="Invalid Knowledge Base file id.")
+
+    if not source_path.exists() or not source_path.is_file():
+        raise HTTPException(status_code=404, detail="Knowledge Base file not found.")
+    if source_path.suffix.lower() not in _accepted_source_extensions:
+        raise HTTPException(
+            status_code=400, detail="Structure Note accepts PDF, PPT, or PPTX only."
+        )
+    return source_path
+
+
+def _list_kb_source_files() -> list[dict]:
+    groups: list[dict] = []
+    for kb_name in _list_kb_names_readonly():
+        raw_dir = _kb_raw_dir(kb_name)
+        files: list[dict] = []
+        if raw_dir.exists():
+            for source_path in sorted(raw_dir.rglob("*"), key=lambda item: item.as_posix()):
+                if not source_path.is_file():
+                    continue
+                if source_path.suffix.lower() not in _accepted_source_extensions:
+                    continue
+                stat = source_path.stat()
+                file_id = source_path.relative_to(raw_dir).as_posix()
+                files.append(
+                    {
+                        "file_id": file_id,
+                        "file_name": source_path.name,
+                        "display_path": file_id,
+                        "size_bytes": stat.st_size,
+                        "updated_at": datetime.fromtimestamp(stat.st_mtime).isoformat(),
+                    }
+                )
+
+        groups.append({"kb_name": kb_name, "files": files})
+    return groups
+
+
+async def _run_structure_note_job(job_id: str, task_id: str) -> None:
+    stream_manager = get_task_stream_manager()
+    stream_manager.ensure_task(task_id)
+    manager = get_structure_note_manager()
+    artifact = await manager.run_job(job_id, task_id, _emit_log)
+    if artifact.status == JobStatus.READY:
+        stream_manager.emit_complete(task_id, "Structure Note completed")
+    else:
+        stream_manager.emit_failed(task_id, artifact.error or "Structure Note failed")
+
+
+@router.post("/jobs")
+async def create_job(
+    background_tasks: BackgroundTasks,
+    file: UploadFile = File(...),
+    difficulty_level: DifficultyLevel = Form(DifficultyLevel.MEDIUM),
+    note_language: NoteLanguage = Form(NoteLanguage.ZH),
+    style_level: ExplanationStyleLevel = Form(ExplanationStyleLevel.MEDIUM),
+    project_name: str | None = Form(None),
+):
+    manager = get_structure_note_manager()
+    task_id = _build_unique_task_id("structure_note", file.filename or "upload")
+    get_task_stream_manager().ensure_task(task_id)
+
+    source_format = Path(file.filename or "").suffix.lower().lstrip(".")
+    if source_format not in {"pdf", "ppt", "pptx"}:
+        raise HTTPException(
+            status_code=400, detail="Structure Note accepts PDF, PPT, or PPTX only."
+        )
+
+    job_id = f"structure_note_{datetime.utcnow().strftime('%Y%m%d_%H%M%S')}_{uuid4().hex[:8]}"
+    job_dirs = manager.storage.ensure_job_dirs(job_id)
+    source_path, safe_name, _ = _save_upload(file, job_dirs["source"])
+
+    target_project_name = (
+        project_name.strip() if project_name and project_name.strip() else "Local Uploads"
+    )
+    try:
+        artifact = manager.create_job(
+            file_name=safe_name,
+            source_format=source_format,
+            difficulty_level=difficulty_level,
+            note_language=note_language,
+            style_level=style_level,
+            source_path=source_path,
+            task_id=task_id,
+            job_id=job_id,
+            project_name=target_project_name,
+            note_title=Path(safe_name).stem,
+            source_kind="upload",
+            source_ref={"file_name": safe_name},
+        )
+    except ValueError as exc:
+        raise HTTPException(status_code=400, detail=str(exc))
+    _emit_log(task_id, f"Created Structure Note job for `{safe_name}`.")
+    background_tasks.add_task(_run_structure_note_job, artifact.job_id, task_id)
+    return manager.serialize_job(artifact)
+
+
+@router.get("/jobs")
+async def list_jobs():
+    manager = get_structure_note_manager()
+    return {"jobs": [manager.serialize_job(job) for job in manager.list_jobs()]}
+
+
+@router.get("/projects")
+async def list_projects():
+    manager = get_structure_note_manager()
+    return {"projects": [project.model_dump(mode="json") for project in manager.list_projects()]}
+
+
+@router.post("/projects")
+async def create_project(name: str = Form(...)):
+    manager = get_structure_note_manager()
+    try:
+        project = manager.create_project(name)
+    except ValueError as exc:
+        raise HTTPException(status_code=400, detail=str(exc))
+    return project.model_dump(mode="json")
+
+
+@router.post("/projects/{project_name}/rename")
+async def rename_project(project_name: str, new_name: str = Form(...)):
+    manager = get_structure_note_manager()
+    try:
+        project = manager.rename_project(project_name, new_name)
+    except FileNotFoundError:
+        raise HTTPException(status_code=404, detail="Project not found.")
+    except ValueError as exc:
+        raise HTTPException(status_code=400, detail=str(exc))
+    return project.model_dump(mode="json")
+
+
+@router.delete("/projects/{project_name}")
+async def delete_project(project_name: str):
+    manager = get_structure_note_manager()
+    try:
+        deleted_job_ids = manager.delete_project(project_name)
+    except FileNotFoundError:
+        raise HTTPException(status_code=404, detail="Project not found.")
+    except ValueError as exc:
+        raise HTTPException(status_code=400, detail=str(exc))
+    return {"deleted_job_ids": deleted_job_ids}
+
+
+@router.get("/kb/files")
+async def list_knowledge_base_source_files():
+    return {"knowledge_bases": _list_kb_source_files()}
+
+
+@router.post("/jobs/from-kb")
+async def create_job_from_knowledge_base(
+    background_tasks: BackgroundTasks,
+    kb_name: str = Form(...),
+    file_id: str = Form(...),
+    difficulty_level: DifficultyLevel = Form(DifficultyLevel.MEDIUM),
+    note_language: NoteLanguage = Form(NoteLanguage.ZH),
+    style_level: ExplanationStyleLevel = Form(ExplanationStyleLevel.MEDIUM),
+    project_name: str | None = Form(None),
+):
+    source_file = _resolve_kb_source_file(kb_name, file_id)
+    safe_name = DocumentValidator.validate_upload_safety(
+        source_file.name,
+        source_file.stat().st_size,
+        allowed_extensions=_accepted_source_extensions,
+    )
+    source_format = source_file.suffix.lower().lstrip(".")
+
+    manager = get_structure_note_manager()
+    task_id = _build_unique_task_id("structure_note", f"{kb_name}_{safe_name}")
+    get_task_stream_manager().ensure_task(task_id)
+
+    job_id = f"structure_note_{datetime.utcnow().strftime('%Y%m%d_%H%M%S')}_{uuid4().hex[:8]}"
+    job_dirs = manager.storage.ensure_job_dirs(job_id)
+    snapshot_path = job_dirs["source"] / safe_name
+    shutil.copy2(source_file, snapshot_path)
+
+    target_project_name = project_name.strip() if project_name and project_name.strip() else kb_name
+    try:
+        artifact = manager.create_job(
+            file_name=safe_name,
+            source_format=source_format,
+            difficulty_level=difficulty_level,
+            note_language=note_language,
+            style_level=style_level,
+            source_path=snapshot_path,
+            task_id=task_id,
+            job_id=job_id,
+            project_name=target_project_name,
+            note_title=Path(file_id).stem,
+            source_kind="knowledge_base",
+            source_ref={
+                "kb_name": kb_name,
+                "file_id": file_id,
+                "file_name": source_file.name,
+            },
+        )
+    except ValueError as exc:
+        raise HTTPException(status_code=400, detail=str(exc))
+    _emit_log(
+        task_id, f"Created Structure Note job for `{safe_name}` from Knowledge Base `{kb_name}`."
+    )
+    background_tasks.add_task(_run_structure_note_job, artifact.job_id, task_id)
+    return manager.serialize_job(artifact)
+
+
+@router.get("/jobs/{job_id}")
+async def get_job(job_id: str):
+    manager = get_structure_note_manager()
+    try:
+        return manager.serialize_job(manager.get_job(job_id))
+    except FileNotFoundError:
+        raise HTTPException(status_code=404, detail="Structure Note job not found")
+
+
+@router.post("/jobs/{job_id}/retry")
+async def retry_job(job_id: str, background_tasks: BackgroundTasks):
+    manager = get_structure_note_manager()
+    try:
+        artifact = manager.get_job(job_id)
+    except FileNotFoundError:
+        raise HTTPException(status_code=404, detail="Structure Note job not found")
+
+    if artifact.status != JobStatus.FAILED:
+        raise HTTPException(status_code=409, detail="Only failed jobs can be retried.")
+
+    task_id = _build_unique_task_id("structure_note_retry", job_id)
+    get_task_stream_manager().ensure_task(task_id)
+    artifact = manager.update_status(artifact, JobStatus.QUEUED, error=None, task_id=task_id)
+    _emit_log(task_id, f"Retrying Structure Note job `{artifact.file_name}`.")
+    background_tasks.add_task(_run_structure_note_job, artifact.job_id, task_id)
+    return manager.serialize_job(artifact)
+
+
+@router.get("/tasks/{task_id}/stream")
+async def stream_task(task_id: str):
+    manager = get_task_stream_manager()
+    manager.ensure_task(task_id)
+    return StreamingResponse(
+        manager.stream(task_id),
+        media_type="text/event-stream",
+        headers={"Cache-Control": "no-cache", "X-Accel-Buffering": "no"},
+    )
diff --git a/deeptutor/api/routers/system.py b/deeptutor/api/routers/system.py
index bfe061b05..0463a78fa 100644
--- a/deeptutor/api/routers/system.py
+++ b/deeptutor/api/routers/system.py
@@ -52,6 +52,7 @@ async def get_runtime_topology():
         ],
         "isolated_subsystems": [
             {"router": "guide", "mode": "independent_subsystem"},
+            {"router": "structure_note", "mode": "independent_subsystem"},
             {"router": "co_writer", "mode": "independent_subsystem"},
             {"router": "plugins_api", "mode": "playground_transport"},
         ],
@@ -292,7 +293,9 @@ async def test_search_connection():
         )
 
     except ValueError as e:
-        return TestResponse(success=False, message=f"Search configuration error: {e!s}", error=str(e))
+        return TestResponse(
+            success=False, message=f"Search configuration error: {e!s}", error=str(e)
+        )
     except Exception as e:
         response_time = (time.time() - start_time) * 1000
         return TestResponse(
diff --git a/deeptutor/services/__init__.py b/deeptutor/services/__init__.py
index 167b90c3e..75e938001 100644
--- a/deeptutor/services/__init__.py
+++ b/deeptutor/services/__init__.py
@@ -50,6 +50,7 @@
     "rag",
     "prompt",
     "search",
+    "structure_note",
     "setup",
     "session",
     "config",
@@ -71,6 +72,8 @@ def __getattr__(name: str):
         return importlib.import_module(f"{__name__}.search")
     if name == "setup":
         return importlib.import_module(f"{__name__}.setup")
+    if name == "structure_note":
+        return importlib.import_module(f"{__name__}.structure_note")
     if name == "session":
         return importlib.import_module(f"{__name__}.session")
     if name == "config":
diff --git a/deeptutor/services/config/loader.py b/deeptutor/services/config/loader.py
index 30e46f996..08bf5cab6 100644
--- a/deeptutor/services/config/loader.py
+++ b/deeptutor/services/config/loader.py
@@ -23,12 +23,19 @@
 # .parent.parent.parent.parent = DeepTutor/ (project root)
 PROJECT_ROOT = Path(__file__).resolve().parent.parent.parent.parent
 
+_DEFAULT_MAIN_CONFIG: dict[str, Any] = {
+    "system": {"language": "en"},
+    "logging": {"level": "WARNING", "save_to_file": True, "console_output": True},
+    "tools": {"run_code": {}},
+}
+
 
 def get_runtime_settings_dir(project_root: Path | None = None) -> Path:
     """Return the canonical runtime settings directory under ``data/user/settings``."""
     root = project_root or PROJECT_ROOT
     return root / "data" / "user" / "settings"
 
+
 def _deep_merge(base: dict[str, Any], override: dict[str, Any]) -> dict[str, Any]:
     """
     Deep merge two dictionaries, values in override will override values in base
@@ -74,6 +81,7 @@ def _inject_runtime_paths(config: dict[str, Any]) -> dict[str, Any]:
         "user_log_dir": str(path_service.get_logs_dir()),
         "performance_log_dir": str(path_service.get_logs_dir() / "performance"),
         "guide_output_dir": str(path_service.get_guide_dir()),
+        "structure_note_output_dir": str(path_service.get_structure_note_dir()),
         "question_output_dir": str(path_service.get_chat_feature_dir("deep_question")),
         "research_output_dir": str(path_service.get_research_dir()),
         "research_reports_dir": str(path_service.get_research_reports_dir()),
@@ -87,6 +95,14 @@ async def _load_yaml_file_async(file_path: Path) -> dict[str, Any]:
     return await asyncio.to_thread(_load_yaml_file, file_path)
 
 
+def _load_main_config(project_root: Path) -> dict[str, Any]:
+    settings_dir = get_runtime_settings_dir(project_root)
+    main_path = settings_dir / "main.yaml"
+    if main_path.exists():
+        return _load_yaml_file(main_path)
+    return _DEFAULT_MAIN_CONFIG.copy()
+
+
 def resolve_config_path(
     config_file: str,
     project_root: Path | None = None,
@@ -108,8 +124,7 @@ def resolve_config_path(
     if config_path.exists():
         return config_path, False
     raise FileNotFoundError(
-        f"Configuration file not found: {config_file} "
-        f"(expected under {settings_dir})"
+        f"Configuration file not found: {config_file} (expected under {settings_dir})"
     )
 
 
@@ -127,8 +142,12 @@ def load_config_with_main(config_file: str, project_root: Path | None = None) ->
     if project_root is None:
         project_root = PROJECT_ROOT
 
+    base_config = _load_main_config(project_root)
+    if config_file == "main.yaml":
+        return _inject_runtime_paths(base_config)
+
     config_path, _ = resolve_config_path(config_file, project_root)
-    return _inject_runtime_paths(_load_yaml_file(config_path))
+    return _inject_runtime_paths(_deep_merge(base_config, _load_yaml_file(config_path)))
 
 
 async def load_config_with_main_async(
@@ -149,8 +168,13 @@ async def load_config_with_main_async(
     if project_root is None:
         project_root = PROJECT_ROOT
 
+    base_config = _load_main_config(project_root)
+    if config_file == "main.yaml":
+        return _inject_runtime_paths(base_config)
+
     config_path, _ = resolve_config_path(config_file, project_root)
-    return _inject_runtime_paths(await _load_yaml_file_async(config_path))
+    module_config = await _load_yaml_file_async(config_path)
+    return _inject_runtime_paths(_deep_merge(base_config, module_config))
 
 
 def get_path_from_config(config: dict[str, Any], path_key: str, default: str = None) -> str:
diff --git a/deeptutor/services/path_service.py b/deeptutor/services/path_service.py
index c3f7cd2b4..15f99a8b0 100644
--- a/deeptutor/services/path_service.py
+++ b/deeptutor/services/path_service.py
@@ -13,6 +13,7 @@
     ├── notebook/
     ├── co-writer/
     ├── guide/
+    ├── structure_note/
     └── chat/
         ├── chat/
         ├── deep_solve/
@@ -32,6 +33,7 @@
     "research",
     "co-writer",
     "guide",
+    "structure_note",
     "run_code_workspace",
     "logs",
     "math_animator",
@@ -51,6 +53,7 @@
     "notebook",
     "co-writer",
     "guide",
+    "structure_note",
     "chat",
 ]
 
@@ -68,6 +71,7 @@ class PathService:
         "math_animator": ("chat", "math_animator"),
         "co-writer": ("co-writer", None),
         "guide": ("guide", None),
+        "structure_note": ("structure_note", None),
         "run_code_workspace": ("chat", "_detached_code_execution"),
     }
     _PRIVATE_SUFFIXES = {".json", ".sqlite", ".db", ".md", ".yaml", ".yml", ".py", ".log"}
@@ -128,17 +132,32 @@ def is_public_output_path(self, path: str | Path) -> bool:
 
         if not candidate.is_file():
             return False
-        if candidate.suffix.lower() in self._PRIVATE_SUFFIXES:
+        parts = relative.parts
+        suffix = candidate.suffix.lower()
+        if len(parts) >= 5 and parts[:2] == ("workspace", "structure_note"):
+            if parts[3] == "final" and suffix in {".pdf", ".md"}:
+                return True
+            if parts[3] == "images" and suffix in {".png", ".jpg", ".jpeg", ".webp", ".gif"}:
+                return True
+
+        if suffix in self._PRIVATE_SUFFIXES:
             return False
 
-        parts = relative.parts
         if parts[:3] == ("workspace", "co-writer", "audio"):
             return True
 
-        if len(parts) >= 5 and parts[:3] == ("workspace", "chat", "deep_solve") and "artifacts" in parts[4:]:
+        if (
+            len(parts) >= 5
+            and parts[:3] == ("workspace", "chat", "deep_solve")
+            and "artifacts" in parts[4:]
+        ):
             return True
 
-        if len(parts) >= 5 and parts[:3] == ("workspace", "chat", "math_animator") and "artifacts" in parts[4:]:
+        if (
+            len(parts) >= 5
+            and parts[:3] == ("workspace", "chat", "math_animator")
+            and "artifacts" in parts[4:]
+        ):
             return True
 
         if len(parts) >= 5 and parts[:2] == ("workspace", "chat") and "code_runs" in parts[3:]:
@@ -183,9 +202,16 @@ def get_session_workspace(self, feature: str, session_id: str) -> Path:
         return session_root / session_id
 
     def _resolve_feature_root(self, feature: str) -> Path:
-        if feature in {"chat", "deep_solve", "deep_question", "deep_research", "math_animator", "_detached_code_execution"}:
+        if feature in {
+            "chat",
+            "deep_solve",
+            "deep_question",
+            "deep_research",
+            "math_animator",
+            "_detached_code_execution",
+        }:
             return self.get_chat_feature_dir(feature)  # type: ignore[arg-type]
-        if feature in {"memory", "notebook", "co-writer", "guide"}:
+        if feature in {"memory", "notebook", "co-writer", "guide", "structure_note"}:
             return self.get_workspace_feature_dir(feature)  # type: ignore[arg-type]
         raise ValueError(f"Unknown workspace feature: {feature}")
 
@@ -224,6 +250,7 @@ def get_memory_dir(self) -> Path:
                     target = new_dir / f.name
                     if not target.exists():
                         import shutil
+
                         shutil.copy2(f, target)
         return new_dir
 
@@ -272,6 +299,12 @@ def get_guide_dir(self) -> Path:
     def get_guide_session_file(self, session_id: str) -> Path:
         return self.get_guide_dir() / f"session_{session_id}.json"
 
+    def get_structure_note_dir(self) -> Path:
+        return self.get_workspace_feature_dir("structure_note")
+
+    def get_structure_note_job_dir(self, job_id: str) -> Path:
+        return self.get_structure_note_dir() / job_id
+
     def get_run_code_workspace_dir(self) -> Path:
         return self.get_chat_feature_dir("_detached_code_execution")
 
@@ -314,7 +347,7 @@ def ensure_all_directories(self) -> None:
         self.ensure_memory_dir()
         self.ensure_notebook_dir()
         self.get_logs_dir().mkdir(parents=True, exist_ok=True)
-        for feature in ("co-writer", "guide"):
+        for feature in ("co-writer", "guide", "structure_note"):
             self.get_workspace_feature_dir(feature).mkdir(parents=True, exist_ok=True)
         for feature in (
             "chat",
diff --git a/deeptutor/services/setup/init.py b/deeptutor/services/setup/init.py
index 7feecc8ce..0d21470b9 100644
--- a/deeptutor/services/setup/init.py
+++ b/deeptutor/services/setup/init.py
@@ -22,7 +22,14 @@
     "sidebar_description": "✨ Data Intelligence Lab @ HKU",
     "sidebar_nav_order": {
         "start": ["/", "/history", "/knowledge", "/notebook"],
-        "learnResearch": ["/question", "/solver", "/guide", "/research", "/co_writer"],
+        "learnResearch": [
+            "/question",
+            "/solver",
+            "/guide",
+            "/structure-note",
+            "/research",
+            "/co_writer",
+        ],
     },
 }
 
@@ -120,7 +127,7 @@ def init_user_directories(project_root: Path | None = None) -> None:
 
     This function uses lazy initialization - directories are created on-demand
     when files are saved, rather than pre-creating all directories at startup.
-    
+
     Only essential configuration files (like settings/interface.json) are
     created at startup if they don't exist.
 
@@ -137,6 +144,7 @@ def init_user_directories(project_root: Path | None = None) -> None:
         ├── memory/
         ├── co-writer/
         ├── guide/
+        ├── structure_note/
         └── chat/
             ├── chat/
             ├── deep_solve/
@@ -160,7 +168,7 @@ def init_user_directories(project_root: Path | None = None) -> None:
 def _ensure_essential_settings(path_service) -> None:
     """
     Ensure essential settings files exist.
-    
+
     This is the minimal initialization needed at startup.
     All other directories are created on-demand when files are saved.
     """
diff --git a/deeptutor/services/structure_note/__init__.py b/deeptutor/services/structure_note/__init__.py
new file mode 100644
index 000000000..2b2e7d614
--- /dev/null
+++ b/deeptutor/services/structure_note/__init__.py
@@ -0,0 +1,40 @@
+from .difficulty import DifficultyPreset, get_difficulty_preset
+from .manager import StructureNoteManager
+from .models import (
+    CitationEntry,
+    DifficultyLevel,
+    DocumentPlan,
+    ExplanationStyleLevel,
+    GenerationChunk,
+    ImagePlaceholder,
+    JobStatus,
+    NoteLanguage,
+    PageIndexPage,
+    SectionEvidence,
+    SectionPlan,
+    SectionTreeNode,
+    StructureNoteArtifact,
+    StructureNoteProject,
+)
+from .storage import StructureNoteStorage
+
+__all__ = [
+    "CitationEntry",
+    "DifficultyLevel",
+    "DifficultyPreset",
+    "DocumentPlan",
+    "ExplanationStyleLevel",
+    "GenerationChunk",
+    "ImagePlaceholder",
+    "JobStatus",
+    "NoteLanguage",
+    "PageIndexPage",
+    "SectionEvidence",
+    "SectionPlan",
+    "SectionTreeNode",
+    "StructureNoteArtifact",
+    "StructureNoteManager",
+    "StructureNoteProject",
+    "StructureNoteStorage",
+    "get_difficulty_preset",
+]
diff --git a/deeptutor/services/structure_note/difficulty.py b/deeptutor/services/structure_note/difficulty.py
new file mode 100644
index 000000000..ad7cc3b8e
--- /dev/null
+++ b/deeptutor/services/structure_note/difficulty.py
@@ -0,0 +1,64 @@
+from __future__ import annotations
+
+from dataclasses import dataclass
+
+from .models import DifficultyLevel
+
+
+@dataclass(frozen=True)
+class DifficultyPreset:
+    level: DifficultyLevel
+    page_window: int
+    depth_instruction: str
+    compression_instruction: str
+    placeholder_purpose: str
+
+
+PRESETS: dict[DifficultyLevel, DifficultyPreset] = {
+    DifficultyLevel.SIMPLE: DifficultyPreset(
+        level=DifficultyLevel.SIMPLE,
+        page_window=10,
+        depth_instruction=(
+            "Simple controls how much to cover: keep only the core thread, key concepts, "
+            "essential conclusions, and any indispensable bridge needed to understand them. "
+            "Short does not mean shallow."
+        ),
+        compression_instruction=(
+            "Compress by deleting repeated background, template transitions, low-information summaries, "
+            "and meta commentary. Preserve precise definitions, key mechanisms, critical formulas or "
+            "arguments, and the shortest logical bridge between ideas."
+        ),
+        placeholder_purpose="key_figure",
+    ),
+    DifficultyLevel.MEDIUM: DifficultyPreset(
+        level=DifficultyLevel.MEDIUM,
+        page_window=10,
+        depth_instruction=(
+            "Medium controls how much to cover: include the main knowledge points and the core logic chain "
+            "needed for a normal classroom handout."
+        ),
+        compression_instruction=(
+            "Compress by merging duplicated examples and background while retaining the main concepts, "
+            "mechanisms, evidence, and topic-to-topic reasoning."
+        ),
+        placeholder_purpose="supporting_figure",
+    ),
+    DifficultyLevel.DETAILED: DifficultyPreset(
+        level=DifficultyLevel.DETAILED,
+        page_window=6,
+        depth_instruction=(
+            "Detailed controls how much to cover: preserve a fuller knowledge structure, including "
+            "intermediate steps, boundary cases, supporting examples, and derivation or argument details "
+            "when they are present in the evidence."
+        ),
+        compression_instruction=(
+            "Compress only low-value repetition and boilerplate. Keep the complete conceptual chain, "
+            "important qualifications, examples, mechanisms, and source-supported derivation details."
+        ),
+        placeholder_purpose="detailed_figure",
+    ),
+}
+
+
+def get_difficulty_preset(level: DifficultyLevel) -> DifficultyPreset:
+    return PRESETS[level]
diff --git a/deeptutor/services/structure_note/generator.py b/deeptutor/services/structure_note/generator.py
new file mode 100644
index 000000000..a43d125e6
--- /dev/null
+++ b/deeptutor/services/structure_note/generator.py
@@ -0,0 +1,571 @@
+from __future__ import annotations
+
+from collections.abc import Iterable
+import re
+
+from deeptutor.services.llm import complete as llm_complete
+
+from .difficulty import DifficultyPreset
+from .markdown_postprocessor import normalize_structure_note_markdown
+from .models import (
+    DifficultyLevel,
+    DocumentPlan,
+    ExplanationStyleLevel,
+    GenerationChunk,
+    NoteLanguage,
+    PageIndexPage,
+    SectionEvidence,
+    SectionPlan,
+    SectionTreeNode,
+)
+
+
+def _pages_by_number(pages: Iterable[PageIndexPage]) -> dict[int, PageIndexPage]:
+    return {page.page_number: page for page in pages}
+
+
+def build_generation_chunks(
+    pages: list[PageIndexPage],
+    sections: list[SectionTreeNode],
+    preset: DifficultyPreset,
+    document_plan: DocumentPlan | None = None,
+) -> list[GenerationChunk]:
+    chunks: list[GenerationChunk] = []
+    chunk_index = 1
+
+    if document_plan and document_plan.outline:
+        section_lookup = {section.section_id: section for section in document_plan.outline}
+        tree_lookup = {section.section_id: section for section in sections}
+        ordered_plans = [
+            section_lookup[section_id]
+            for section_id in document_plan.section_order
+            if section_id in section_lookup
+        ]
+        for plan in ordered_plans:
+            page_numbers = plan.page_numbers
+            evidence = plan.evidence
+            tree_node = tree_lookup.get(plan.section_id)
+            if tree_node and tree_node.child_ids:
+                child_starts = [
+                    tree_lookup[child_id].page_start
+                    for child_id in tree_node.child_ids
+                    if child_id in tree_lookup
+                ]
+                if child_starts:
+                    overview_end = min(plan.page_end, min(child_starts) - 1)
+                    page_numbers = list(range(plan.page_start, overview_end + 1))
+                    if not page_numbers:
+                        page_numbers = [plan.page_start]
+                    evidence = [
+                        item for item in plan.evidence if item.page_number in set(page_numbers)
+                    ]
+            if not page_numbers:
+                continue
+            chunks.append(
+                _chunk_from_plan(plan, chunk_index, page_numbers=page_numbers, evidence=evidence)
+            )
+            chunk_index += 1
+    elif sections:
+        ordered_sections = sorted(
+            sections, key=lambda item: (item.page_start, item.level, item.section_id)
+        )
+        for section in ordered_sections:
+            page_numbers = list(range(section.page_start, section.page_end + 1))
+            if not page_numbers:
+                continue
+            chunks.append(
+                GenerationChunk(
+                    chunk_id=f"chunk-{chunk_index:03d}",
+                    section_id=section.section_id,
+                    section_title=section.title,
+                    section_path=section.path or [section.title],
+                    section_summary=section.summary,
+                    heading_level=max(2, min(section.level, 5)),
+                    page_start=page_numbers[0],
+                    page_end=page_numbers[-1],
+                    page_numbers=page_numbers,
+                )
+            )
+            chunk_index += 1
+    else:
+        for start in range(1, len(pages) + 1, preset.page_window):
+            window = list(range(start, min(start + preset.page_window, len(pages) + 1)))
+            title = f"Pages {window[0]}-{window[-1]}" if len(window) > 1 else f"Page {window[0]}"
+            chunks.append(
+                GenerationChunk(
+                    chunk_id=f"chunk-{chunk_index:03d}",
+                    section_title=title,
+                    section_path=[title],
+                    page_start=window[0],
+                    page_end=window[-1],
+                    page_numbers=window,
+                )
+            )
+            chunk_index += 1
+
+    return chunks
+
+
+def _chunk_from_plan(
+    plan: SectionPlan,
+    chunk_index: int,
+    *,
+    page_numbers: list[int] | None = None,
+    evidence: list[SectionEvidence] | None = None,
+) -> GenerationChunk:
+    resolved_pages = page_numbers or plan.page_numbers
+    return GenerationChunk(
+        chunk_id=f"chunk-{chunk_index:03d}",
+        section_id=plan.section_id,
+        section_title=plan.title,
+        section_path=plan.section_path or [plan.title],
+        section_summary=plan.summary,
+        heading_level=max(2, min(plan.level, 5)),
+        page_start=resolved_pages[0],
+        page_end=resolved_pages[-1],
+        page_numbers=resolved_pages,
+        evidence=evidence if evidence is not None else plan.evidence,
+        dependencies=plan.dependencies,
+    )
+
+
+def _build_page_context(
+    page_lookup: dict[int, PageIndexPage],
+    page_numbers: list[int],
+    evidence: list[SectionEvidence],
+) -> str:
+    parts: list[str] = []
+    evidence_lookup = {item.page_number: item for item in evidence}
+    for page_number in page_numbers:
+        page = page_lookup.get(page_number)
+        if not page:
+            continue
+        evidence_item = evidence_lookup.get(page_number)
+        excerpt = evidence_item.excerpt if evidence_item else page.text.strip()
+        if len(excerpt) > 1800:
+            excerpt = f"{excerpt[:1800]}\n..."
+        title_candidates = (
+            evidence_item.title_candidates
+            if evidence_item
+            else [candidate.text for candidate in page.title_candidates[:5]]
+        )
+        image_candidate_ids = (
+            evidence_item.image_candidate_ids
+            if evidence_item
+            else [candidate.candidate_id for candidate in page.image_candidates[:8]]
+        )
+        metadata = []
+        if title_candidates:
+            metadata.append(f"title candidates: {title_candidates}")
+        if image_candidate_ids:
+            metadata.append(f"image candidates: {image_candidate_ids}")
+        suffix = f"\n({'; '.join(metadata)})" if metadata else ""
+        parts.append(f"[Page {page_number}]{suffix}\n{excerpt}")
+    return "\n\n".join(parts)
+
+
+def _fallback_markdown(
+    chunk: GenerationChunk, page_lookup: dict[int, PageIndexPage], language: str
+) -> str:
+    heading = "#" * max(2, min(chunk.heading_level, 5))
+    title = " / ".join(chunk.section_path)
+    source_range = (
+        f"Pages {chunk.page_start}-{chunk.page_end}"
+        if chunk.page_start != chunk.page_end
+        else f"Page {chunk.page_start}"
+    )
+    if language == "zh":
+        intro = f"本节根据第 {chunk.page_start}-{chunk.page_end} 页内容整理。"
+        summary_label = "本节小结"
+        source_label = "来源线索"
+        empty = "该页范围未提取到可用文本。"
+    else:
+        intro = f"This section synthesizes the material from {source_range.lower()}."
+        summary_label = "Section Summary"
+        source_label = "Source Notes"
+        empty = "No extractable text was found for this section range."
+    source_notes: list[str] = []
+    for page_number in chunk.page_numbers:
+        page = page_lookup.get(page_number)
+        if not page or not page.text.strip():
+            continue
+        excerpt = page.text.strip().replace("\n", " ")
+        if len(excerpt) > 360:
+            excerpt = f"{excerpt[:360]}..."
+        source_notes.append(f"- Page {page_number}: {excerpt}")
+    if not source_notes:
+        source_notes.append(f"- {empty}")
+    summary = chunk.section_summary or empty
+    return (
+        f"{heading} {title}\n\n"
+        f"{intro}\n\n"
+        f"### {source_label}\n\n"
+        + "\n".join(source_notes)
+        + f"\n\n> **{summary_label}:** {summary}\n"
+    )
+
+
+def _strip_markdown_fence(content: str) -> str:
+    match = re.fullmatch(
+        r"\s*```(?:markdown)?\s*(.*?)\s*```\s*", content, flags=re.DOTALL | re.IGNORECASE
+    )
+    return match.group(1).strip() if match else content.strip()
+
+
+def _document_outline(document_plan: DocumentPlan | None) -> str:
+    if not document_plan:
+        return ""
+    lines: list[str] = []
+    for section in document_plan.outline:
+        indent = "  " * max(0, section.level - 2)
+        page_range = (
+            f"pages {section.page_start}-{section.page_end}"
+            if section.page_start != section.page_end
+            else f"page {section.page_start}"
+        )
+        lines.append(f"{indent}- {section.title} ({page_range}): {section.summary}")
+    return "\n".join(lines)
+
+
+def _language_name(language: str) -> str:
+    if language == NoteLanguage.ZH.value:
+        return "Chinese"
+    if language == NoteLanguage.EN.value:
+        return "English"
+    return language
+
+
+def _style_instruction(style_level: ExplanationStyleLevel, language: str) -> str:
+    if language == NoteLanguage.ZH.value:
+        if style_level == ExplanationStyleLevel.LOW:
+            return (
+                "Low 只控制怎么讲：科普式讲解，强调直观、易懂、低门槛，减少术语和公式负担。"
+                "不要减少本节按 depth 要覆盖的核心内容。"
+            )
+        if style_level == ExplanationStyleLevel.HIGH:
+            return (
+                "High 只控制怎么讲：学术讲义风格，定义更精确，边界更清楚，逻辑链更严格，"
+                "强调机制、论证链和术语精度。理工/数学/计算机可保留关键公式、推导、矩阵、定理或算法机制；"
+                "生物/医学保留机制链路、因果过程和术语定义；社科/人文保留概念辨析、理论框架和论证结构。"
+                "High 的本质是 rigor，不是强行造公式。"
+            )
+        return (
+            "Medium 只控制怎么讲：标准课堂讲义风格，兼顾清晰度、完整性和一定理论性，"
+            "不要改变 depth 决定的覆盖范围。"
+        )
+
+    if style_level == ExplanationStyleLevel.LOW:
+        return (
+            "Low controls how to explain: popular-science style, intuitive, approachable, and low-friction, "
+            "with less terminology and formula burden. Do not reduce the content coverage selected by depth."
+        )
+    if style_level == ExplanationStyleLevel.HIGH:
+        return (
+            "High controls how to explain: academic lecture-note style with precise definitions, clear concept "
+            "boundaries, strict logic, mechanisms, argument chains, and terminology precision. For STEM, math, "
+            "CS, or engineering, preserve key formulas, derivations, matrices, theorems, or algorithm mechanisms "
+            "when supported. For biology or medicine, preserve mechanism chains, causal processes, and definitions. "
+            "For social sciences or humanities, preserve conceptual distinctions, theoretical frameworks, and "
+            "argument structure. High means rigor; do not invent formulas."
+        )
+    return (
+        "Medium controls how to explain: standard classroom handout style, balancing clarity, completeness, "
+        "and moderate theoretical density without changing the depth coverage."
+    )
+
+
+def _depth_label(level: DifficultyLevel) -> str:
+    return {
+        DifficultyLevel.SIMPLE: "Simple",
+        DifficultyLevel.MEDIUM: "Medium",
+        DifficultyLevel.DETAILED: "Detailed",
+    }[level]
+
+
+def _style_label(style_level: ExplanationStyleLevel) -> str:
+    return {
+        ExplanationStyleLevel.LOW: "Low",
+        ExplanationStyleLevel.MEDIUM: "Medium",
+        ExplanationStyleLevel.HIGH: "High",
+    }[style_level]
+
+
+def _transition_excerpt(markdown: str, limit: int = 800) -> str:
+    excerpt = markdown.strip()
+    if len(excerpt) <= limit:
+        return excerpt
+    return f"{excerpt[:limit].rstrip()}..."
+
+
+def _clean_transition_markdown(content: str) -> str:
+    cleaned = normalize_structure_note_markdown(_strip_markdown_fence(content))
+    lines = [line.strip() for line in cleaned.splitlines() if line.strip()]
+    normalized_lines: list[str] = []
+    for line in lines:
+        line = re.sub(r"^(?:>\s*)+", "", line).strip()
+        line = re.sub(r"^(?:[-*+]|\d+[.)])\s+", "", line).strip()
+        if line:
+            normalized_lines.append(line)
+    return " ".join(normalized_lines).strip()
+
+
+def _transition_style_instruction(style_level: ExplanationStyleLevel) -> str:
+    if style_level == ExplanationStyleLevel.LOW:
+        return "LOW: intuitive, simple explanation"
+    if style_level == ExplanationStyleLevel.HIGH:
+        return "HIGH: emphasize logical necessity, limitation, or theoretical gap"
+    return "MEDIUM: standard lecture explanation (default)"
+
+
+def _minimal_transition_fallback(previous: GenerationChunk, current: GenerationChunk) -> str:
+    return f"{previous.section_title} leads naturally to {current.section_title}."
+
+
+async def generate_transition_markdown(
+    previous: GenerationChunk,
+    current: GenerationChunk,
+    *,
+    language: str,
+    style_level: ExplanationStyleLevel,
+    document_plan: DocumentPlan | None = None,
+) -> str:
+    outline = _document_outline(document_plan)
+    prompt = (
+        "Write a short transition paragraph for a lecture-style note.\n\n"
+        "Goal:\n"
+        "Connect the previous section to the current section in a natural, knowledge-driven way.\n\n"
+        "Requirements:\n"
+        "- 1-3 sentences ONLY\n"
+        "- Do NOT use template phrases like:\n"
+        '  "上一部分...", "接下来...", "本节将..."\n'
+        "- Do NOT mention slides or pages\n"
+        "- Explain the logical bridge:\n"
+        "  1. what the previous section established\n"
+        "  2. what is still missing or limited\n"
+        "  3. why the current section naturally follows\n"
+        "- Write like a human lecture note, not a system connector\n"
+        "- No bullet points\n"
+        "- Output plain Markdown paragraph only\n\n"
+        "Style:\n"
+        "- LOW: intuitive, simple explanation\n"
+        "- MEDIUM: standard lecture explanation (default)\n"
+        "- HIGH: emphasize logical necessity, limitation, or theoretical gap\n"
+        f"Selected style: {_transition_style_instruction(style_level)}\n\n"
+        f"Language:\n{_language_name(language)}\n\n"
+        f"Document Outline:\n{outline or '(not provided)'}\n\n"
+        "Previous Section:\n"
+        f"Title: {previous.section_title}\n"
+        f"Summary: {previous.section_summary}\n"
+        f"Excerpt: {_transition_excerpt(previous.markdown)}\n\n"
+        "Current Section:\n"
+        f"Title: {current.section_title}\n"
+        f"Summary: {current.section_summary}\n"
+        f"Excerpt: {_transition_excerpt(current.markdown)}\n"
+    )
+    try:
+        response = await llm_complete(
+            prompt=prompt,
+            system_prompt=(
+                "You write concise connective paragraphs for online lecture notes. "
+                "Use the given section excerpts to explain the knowledge flow without using a fixed template."
+            ),
+            temperature=0.45,
+        )
+        cleaned = _clean_transition_markdown(response)
+        return cleaned or _minimal_transition_fallback(previous, current)
+    except Exception:
+        return _minimal_transition_fallback(previous, current)
+
+
+def _combination_instruction(
+    depth_level: DifficultyLevel,
+    style_level: ExplanationStyleLevel,
+    language: str,
+) -> str:
+    if language == NoteLanguage.ZH.value:
+        matrix = {
+            (DifficultyLevel.SIMPLE, ExplanationStyleLevel.LOW): (
+                "Simple + Low：短篇幅、低门槛、科普化。只讲最核心内容，用直觉化表达帮助快速入门。"
+            ),
+            (DifficultyLevel.SIMPLE, ExplanationStyleLevel.MEDIUM): (
+                "Simple + Medium：短篇幅、标准课堂风格。只保留核心知识骨架，但表述清晰、正常、不泛化。"
+            ),
+            (DifficultyLevel.SIMPLE, ExplanationStyleLevel.HIGH): (
+                "Simple + High：短篇幅、高密度、学术型核心讲义。只讲最重要内容，但保留严谨定义、关键机制、"
+                "关键公式或关键论证的作用说明。这是 short but dense，不是 short and shallow。"
+            ),
+            (DifficultyLevel.MEDIUM, ExplanationStyleLevel.LOW): (
+                "Medium + Low：中等篇幅、科普风格。覆盖主要知识点，但仍以直观解释为主，减少抽象负担。"
+            ),
+            (DifficultyLevel.MEDIUM, ExplanationStyleLevel.MEDIUM): (
+                "Medium + Medium：中等篇幅、标准课堂讲义。作为默认模式，兼顾覆盖面、逻辑和可读性。"
+            ),
+            (DifficultyLevel.MEDIUM, ExplanationStyleLevel.HIGH): (
+                "Medium + High：中等篇幅、学术课堂风格。覆盖主要知识点，同时保留较强理论解释和关键数学、机制或论证说明。"
+            ),
+            (DifficultyLevel.DETAILED, ExplanationStyleLevel.LOW): (
+                "Detailed + Low：长篇幅、低门槛。讲得更全、更慢、更细，但仍以易懂为优先，不强行学术化。"
+            ),
+            (DifficultyLevel.DETAILED, ExplanationStyleLevel.MEDIUM): (
+                "Detailed + Medium：长篇幅、完整课堂讲义。比较全面，适合复习和系统整理。"
+            ),
+            (DifficultyLevel.DETAILED, ExplanationStyleLevel.HIGH): (
+                "Detailed + High：长篇幅、学术讲义/课程笔记风格。完整覆盖，强理论解释，并保留材料支持的必要推导、公式或严谨论证。"
+            ),
+        }
+        return matrix[(depth_level, style_level)]
+
+    matrix = {
+        (DifficultyLevel.SIMPLE, ExplanationStyleLevel.LOW): (
+            "Simple + Low: short, low-barrier, popular-science explanation. Cover only the core ideas "
+            "and use intuitive language for fast entry-level understanding."
+        ),
+        (DifficultyLevel.SIMPLE, ExplanationStyleLevel.MEDIUM): (
+            "Simple + Medium: short standard classroom note. Keep the core knowledge skeleton, but explain it clearly "
+            "without flattening it into a vague summary."
+        ),
+        (DifficultyLevel.SIMPLE, ExplanationStyleLevel.HIGH): (
+            "Simple + High: short, dense, academic core note. Cover only the most important material while preserving "
+            "precise definitions, key mechanisms, and the role of any essential formula or argument. This is short "
+            "but dense, not short and shallow."
+        ),
+        (DifficultyLevel.MEDIUM, ExplanationStyleLevel.LOW): (
+            "Medium + Low: medium length, popular-science style. Cover the main knowledge points with intuitive "
+            "explanations and a lighter abstraction burden."
+        ),
+        (DifficultyLevel.MEDIUM, ExplanationStyleLevel.MEDIUM): (
+            "Medium + Medium: medium length standard classroom note. This is the default balance of coverage, "
+            "logic, and readability."
+        ),
+        (DifficultyLevel.MEDIUM, ExplanationStyleLevel.HIGH): (
+            "Medium + High: medium length academic classroom note. Cover the main knowledge points while preserving "
+            "stronger theoretical explanation and key mathematical, mechanistic, or argumentative structure."
+        ),
+        (DifficultyLevel.DETAILED, ExplanationStyleLevel.LOW): (
+            "Detailed + Low: long, low-barrier explanation. Cover more material slowly and carefully while keeping "
+            "accessibility ahead of academic density."
+        ),
+        (DifficultyLevel.DETAILED, ExplanationStyleLevel.MEDIUM): (
+            "Detailed + Medium: long, complete classroom note for review and systematic organization."
+        ),
+        (DifficultyLevel.DETAILED, ExplanationStyleLevel.HIGH): (
+            "Detailed + High: long academic lecture note. Complete coverage with strong theoretical explanation and "
+            "source-supported derivations, formulas, or rigorous arguments when appropriate."
+        ),
+    }
+    return matrix[(depth_level, style_level)]
+
+
+def _prompt_contract(
+    preset: DifficultyPreset,
+    style_level: ExplanationStyleLevel,
+    language: str,
+) -> str:
+    if language == NoteLanguage.ZH.value:
+        return (
+            "Parameter contract:\n"
+            f"- Explanation Depth = {_depth_label(preset.level)}，只控制“讲多少”：{preset.depth_instruction}\n"
+            f"- Lecture Style Level = {_style_label(style_level)}，只控制“怎么讲”：{_style_instruction(style_level, language)}\n"
+            f"- 组合语义：{_combination_instruction(preset.level, style_level, language)}\n"
+            "Compression policy:\n"
+            f"- {preset.compression_instruction}\n"
+            "- 优先删除：模板过渡、重复背景、空泛总结、“这一部分讲什么”的元描述、低信息量套话。\n"
+            "- 优先保留：核心概念、关键机制、关键公式或关键论证、关键推导桥梁句、方法之间为什么衔接的逻辑。\n"
+        )
+
+    return (
+        "Parameter contract:\n"
+        f"- Explanation Depth = {_depth_label(preset.level)} controls only how much to cover: {preset.depth_instruction}\n"
+        f"- Lecture Style Level = {_style_label(style_level)} controls only how to explain: {_style_instruction(style_level, language)}\n"
+        f"- Combination meaning: {_combination_instruction(preset.level, style_level, language)}\n"
+        "Compression policy:\n"
+        f"- {preset.compression_instruction}\n"
+        "- Delete first: template transitions, repeated background, vague summaries, meta descriptions of what the section covers, and low-information filler.\n"
+        "- Preserve first: core concepts, key mechanisms, essential formulas or arguments, derivation bridge sentences, and the logic explaining why methods or ideas connect.\n"
+    )
+
+
+async def generate_chunk_markdown(
+    chunk: GenerationChunk,
+    pages: list[PageIndexPage],
+    preset: DifficultyPreset,
+    language: str = "en",
+    style_level: ExplanationStyleLevel = ExplanationStyleLevel.MEDIUM,
+    document_plan: DocumentPlan | None = None,
+) -> str:
+    page_lookup = _pages_by_number(pages)
+    context = _build_page_context(page_lookup, chunk.page_numbers, chunk.evidence)
+    if not context.strip():
+        return _fallback_markdown(chunk, page_lookup, language)
+
+    heading = "#" * max(2, min(chunk.heading_level, 5))
+    prompt = (
+        f"Write one Markdown-first study-note section in {_language_name(language)}.\n"
+        f"The final note content itself must be in {_language_name(language)}; this is independent of UI language.\n"
+        "Return Markdown only. Write a real online lecture note section, not a page digest, slide script, "
+        "summary expansion, or fixed template.\n"
+        f"Section path: {' > '.join(chunk.section_path)}\n"
+        f"Page range: {chunk.page_start}-{chunk.page_end}\n"
+        f"Section summary: {chunk.section_summary}\n"
+        f"Required heading: {heading} {' / '.join(chunk.section_path)}\n"
+        f"{_prompt_contract(preset, style_level, language)}\n"
+        f"Document outline:\n{_document_outline(document_plan)}\n\n"
+        "Requirements:\n"
+        f"- Start exactly with the required Markdown heading.\n"
+        "- Organize by the knowledge thread of this section: what problem/concept is being explained, what mechanism or argument makes it work, and why the ideas connect.\n"
+        "- Do not average-compress every page. Select evidence according to the depth/style contract above.\n"
+        '- Do not write page-by-page explanations, presentation speech, or template phrases such as "this section introduces".\n'
+        "- Use natural explanatory paragraphs as the main body. Lists, tables, and callouts are supporting material only.\n"
+        "- Use ### subheadings only when they reflect real conceptual turns, not a fixed Definition/Example/Summary template.\n"
+        "- When a formula, theorem, algorithm, mechanism, causal chain, or argument is essential, explain the problem it solves, why it is introduced, and what role it plays in the method.\n"
+        "- For formulas or algorithmic updates, do not merely quote the expression. When the evidence supports it, derive it step by step from the preceding definition, objective, constraint, or mechanism; otherwise explain the missing derivation assumption clearly.\n"
+        "- For algorithms, identify the input/state/objective/update, why each update is shaped that way, and how the update reduces the original problem.\n"
+        "- For mechanisms, explain the chain from condition to process to consequence, including the point where the mechanism changes the outcome.\n"
+        "- For High style, increase rigor through precise definitions, boundaries, mechanisms, and argument quality; do not force formulas for non-mathematical material.\n"
+        "- Use numbered lists for algorithms, procedures, or causal sequences."
+        "- End with a short section summary callout that states the knowledge takeaway, not a generic recap.\n"
+        "- Markdown math contract: inline math must use `$...$`; display math and multi-step derivations must use `$$...$$` on their own lines.\n"
+        "- Never use unsupported wrappers such as `\\(...\\)` or `\\[...\\]`, and never mix wrappers like `$$\\(...\\)$$`.\n"
+        "- For function names, API names, code-like expressions, or pseudocode in prose, use backticks such as `f(x)` or `softmax(x)`, not math delimiters.\n"
+        "- Keep grounding traceable by mentioning source page ranges only when it clarifies evidence.\n\n"
+        "- Use bold sparingly for key concepts, mechanism names, theorem names, algorithm names, and likely confusion points. Do not overuse bold. Prefer 1–3 bold phrases per paragraph and never bold full sentences."
+        "- When appropriate, briefly point out one common misunderstanding, confusion, or misuse of the concept, and clarify it directly."
+        f"Section-grounded evidence:\n{context}"
+    )
+
+    try:
+        response = await llm_complete(
+            prompt=prompt,
+            system_prompt=(
+                "You turn a PageIndex-style section plan and page evidence into coherent online lecture notes. "
+                "You never produce slide narration or page-by-page commentary."
+            ),
+            temperature=0.35,
+        )
+        cleaned = normalize_structure_note_markdown(_strip_markdown_fence(response))
+        return cleaned if cleaned else _fallback_markdown(chunk, page_lookup, language)
+    except Exception:
+        return _fallback_markdown(chunk, page_lookup, language)
+
+
+def inject_image_placeholders(
+    chunks: list[GenerationChunk],
+    pages: list[PageIndexPage],
+    purpose: str,
+) -> list[GenerationChunk]:
+    page_lookup = _pages_by_number(pages)
+    for chunk in chunks:
+        image_pages = [
+            page_number
+            for page_number in chunk.page_numbers
+            if page_lookup.get(page_number) and page_lookup[page_number].image_candidates
+        ]
+        if not image_pages:
+            continue
+        page_hint = image_pages[0]
+        placeholder_id = f"{chunk.chunk_id}-image-1"
+        token = f"[[IMAGE_PLACEHOLDER:{placeholder_id}:{page_hint}:{purpose}]]"
+        if token not in chunk.markdown:
+            chunk.markdown = f"{chunk.markdown.rstrip()}\n\n{token}\n"
+        chunk.placeholder_ids.append(placeholder_id)
+    return chunks
diff --git a/deeptutor/services/structure_note/image_pipeline.py b/deeptutor/services/structure_note/image_pipeline.py
new file mode 100644
index 000000000..6c2532087
--- /dev/null
+++ b/deeptutor/services/structure_note/image_pipeline.py
@@ -0,0 +1,132 @@
+from __future__ import annotations
+
+from pathlib import Path
+import re
+
+from .models import CitationEntry, GenerationChunk, ImagePlaceholder, PageIndexPage
+
+_PLACEHOLDER_RE = re.compile(
+    r"\[\[IMAGE_PLACEHOLDER:(?P<placeholder_id>[^:\]]+):(?P<page_hint>\d+):(?P<purpose>[^\]]+)\]\]"
+)
+
+
+def _pages_map(pages: list[PageIndexPage]) -> dict[int, PageIndexPage]:
+    return {page.page_number: page for page in pages}
+
+
+def _figure_caption(chunk: GenerationChunk, page_number: int | None, language: str) -> str:
+    topic = (chunk.section_summary or chunk.section_title).strip()
+    if len(topic) > 120:
+        topic = f"{topic[:120].rstrip()}..."
+    if language == "zh":
+        source = f"第 {page_number} 页" if page_number else "对应页"
+        return (
+            f"图示来源：{source}。该图对应本节“{chunk.section_title}”的核心内容："
+            f"{topic or '结构、过程或关键例子'}"
+        )
+    source = f"page {page_number}" if page_number else "the source page"
+    return (
+        f"Figure from {source}. It supports the explanation of {chunk.section_title} by showing "
+        f"{topic or 'the structure, process, or key example'} discussed in the section."
+    )
+
+
+def _render_page_crop(
+    pdf_path: Path, page_number: int, output_path: Path, clip: list[float] | None = None
+) -> None:
+    import fitz
+
+    document = fitz.open(pdf_path)
+    try:
+        page = document[page_number - 1]
+        rect = fitz.Rect(clip) if clip else page.rect
+        pix = page.get_pixmap(matrix=fitz.Matrix(2, 2), clip=rect, alpha=False)
+        pix.save(output_path)
+    finally:
+        document.close()
+
+
+def process_images(
+    chunks: list[GenerationChunk],
+    pages: list[PageIndexPage],
+    pdf_path: Path,
+    images_dir: Path,
+    source_file: str,
+    language: str = "en",
+) -> tuple[list[GenerationChunk], list[ImagePlaceholder], list[CitationEntry]]:
+    images_dir.mkdir(parents=True, exist_ok=True)
+    page_lookup = _pages_map(pages)
+    placeholders: list[ImagePlaceholder] = []
+    citations: list[CitationEntry] = []
+
+    for chunk in chunks:
+        if not chunk.placeholder_ids:
+            continue
+
+        def replace(match: re.Match[str]) -> str:
+            placeholder_id = match.group("placeholder_id")
+            page_hint = int(match.group("page_hint"))
+            purpose = match.group("purpose")
+            candidates = []
+            for page_number in chunk.page_numbers:
+                page = page_lookup.get(page_number)
+                if not page:
+                    continue
+                candidates.extend(page.image_candidates)
+
+            placeholder = ImagePlaceholder(
+                placeholder_id=placeholder_id,
+                chunk_id=chunk.chunk_id,
+                page_hint=page_hint,
+                purpose=purpose,
+            )
+
+            image_name = f"{placeholder_id}.png"
+            image_path = images_dir / image_name
+            markdown_image_path = f"images/{image_name}"
+
+            try:
+                if len(candidates) == 1:
+                    candidate = candidates[0]
+                    _render_page_crop(pdf_path, candidate.page_number, image_path, candidate.bbox)
+                    placeholder.status = "filled"
+                    placeholder.image_path = markdown_image_path
+                    placeholder.resolved_page = candidate.page_number
+                    placeholder.resolved_region = candidate.bbox
+                else:
+                    fallback_page = page_hint if page_hint in page_lookup else chunk.page_start
+                    _render_page_crop(pdf_path, fallback_page, image_path, None)
+                    placeholder.status = "fallback_page"
+                    placeholder.image_path = markdown_image_path
+                    placeholder.resolved_page = fallback_page
+                    placeholder.resolved_region = None
+
+                placeholders.append(placeholder)
+                citations.append(
+                    CitationEntry(
+                        citation_id=f"cite-{placeholder_id}",
+                        section_path=chunk.section_path,
+                        page_start=chunk.page_start,
+                        page_end=chunk.page_end,
+                        source_file=source_file,
+                        source_kind="image",
+                        image_page=placeholder.resolved_page,
+                        image_region=placeholder.resolved_region,
+                        excerpt=purpose,
+                    )
+                )
+                caption = _figure_caption(chunk, placeholder.resolved_page, language)
+                return f"![{purpose}]({markdown_image_path})\n\n*{caption}*"
+            except Exception as exc:
+                placeholder.status = "fallback_text"
+                placeholder.error = str(exc)
+                placeholders.append(placeholder)
+                return (
+                    "> Figure reference unavailable for this page range."
+                    if language != "zh"
+                    else "> 当前页范围的图片引用暂不可用。"
+                )
+
+        chunk.markdown = _PLACEHOLDER_RE.sub(replace, chunk.markdown)
+
+    return chunks, placeholders, citations
diff --git a/deeptutor/services/structure_note/manager.py b/deeptutor/services/structure_note/manager.py
new file mode 100644
index 000000000..b4cd9bc8c
--- /dev/null
+++ b/deeptutor/services/structure_note/manager.py
@@ -0,0 +1,592 @@
+from __future__ import annotations
+
+from datetime import datetime
+from pathlib import Path
+from typing import Any, Literal
+import uuid
+
+from deeptutor.logging import get_logger
+
+from .difficulty import get_difficulty_preset
+from .generator import (
+    build_generation_chunks,
+    generate_chunk_markdown,
+    generate_transition_markdown,
+    inject_image_placeholders,
+)
+from .image_pipeline import process_images
+from .markdown_postprocessor import normalize_structure_note_markdown
+from .models import (
+    CitationEntry,
+    DifficultyLevel,
+    DocumentPlan,
+    ExplanationStyleLevel,
+    GenerationChunk,
+    JobStatus,
+    NoteLanguage,
+    PageIndexPage,
+    SectionTreeNode,
+    StructureNoteArtifact,
+    StructureNoteProject,
+)
+from .normalizer import normalize_to_pdf
+from .page_index import build_page_index
+from .planner import build_document_plan
+from .renderer import render_pdf
+from .storage import StructureNoteStorage
+from .tree_builder import build_section_tree
+
+
+class StructureNoteManager:
+    def __init__(self, storage: StructureNoteStorage | None = None):
+        self.storage = storage or StructureNoteStorage()
+        self.logger = get_logger("StructureNote")
+
+    def _normalize_project_name(self, project_name: str | None) -> str:
+        normalized = (project_name or "").strip()
+        if not normalized:
+            raise ValueError("Project name is required.")
+        if "/" in normalized or "\\" in normalized:
+            raise ValueError("Project name cannot contain path separators.")
+        return normalized
+
+    def _artifact_project_name(self, artifact: StructureNoteArtifact) -> str:
+        return artifact.project_name or artifact.source_ref.get("kb_name") or "Local Uploads"
+
+    def list_projects(self) -> list[StructureNoteProject]:
+        projects_by_name: dict[str, StructureNoteProject] = {
+            self._normalize_project_name(project.name): project
+            for project in self.storage.read_projects()
+        }
+        for artifact in self.list_jobs():
+            project_name = self._artifact_project_name(artifact)
+            existing = projects_by_name.get(project_name)
+            if existing is None:
+                projects_by_name[project_name] = StructureNoteProject(
+                    name=project_name,
+                    created_at=artifact.created_at,
+                    updated_at=artifact.updated_at,
+                )
+            elif artifact.updated_at > existing.updated_at:
+                existing.updated_at = artifact.updated_at
+        return sorted(projects_by_name.values(), key=lambda item: item.name.lower())
+
+    def create_project(self, project_name: str) -> StructureNoteProject:
+        name = self._normalize_project_name(project_name)
+        projects = {project.name: project for project in self.list_projects()}
+        if name in projects:
+            raise ValueError(f"Project already exists: {name}")
+        timestamp = self.storage.new_timestamp()
+        project = StructureNoteProject(name=name, created_at=timestamp, updated_at=timestamp)
+        projects[name] = project
+        self.storage.write_projects(sorted(projects.values(), key=lambda item: item.name.lower()))
+        return project
+
+    def ensure_project(self, project_name: str) -> StructureNoteProject:
+        name = self._normalize_project_name(project_name)
+        for project in self.list_projects():
+            if project.name == name:
+                return project
+        return self.create_project(name)
+
+    def rename_project(self, old_name: str, new_name: str) -> StructureNoteProject:
+        old_project_name = self._normalize_project_name(old_name)
+        new_project_name = self._normalize_project_name(new_name)
+        if old_project_name == new_project_name:
+            self.ensure_project(new_project_name)
+            return next(
+                project for project in self.list_projects() if project.name == new_project_name
+            )
+
+        projects = {project.name: project for project in self.list_projects()}
+        if old_project_name not in projects:
+            raise FileNotFoundError(f"Project not found: {old_project_name}")
+        if new_project_name in projects:
+            raise ValueError(f"Project already exists: {new_project_name}")
+
+        renamed = projects.pop(old_project_name)
+        renamed.name = new_project_name
+        renamed.updated_at = self.storage.new_timestamp()
+        projects[new_project_name] = renamed
+
+        for artifact in self.list_jobs():
+            if self._artifact_project_name(artifact) != old_project_name:
+                continue
+            artifact.project_name = new_project_name
+            self.storage.touch_updated_at(artifact)
+            self.storage.write_artifact(artifact)
+
+        self.storage.write_projects(sorted(projects.values(), key=lambda item: item.name.lower()))
+        return renamed
+
+    def delete_project(self, project_name: str) -> list[str]:
+        name = self._normalize_project_name(project_name)
+        projects = {project.name: project for project in self.list_projects()}
+        if name not in projects:
+            raise FileNotFoundError(f"Project not found: {name}")
+
+        deleted_job_ids: list[str] = []
+        for artifact in self.list_jobs():
+            if self._artifact_project_name(artifact) != name:
+                continue
+            deleted_job_ids.append(artifact.job_id)
+            self.storage.delete_job_dir(artifact.job_id)
+
+        projects.pop(name, None)
+        self.storage.write_projects(sorted(projects.values(), key=lambda item: item.name.lower()))
+        return deleted_job_ids
+
+    def create_job(
+        self,
+        file_name: str,
+        source_format: str,
+        difficulty_level: DifficultyLevel,
+        note_language: NoteLanguage,
+        style_level: ExplanationStyleLevel,
+        source_path: Path,
+        task_id: str,
+        job_id: str | None = None,
+        project_name: str | None = None,
+        note_title: str | None = None,
+        source_kind: Literal["upload", "knowledge_base"] = "upload",
+        source_ref: dict[str, str] | None = None,
+    ) -> StructureNoteArtifact:
+        job_id = job_id or (
+            f"structure_note_{datetime.utcnow().strftime('%Y%m%d_%H%M%S')}_{uuid.uuid4().hex[:8]}"
+        )
+        self.storage.ensure_job_dirs(job_id)
+        inferred_title = Path(file_name).stem or file_name
+        if project_name:
+            project_name = self.ensure_project(project_name).name
+        artifact = StructureNoteArtifact(
+            job_id=job_id,
+            file_name=file_name,
+            source_format=source_format,
+            difficulty_level=difficulty_level,
+            note_language=note_language,
+            style_level=style_level,
+            project_name=project_name,
+            note_title=note_title or inferred_title,
+            source_kind=source_kind,
+            source_ref=source_ref or {},
+            status=JobStatus.QUEUED,
+            source_path=str(source_path),
+            task_id=task_id,
+            retry_state=None,
+            error=None,
+            created_at=self.storage.new_timestamp(),
+            updated_at=self.storage.new_timestamp(),
+        )
+        return self.storage.write_artifact(artifact)
+
+    def list_jobs(self) -> list[StructureNoteArtifact]:
+        return self.storage.list_artifacts()
+
+    def get_job(self, job_id: str) -> StructureNoteArtifact:
+        return self.storage.read_artifact(job_id)
+
+    def update_status(
+        self,
+        artifact: StructureNoteArtifact,
+        status: JobStatus,
+        *,
+        error: str | None = None,
+        retry_state: str | None = None,
+        task_id: str | None = None,
+    ) -> StructureNoteArtifact:
+        artifact.status = status
+        artifact.error = error
+        artifact.retry_state = retry_state
+        if task_id is not None:
+            artifact.task_id = task_id
+        self.storage.touch_updated_at(artifact)
+        return self.storage.write_artifact(artifact)
+
+    def serialize_job(self, artifact: StructureNoteArtifact) -> dict[str, Any]:
+        citations: list[dict[str, Any]] = []
+        if artifact.citation_manifest_path and Path(artifact.citation_manifest_path).exists():
+            citations = self.storage.read_json(Path(artifact.citation_manifest_path))
+        section_tree = self._load_section_tree_payload(artifact.section_tree_path)
+        return {
+            "job_id": artifact.job_id,
+            "file_name": artifact.file_name,
+            "status": artifact.status.value,
+            "source_format": artifact.source_format,
+            "difficulty_level": artifact.difficulty_level.value,
+            "note_language": artifact.note_language.value,
+            "style_level": artifact.style_level.value,
+            "project_name": artifact.project_name,
+            "note_title": artifact.note_title,
+            "source_kind": artifact.source_kind,
+            "source_ref": artifact.source_ref,
+            "final_pdf_url": self.storage.output_url_for(artifact.final_pdf_path),
+            "rendered_markdown_url": self.storage.output_url_for(artifact.rendered_markdown_path),
+            "asset_base_url": self.storage.output_url_for(
+                self.storage.get_job_dir(artifact.job_id)
+            ),
+            "sections": section_tree,
+            "citations": citations,
+            "retry_available": artifact.status == JobStatus.FAILED,
+            "error": artifact.error,
+            "task_id": artifact.task_id,
+            "created_at": artifact.created_at,
+            "updated_at": artifact.updated_at,
+        }
+
+    async def run_job(self, job_id: str, task_id: str, emit_log) -> StructureNoteArtifact:
+        artifact = self.get_job(job_id)
+        artifact = self.update_status(artifact, JobStatus.QUEUED, error=None, task_id=task_id)
+        job_dirs = self.storage.ensure_job_dirs(job_id)
+        language = artifact.note_language.value
+        preset = get_difficulty_preset(artifact.difficulty_level)
+        style_level = artifact.style_level
+
+        try:
+            emit_log(task_id, "Preparing Structure Note job.")
+
+            normalized_pdf_path = job_dirs["normalized"] / "normalized.pdf"
+            artifact = self.update_status(
+                artifact, JobStatus.NORMALIZING, retry_state=JobStatus.NORMALIZING.value
+            )
+            if artifact.normalized_pdf_path and Path(artifact.normalized_pdf_path).exists():
+                normalized_pdf_path = Path(artifact.normalized_pdf_path)
+                emit_log(task_id, "Reusing normalized PDF.")
+            else:
+                emit_log(task_id, "Normalizing source file to PDF.")
+                normalized_pdf_path = normalize_to_pdf(
+                    Path(artifact.source_path), job_dirs["normalized"]
+                )
+                artifact.normalized_pdf_path = str(normalized_pdf_path)
+                self.storage.write_artifact(artifact)
+
+            page_index_path = job_dirs["index"] / "page_index.json"
+            artifact = self.update_status(
+                artifact, JobStatus.INDEXING, retry_state=JobStatus.INDEXING.value
+            )
+            if artifact.page_index_path and Path(artifact.page_index_path).exists():
+                emit_log(task_id, "Reusing existing page index.")
+                page_index = [
+                    PageIndexPage.model_validate(item)
+                    for item in self.storage.read_json(Path(artifact.page_index_path))
+                ]
+            else:
+                emit_log(task_id, "Building page-level index.")
+                page_index = build_page_index(normalized_pdf_path)
+                artifact.page_index_path = str(
+                    self.storage.write_json(
+                        page_index_path,
+                        [page.model_dump(mode="json") for page in page_index],
+                    )
+                )
+                self.storage.write_artifact(artifact)
+
+            section_tree_path = job_dirs["index"] / "section_tree.json"
+            artifact = self.update_status(
+                artifact, JobStatus.PLANNING, retry_state=JobStatus.PLANNING.value
+            )
+            if artifact.section_tree_path and Path(artifact.section_tree_path).exists():
+                emit_log(task_id, "Reusing section tree.")
+                section_tree = [
+                    SectionTreeNode.model_validate(item)
+                    for item in self.storage.read_json(Path(artifact.section_tree_path))
+                ]
+            else:
+                emit_log(task_id, "Deriving section tree.")
+                section_tree = await build_section_tree(
+                    page_index, preset.page_window, language=language
+                )
+                artifact.section_tree_path = str(
+                    self.storage.write_json(
+                        section_tree_path,
+                        [node.model_dump(mode="json") for node in section_tree],
+                    )
+                )
+                self.storage.write_artifact(artifact)
+
+            document_plan_path = job_dirs["index"] / "document_plan.json"
+            if artifact.document_plan_path and Path(artifact.document_plan_path).exists():
+                emit_log(task_id, "Reusing document-level plan.")
+                document_plan = DocumentPlan.model_validate(
+                    self.storage.read_json(Path(artifact.document_plan_path))
+                )
+            else:
+                emit_log(task_id, "Building document-level section plan.")
+                document_plan = build_document_plan(
+                    page_index,
+                    section_tree,
+                    document_title=artifact.file_name,
+                    language=language,
+                )
+                artifact.document_plan_path = str(
+                    self.storage.write_json(
+                        document_plan_path,
+                        document_plan.model_dump(mode="json"),
+                    )
+                )
+                self.storage.write_artifact(artifact)
+
+            chunks_path = job_dirs["chunks"] / "generation_chunks.json"
+            artifact = self.update_status(
+                artifact, JobStatus.GENERATING, retry_state=JobStatus.GENERATING.value
+            )
+            if artifact.generation_chunks_path and Path(artifact.generation_chunks_path).exists():
+                emit_log(task_id, "Reusing generated chunks.")
+                chunks = [
+                    GenerationChunk.model_validate(item)
+                    for item in self.storage.read_json(Path(artifact.generation_chunks_path))
+                ]
+            else:
+                emit_log(task_id, "Generating section-level Markdown notes.")
+                chunks = build_generation_chunks(
+                    page_index,
+                    section_tree,
+                    preset,
+                    document_plan=document_plan,
+                )
+                for chunk in chunks:
+                    chunk.markdown = await generate_chunk_markdown(
+                        chunk,
+                        page_index,
+                        preset,
+                        language=language,
+                        style_level=style_level,
+                        document_plan=document_plan,
+                    )
+                chunks = inject_image_placeholders(chunks, page_index, preset.placeholder_purpose)
+                artifact.generation_chunks_path = str(
+                    self.storage.write_json(
+                        chunks_path,
+                        [chunk.model_dump(mode="json") for chunk in chunks],
+                    )
+                )
+                self.storage.write_artifact(artifact)
+
+            image_state_path = job_dirs["chunks"] / "image_fill_state.json"
+            artifact = self.update_status(
+                artifact,
+                JobStatus.PROCESSING_IMAGES,
+                retry_state=JobStatus.PROCESSING_IMAGES.value,
+            )
+            if artifact.rendered_markdown_path and Path(artifact.rendered_markdown_path).exists():
+                emit_log(task_id, "Reusing rendered markdown after image processing.")
+                rendered_path = Path(artifact.rendered_markdown_path)
+                markdown_text = normalize_structure_note_markdown(
+                    rendered_path.read_text(encoding="utf-8")
+                )
+                rendered_path.write_text(markdown_text, encoding="utf-8")
+                image_citations = self._load_image_citations(artifact.image_fill_state_path)
+            else:
+                emit_log(task_id, "Resolving figure placeholders.")
+                chunks, placeholders, image_citations = process_images(
+                    chunks,
+                    page_index,
+                    normalized_pdf_path,
+                    job_dirs["images"],
+                    artifact.file_name,
+                    language=language,
+                )
+                self.storage.write_json(
+                    chunks_path,
+                    [chunk.model_dump(mode="json") for chunk in chunks],
+                )
+                artifact.image_fill_state_path = str(
+                    self.storage.write_json(
+                        image_state_path,
+                        {
+                            "placeholders": [item.model_dump(mode="json") for item in placeholders],
+                            "image_citations": [
+                                item.model_dump(mode="json") for item in image_citations
+                            ],
+                        },
+                    )
+                )
+                transition_map = await self._build_transition_map(
+                    chunks,
+                    language=language,
+                    style_level=style_level,
+                    document_plan=document_plan,
+                )
+                markdown_text = normalize_structure_note_markdown(
+                    self._compose_markdown(
+                        artifact,
+                        chunks,
+                        language,
+                        transition_map=transition_map,
+                    )
+                )
+                artifact.rendered_markdown_path = str(
+                    self.storage.write_text(job_dirs["final"] / "rendered.md", markdown_text)
+                )
+                self.storage.write_artifact(artifact)
+
+            artifact = self.update_status(
+                artifact, JobStatus.RENDERING, retry_state=JobStatus.RENDERING.value
+            )
+            citations = self._build_text_citations(chunks, artifact.file_name)
+            citations.extend(image_citations)
+            emit_log(task_id, "Rendering final PDF.")
+            final_pdf_path, citation_path = render_pdf(
+                markdown_text,
+                title=artifact.file_name,
+                citation_entries=citations,
+                job_dir=job_dirs["job"],
+                final_dir=job_dirs["final"],
+            )
+            artifact.final_pdf_path = str(final_pdf_path)
+            artifact.citation_manifest_path = str(citation_path)
+            artifact = self.update_status(
+                artifact, JobStatus.READY, retry_state=JobStatus.READY.value
+            )
+            self.storage.apply_retention_policy(artifact)
+            emit_log(task_id, "Structure Note is ready.")
+            return artifact
+        except Exception as exc:
+            self.logger.error(f"Structure Note job failed: {exc}", exc_info=True)
+            emit_log(task_id, f"Structure Note failed: {exc}")
+            return self.update_status(
+                artifact,
+                JobStatus.FAILED,
+                error=str(exc),
+                retry_state=artifact.status.value,
+            )
+
+    def _compose_markdown(
+        self,
+        artifact: StructureNoteArtifact,
+        chunks: list[GenerationChunk],
+        language: str,
+        *,
+        transition_map: dict[str, str] | None = None,
+    ) -> str:
+        heading = self._compose_markdown_heading(artifact, chunks, language)
+        sections: list[str] = []
+        previous_major: GenerationChunk | None = None
+        for chunk in chunks:
+            if not chunk.markdown.strip():
+                continue
+            if chunk.heading_level <= 2:
+                if previous_major is not None:
+                    transition = (transition_map or {}).get(chunk.section_id or chunk.chunk_id, "")
+                    if transition.strip():
+                        sections.append(transition.strip())
+                previous_major = chunk
+            sections.append(
+                f'<a id="{chunk.section_id or chunk.chunk_id}"></a>\n\n{chunk.markdown.strip()}'
+            )
+        return f"{heading}\n\n" + "\n\n".join(sections)
+
+    async def _build_transition_map(
+        self,
+        chunks: list[GenerationChunk],
+        *,
+        language: str,
+        style_level: ExplanationStyleLevel,
+        document_plan: DocumentPlan | None,
+    ) -> dict[str, str]:
+        transition_map: dict[str, str] = {}
+        previous_major: GenerationChunk | None = None
+        for chunk in chunks:
+            if not chunk.markdown.strip() or chunk.heading_level > 2:
+                continue
+            if previous_major is not None:
+                key = chunk.section_id or chunk.chunk_id
+                transition_map[key] = await generate_transition_markdown(
+                    previous_major,
+                    chunk,
+                    language=language,
+                    style_level=style_level,
+                    document_plan=document_plan,
+                )
+            previous_major = chunk
+        return transition_map
+
+    def _compose_markdown_heading(
+        self,
+        artifact: StructureNoteArtifact,
+        chunks: list[GenerationChunk],
+        language: str,
+    ) -> str:
+        if language == "zh":
+            lines = [
+                f"# {artifact.file_name}",
+                "",
+                f"> 结构化讲义。难度：`{artifact.difficulty_level.value}`。",
+                "",
+                "## 讲义目录",
+            ]
+            for chunk in chunks:
+                page_range = (
+                    f"第 {chunk.page_start}-{chunk.page_end} 页"
+                    if chunk.page_start != chunk.page_end
+                    else f"第 {chunk.page_start} 页"
+                )
+                indent = "  " * max(0, chunk.heading_level - 2)
+                lines.append(f"{indent}- {chunk.section_title}（{page_range}）")
+            lines.append("")
+            return "\n".join(lines)
+
+        lines = [
+            f"# {artifact.file_name}",
+            "",
+            f"> Structured lecture note. Difficulty: `{artifact.difficulty_level.value}`.",
+            "",
+            "## Lecture Outline",
+        ]
+        for chunk in chunks:
+            page_range = (
+                f"pages {chunk.page_start}-{chunk.page_end}"
+                if chunk.page_start != chunk.page_end
+                else f"page {chunk.page_start}"
+            )
+            indent = "  " * max(0, chunk.heading_level - 2)
+            lines.append(f"{indent}- {chunk.section_title} ({page_range})")
+        lines.append("")
+        return "\n".join(lines)
+
+    def _build_text_citations(
+        self, chunks: list[GenerationChunk], source_file: str
+    ) -> list[CitationEntry]:
+        citations: list[CitationEntry] = []
+        for chunk in chunks:
+            evidence_excerpt = " ".join(
+                item.excerpt for item in chunk.evidence if item.excerpt
+            ).strip()
+            excerpt = evidence_excerpt or chunk.markdown.replace("\n", " ").strip()
+            if len(excerpt) > 240:
+                excerpt = f"{excerpt[:240]}..."
+            citations.append(
+                CitationEntry(
+                    citation_id=f"cite-{chunk.chunk_id}",
+                    section_path=chunk.section_path,
+                    page_start=chunk.page_start,
+                    page_end=chunk.page_end,
+                    source_file=source_file,
+                    source_kind="text",
+                    excerpt=excerpt or None,
+                )
+            )
+        return citations
+
+    def _load_section_tree_payload(self, section_tree_path: str | None) -> list[dict[str, Any]]:
+        if not section_tree_path:
+            return []
+        path = Path(section_tree_path)
+        if not path.exists():
+            return []
+        payload = self.storage.read_json(path)
+        if not isinstance(payload, list):
+            return []
+        return [item for item in payload if isinstance(item, dict)]
+
+    def _load_image_citations(self, image_fill_state_path: str | None) -> list[CitationEntry]:
+        if not image_fill_state_path:
+            return []
+        state_path = Path(image_fill_state_path)
+        if not state_path.exists():
+            return []
+        payload = self.storage.read_json(state_path)
+        return [
+            CitationEntry.model_validate(item)
+            for item in payload.get("image_citations", [])
+            if isinstance(item, dict)
+        ]
diff --git a/deeptutor/services/structure_note/markdown_postprocessor.py b/deeptutor/services/structure_note/markdown_postprocessor.py
new file mode 100644
index 000000000..f39b92a4d
--- /dev/null
+++ b/deeptutor/services/structure_note/markdown_postprocessor.py
@@ -0,0 +1,252 @@
+from __future__ import annotations
+
+from collections.abc import Callable
+from dataclasses import dataclass
+import re
+
+_FENCE_RE = re.compile(r"(```[\s\S]*?```|~~~[\s\S]*?~~~)")
+_INLINE_CODE_RE = re.compile(r"`[^`\n]+`")
+_BRACKET_BLOCK_RE = re.compile(r"\\\[([\s\S]*?)\\\]")
+_PAREN_INLINE_RE = re.compile(r"\\\(([\s\S]*?)\\\)")
+_SINGLE_DOLLAR_RE = re.compile(r"(?<!\\)(?<!\$)\$(?!\$|\s)([^$\n]+?)(?<!\s)(?<!\\)\$(?!\$)")
+_DOUBLE_DOLLAR_RE = re.compile(r"(?<!\$)\$\$([\s\S]*?)\$\$(?!\$)")
+_LATEX_ENV_RE = re.compile(
+    r"\\begin\{(equation\*?|displaymath|align\*?|gather\*?|multline\*?)\}"
+    r"([\s\S]*?)"
+    r"\\end\{\1\}",
+)
+
+_MATH_SIGNAL_RE = re.compile(
+    r"(\\[A-Za-z]+|[=<>^_{}]|[+\-*/]\s*[A-Za-z0-9]|[A-Za-z0-9]\s*[+\-*/]|"
+    r"[≤≥≈≠→←×÷±∈∉∪∩∞∑∫√])"
+)
+_CODE_LIKE_CALL_RE = re.compile(r"^[A-Za-z_][\w.]*\([A-Za-z0-9_.,\s:'\"-]*\)$")
+
+
+@dataclass(frozen=True)
+class MarkdownValidationResult:
+    warnings: list[str]
+
+    @property
+    def ok(self) -> bool:
+        return not self.warnings
+
+
+def normalize_structure_note_markdown(markdown_text: str) -> str:
+    """Normalize Structure Note Markdown for the current online/PDF renderers.
+
+    The Structure Note render path uses remark-math/KaTeX online and a PDF
+    fallback renderer. Both paths expect inline math as ``$...$`` and display
+    math as ``$$...$$``. This pass converts unsupported wrappers, repairs common
+    mixed wrappers, and keeps code-like calls as inline code.
+    """
+
+    if not markdown_text:
+        return ""
+
+    parts = _split_fenced_code(markdown_text)
+    normalized = [
+        part if is_fence else _normalize_non_fenced_markdown(part) for is_fence, part in parts
+    ]
+    return re.sub(r"\n{3,}", "\n\n", "".join(normalized)).strip() + "\n"
+
+
+def validate_renderer_compatible_markdown(markdown_text: str) -> MarkdownValidationResult:
+    warnings: list[str] = []
+    for is_fence, part in _split_fenced_code(markdown_text):
+        if is_fence:
+            continue
+        protected, _restore = _protect_inline_code(part)
+        if re.search(r"\\[\(\)\[\]]", protected):
+            warnings.append("Unsupported LaTeX wrapper remains after normalization.")
+        if _has_inline_double_dollar(protected):
+            warnings.append("Inline double-dollar math remains after normalization.")
+        warnings.extend(_dangling_math_delimiter_warnings(protected))
+        for kind, expression in _iter_math_expressions(protected):
+            warnings.extend(_validate_math_expression(expression, kind))
+    return MarkdownValidationResult(warnings=warnings)
+
+
+def _split_fenced_code(markdown_text: str) -> list[tuple[bool, str]]:
+    parts: list[tuple[bool, str]] = []
+    last = 0
+    for match in _FENCE_RE.finditer(markdown_text):
+        if match.start() > last:
+            parts.append((False, markdown_text[last : match.start()]))
+        parts.append((True, match.group(0)))
+        last = match.end()
+    if last < len(markdown_text):
+        parts.append((False, markdown_text[last:]))
+    return parts or [(False, markdown_text)]
+
+
+def _protect_inline_code(text: str) -> tuple[str, Callable[[str], str]]:
+    protected: list[str] = []
+
+    def stash(match: re.Match[str]) -> str:
+        protected.append(match.group(0))
+        return f"\u0000CODE{len(protected) - 1}\u0000"
+
+    def restore(value: str) -> str:
+        for index, original in enumerate(protected):
+            value = value.replace(f"\u0000CODE{index}\u0000", original)
+        return value
+
+    return _INLINE_CODE_RE.sub(stash, text), restore
+
+
+def _normalize_non_fenced_markdown(text: str) -> str:
+    protected, restore = _protect_inline_code(text)
+    normalized = _LATEX_ENV_RE.sub(lambda match: _display_math(_latex_env_body(match)), protected)
+    normalized = _BRACKET_BLOCK_RE.sub(lambda match: _display_math(match.group(1)), normalized)
+    normalized = _PAREN_INLINE_RE.sub(
+        lambda match: _inline_math_replacement(match.group(1)), normalized
+    )
+    normalized = _DOUBLE_DOLLAR_RE.sub(lambda match: _display_math(match.group(1)), normalized)
+    normalized = _SINGLE_DOLLAR_RE.sub(
+        lambda match: _single_dollar_replacement(match.group(1)), normalized
+    )
+    return restore(normalized)
+
+
+def _latex_env_body(match: re.Match[str]) -> str:
+    env_name = match.group(1).rstrip("*")
+    body = match.group(2).strip()
+    if env_name in {"align", "gather", "multline"}:
+        return f"\\begin{{aligned}}\n{body}\n\\end{{aligned}}"
+    return body
+
+
+def _single_dollar_replacement(expression: str) -> str:
+    expression = _clean_math_expression(expression)
+    if _is_code_like_expression(expression):
+        return f"`{expression}`"
+    if _looks_like_math_expression(expression):
+        return _inline_math(expression)
+    return f"${expression}$"
+
+
+def _inline_math_replacement(expression: str) -> str:
+    expression = _clean_math_expression(expression)
+    if _is_code_like_expression(expression):
+        return f"`{expression}`"
+    return _inline_math(expression)
+
+
+def _inline_math(expression: str) -> str:
+    body = _clean_math_expression(expression)
+    return f"${body}$" if body else ""
+
+
+def _display_math(expression: str) -> str:
+    body = _clean_math_expression(expression)
+    return f"\n\n$$\n{body}\n$$\n\n" if body else ""
+
+
+def _clean_math_expression(expression: str) -> str:
+    body = expression.strip()
+    changed = True
+    while changed:
+        changed = False
+        for opener, closer in (("\\(", "\\)"), ("\\[", "\\]"), ("$$", "$$"), ("$", "$")):
+            if (
+                body.startswith(opener)
+                and body.endswith(closer)
+                and len(body) > len(opener) + len(closer)
+            ):
+                body = body[len(opener) : len(body) - len(closer)].strip()
+                changed = True
+    body = re.sub(r"\n{3,}", "\n\n", body)
+    return body
+
+
+def _is_code_like_expression(expression: str) -> bool:
+    if "\\" in expression or "\n" in expression:
+        return False
+    if any(symbol in expression for symbol in ("=", "^", "_", "<", ">", "+", "*", "/", "|")):
+        return False
+    return bool(_CODE_LIKE_CALL_RE.fullmatch(expression.strip()))
+
+
+def _looks_like_math_expression(expression: str) -> bool:
+    expr = expression.strip()
+    if not expr:
+        return False
+    if _MATH_SIGNAL_RE.search(expr):
+        return True
+    return bool(re.fullmatch(r"[A-Za-z](?:_[A-Za-z0-9]+)?|[A-Za-z]\d*", expr))
+
+
+def _has_inline_double_dollar(text: str) -> bool:
+    for match in _DOUBLE_DOLLAR_RE.finditer(text):
+        before = text[: match.start()].rsplit("\n", 1)[-1].strip()
+        after = text[match.end() :].split("\n", 1)[0].strip()
+        if before or after:
+            return True
+    return False
+
+
+def _iter_math_expressions(text: str) -> list[tuple[str, str]]:
+    expressions: list[tuple[str, str]] = []
+    display_spans: list[tuple[int, int]] = []
+    for match in _DOUBLE_DOLLAR_RE.finditer(text):
+        expressions.append(("display", match.group(1).strip()))
+        display_spans.append((match.start(), match.end()))
+
+    def is_inside_display(match: re.Match[str]) -> bool:
+        return any(start <= match.start() and match.end() <= end for start, end in display_spans)
+
+    for match in _SINGLE_DOLLAR_RE.finditer(text):
+        if not is_inside_display(match):
+            expressions.append(("inline", match.group(1).strip()))
+    return expressions
+
+
+def _validate_math_expression(expression: str, kind: str) -> list[str]:
+    warnings: list[str] = []
+    body = expression.strip()
+    if not body:
+        warnings.append(f"Empty {kind} math expression.")
+        return warnings
+    if "\\(" in body or "\\)" in body or "\\[" in body or "\\]" in body:
+        warnings.append(f"Unsupported LaTeX wrapper remains inside {kind} math.")
+    if "$" in body:
+        warnings.append(f"Nested dollar delimiter remains inside {kind} math.")
+    if not _balanced_braces(body, "{", "}"):
+        warnings.append(f"Unbalanced braces in {kind} math: {body[:80]}")
+    if not _balanced_braces(body, "(", ")"):
+        warnings.append(f"Unbalanced parentheses in {kind} math: {body[:80]}")
+    if not _balanced_braces(body, "[", "]"):
+        warnings.append(f"Unbalanced brackets in {kind} math: {body[:80]}")
+    return warnings
+
+
+def _balanced_braces(value: str, opener: str, closer: str) -> bool:
+    depth = 0
+    escaped = False
+    for char in value:
+        if escaped:
+            escaped = False
+            continue
+        if char == "\\":
+            escaped = True
+            continue
+        if char == opener:
+            depth += 1
+        elif char == closer:
+            depth -= 1
+            if depth < 0:
+                return False
+    return depth == 0
+
+
+def _dangling_math_delimiter_warnings(text: str) -> list[str]:
+    warnings: list[str] = []
+    without_display = _DOUBLE_DOLLAR_RE.sub("", text)
+    for line in without_display.splitlines():
+        scan = re.sub(r"\\\$", "", line)
+        scan = re.sub(r"\$\d+(?:[.,]\d+)?", "", scan)
+        single_dollars = [match.start() for match in re.finditer(r"(?<!\\)\$(?!\$)", scan)]
+        if len(single_dollars) % 2 == 1 and _MATH_SIGNAL_RE.search(scan):
+            warnings.append(f"Possible damaged inline math delimiter near: {line.strip()[:100]}")
+    return warnings
diff --git a/deeptutor/services/structure_note/models.py b/deeptutor/services/structure_note/models.py
new file mode 100644
index 000000000..275661783
--- /dev/null
+++ b/deeptutor/services/structure_note/models.py
@@ -0,0 +1,184 @@
+from __future__ import annotations
+
+from enum import Enum
+from typing import Literal
+
+from pydantic import BaseModel, Field
+
+
+class DifficultyLevel(str, Enum):
+    SIMPLE = "simple"
+    MEDIUM = "medium"
+    DETAILED = "detailed"
+
+
+class NoteLanguage(str, Enum):
+    ZH = "zh"
+    EN = "en"
+
+
+class ExplanationStyleLevel(str, Enum):
+    LOW = "low"
+    MEDIUM = "medium"
+    HIGH = "high"
+
+
+class JobStatus(str, Enum):
+    QUEUED = "queued"
+    NORMALIZING = "normalizing"
+    INDEXING = "indexing"
+    PLANNING = "planning"
+    GENERATING = "generating"
+    PROCESSING_IMAGES = "processing_images"
+    RENDERING = "rendering"
+    READY = "ready"
+    FAILED = "failed"
+
+
+class TextBlock(BaseModel):
+    text: str
+    bbox: list[float] = Field(default_factory=list)
+    font_size: float | None = None
+
+
+class TitleCandidate(BaseModel):
+    text: str
+    page_number: int
+    bbox: list[float] = Field(default_factory=list)
+    font_size: float | None = None
+    score: float = 0.0
+
+
+class ImageCandidate(BaseModel):
+    candidate_id: str
+    page_number: int
+    bbox: list[float] = Field(default_factory=list)
+    width: float | None = None
+    height: float | None = None
+    area_ratio: float | None = None
+
+
+class PageIndexPage(BaseModel):
+    page_number: int
+    width: float
+    height: float
+    text: str
+    text_blocks: list[TextBlock] = Field(default_factory=list)
+    title_candidates: list[TitleCandidate] = Field(default_factory=list)
+    image_candidates: list[ImageCandidate] = Field(default_factory=list)
+
+
+class SectionTreeNode(BaseModel):
+    section_id: str
+    title: str
+    level: int
+    page_start: int
+    page_end: int
+    summary: str = ""
+    parent_id: str | None = None
+    child_ids: list[str] = Field(default_factory=list)
+    path: list[str] = Field(default_factory=list)
+
+
+class SectionEvidence(BaseModel):
+    page_number: int
+    excerpt: str
+    title_candidates: list[str] = Field(default_factory=list)
+    image_candidate_ids: list[str] = Field(default_factory=list)
+
+
+class SectionPlan(BaseModel):
+    section_id: str
+    title: str
+    level: int
+    section_path: list[str] = Field(default_factory=list)
+    page_start: int
+    page_end: int
+    page_numbers: list[int] = Field(default_factory=list)
+    summary: str = ""
+    writing_goal: str = ""
+    dependencies: list[str] = Field(default_factory=list)
+    evidence: list[SectionEvidence] = Field(default_factory=list)
+
+
+class DocumentPlan(BaseModel):
+    document_title: str
+    document_summary: str = ""
+    outline: list[SectionPlan] = Field(default_factory=list)
+    section_order: list[str] = Field(default_factory=list)
+    page_to_sections: dict[str, list[str]] = Field(default_factory=dict)
+
+
+class CitationEntry(BaseModel):
+    citation_id: str
+    section_path: list[str] = Field(default_factory=list)
+    page_start: int
+    page_end: int
+    source_file: str
+    source_kind: Literal["text", "image"]
+    image_page: int | None = None
+    image_region: list[float] | None = None
+    excerpt: str | None = None
+
+
+class ImagePlaceholder(BaseModel):
+    placeholder_id: str
+    chunk_id: str
+    page_hint: int
+    purpose: str
+    status: Literal["pending", "filled", "fallback_page", "fallback_text", "failed"] = "pending"
+    image_path: str | None = None
+    resolved_page: int | None = None
+    resolved_region: list[float] | None = None
+    error: str | None = None
+
+
+class StructureNoteProject(BaseModel):
+    name: str
+    created_at: str
+    updated_at: str
+
+
+class GenerationChunk(BaseModel):
+    chunk_id: str
+    section_id: str | None = None
+    section_title: str
+    section_path: list[str] = Field(default_factory=list)
+    section_summary: str = ""
+    heading_level: int = 2
+    page_start: int
+    page_end: int
+    page_numbers: list[int] = Field(default_factory=list)
+    evidence: list[SectionEvidence] = Field(default_factory=list)
+    dependencies: list[str] = Field(default_factory=list)
+    markdown: str = ""
+    placeholder_ids: list[str] = Field(default_factory=list)
+
+
+class StructureNoteArtifact(BaseModel):
+    job_id: str
+    file_name: str
+    source_format: str
+    difficulty_level: DifficultyLevel
+    note_language: NoteLanguage = NoteLanguage.EN
+    style_level: ExplanationStyleLevel = ExplanationStyleLevel.MEDIUM
+    project_name: str | None = None
+    note_title: str | None = None
+    source_kind: Literal["upload", "knowledge_base"] = "upload"
+    source_ref: dict[str, str] = Field(default_factory=dict)
+    status: JobStatus
+    source_path: str
+    normalized_pdf_path: str | None = None
+    page_index_path: str | None = None
+    section_tree_path: str | None = None
+    document_plan_path: str | None = None
+    generation_chunks_path: str | None = None
+    rendered_markdown_path: str | None = None
+    image_fill_state_path: str | None = None
+    citation_manifest_path: str | None = None
+    final_pdf_path: str | None = None
+    task_id: str | None = None
+    retry_state: str | None = None
+    error: str | None = None
+    created_at: str
+    updated_at: str
diff --git a/deeptutor/services/structure_note/normalizer.py b/deeptutor/services/structure_note/normalizer.py
new file mode 100644
index 000000000..4c081bee7
--- /dev/null
+++ b/deeptutor/services/structure_note/normalizer.py
@@ -0,0 +1,49 @@
+from __future__ import annotations
+
+from pathlib import Path
+import shutil
+import subprocess
+
+
+class NormalizationError(RuntimeError):
+    pass
+
+
+def normalize_to_pdf(source_path: Path, output_dir: Path) -> Path:
+    output_dir.mkdir(parents=True, exist_ok=True)
+    suffix = source_path.suffix.lower()
+    target_pdf = output_dir / "normalized.pdf"
+
+    if suffix == ".pdf":
+        shutil.copy2(source_path, target_pdf)
+        return target_pdf
+
+    if suffix not in {".ppt", ".pptx"}:
+        raise NormalizationError(f"Unsupported file type for Structure Note: {suffix}")
+
+    soffice = shutil.which("soffice")
+    if not soffice:
+        raise NormalizationError(
+            "LibreOffice is required for PPT/PPTX uploads. Install `soffice` and retry."
+        )
+
+    command = [
+        soffice,
+        "--headless",
+        "--convert-to",
+        "pdf",
+        "--outdir",
+        str(output_dir),
+        str(source_path),
+    ]
+    result = subprocess.run(command, capture_output=True, text=True, check=False)
+    if result.returncode != 0:
+        stderr = result.stderr.strip() or result.stdout.strip() or "Unknown conversion error"
+        raise NormalizationError(f"Failed to convert PPT/PPTX to PDF: {stderr}")
+
+    converted_pdf = output_dir / f"{source_path.stem}.pdf"
+    if not converted_pdf.exists():
+        raise NormalizationError("LibreOffice reported success but did not produce a PDF output.")
+
+    converted_pdf.replace(target_pdf)
+    return target_pdf
diff --git a/deeptutor/services/structure_note/page_index.py b/deeptutor/services/structure_note/page_index.py
new file mode 100644
index 000000000..be559f920
--- /dev/null
+++ b/deeptutor/services/structure_note/page_index.py
@@ -0,0 +1,108 @@
+from __future__ import annotations
+
+from pathlib import Path
+import re
+from statistics import median
+
+from .models import ImageCandidate, PageIndexPage, TextBlock, TitleCandidate
+
+_HEADING_PATTERN = re.compile(r"^(\d+([.\-]\d+)*|[IVXLC]+|[A-Z])[\).:\s-]")
+
+
+def _bbox_list(bbox: tuple[float, float, float, float] | list[float]) -> list[float]:
+    return [float(value) for value in bbox]
+
+
+def build_page_index(pdf_path: Path) -> list[PageIndexPage]:
+    try:
+        import fitz
+    except ImportError as exc:  # pragma: no cover - dependency is runtime-required
+        raise RuntimeError("PyMuPDF is required for Structure Note indexing.") from exc
+
+    pages: list[PageIndexPage] = []
+    document = fitz.open(pdf_path)
+    try:
+        for page_index, page in enumerate(document, start=1):
+            raw = page.get_text("dict")
+            blocks: list[TextBlock] = []
+            title_candidates: list[TitleCandidate] = []
+            image_candidates: list[ImageCandidate] = []
+            font_sizes: list[float] = []
+            max_font_size = 0.0
+
+            for block in raw.get("blocks", []):
+                block_type = int(block.get("type", 0))
+                bbox = _bbox_list(block.get("bbox", [0, 0, 0, 0]))
+                if block_type == 1:
+                    width = float(bbox[2] - bbox[0])
+                    height = float(bbox[3] - bbox[1])
+                    page_area = max(page.rect.width * page.rect.height, 1.0)
+                    image_candidates.append(
+                        ImageCandidate(
+                            candidate_id=f"img-{page_index}-{len(image_candidates) + 1}",
+                            page_number=page_index,
+                            bbox=bbox,
+                            width=width,
+                            height=height,
+                            area_ratio=(width * height) / page_area,
+                        )
+                    )
+                    continue
+
+                lines = block.get("lines", [])
+                for line in lines:
+                    spans = line.get("spans", [])
+                    text = "".join(str(span.get("text", "")) for span in spans).strip()
+                    if not text:
+                        continue
+                    span_sizes = [float(span.get("size", 0.0) or 0.0) for span in spans]
+                    line_font_size = max(span_sizes) if span_sizes else None
+                    if line_font_size:
+                        font_sizes.extend(span_sizes)
+                        max_font_size = max(max_font_size, line_font_size)
+                    line_bbox = _bbox_list(line.get("bbox", bbox))
+                    blocks.append(
+                        TextBlock(
+                            text=text,
+                            bbox=line_bbox,
+                            font_size=line_font_size,
+                        )
+                    )
+
+            size_median = median(font_sizes) if font_sizes else 0.0
+            top_threshold = page.rect.height * 0.45
+            for block in blocks:
+                font_size = block.font_size or 0.0
+                heading_like = bool(_HEADING_PATTERN.match(block.text))
+                large_enough = font_size >= max(size_median + 1.5, max_font_size * 0.82, 11.5)
+                near_top = block.bbox[1] <= top_threshold
+                if len(block.text) > 160:
+                    continue
+                if not (heading_like or (large_enough and near_top)):
+                    continue
+                title_candidates.append(
+                    TitleCandidate(
+                        text=block.text,
+                        page_number=page_index,
+                        bbox=block.bbox,
+                        font_size=font_size or None,
+                        score=round((font_size or 0.0) + (3 if heading_like else 0), 3),
+                    )
+                )
+
+            page_text = "\n".join(block.text for block in blocks).strip()
+            pages.append(
+                PageIndexPage(
+                    page_number=page_index,
+                    width=float(page.rect.width),
+                    height=float(page.rect.height),
+                    text=page_text,
+                    text_blocks=blocks,
+                    title_candidates=title_candidates,
+                    image_candidates=image_candidates,
+                )
+            )
+    finally:
+        document.close()
+
+    return pages
diff --git a/deeptutor/services/structure_note/planner.py b/deeptutor/services/structure_note/planner.py
new file mode 100644
index 000000000..3e7de795b
--- /dev/null
+++ b/deeptutor/services/structure_note/planner.py
@@ -0,0 +1,125 @@
+from __future__ import annotations
+
+import re
+
+from .models import DocumentPlan, PageIndexPage, SectionEvidence, SectionPlan, SectionTreeNode
+
+
+def _clean_text(text: str, limit: int) -> str:
+    cleaned = re.sub(r"\s+", " ", text).strip()
+    if len(cleaned) <= limit:
+        return cleaned
+    return f"{cleaned[:limit].rstrip()}..."
+
+
+def _page_lookup(pages: list[PageIndexPage]) -> dict[int, PageIndexPage]:
+    return {page.page_number: page for page in pages}
+
+
+def _section_evidence(
+    pages: list[PageIndexPage],
+    page_numbers: list[int],
+    *,
+    excerpt_limit: int = 900,
+) -> list[SectionEvidence]:
+    lookup = _page_lookup(pages)
+    evidence: list[SectionEvidence] = []
+    for page_number in page_numbers:
+        page = lookup.get(page_number)
+        if not page:
+            continue
+        excerpt = _clean_text(page.text, excerpt_limit)
+        if not excerpt and not page.image_candidates and not page.title_candidates:
+            continue
+        evidence.append(
+            SectionEvidence(
+                page_number=page_number,
+                excerpt=excerpt,
+                title_candidates=[candidate.text for candidate in page.title_candidates[:5]],
+                image_candidate_ids=[
+                    candidate.candidate_id for candidate in page.image_candidates[:8]
+                ],
+            )
+        )
+    return evidence
+
+
+def _fallback_summary(evidence: list[SectionEvidence]) -> str:
+    for item in evidence:
+        if item.excerpt:
+            return _clean_text(item.excerpt, 220)
+    return ""
+
+
+def _build_page_to_sections(sections: list[SectionPlan]) -> dict[str, list[str]]:
+    mapping: dict[str, list[str]] = {}
+    for section in sections:
+        for page_number in section.page_numbers:
+            mapping.setdefault(str(page_number), []).append(section.section_id)
+    return mapping
+
+
+def _document_summary(sections: list[SectionPlan], language: str) -> str:
+    titles = [section.title for section in sections[:8]]
+    if not titles:
+        return (
+            "No extractable section structure was found."
+            if language != "zh"
+            else "未提取到可用章节结构。"
+        )
+    joined = " / ".join(titles)
+    if language == "zh":
+        return f"本讲义围绕 {joined} 等章节组织内容。"
+    return f"This note is organized around {joined}."
+
+
+def build_document_plan(
+    pages: list[PageIndexPage],
+    sections: list[SectionTreeNode],
+    *,
+    document_title: str,
+    language: str = "en",
+) -> DocumentPlan:
+    """Create the Structure Note planning backbone from the PageIndex-style tree.
+
+    This intentionally stays inside Structure Note. It uses the document tree as the
+    retrieval surface, then attaches page-grounded evidence for section generation.
+    """
+
+    section_plans: list[SectionPlan] = []
+    previous_section_id: str | None = None
+
+    for node in sorted(sections, key=lambda item: (item.page_start, item.level, item.section_id)):
+        page_numbers = list(range(node.page_start, node.page_end + 1))
+        evidence = _section_evidence(pages, page_numbers)
+        summary = node.summary.strip() or _fallback_summary(evidence)
+        writing_goal = (
+            f"Explain {node.title} as a coherent study-note section using pages {node.page_start}-{node.page_end}."
+            if language != "zh"
+            else f"基于第 {node.page_start}-{node.page_end} 页，把“{node.title}”写成连贯的学习讲义章节。"
+        )
+        dependencies = [previous_section_id] if previous_section_id else []
+        section_plans.append(
+            SectionPlan(
+                section_id=node.section_id,
+                title=node.title,
+                level=node.level,
+                section_path=node.path or [node.title],
+                page_start=node.page_start,
+                page_end=node.page_end,
+                page_numbers=page_numbers,
+                summary=summary,
+                writing_goal=writing_goal,
+                dependencies=dependencies,
+                evidence=evidence,
+            )
+        )
+        previous_section_id = node.section_id
+
+    return DocumentPlan(
+        document_title=document_title,
+        document_summary=_document_summary(section_plans, language),
+        outline=section_plans,
+        section_order=[section.section_id for section in section_plans],
+        page_to_sections=_build_page_to_sections(section_plans),
+    )
diff --git a/deeptutor/services/structure_note/renderer.py b/deeptutor/services/structure_note/renderer.py
new file mode 100644
index 000000000..0572660e9
--- /dev/null
+++ b/deeptutor/services/structure_note/renderer.py
@@ -0,0 +1,178 @@
+from __future__ import annotations
+
+from html import escape
+import json
+from pathlib import Path
+import re
+
+from .markdown_postprocessor import (
+    normalize_structure_note_markdown,
+    validate_renderer_compatible_markdown,
+)
+from .models import CitationEntry
+
+_STYLE = """
+@page {
+  margin: 20mm 16mm;
+}
+body {
+  font-family: "Helvetica", Arial, sans-serif;
+  color: #202427;
+  font-size: 11pt;
+  line-height: 1.65;
+}
+h1, h2, h3, h4 {
+  color: #111827;
+  page-break-after: avoid;
+  text-wrap: balance;
+}
+h1 {
+  font-size: 22pt;
+  margin-bottom: 8mm;
+}
+h2 {
+  font-size: 16pt;
+  margin-top: 8mm;
+}
+h3 {
+  font-size: 13pt;
+  margin-top: 6mm;
+}
+p, li {
+  orphans: 3;
+  widows: 3;
+}
+img {
+  max-width: 100%;
+  border-radius: 4px;
+  margin: 6mm 0 2mm;
+}
+figure, table, pre {
+  page-break-inside: avoid;
+}
+code {
+  background: #f3f4f6;
+  padding: 0.1rem 0.25rem;
+  border-radius: 3px;
+}
+.math-inline {
+  font-family: "Courier New", monospace;
+  background: #f9fafb;
+  border-radius: 3px;
+  padding: 0.05rem 0.2rem;
+}
+blockquote {
+  border-left: 3px solid #d1d5db;
+  color: #4b5563;
+  padding-left: 12px;
+  margin-left: 0;
+}
+.math-block {
+  display: block;
+  margin: 4mm 0;
+  padding: 3mm 4mm;
+  background: #f9fafb;
+  border: 1px solid #e5e7eb;
+  border-radius: 4px;
+  overflow-wrap: anywhere;
+}
+.math-block pre {
+  margin: 0;
+  white-space: pre-wrap;
+  font-family: "Courier New", monospace;
+  font-size: 10pt;
+  line-height: 1.45;
+  background: transparent;
+}
+"""
+
+
+class RenderError(RuntimeError):
+    pass
+
+
+_MATH_BLOCK_RE = re.compile(r"(?<!\$)\$\$\s*([\s\S]*?)\s*\$\$(?!\$)")
+_MATH_INLINE_RE = re.compile(r"(?<!\\)(?<!\$)\$(?!\$|\s)([^$\n]+?)(?<!\s)(?<!\\)\$(?!\$)")
+_FENCE_RE = re.compile(r"(```[\s\S]*?```|~~~[\s\S]*?~~~)")
+
+
+def _render_math_for_pdf(markdown_text: str) -> str:
+    parts: list[str] = []
+    last = 0
+    for match in _FENCE_RE.finditer(markdown_text):
+        if match.start() > last:
+            parts.append(_render_math_in_non_fenced_text(markdown_text[last : match.start()]))
+        parts.append(match.group(0))
+        last = match.end()
+    if last < len(markdown_text):
+        parts.append(_render_math_in_non_fenced_text(markdown_text[last:]))
+    return "".join(parts)
+
+
+def _render_math_in_non_fenced_text(markdown_text: str) -> str:
+    def replace_display(match: re.Match[str]) -> str:
+        expression = match.group(1).strip()
+        if not expression:
+            return ""
+        return f'\n\n<div class="math-block"><pre>{escape(expression)}</pre></div>\n\n'
+
+    def replace_inline(match: re.Match[str]) -> str:
+        expression = match.group(1).strip()
+        if not expression:
+            return ""
+        return f'<span class="math-inline">{escape(expression)}</span>'
+
+    rendered = _MATH_BLOCK_RE.sub(replace_display, markdown_text)
+    return _MATH_INLINE_RE.sub(replace_inline, rendered)
+
+
+def render_pdf(
+    markdown_text: str,
+    title: str,
+    citation_entries: list[CitationEntry],
+    job_dir: Path,
+    final_dir: Path,
+) -> tuple[Path, Path]:
+    try:
+        from markdown import markdown
+    except ImportError as exc:  # pragma: no cover - runtime dependency
+        raise RenderError(
+            "The `markdown` package is required for Structure Note rendering."
+        ) from exc
+
+    try:
+        from weasyprint import HTML
+    except ImportError as exc:
+        raise RenderError(
+            "WeasyPrint is required for Structure Note PDF export. Install `weasyprint` and retry."
+        ) from exc
+
+    markdown_text = normalize_structure_note_markdown(markdown_text)
+    validation = validate_renderer_compatible_markdown(markdown_text)
+    if not validation.ok:
+        detail = "; ".join(validation.warnings)
+        raise RenderError(f"Structure Note Markdown contains unsupported math syntax: {detail}")
+
+    final_dir.mkdir(parents=True, exist_ok=True)
+    html_ready_markdown = _render_math_for_pdf(markdown_text)
+    html_body = markdown(html_ready_markdown, extensions=["extra", "fenced_code", "tables", "toc"])
+    html = (
+        "<!doctype html><html><head><meta charset='utf-8'>"
+        f"<title>{title}</title><style>{_STYLE}</style>"
+        "</head><body>"
+        f"{html_body}</body></html>"
+    )
+
+    pdf_path = final_dir / "final.pdf"
+    HTML(string=html, base_url=str(job_dir)).write_pdf(str(pdf_path))
+
+    citation_path = final_dir / "citation_manifest.json"
+    with open(citation_path, "w", encoding="utf-8") as handle:
+        json.dump(
+            [entry.model_dump(mode="json") for entry in citation_entries],
+            handle,
+            ensure_ascii=False,
+            indent=2,
+        )
+
+    return pdf_path, citation_path
diff --git a/deeptutor/services/structure_note/storage.py b/deeptutor/services/structure_note/storage.py
new file mode 100644
index 000000000..a5d49f0af
--- /dev/null
+++ b/deeptutor/services/structure_note/storage.py
@@ -0,0 +1,185 @@
+from __future__ import annotations
+
+from datetime import datetime
+import json
+import os
+from pathlib import Path
+import shutil
+from typing import Any
+
+from deeptutor.services.path_service import PathService, get_path_service
+
+from .models import StructureNoteArtifact, StructureNoteProject
+
+
+def _utc_now() -> str:
+    return datetime.utcnow().isoformat()
+
+
+class StructureNoteStorage:
+    def __init__(self, path_service: PathService | None = None):
+        self.path_service = path_service or get_path_service()
+
+    def get_root_dir(self) -> Path:
+        return self.path_service.get_structure_note_dir()
+
+    def get_job_dir(self, job_id: str) -> Path:
+        return self.path_service.get_structure_note_job_dir(job_id)
+
+    def ensure_job_dirs(self, job_id: str) -> dict[str, Path]:
+        job_dir = self.get_job_dir(job_id)
+        dirs = {
+            "job": job_dir,
+            "source": job_dir / "source",
+            "normalized": job_dir / "normalized",
+            "index": job_dir / "index",
+            "chunks": job_dir / "chunks",
+            "images": job_dir / "images",
+            "final": job_dir / "final",
+        }
+        for directory in dirs.values():
+            directory.mkdir(parents=True, exist_ok=True)
+        return dirs
+
+    def artifact_path(self, job_id: str) -> Path:
+        return self.get_job_dir(job_id) / "artifact.json"
+
+    def projects_path(self) -> Path:
+        return self.get_root_dir() / "projects.json"
+
+    def write_artifact(self, artifact: StructureNoteArtifact) -> StructureNoteArtifact:
+        payload = artifact.model_dump(mode="json")
+        path = self.artifact_path(artifact.job_id)
+        path.parent.mkdir(parents=True, exist_ok=True)
+        with open(path, "w", encoding="utf-8") as handle:
+            json.dump(payload, handle, indent=2, ensure_ascii=False)
+        return artifact
+
+    def read_artifact(self, job_id: str) -> StructureNoteArtifact:
+        with open(self.artifact_path(job_id), encoding="utf-8") as handle:
+            return StructureNoteArtifact.model_validate(json.load(handle))
+
+    def artifact_exists(self, job_id: str) -> bool:
+        return self.artifact_path(job_id).exists()
+
+    def delete_job_dir(self, job_id: str) -> None:
+        shutil.rmtree(self.get_job_dir(job_id), ignore_errors=True)
+
+    def list_artifacts(self) -> list[StructureNoteArtifact]:
+        artifacts: list[StructureNoteArtifact] = []
+        root = self.get_root_dir()
+        if not root.exists():
+            return artifacts
+        for child in root.iterdir():
+            if not child.is_dir():
+                continue
+            artifact_path = child / "artifact.json"
+            if not artifact_path.exists():
+                continue
+            try:
+                with open(artifact_path, encoding="utf-8") as handle:
+                    artifacts.append(StructureNoteArtifact.model_validate(json.load(handle)))
+            except Exception:
+                continue
+        artifacts.sort(key=lambda item: item.updated_at, reverse=True)
+        return artifacts
+
+    def read_projects(self) -> list[StructureNoteProject]:
+        path = self.projects_path()
+        if not path.exists():
+            return []
+        try:
+            with open(path, encoding="utf-8") as handle:
+                payload = json.load(handle)
+        except Exception:
+            return []
+        if not isinstance(payload, list):
+            return []
+        projects: list[StructureNoteProject] = []
+        for item in payload:
+            if not isinstance(item, dict):
+                continue
+            try:
+                projects.append(StructureNoteProject.model_validate(item))
+            except Exception:
+                continue
+        return projects
+
+    def write_projects(self, projects: list[StructureNoteProject]) -> list[StructureNoteProject]:
+        path = self.projects_path()
+        path.parent.mkdir(parents=True, exist_ok=True)
+        with open(path, "w", encoding="utf-8") as handle:
+            json.dump(
+                [project.model_dump(mode="json") for project in projects],
+                handle,
+                indent=2,
+                ensure_ascii=False,
+            )
+        return projects
+
+    def write_json(self, path: Path, payload: Any) -> Path:
+        path.parent.mkdir(parents=True, exist_ok=True)
+        with open(path, "w", encoding="utf-8") as handle:
+            json.dump(payload, handle, indent=2, ensure_ascii=False)
+        return path
+
+    def read_json(self, path: Path) -> Any:
+        with open(path, encoding="utf-8") as handle:
+            return json.load(handle)
+
+    def write_text(self, path: Path, content: str) -> Path:
+        path.parent.mkdir(parents=True, exist_ok=True)
+        path.write_text(content, encoding="utf-8")
+        return path
+
+    def output_url_for(self, path: str | Path | None) -> str | None:
+        if not path:
+            return None
+        candidate = Path(path).resolve()
+        root = self.path_service.get_user_root().resolve()
+        try:
+            relative = candidate.relative_to(root)
+        except ValueError:
+            return None
+        return f"/api/outputs/{relative.as_posix()}"
+
+    def get_retention_mode(self) -> str:
+        default_mode = "full" if os.getenv("PYTEST_CURRENT_TEST") else "minimal"
+        mode = os.getenv("STRUCTURE_NOTE_RETENTION_MODE", default_mode).strip().lower()
+        return mode if mode in {"full", "minimal"} else default_mode
+
+    def apply_retention_policy(self, artifact: StructureNoteArtifact) -> None:
+        if self.get_retention_mode() != "minimal":
+            return
+
+        preserved: set[Path] = {self.artifact_path(artifact.job_id).resolve()}
+        for candidate in (
+            artifact.final_pdf_path,
+            artifact.citation_manifest_path,
+            artifact.rendered_markdown_path,
+            artifact.page_index_path,
+            artifact.section_tree_path,
+            artifact.document_plan_path,
+            artifact.generation_chunks_path,
+            artifact.image_fill_state_path,
+        ):
+            if candidate:
+                preserved.add(Path(candidate).resolve())
+
+        for directory_name in ("normalized", "index", "chunks"):
+            directory = self.get_job_dir(artifact.job_id) / directory_name
+            if not directory.exists():
+                continue
+            for child in directory.rglob("*"):
+                if child.is_dir():
+                    continue
+                if child.resolve() in preserved:
+                    continue
+                child.unlink(missing_ok=True)
+
+    def touch_updated_at(self, artifact: StructureNoteArtifact) -> StructureNoteArtifact:
+        artifact.updated_at = _utc_now()
+        return artifact
+
+    def new_timestamp(self) -> str:
+        return _utc_now()
diff --git a/deeptutor/services/structure_note/tree_builder.py b/deeptutor/services/structure_note/tree_builder.py
new file mode 100644
index 000000000..bcf0121bd
--- /dev/null
+++ b/deeptutor/services/structure_note/tree_builder.py
@@ -0,0 +1,205 @@
+from __future__ import annotations
+
+from collections import defaultdict
+import re
+
+from deeptutor.services.llm import complete as llm_complete
+from deeptutor.utils.json_parser import parse_json_response
+
+from .models import PageIndexPage, SectionTreeNode
+
+
+def _collect_heading_candidates(pages: list[PageIndexPage]) -> list[dict[str, object]]:
+    grouped: dict[tuple[int, str], dict[str, object]] = {}
+    for page in pages:
+        for candidate in page.title_candidates:
+            key = (candidate.page_number, candidate.text.strip())
+            current = grouped.get(key)
+            payload = {
+                "page_number": candidate.page_number,
+                "text": candidate.text.strip(),
+                "font_size": candidate.font_size,
+                "score": candidate.score,
+            }
+            if current is None or float(payload["score"] or 0.0) > float(
+                current.get("score") or 0.0
+            ):
+                grouped[key] = payload
+    candidates = list(grouped.values())
+    candidates.sort(key=lambda item: (int(item["page_number"]), -float(item.get("score") or 0.0)))
+    return candidates[:60]
+
+
+def _clean_excerpt(text: str, limit: int = 520) -> str:
+    cleaned = re.sub(r"\s+", " ", text).strip()
+    if len(cleaned) <= limit:
+        return cleaned
+    return f"{cleaned[:limit].rstrip()}..."
+
+
+def _page_overviews(pages: list[PageIndexPage], limit: int = 36) -> list[dict[str, object]]:
+    overviews: list[dict[str, object]] = []
+    for page in pages[:limit]:
+        overviews.append(
+            {
+                "page_number": page.page_number,
+                "heading_candidates": [candidate.text for candidate in page.title_candidates[:5]],
+                "excerpt": _clean_excerpt(page.text, 480),
+                "image_count": len(page.image_candidates),
+            }
+        )
+    return overviews
+
+
+def _summary_from_pages(pages: list[PageIndexPage], page_start: int, page_end: int) -> str:
+    snippets: list[str] = []
+    for page in pages:
+        if page_start <= page.page_number <= page_end and page.text.strip():
+            snippets.append(_clean_excerpt(page.text, 180))
+        if len(snippets) >= 2:
+            break
+    return " ".join(snippets)
+
+
+def _fallback_sections(pages: list[PageIndexPage], page_window: int) -> list[SectionTreeNode]:
+    nodes: list[SectionTreeNode] = []
+    for index, start in enumerate(range(1, len(pages) + 1, page_window), start=1):
+        end = min(start + page_window - 1, len(pages))
+        title = f"Pages {start}-{end}" if start != end else f"Page {start}"
+        nodes.append(
+            SectionTreeNode(
+                section_id=f"fallback-{index:03d}",
+                title=title,
+                level=2,
+                page_start=start,
+                page_end=end,
+                summary=_summary_from_pages(pages, start, end),
+                path=[title],
+            )
+        )
+    return nodes
+
+
+def _coerce_sections(
+    raw_sections: list[dict[str, object]], total_pages: int
+) -> list[dict[str, object]]:
+    sections: list[dict[str, object]] = []
+    seen: set[tuple[int, str]] = set()
+    for raw in raw_sections:
+        title = str(raw.get("title", "")).strip()
+        if not title:
+            continue
+        try:
+            page_start = int(raw.get("page_start", 0))
+        except Exception:
+            continue
+        if page_start < 1 or page_start > total_pages:
+            continue
+        try:
+            level = int(raw.get("level", 2))
+        except Exception:
+            level = 2
+        level = max(2, min(level, 5))
+        summary = str(raw.get("summary", "")).strip()
+        key = (page_start, title)
+        if key in seen:
+            continue
+        seen.add(key)
+        sections.append(
+            {"title": title, "page_start": page_start, "level": level, "summary": summary}
+        )
+    sections.sort(
+        key=lambda item: (int(item["page_start"]), int(item["level"]), str(item["title"]))
+    )
+    return sections
+
+
+async def build_section_tree(
+    pages: list[PageIndexPage],
+    page_window: int,
+    language: str = "en",
+) -> list[SectionTreeNode]:
+    total_pages = len(pages)
+    candidates = _collect_heading_candidates(pages)
+    if len(candidates) < 2:
+        return _fallback_sections(pages, page_window)
+
+    prompt = (
+        "You are building a PageIndex-style document tree for Structure Note only.\n"
+        "PageIndex uses a table-of-contents-like hierarchy first, then retrieves by reasoning over that tree. "
+        "Your task is to infer a stable document-level outline, not page-by-page notes.\n"
+        "Return JSON only with shape "
+        '{"sections": [{"title": str, "level": 2-5, "page_start": int, "summary": str}]}\n'
+        "Rules:\n"
+        "- Keep the sections in reading order.\n"
+        "- Use only headings that are strongly supported by the candidates.\n"
+        "- Use levels 2-5 only.\n"
+        "- Do not invent page numbers outside the document.\n"
+        "- Include 3-20 sections depending on the material.\n"
+        "- Merge repeated slide headers into one section when they represent the same topic.\n"
+        "- Summaries should describe the section topic in one short sentence.\n"
+        f"- Output language: {'Chinese' if language == 'zh' else 'English'}.\n\n"
+        f"Total pages: {total_pages}\n"
+        f"Heading candidates: {candidates}\n"
+        f"Page overviews: {_page_overviews(pages)}"
+    )
+
+    try:
+        raw_response = await llm_complete(
+            prompt=prompt,
+            system_prompt="You convert page heading candidates into structured JSON.",
+            temperature=0.1,
+        )
+        parsed = parse_json_response(raw_response, fallback={})
+        raw_sections = parsed.get("sections") if isinstance(parsed, dict) else None
+        if not isinstance(raw_sections, list):
+            raise ValueError("Missing sections array")
+        sections = _coerce_sections(raw_sections, total_pages)
+    except Exception:
+        sections = []
+
+    if not sections:
+        return _fallback_sections(pages, page_window)
+
+    nodes: list[SectionTreeNode] = []
+    stack: list[SectionTreeNode] = []
+    child_map: dict[str, list[str]] = defaultdict(list)
+
+    for index, section in enumerate(sections):
+        title = str(section["title"])
+        page_start = int(section["page_start"])
+        level = int(section["level"])
+
+        while stack and stack[-1].level >= level:
+            stack.pop()
+
+        parent_id = stack[-1].section_id if stack else None
+        path = [*stack[-1].path, title] if stack else [title]
+        node = SectionTreeNode(
+            section_id=f"section-{index + 1:03d}",
+            title=title,
+            level=level,
+            page_start=page_start,
+            page_end=page_start,
+            summary=str(section.get("summary") or ""),
+            parent_id=parent_id,
+            path=path,
+        )
+        if parent_id:
+            child_map[parent_id].append(node.section_id)
+        nodes.append(node)
+        stack.append(node)
+
+    for index, node in enumerate(nodes):
+        next_boundary = total_pages + 1
+        for later in nodes[index + 1 :]:
+            if later.level <= node.level:
+                next_boundary = later.page_start
+                break
+        node.page_end = max(node.page_start, min(total_pages, next_boundary - 1))
+        if not node.summary:
+            node.summary = _summary_from_pages(pages, node.page_start, node.page_end)
+
+    for node in nodes:
+        node.child_ids = child_map.get(node.section_id, [])
+    return nodes
diff --git a/docs/features/overview.md b/docs/features/overview.md
new file mode 100644
index 000000000..d257ccb89
--- /dev/null
+++ b/docs/features/overview.md
@@ -0,0 +1,162 @@
+# 🏛️ DeepTutor's Framework
+
+<img src="/full-pipe.png" alt="DeepTutor Full-Stack Workflow" width="100%">
+
+## 💬 User Interface Layer
+• **Intuitive Interaction**: Simple bidirectional query-response flow for intuitive interaction.  
+• **Structured Output**: Structured response generation that organizes complex information into actionable outputs.  
+• **Dark/Light Mode**: System-wide theme support with automatic system preference detection.  
+• **Collapsible Sidebar**: Compact navigation with icon-only mode for focused learning.
+
+## 🤖 Intelligent Agent Modules
+• **Problem Solving & Assessment**: Step-by-step problem solving and custom assessment generation.  
+• **Research & Learning**: Deep Research for topic exploration and Guided Learning with visualization.  
+• **Idea Generation**: Automated and interactive concept development with multi-source insights.
+
+## 🔧 Tool Integration Layer
+• **Information Retrieval**: RAG hybrid retrieval, real-time web search, and academic paper databases.  
+• **Processing & Analysis**: Python code execution, query item lookup, and PDF parsing for document analysis.  
+• **Multi-Provider Support**: Flexible LLM providers (OpenAI, Anthropic, Ollama, etc.) and embedding adapters (OpenAI, Jina, Cohere, Ollama, etc.).
+
+## 🧠 Knowledge & Memory Foundation
+• **Knowledge Graph**: Entity-relation mapping for semantic connections and knowledge discovery.  
+• **Vector Store**: Embedding-based semantic search for intelligent content retrieval.  
+• **Memory System**: Session state management and citation tracking for contextual continuity.
+
+---
+
+# Key Features of DeepTutor
+
+## 📚 Massive Document Knowledge Q&A
+
+• **Smart Knowledge Base**: Upload textbooks, research papers, technical manuals, and domain-specific documents. Build a comprehensive AI-powered knowledge repository for instant access.
+
+• **Multi-Agent Problem Solving**: Dual-loop reasoning architecture with RAG, web search, paper search, and code execution—delivering step-by-step solutions with precise citations.
+
+## 🎨 Interactive Learning Visualization
+
+• **Knowledge Simplification & Explanations**: Transform complex concepts, knowledge, and algorithms into easy-to-understand visual aids, detailed step-by-step breakdowns, and engaging interactive demonstrations.
+
+• **Personalized Q&A**: Context-aware conversations that adapt to your learning progress, with interactive pages and session-based knowledge tracking.
+
+## 🎯 Knowledge Reinforcement with Practice Problem Generator
+
+• **Intelligent Exercise Creation**: Generate targeted quizzes, practice problems, and customized assessments tailored to your current knowledge level and specific learning objectives.
+
+• **Authentic Exam Simulation**: Upload reference exams to generate practice questions that perfectly match the original style, format, and difficulty—giving you realistic preparation for the actual test.
+
+## 🔍 Deep Research & Idea Generation
+
+• **Comprehensive Research & Literature Review**: Conduct in-depth topic exploration with systematic analysis. Identify patterns, connect related concepts across disciplines, and synthesize existing research findings.
+
+• **Novel Insight Discovery**: Generate structured learning materials and uncover knowledge gaps. Identify promising new research directions through intelligent cross-domain knowledge synthesis.
+
+---
+
+<!-- Core Learning Experience -->
+
+<table>
+<tr>
+<td width="50%" align="center" valign="top">
+
+### 📚 Massive Document Knowledge Q&A
+
+<img src="/solve.gif" alt="Document Q&A demonstration" width="100%">
+
+Document Q&A and Step-by-Step Problem Solving
+
+</td>
+<td width="50%" align="center" valign="top">
+
+### 🎨 Interactive Learning Visualization
+
+<img src="/guided-learning.gif" alt="Interactive learning visualization demo" width="100%">
+
+Interactive AI Learning with Knowledge Visual Explanations
+
+</td>
+</tr>
+</table>
+
+<!-- Practice & Reinforcement -->
+
+### 🎯 Knowledge Reinforcement
+
+<table>
+<tr>
+<td width="50%" valign="top" align="center">
+
+<img src="/question-1.gif" alt="Custom question generation demo" width="100%">
+
+**Custom Questions**  
+Auto-Validated Practice Questions with Instant Feedback
+
+</td>
+<td width="50%" valign="top" align="center">
+
+<img src="/question-2.gif" alt="Mimic exam style questions demo" width="100%">
+
+**Mimic Questions**  
+Clone Exam Style for Authentic Practice
+
+</td>
+</tr>
+</table>
+
+<!-- Research & Creation -->
+
+### 🔍 Deep Research & Idea Generation
+
+<table>
+<tr>
+<td width="33%" align="center">
+
+<img src="/deepresearch.gif" alt="Deep research with web and paper search demo" width="100%">
+
+**Deep Research**  
+Web and Paper Search with Literature Review
+
+</td>
+<td width="33%" align="center">
+
+<img src="/ideagen.gif" alt="Automated idea generation demo" width="100%">
+
+**Automated IdeaGen**  
+Systematic Brainstorming and Concept Synthesis
+
+</td>
+<td width="33%" align="center">
+
+<img src="/co-writer.gif" alt="Interactive idea generation demo" width="100%">
+
+**Interactive IdeaGen**  
+RAG-powered Idea Generation with Multi-Source Insights
+
+</td>
+</tr>
+</table>
+
+<!-- Knowledge Infrastructure -->
+
+### 🏗️ All-in-One Knowledge System
+
+<table>
+<tr>
+<td width="50%" align="center">
+
+<img src="/knowledge_bases.png" alt="Personal knowledge base demo" width="100%">
+
+**Personal Knowledge Base**  
+Build and Organize Your Own Knowledge Repository
+
+</td>
+<td width="50%" align="center">
+
+<img src="/notebooks.png" alt="Personal notebook demo" width="100%">
+
+**Personal Notebook**  
+Your Contextual Memory for Learning Sessions
+
+</td>
+</tr>
+</table>
diff --git a/docs/guide/data-preparation.md b/docs/guide/data-preparation.md
new file mode 100644
index 000000000..7b502b06d
--- /dev/null
+++ b/docs/guide/data-preparation.md
@@ -0,0 +1,185 @@
+# Data Preparation
+
+DeepTutor provides demo knowledge bases and sample questions to help you get started quickly.
+
+## Demo Knowledge Bases
+
+We provide two pre-built knowledge bases on [Google Drive](https://drive.google.com/drive/folders/1iWwfZXiTuQKQqUYb5fGDZjLCeTUP6DA6?usp=sharing):
+
+### 1. Research Papers Collection
+
+<div class="info-card">
+  <div class="info-header">
+    <span class="info-icon">📄</span>
+    <span class="info-title">5 Research Papers (20-50 pages each)</span>
+  </div>
+  <div class="info-content">
+    <p>A curated collection of cutting-edge research papers from our lab, covering RAG and Agent fields.</p>
+    <p><strong>Included Papers:</strong></p>
+    <ul>
+      <li><a href="https://github.com/HKUDS/AI-Researcher">AI-Researcher</a> - Automated research paper generation</li>
+      <li><a href="https://github.com/HKUDS/AutoAgent">AutoAgent</a> - Autonomous agent framework</li>
+      <li><a href="https://github.com/HKUDS/RAG-Anything">RAG-Anything</a> - Multimodal RAG system</li>
+      <li><a href="https://github.com/HKUDS/LightRAG">LightRAG</a> - Simple and fast RAG</li>
+      <li><a href="https://github.com/HKUDS/VideoRAG">VideoRAG</a> - Video understanding with RAG</li>
+    </ul>
+    <p><strong>Best for:</strong> Research scenarios, broad knowledge coverage</p>
+  </div>
+</div>
+
+### 2. Data Science Textbook
+
+<div class="info-card">
+  <div class="info-header">
+    <span class="info-icon">📚</span>
+    <span class="info-title">8 Chapters, 296 Pages</span>
+  </div>
+  <div class="info-content">
+    <p>A comprehensive deep learning textbook from UC Berkeley.</p>
+    <p><strong>Source:</strong> <a href="https://ma-lab-berkeley.github.io/deep-representation-learning-book/">Deep Representation Learning Book</a></p>
+    <p><strong>Topics Covered:</strong></p>
+    <ul>
+      <li>Neural Network Fundamentals</li>
+      <li>Representation Learning</li>
+      <li>Deep Learning Architectures</li>
+      <li>Advanced Topics</li>
+    </ul>
+    <p><strong>Best for:</strong> Learning scenarios, deep knowledge depth</p>
+  </div>
+</div>
+
+## Download & Setup
+
+### Step 1: Download
+
+Visit our [Google Drive folder](https://drive.google.com/drive/folders/1iWwfZXiTuQKQqUYb5fGDZjLCeTUP6DA6?usp=sharing) and download:
+
+- `knowledge_bases.zip` - Pre-built knowledge bases with embeddings
+- `questions.zip` - Sample questions and usage examples (optional)
+
+### Step 2: Extract
+
+Extract the downloaded files into the `data/` directory:
+
+```
+DeepTutor/
+├── data/
+│   └── knowledge_bases/
+│       ├── research_papers/      # Research papers KB
+│       ├── data_science_book/    # Textbook KB
+│       └── kb_config.json        # Knowledge base config
+└── user/                         # User data (auto-created)
+```
+
+### Step 3: Verify
+
+After extracting, your knowledge bases will be automatically available when you start DeepTutor.
+
+::: warning Embedding Compatibility
+Our demo knowledge bases use `text-embedding-3-large` with `dimensions = 3072`.
+
+If your embedding model has different dimensions, you'll need to create your own knowledge base instead.
+:::
+
+## Creating Custom Knowledge Bases
+
+### Supported File Formats
+
+| Format | Extension | Notes |
+|:-------|:----------|:------|
+| PDF | `.pdf` | Supports text extraction and layout analysis |
+| Text | `.txt` | Plain text files |
+| Markdown | `.md` | Markdown with formatting support |
+
+### Via Web Interface
+
+1. Navigate to `http://localhost:3782/knowledge`
+2. Click **"New Knowledge Base"**
+3. Enter a unique name for your knowledge base
+4. Upload your documents (single or batch upload)
+5. Wait for processing to complete
+
+::: tip Processing Time
+- Small documents (< 10 pages): ~1 minute
+- Medium documents (10-100 pages): ~5-10 minutes
+- Large documents (100+ pages): May take longer
+:::
+
+### Via Command Line
+
+```bash
+# Initialize a new knowledge base with documents
+python -m src.knowledge.start_kb init <kb_name> --docs <pdf_path>
+
+# Add documents to existing knowledge base
+python -m src.knowledge.add_documents <kb_name> --docs <new_document.pdf>
+```
+
+## Data Storage Structure
+
+All user data is stored in the `data/` directory:
+
+```
+data/
+├── knowledge_bases/              # Knowledge base storage
+│   ├── <kb_name>/
+│   │   ├── documents/            # Original documents
+│   │   ├── chunks/               # Chunked content
+│   │   ├── embeddings/           # Vector embeddings
+│   │   └── graph/                # Knowledge graph data
+└── user/                         # User activity data
+    ├── solve/                    # Problem solving results
+    ├── question/                 # Generated questions
+    ├── research/                 # Research reports
+    ├── notebook/                 # Notebook records
+    └── logs/                     # System logs
+```
+
+---
+
+**Next Step:** [Local Installation →](/guide/local-start)
+
+<style>
+.info-card {
+  background: var(--vp-c-bg-soft);
+  border: 1px solid var(--vp-c-border);
+  border-radius: 12px;
+  padding: 20px;
+  margin: 16px 0;
+}
+
+.info-header {
+  display: flex;
+  align-items: center;
+  gap: 12px;
+  margin-bottom: 16px;
+}
+
+.info-icon {
+  font-size: 1.5rem;
+}
+
+.info-title {
+  font-size: 1.1rem;
+  font-weight: 600;
+  color: var(--vp-c-text-1);
+}
+
+.info-content {
+  color: var(--vp-c-text-2);
+  line-height: 1.7;
+}
+
+.info-content ul {
+  margin: 12px 0;
+  padding-left: 20px;
+}
+
+.info-content li {
+  margin: 6px 0;
+}
+
+.info-content a {
+  color: var(--vp-c-brand-1);
+}
+</style>
diff --git a/docs/guide/local-start.md b/docs/guide/local-start.md
new file mode 100644
index 000000000..e015eec86
--- /dev/null
+++ b/docs/guide/local-start.md
@@ -0,0 +1,190 @@
+# Local Installation
+
+This guide covers manual installation for development or non-Docker environments.
+
+## Prerequisites
+
+- **Python 3.10+** — [Download](https://www.python.org/downloads/)
+- **Node.js 18+** — [Download](https://nodejs.org/)
+- **Git** — [Download](https://git-scm.com/)
+
+::: tip Windows Users
+If you encounter path length errors during installation, enable long path support:
+
+```cmd
+reg add "HKLM\SYSTEM\CurrentControlSet\Control\FileSystem" /v LongPathsEnabled /t REG_DWORD /d 1 /f
+```
+
+Restart your terminal after running this command.
+:::
+
+## Step 1: Set Up Virtual Environment
+
+Choose one of the following options:
+
+::: code-group
+
+```bash [Conda (Recommended)]
+# Create environment
+conda create -n deeptutor python=3.10
+
+# Activate environment
+conda activate deeptutor
+```
+
+```bash [venv]
+# Create environment
+python -m venv venv
+
+# Activate (Windows)
+venv\Scripts\activate
+
+# Activate (macOS/Linux)
+source venv/bin/activate
+```
+
+:::
+
+## Step 2: Install Dependencies
+
+### Option A: Automated Installation (Recommended)
+
+```bash
+# Using Python script
+python scripts/install_all.py
+
+# Or using shell script (macOS/Linux)
+bash scripts/install_all.sh
+```
+
+### Option B: Manual Installation
+
+```bash
+# Install Python dependencies
+pip install -r requirements.txt
+
+# Install Node.js dependencies
+npm install --prefix web
+```
+
+::: warning Common Issues
+If you see `npm: command not found`:
+
+```bash
+# Using Conda
+conda install -c conda-forge nodejs
+
+# Or install from https://nodejs.org/
+```
+:::
+
+## Step 3: Configure Environment
+
+Make sure you have completed the [Pre-Configuration](/guide/pre-config) steps:
+
+1. ✅ Created `.env` file with your API keys
+2. ✅ (Optional) Customized `config/agents.yaml`
+3. ✅ (Optional) Downloaded demo knowledge bases
+
+## Step 4: Launch Application
+
+### Start Web Interface (Recommended)
+
+```bash
+python scripts/start_web.py
+```
+
+This starts both the **frontend** (Next.js) and **backend** (FastAPI) servers.
+
+### Alternative: CLI Interface Only
+
+```bash
+python scripts/start.py
+```
+
+### Access URLs
+
+| Service | URL | Description |
+|:---:|:---|:---|
+| **Frontend** | http://localhost:3782 | Main web interface |
+| **API Docs** | http://localhost:8001/docs | Interactive API documentation |
+
+## Advanced: Start Services Separately
+
+For development, you may want to run frontend and backend separately:
+
+### Backend (FastAPI)
+
+```bash
+python src/api/run_server.py
+
+# Or with uvicorn directly
+uvicorn src.api.main:app --host 0.0.0.0 --port 8001 --reload
+```
+
+### Frontend (Next.js)
+
+First, create `web/.env.local`:
+
+```bash
+NEXT_PUBLIC_API_BASE=http://localhost:8001
+```
+
+Then start the development server:
+
+```bash
+cd web
+npm install
+npm run dev -- -p 3782
+```
+
+## Stopping the Service
+
+Press `Ctrl+C` in the terminal to stop the service.
+
+::: warning Port Still in Use?
+If you see "port already in use" after pressing Ctrl+C:
+
+**macOS/Linux:**
+```bash
+lsof -i :8001
+kill -9 <PID>
+```
+
+**Windows:**
+```bash
+netstat -ano | findstr :8001
+taskkill /PID <PID> /F
+```
+:::
+
+## Troubleshooting
+
+### Backend fails to start
+
+**Checklist:**
+- Confirm Python version >= 3.10: `python --version`
+- Confirm all dependencies installed: `pip install -r requirements.txt`
+- Check if port 8001 is in use
+- Verify `.env` file configuration
+
+### Frontend cannot connect to backend
+
+**Solutions:**
+1. Confirm backend is running: visit http://localhost:8001/docs
+2. Check browser console for error messages
+3. Create `web/.env.local` with:
+   ```bash
+   NEXT_PUBLIC_API_BASE=http://localhost:8001
+   ```
+
+### WebSocket connection fails
+
+**Checklist:**
+- Confirm backend is running
+- Check firewall settings
+- Verify WebSocket URL format: `ws://localhost:8001/api/v1/...`
+
+---
+
+**Next Step:** [Docker Deployment →](/guide/docker-start)
diff --git a/docs/guide/pre-config.md b/docs/guide/pre-config.md
new file mode 100644
index 000000000..4056263c6
--- /dev/null
+++ b/docs/guide/pre-config.md
@@ -0,0 +1,201 @@
+# Pre-Configuration
+
+Before starting DeepTutor, you need to complete the following setup steps.
+
+## 1. Clone Repository
+
+```bash
+git clone https://github.com/HKUDS/DeepTutor.git
+cd DeepTutor
+```
+
+## 2. Environment Variables Setup
+
+Create your `.env` file from the template:
+
+```bash
+cp .env.example .env
+```
+
+Then edit the `.env` file with your API keys:
+
+```bash
+# ============================================================================
+# Server Configuration
+# ============================================================================
+BACKEND_PORT=8001                         # Backend API port
+FRONTEND_PORT=3782                        # Frontend web port
+
+# For remote/LAN access - set to your server's IP address
+# NEXT_PUBLIC_API_BASE=http://192.168.1.100:8001
+
+# ============================================================================
+# LLM (Large Language Model) Configuration - Required
+# ============================================================================
+LLM_BINDING=openai                        # Provider: openai, anthropic, azure_openai, ollama, etc.
+LLM_MODEL=gpt-4o                          # Model name: gpt-4o, deepseek-chat, claude-3-5-sonnet, etc.
+LLM_HOST=https://api.openai.com/v1        # API endpoint URL
+LLM_API_KEY=your_api_key                  # Your LLM API key
+
+# ============================================================================
+# Embedding Model Configuration - Required for Knowledge Base
+# ============================================================================
+EMBEDDING_BINDING=openai                  # Provider type
+EMBEDDING_MODEL=text-embedding-3-large    # Embedding model name
+EMBEDDING_DIMENSION=3072                  # Must match model dimensions
+EMBEDDING_HOST=https://api.openai.com/v1  # API endpoint
+EMBEDDING_API_KEY=your_api_key            # Embedding API key
+
+# ============================================================================
+# Web Search Configuration - Optional
+# ============================================================================
+SEARCH_PROVIDER=perplexity                # Options: perplexity, tavily, serper, jina, exa, baidu
+SEARCH_API_KEY=your_search_api_key        # API key for search provider
+```
+
+### Environment Variables Reference
+
+| Variable | Required | Description |
+|:---|:---:|:---|
+| `LLM_MODEL` | **Yes** | Model name (e.g., `gpt-4o`, `deepseek-chat`) |
+| `LLM_API_KEY` | **Yes** | Your LLM API key |
+| `LLM_HOST` | **Yes** | API endpoint URL |
+| `EMBEDDING_MODEL` | **Yes** | Embedding model name |
+| `EMBEDDING_DIMENSION` | **Yes** | Must match model output dimensions |
+| `EMBEDDING_API_KEY` | **Yes** | Embedding API key |
+| `EMBEDDING_HOST` | **Yes** | Embedding API endpoint |
+| `BACKEND_PORT` | No | Backend port (default: `8001`) |
+| `FRONTEND_PORT` | No | Frontend port (default: `3782`) |
+| `NEXT_PUBLIC_API_BASE` | No | Set for remote/LAN access |
+| `SEARCH_PROVIDER` | No | Web search provider |
+| `SEARCH_API_KEY` | No | Search API key |
+
+### Supported LLM Providers
+
+| Provider | `LLM_BINDING` Value | Notes |
+|:---------|:--------------------|:------|
+| OpenAI | `openai` | GPT-4o, GPT-4, GPT-3.5 |
+| Anthropic | `anthropic` | Claude 3.5, Claude 3 |
+| Azure OpenAI | `azure_openai` | Enterprise deployments |
+| Ollama | `ollama` | Local models |
+| DeepSeek | `deepseek` | DeepSeek-V3, DeepSeek-R1 |
+| Groq | `groq` | Fast inference |
+| OpenRouter | `openrouter` | Multi-model gateway |
+| Google Gemini | `gemini` | OpenAI-compatible mode |
+
+### Supported Embedding Providers
+
+| Provider | `EMBEDDING_BINDING` Value | Notes |
+|:---------|:--------------------------|:------|
+| OpenAI | `openai` | text-embedding-3-large/small |
+| Azure OpenAI | `azure_openai` | Enterprise deployments |
+| Jina AI | `jina` | jina-embeddings-v3 |
+| Cohere | `cohere` | embed-v3 series |
+| Ollama | `ollama` | Local embedding models |
+| LM Studio | `lm_studio` | Local inference server |
+| HuggingFace | `huggingface` | OpenAI-compatible endpoints |
+
+## 3. Configuration Files
+
+DeepTutor uses two YAML configuration files for customization:
+
+### `config/agents.yaml` - Agent Parameters
+
+This file controls LLM parameters for each module:
+
+```yaml
+# Solve Module - Problem solving agents
+solve:
+  temperature: 0.3
+  max_tokens: 8192
+
+# Research Module - Deep research agents  
+research:
+  temperature: 0.5
+  max_tokens: 12000
+
+# Question Module - Question generation agents
+question:
+  temperature: 0.7
+  max_tokens: 4096
+
+# Guide Module - Learning guidance agents
+guide:
+  temperature: 0.5
+  max_tokens: 16192
+
+# IdeaGen Module - Idea generation agents
+ideagen:
+  temperature: 0.7
+  max_tokens: 4096
+
+# CoWriter Module - Collaborative writing agents
+co_writer:
+  temperature: 0.7
+  max_tokens: 4096
+```
+
+### `config/main.yaml` - System Settings
+
+This file controls paths, tools, and module-specific settings:
+
+```yaml
+# System language
+system:
+  language: en
+
+# Data paths
+paths:
+  user_data_dir: ./data/user
+  knowledge_bases_dir: ./data/knowledge_bases
+
+# Tool configuration
+tools:
+  rag_tool:
+    kb_base_dir: ./data/knowledge_bases
+    default_kb: ai_textbook
+  run_code:
+    workspace: ./data/user/run_code_workspace
+  web_search:
+    enabled: true
+  query_item:
+    enabled: true
+    max_results: 5
+
+# Module-specific settings
+research:
+  researching:
+    execution_mode: series      # "series" or "parallel"
+    max_iterations: 5
+    enable_rag_hybrid: true
+    enable_paper_search: true
+    enable_web_search: true
+```
+
+> **Tip:** For most users, the default configuration works well. Only modify these files if you need specific customizations.
+
+## 4. Knowledge Base Preparation (Optional)
+
+You can use our pre-built demo knowledge bases to get started quickly.
+
+### Download Demo Knowledge Bases
+
+Download from [Google Drive](https://drive.google.com/drive/folders/1iWwfZXiTuQKQqUYb5fGDZjLCeTUP6DA6?usp=sharing) and extract into the `data/` directory.
+
+::: info Important
+The demo knowledge bases use `text-embedding-3-large` with `dimensions = 3072`. Make sure your embedding model has matching dimensions.
+:::
+
+### Create Your Own Knowledge Base
+
+After launching DeepTutor:
+
+1. Navigate to `http://localhost:3782/knowledge`
+2. Click **"New Knowledge Base"**
+3. Enter a unique name
+4. Upload PDF/TXT/MD files
+5. Monitor progress in the terminal
+
+---
+
+**Next Step:** [Data Preparation →](/guide/data-preparation)
diff --git a/docs/guide/troubleshooting.md b/docs/guide/troubleshooting.md
new file mode 100644
index 000000000..37803c3ff
--- /dev/null
+++ b/docs/guide/troubleshooting.md
@@ -0,0 +1,170 @@
+# ❓ FAQ
+
+## Backend fails to start?
+
+**Checklist**
+- Confirm Python version >= 3.10
+- Confirm all dependencies installed: `pip install -r requirements.txt`
+- Check if port 8001 is in use (configurable in `config/main.yaml`)
+- Check `.env` file configuration
+
+**Solutions**
+- **Change port**: Edit `config/main.yaml` server.backend_port
+- **Check logs**: Review terminal error messages
+
+---
+
+## Port occupied after Ctrl+C?
+
+**Problem**
+
+After pressing Ctrl+C during a running task (e.g., deep research), restarting shows "port already in use" error.
+
+**Cause**
+
+Ctrl+C sometimes only terminates the frontend process while the backend continues running in the background.
+
+**Solution**
+
+```bash
+# macOS/Linux
+kill -9 $(lsof -t -i :8001)
+
+# Windows
+netstat -ano | findstr :8001
+taskkill /PID <PID> /F
+```
+
+Then restart the service with `python scripts/start_web.py`.
+
+---
+
+## npm: command not found error?
+
+**Problem**
+
+Running `scripts/start_web.py` shows `npm: command not found` or exit status 127.
+
+**Checklist**
+- Check if npm is installed: `npm --version`
+- Check if Node.js is installed: `node --version`
+- Confirm conda environment is activated (if using conda)
+
+**Solutions**
+```bash
+# Option A: Using Conda (Recommended)
+conda install -c conda-forge nodejs
+
+# Option B: Using Official Installer
+# Download from https://nodejs.org/
+
+# Option C: Using nvm
+nvm install 18
+nvm use 18
+```
+
+**Verify Installation**
+```bash
+node --version  # Should show v18.x.x or higher
+npm --version   # Should show version number
+```
+
+---
+
+## Frontend cannot connect to backend?
+
+**Checklist**
+- Confirm backend is running (visit `http://localhost:8001/docs`)
+- Check browser console for error messages
+
+**Solution**
+
+Create `.env.local` in `web` directory:
+
+```bash
+NEXT_PUBLIC_API_BASE=http://localhost:8001
+```
+
+---
+
+## WebSocket connection fails?
+
+**Checklist**
+- Confirm backend is running
+- Check firewall settings
+- Confirm WebSocket URL is correct
+
+**Solution**
+- **Check backend logs**
+- **Confirm URL format**: `ws://localhost:8001/api/v1/...`
+
+---
+
+## Where are module outputs stored?
+
+| Module | Output Path |
+|:---:|:---|
+| Solve | `data/user/solve/solve_YYYYMMDD_HHMMSS/` |
+| Question | `data/user/question/question_YYYYMMDD_HHMMSS/` |
+| Research | `data/user/research/reports/` |
+| Interactive IdeaGen | `data/user/co-writer/` |
+| Notebook | `data/user/notebook/` |
+| Guide | `data/user/guide/session_{session_id}.json` |
+| Logs | `data/user/logs/` |
+
+---
+
+## How to add a new knowledge base?
+
+**Web Interface**
+1. Visit `http://localhost:3782/knowledge`
+2. Click "New Knowledge Base"
+3. Enter knowledge base name
+4. Upload PDF/TXT/MD documents
+5. System will process documents in background
+
+**CLI**
+```bash
+python -m src.knowledge.start_kb init <kb_name> --docs <pdf_path>
+```
+
+---
+
+## How to incrementally add documents to existing KB?
+
+**CLI (Recommended)**
+```bash
+python -m src.knowledge.add_documents <kb_name> --docs <new_document.pdf>
+```
+
+**Benefits**
+- Only processes new documents, saves time and API costs
+- Automatically merges with existing knowledge graph
+- Preserves all existing data
+
+---
+
+## Numbered items extraction failed with uvloop.Loop error?
+
+**Problem**
+
+When initializing a knowledge base, you may encounter this error:
+```text
+ValueError: Can't patch loop of type <class 'uvloop.Loop'>
+```
+
+This occurs because Uvicorn uses `uvloop` event loop by default, which is incompatible with `nest_asyncio`.
+
+**Solution**
+
+Use one of the following methods to extract numbered items:
+
+```bash
+# Option 1: Using the shell script (recommended)
+./scripts/extract_numbered_items.sh <kb_name>
+
+# Option 2: Direct Python command
+python src/knowledge/extract_numbered_items.py --kb <kb_name> --base-dir ./data/knowledge_bases
+```
+
+This will extract numbered items (Definitions, Theorems, Equations, etc.) from your knowledge base without reinitializing it.
diff --git a/docs/index.md b/docs/index.md
new file mode 100644
index 000000000..3e892b379
--- /dev/null
+++ b/docs/index.md
@@ -0,0 +1,77 @@
+---
+layout: home
+
+hero:
+  name: "DeepTutor"
+  text: "Your AI Learning Companion"
+  tagline: Transform any document into an interactive learning experience with multi-agent intelligence
+  image:
+    src: /logo.png
+    alt: DeepTutor
+  actions:
+    - theme: brand
+      text: Get Started →
+      link: /guide/pre-config
+    - theme: alt
+      text: GitHub
+      link: https://github.com/HKUDS/DeepTutor
+
+features:
+  - icon: 📚
+    title: Massive Document Q&A
+    details: Upload textbooks, papers, and manuals. Build AI-powered knowledge repositories with RAG and knowledge graph integration.
+  - icon: 🧠
+    title: Smart Problem Solving
+    details: Dual-loop reasoning architecture with multi-agent collaboration, delivering step-by-step solutions with precise citations.
+  - icon: 🎯
+    title: Practice Generator
+    details: Generate custom quizzes based on your knowledge base, or mimic real exam styles for authentic practice.
+  - icon: 🎓
+    title: Guided Learning
+    details: Personalized learning paths with interactive visualizations and adaptive explanations.
+  - icon: 🔬
+    title: Deep Research
+    details: Systematic topic exploration with web search, paper retrieval, and literature synthesis.
+  - icon: 💡
+    title: Idea Generation
+    details: AI-assisted brainstorming with knowledge extraction and multi-stage filtering.
+---
+
+## Why DeepTutor?
+
+- **Deep Understanding** — Not just answers, but guided learning journeys with visual explanations
+- **Multi-Modal Support** — PDF, LaTeX, images, code execution, and more
+- **Knowledge Graph** — Semantic connections powered by LightRAG for better comprehension
+- **All-in-One Platform** — Problem solving, question generation, research, and idea generation in one place
+
+<style>
+:root {
+  --vp-home-hero-name-color: transparent;
+  --vp-home-hero-name-background: linear-gradient(135deg, #667eea 0%, #764ba2 50%, #f093fb 100%);
+  --vp-home-hero-image-background-image: linear-gradient(135deg, rgba(102, 126, 234, 0.2) 0%, rgba(118, 75, 162, 0.2) 50%, rgba(240, 147, 251, 0.15) 100%);
+  --vp-home-hero-image-filter: blur(72px);
+}
+
+.dark {
+  --vp-home-hero-image-background-image: linear-gradient(135deg, rgba(102, 126, 234, 0.15) 0%, rgba(118, 75, 162, 0.15) 50%, rgba(240, 147, 251, 0.1) 100%);
+}
+
+.VPHero .name {
+  font-size: 4.5rem !important;
+  line-height: 1.1 !important;
+}
+
+.VPHero .text {
+  font-size: 2.4rem !important;
+  font-weight: 600 !important;
+}
+
+@media (max-width: 768px) {
+  .VPHero .name {
+    font-size: 3rem !important;
+  }
+  .VPHero .text {
+    font-size: 1.8rem !important;
+  }
+}
+</style>
diff --git a/docs/roadmap.md b/docs/roadmap.md
new file mode 100644
index 000000000..c0e530452
--- /dev/null
+++ b/docs/roadmap.md
@@ -0,0 +1,41 @@
+# Roadmap
+
+Our vision for DeepTutor's future development.
+
+## ✅ Recently Completed (v0.4.0)
+
+- [x] **RAG Module Decoupling** — Modular RAG architecture with provider-agnostic interface
+  - Currently supports RAG-Anything (MinerU + LightRAG)
+  - More backends coming soon
+- [x] **Multi-Provider Support** — Expanded LLM and Embedding provider options
+  - LLM: OpenAI, Anthropic, Azure, Ollama, Groq, OpenRouter, DeepSeek, Gemini
+  - Embedding: OpenAI, Jina, Cohere, Ollama, LM Studio, HuggingFace
+- [x] **Dark Mode** — System-wide dark/light theme support
+- [x] **Environment Configuration** — Unified `.env` based configuration
+
+## 🚀 Planned Features
+
+- [ ] **Deepcoding from Idea Generation** — Transform research ideas into working prototypes
+- [ ] **Personalized Memory** — Adapt tutoring style based on user learning history
+- [ ] **Additional RAG Backends** — LlamaIndex, ChromaDB, Pinecone integration
+- [ ] **More Embedding Adapters** — Voyage AI, Mixedbread, local transformers
+
+## 💭 Under Consideration
+
+- Multi-language support
+- Mobile-friendly interface
+- Collaborative learning features
+- Voice interaction support
+- Faster frontend framework
+
+## 🤝 Community Requests
+
+Have a feature idea? We'd love to hear it!
+
+- Open a [Feature Request](https://github.com/HKUDS/DeepTutor/issues/new?template=feature_request.yml)
+- Join the discussion on existing proposals
+- Check our [GitHub Discussions](https://github.com/HKUDS/DeepTutor/discussions)
+
+---
+
+⭐ **Star the repo** to follow our future updates!
diff --git a/docs/testdoc/structure-note-prd.md b/docs/testdoc/structure-note-prd.md
new file mode 100644
index 000000000..6557dd096
--- /dev/null
+++ b/docs/testdoc/structure-note-prd.md
@@ -0,0 +1,278 @@
+# Structure Note 产品需求文档（PRD）
+
+## Title
+
+Structure Note: 基于 PageIndex 的课件/教材结构化讲义工作区
+
+## Summary
+
+新增一个独立的 `Structure Note` 工作区。用户上传 `PDF` 或 `PPT/PPTX` 后，系统先统一归一化为 PDF，再基于新增的 `PageIndex` 构建页级结构树，按章节与页范围分段生成详细讲义，并通过图片占位、定位、切图和回填补全图文内容，最终输出一份带引用来源的可读 PDF。用户可在生成前选择三档讲解难度：简单、中等（默认）、复杂。
+
+## Existing Requirements And Current State
+
+DeepTutor 当前已具备相邻能力，但缺少本功能所需的页级结构层：
+
+- 知识库主干已统一到 `llamaindex`，`lightrag` 只是兼容别名
+- 当前文档导入以整文抽取和向量检索为主，没有稳定的页级索引或章节树
+- `Guided Learning` 已有独立工作区、session、分页状态和后台生成机制，可作为工作区组织方式参考
+- `Notebook` 适合保存文本记录，不适合作为 PDF 最终产物主模型
+- 上传校验允许 `ppt/pptx`，但 RAG 文件路由当前并不真正支持它们进入主流程
+
+## Problem Statement
+
+DeepTutor 目前没有一个面向课件和教材的“逐页、详细、可回溯”的结构化讲义产物。
+
+这带来两个明显缺口：
+
+1. 学生无法获得接近逐字稿的图文讲义，用于跟课、补漏和课后复习
+2. 教师无法将现有 PPT 快速转换为可直接讲授的 Script，仍需自行整理讲稿
+
+现有知识库能力偏向检索，不足以支撑页级结构、章节树、图片回填和最终 PDF 产出。
+
+## Repo Context
+
+- 该功能应是独立工作区，而不是 `Knowledge Hub` 的附属按钮，也不是 `Guided Learning` 的变种
+- 该功能不应建立在 LightRAG 上，而应新增 `PageIndex` 结构层
+- 当前 repo 没有现成 `PageIndex` 实现，需要新增核心服务
+- 该功能会跨后端 router、任务流、路径管理、前端工作区和 PDF 导出，更适合进入 core，并以实验性工作区首发
+
+## Target Users
+
+- 学生：跟课、补漏、课后复习
+- 教师：PPT 转 Script，减轻备课负担
+- 研发与测试：验证引用、图片回填和恢复流程
+
+## Goals
+
+- 提供独立的 `Structure Note` 工作区
+- 支持 `PDF + PPT/PPTX` 上传
+- 将 PPT/PPTX 先归一化为 PDF
+- 基于 `PageIndex` 生成页级结构树，而非整文向量块
+- 采用章节树加分段生成策略，降低 lost-in-the-middle 风险
+- 支持简单 / 中等 / 复杂三档讲解难度，其中中等为默认
+- 输出最终可读 PDF，并附带引用来源
+- 在后端保留中间状态、图片回填和续跑能力，用于测试和恢复
+
+## Non-Goals
+
+- 不替换现有 `Knowledge Hub` 主流程
+- 不把最终产物首发建模为 Notebook 主记录类型
+- 不在首发覆盖 DOCX、图片 OCR、音频转录等更多素材
+- 不向前端暴露占位符、象限定位、切图调试细节
+- 不要求 CLI / SDK 首发同步支持
+
+## Proposed Solution
+
+新增 `Structure Note` 工作区，采用独立 router、manager、artifact 存储与前端页面。
+
+### 主流程
+
+1. 用户上传 `PDF` 或 `PPT/PPTX`
+2. 若为 PPT/PPTX，先通过转换适配器归一化为 PDF
+3. 对 PDF 执行 `PageIndex`，输出逐页文本、页码、标题候选、图像候选区域
+4. 构建多级章节树，优先覆盖二级到五级结构
+5. 以章节树为主线，按约 10 页窗口分段生成讲义；`复杂讲解` 可自动缩小为 5-8 页窗口
+6. 首轮文本生成时插入图片占位符，并记录对应页码范围
+7. 图像流水线识别占位符，执行“页定位 -> 象限定位 -> 切图 -> 回填”
+8. 将最终内容渲染为 PDF，并生成 `citation_manifest.json`
+9. 前端展示最终 PDF、下载入口和引用来源列表
+
+### Difficulty Model
+
+#### simple
+
+- 定位：科普型、入门型
+- 目标：讲清关键词、定义、核心知识和结论
+- 风格：少推理、少展开、少旁支
+- 篇幅：最短
+
+#### medium
+
+- 定位：默认档，接近正常课堂讲解密度
+- 目标：概念、重点、基础逻辑链讲清楚
+- 风格：细致但不过度展开
+- 篇幅：中等
+
+#### detailed
+
+- 定位：最完整档
+- 目标：尽量展开所有内容，包括推理、过程、细节和隐含连接
+- 风格：最详细
+- 篇幅：最长
+- 特殊策略：自动缩小页窗口，以换取生成稳定性
+
+## Scope In
+
+- 独立工作区
+- PDF 与 PPT/PPTX 上传
+- PPT/PPTX -> PDF 归一化
+- `PageIndex` 服务层
+- 章节树生成
+- 按页范围分段生成
+- 三档难度控制
+- 图片占位、定位、切图、回填
+- 最终 PDF 导出
+- 引用来源展示
+- 后端中间状态持久化与续跑
+
+## Scope Out
+
+- 与知识库检索结果的双向联动
+- Notebook 一键保存 PDF
+- 用户手动编辑章节树
+- 多文档自动合并成一本总讲义
+- CLI / SDK 首发接口
+- 高级版式编辑器
+
+## UX Or Interaction Notes
+
+- 工作区形态采用“上传 -> 配置 -> 处理中 -> 查看结果”
+- 上传页提供：
+  - 文件选择
+  - 难度选择器：简单 / 中等（默认） / 复杂
+- 结果页仅展示：
+  - 最终 PDF 预览或下载
+  - 本次难度档位
+  - 引用来源列表
+  - 失败后的重试入口
+- 不向用户展示内部中间态和 agent 细节
+
+## Technical Considerations
+
+- `PageIndex` 是新增结构服务，不是新的 RAG provider
+- 用户可见主产物是 PDF；后端内部仍保留中间 JSON / Markdown / render state
+- 内部 artifact 至少包含：
+  - `source_file`
+  - `normalized_pdf_path`
+  - `difficulty_level`
+  - `page_index`
+  - `section_tree`
+  - `generation_chunks`
+  - `image_fill_state`
+  - `final_pdf_path`
+  - `citation_manifest`
+- 引用来源至少应包含：
+  - 章节路径
+  - 页码范围
+  - 原始 PDF 页
+  - 图像来源页
+- `detailed` 模式应允许更长耗时和更小页窗口，以换取稳定性
+
+## Impacted Areas Of The Repo
+
+- 新增 backend router：`deeptutor/api/routers/structure_note.py`
+- 新增服务目录：`deeptutor/services/structure_note/`
+- 扩展路径管理：`deeptutor/services/path_service.py`
+- 复用任务流与日志广播模式：`deeptutor/api/routers/knowledge.py`
+- 新增前端页面：`web/app/(workspace)/structure-note/page.tsx`
+- 更新工作区导航与文档
+
+## Acceptance Criteria
+
+- 用户可在独立工作区上传 PDF 并生成最终 PDF 讲义
+- 用户可上传 PPT/PPTX，系统会先转换为 PDF 再进入同一流程
+- 系统基于页级结构和章节树分段生成，而不是整文一次性生成
+- 用户可选择三档难度；未选择时默认为中等
+- 三档难度的结果在覆盖密度和篇幅上有明显差异
+- 最终结果可回溯到页码范围，并在前端展示引用来源
+- 图片可通过占位符 -> 定位 -> 切图 -> 回填进入最终结果
+- 生成中断后可在后端基于中间状态续跑
+- 不影响现有 `Knowledge Hub`、`Notebook`、`Guided Learning`
+
+## Success Metrics
+
+- 任务成功率
+- 平均生成时长
+- 页码引用正确率
+- 图片回填成功率
+- 三档难度的用户使用分布
+- 学生复习场景下的二次打开率
+- 教师上传后导出率
+
+## Rollout And Compatibility
+
+- 以独立工作区、实验性功能首发
+- 完全 opt-in，不替换现有知识库主行为
+- 中间状态保留策略做成可配置项，测试环境默认开启，生产环境可裁剪
+- 若 PPT 转 PDF 或 `PageIndex` 失败，应给出明确错误并允许重试
+
+## Risks And Mitigations
+
+### PageIndex 质量不稳定
+
+- 风险：树生成失败或页级抽取噪声过大
+- 缓解：树失败时回退为按页段生成，保证主流程可用
+
+### PPT 转 PDF 兼容性不足
+
+- 风险：不同模板、字体或复杂动画导致转换异常
+- 缓解：转换器做成可替换 adapter；首发默认使用 LibreOffice
+
+### simple 过度压缩
+
+- 风险：为追求短篇幅丢失关键上下文
+- 缓解：强制保留关键词、定义、结论和最小解释链
+
+### detailed 成本和耗时过高
+
+- 风险：长文档生成时间和成本显著上升
+- 缓解：缩小页窗口并启用缓存和续跑
+
+### 图片定位不准
+
+- 风险：四象限粗定位与真实图像区域偏差较大
+- 缓解：定位失败时允许整页截图回退
+
+## Maintainer Fit
+
+该功能适合进入 core，但建议以实验性工作区首发。它直接服务于 DeepTutor 的“材料 -> 学习产物”主线，需要复用上传、任务流、前端工作区和路径管理；若做成外置 plugin，会让产品入口、状态管理和文件处理都变得割裂。
+
+## Alternatives Considered
+
+- 挂在 `Knowledge Hub` 下：不选，因为它不是普通 KB 初始化副产物
+- 复用 `Guided Learning`：不选，因为其主产物是交互页面，不是最终 PDF 讲义
+- 只保存最终 PDF，不保留中间状态：不选，因为测试、恢复和图片回填都会变差
+- 基于 LightRAG 扩展：不选，因为当前主干不走这条路径，且需求核心是页级结构
+
+## Docs And Test Impact
+
+- README 增加 `Structure Note` 工作区说明
+- docs 增加支持格式、难度档位、生成流程、引用来源说明
+- 后端测试覆盖：
+  - PPT/PPTX 归一化
+  - `PageIndex`
+  - 章节树生成
+  - 难度分层
+  - 引用页码
+  - 图片回填
+  - 续跑恢复
+- 前端测试覆盖：
+  - 上传与难度选择
+  - 处理中状态
+  - 最终 PDF 展示
+  - 引用来源展示
+
+## Open Questions
+
+- 最终 PDF 是否需要内嵌引用附录，还是只在前端展示完整 citation
+- 生产环境中间状态保留多久
+- 是否允许下载 `PDF + citation manifest` 打包结果
+
+## Assumptions
+
+- 首发是 web-first
+- 最终用户产物是 PDF
+- 后端保留中间状态仅用于测试、恢复和内部验证
+- `medium` 为默认档位
+- `detailed` 可接受更长生成时延和更高成本
+
+## Decision Log
+
+- 入口：独立工作区
+- 素材：PDF + PPT/PPTX
+- 归一化：PPT/PPTX 先转 PDF
+- 结构底座：新增 `PageIndex`
+- 用户可见产物：最终 PDF
+- 前端：只展示结果与引用
+- 后端：保留中间状态、图片回填和续跑
+- 难度：简单 / 中等（默认） / 复杂
diff --git a/docs/testdoc/structure-note-technical-plan.md b/docs/testdoc/structure-note-technical-plan.md
new file mode 100644
index 000000000..be0af868d
--- /dev/null
+++ b/docs/testdoc/structure-note-technical-plan.md
@@ -0,0 +1,539 @@
+# Structure Note 详细技术计划
+
+## 1. 背景与决策
+
+### 1.1 目标
+
+在 DeepTutor 中新增一个独立的 `Structure Note` 工作区，将用户上传的课件或教材转成可阅读、可回溯的结构化 PDF 讲义。
+
+### 1.2 已锁定决策
+
+- 工作区独立存在，不挂在 `Knowledge Hub` 或 `Guided Learning` 下
+- 首发真实支持 `PDF + PPT/PPTX`
+- `PPT/PPTX -> PDF` 由服务端通过 `headless LibreOffice` 实现
+- 结构底座为新增的 `PageIndex`，不接入现有 `llamaindex` provider
+- 最终用户产物是 PDF
+- 引用只在前端结果页侧栏展示，不强行内嵌到 PDF 中
+- 中间状态保留采用环境可配策略
+- 难度固定为 `simple / medium / detailed`，默认 `medium`
+
+### 1.3 与现有能力的关系
+
+- 复用 `knowledge` 路由中的任务流、SSE 日志和后台任务模式
+- 参考 `guide` 工作区的 session / manager 组织方式
+- 不复用 Notebook 作为主产物容器
+- 不影响现有 RAG 搜索、聊天和 Guided Learning
+
+## 2. 端到端数据流
+
+### 2.1 主流程
+
+1. 前端上传文件并提交难度参数
+2. 后端创建 `job_id`，生成 artifact 目录结构
+3. 后端执行素材归一化：
+   - PDF：直接进入下一阶段
+   - PPT/PPTX：使用 `soffice --headless --convert-to pdf` 转为 PDF
+4. 后端执行 `PageIndex`：
+   - 逐页抽文本
+   - 渲染页图缩略信息
+   - 识别标题候选
+   - 记录图像候选区域
+5. 后端构建章节树：
+   - 规则层抽标题候选
+   - LLM 将候选标准化为 2-5 级结构
+   - 输出节点与页码范围映射
+6. 后端分段生成正文：
+   - 按章节树与页范围切块
+   - 每块调用 LLM 生成 Markdown 讲义正文
+   - 同步输出页码范围与图片占位符
+7. 后端执行图片流水线：
+   - 识别占位符
+   - 生成页号映射
+   - 通过定位 Agent 选择象限
+   - 通过切图执行器生成图片资源
+   - 回填 Markdown / render model
+8. 后端渲染最终 PDF 与 `citation_manifest.json`
+9. 前端结果页读取任务详情、PDF 地址与 citation 清单
+
+### 2.2 阶段与状态
+
+统一任务状态：
+
+- `queued`
+- `normalizing`
+- `indexing`
+- `planning`
+- `generating`
+- `processing_images`
+- `rendering`
+- `ready`
+- `failed`
+
+### 2.3 失败与续跑原则
+
+- 若素材归一化失败，任务直接失败，不进入后续阶段
+- 若 `PageIndex` 失败，任务失败；后续重试从 `normalize` 后的 PDF 继续
+- 若章节树生成失败，可回退到按页段生成
+- 若图片定位或切图失败，不阻塞整份文档，可对该占位符降级为整页截图或文本标注
+- `retry` 优先复用已存在中间态，而不是重新上传文件
+
+## 3. 后端模块拆分
+
+### 3.1 新增目录
+
+建议新增：
+
+- `deeptutor/api/routers/structure_note.py`
+- `deeptutor/services/structure_note/`
+
+### 3.2 服务子模块
+
+建议按以下模块拆分：
+
+#### `models.py`
+
+定义内部类型：
+
+- `DifficultyLevel`
+- `JobStatus`
+- `StructureNoteArtifact`
+- `PageIndexPage`
+- `SectionTreeNode`
+- `GenerationChunk`
+- `CitationEntry`
+- `ImagePlaceholder`
+
+#### `storage.py`
+
+负责：
+
+- 生成 artifact 目录
+- 读写 `artifact.json`
+- 路径组装
+- 环境化保留策略清理
+
+#### `normalizer.py`
+
+负责：
+
+- 判断输入格式
+- 调用 LibreOffice 完成 PPT/PPTX -> PDF 转换
+- 输出标准 PDF 路径
+- 提供依赖缺失时的明确错误消息
+
+#### `page_index.py`
+
+负责：
+
+- 使用 PyMuPDF 逐页抽文本
+- 记录页码、页尺寸、文本块信息
+- 渲染页面基础图像信息
+- 提取标题候选与图像候选区域
+
+#### `tree_builder.py`
+
+负责：
+
+- 规则层标题候选提取
+- 调用 LLM 将候选标准化为 2-5 级章节树
+- 建立 `section -> page range` 映射
+- 失败时回退到按页段生成
+
+#### `difficulty.py`
+
+负责三档难度 preset：
+
+- 输出长度预算
+- 输出风格约束
+- 页窗口大小
+- 术语解释深度
+- 推理展开深度
+
+#### `generator.py`
+
+负责：
+
+- 根据树结构切分 generation chunks
+- 生成 Markdown 正文
+- 注入页码范围标签
+- 生成图片占位符
+
+#### `image_pipeline.py`
+
+负责：
+
+- 占位符扫描
+- 页号映射
+- 调用定位 Agent 得到页与象限
+- 将象限转换为 PyMuPDF crop box
+- 切图并写入 `images/`
+- 回填到 Markdown / render model
+
+#### `renderer.py`
+
+负责：
+
+- Markdown -> HTML
+- HTML -> PDF（WeasyPrint）
+- citation manifest 输出
+
+#### `manager.py`
+
+负责：
+
+- 任务编排
+- 状态流转
+- 后台续跑
+- 对 router 提供统一接口
+
+### 3.3 PathService 扩展
+
+在 `deeptutor/services/path_service.py` 中增加 `structure_note` 工作区路径支持，最终目录落到：
+
+`data/user/workspace/structure_note/<job_id>/`
+
+固定目录结构：
+
+- `source/`
+- `normalized/`
+- `index/`
+- `chunks/`
+- `images/`
+- `final/`
+- `artifact.json`
+
+## 4. API 与类型
+
+### 4.1 对外接口
+
+#### `POST /api/v1/structure-note/jobs`
+
+用途：创建任务  
+请求：`multipart/form-data`
+
+- `file`: 上传文件
+- `difficulty_level`: `simple | medium | detailed`
+
+行为：
+
+- 验证格式
+- 创建 `job_id`
+- 写入源文件
+- 启动后台任务
+- 返回任务基础信息与 task stream 标识
+
+#### `GET /api/v1/structure-note/jobs`
+
+用途：获取工作区历史列表  
+返回最少字段：
+
+- `job_id`
+- `file_name`
+- `difficulty_level`
+- `status`
+- `created_at`
+- `updated_at`
+
+#### `GET /api/v1/structure-note/jobs/{job_id}`
+
+用途：获取任务详情  
+返回最少字段：
+
+- `job_id`
+- `status`
+- `source_format`
+- `difficulty_level`
+- `final_pdf_path`
+- `citation_manifest_summary`
+- `retry_available`
+
+#### `POST /api/v1/structure-note/jobs/{job_id}/retry`
+
+用途：失败任务续跑  
+行为：
+
+- 读取 `artifact.json`
+- 检查上次成功阶段
+- 从最近可复用阶段继续执行
+
+#### `GET /api/v1/structure-note/tasks/{task_id}/stream`
+
+用途：SSE 任务流  
+复用 `knowledge` 的日志和状态推送模式
+
+### 4.2 内部 artifact 结构
+
+`artifact.json` 至少包含：
+
+- `job_id`
+- `source_format`
+- `difficulty_level`
+- `source_path`
+- `normalized_pdf_path`
+- `page_index_path`
+- `section_tree_path`
+- `generation_chunks_path`
+- `citation_manifest_path`
+- `final_pdf_path`
+- `status`
+- `retry_state`
+- `created_at`
+- `updated_at`
+
+### 4.3 Citation 类型
+
+每条 citation 至少包含：
+
+- `citation_id`
+- `section_path`
+- `page_start`
+- `page_end`
+- `source_file`
+- `source_kind`
+- `image_page`
+- `image_region`
+
+其中：
+
+- `source_kind` 仅允许 `text` 或 `image`
+- `image_page` / `image_region` 仅在图像引用时填写
+
+## 5. 前端工作区设计
+
+### 5.1 页面结构
+
+新页面建议为：
+
+`web/app/(workspace)/structure-note/page.tsx`
+
+### 5.2 三个核心面板
+
+#### 上传与配置
+
+- 文件选择
+- 难度切换：
+  - 简单
+  - 中等（默认）
+  - 复杂
+- `detailed` 旁边增加一条轻量提示：生成时间更长
+
+#### 处理中
+
+- 阶段文本
+- 进度条
+- 错误提示
+- 重试按钮
+
+#### 结果页
+
+- PDF 预览
+- 下载按钮
+- citation 侧栏
+- 历史任务入口
+
+### 5.3 非目标展示
+
+前端明确不展示：
+
+- 章节树调试信息
+- 图片占位符
+- 四象限判断
+- crop box
+- 中间 Markdown
+- 中间 JSON
+
+### 5.4 历史列表字段
+
+至少显示：
+
+- 文件名
+- 难度
+- 状态
+- 创建时间
+- 重新打开结果
+
+## 6. 生成与渲染策略
+
+### 6.1 难度预设
+
+#### simple
+
+- 目标：关键词、定义、核心知识、结论
+- 风格：科普型
+- 输出：最短
+- 推理：尽量压缩
+- 页窗口：默认 10 页
+
+#### medium
+
+- 目标：正常课堂讲解
+- 风格：重点解释 + 基础逻辑链
+- 输出：中等
+- 推理：保留基础过程
+- 页窗口：默认 10 页
+
+#### detailed
+
+- 目标：覆盖细节、推理、过程与隐含逻辑
+- 风格：最详细
+- 输出：最长
+- 推理：尽量完整
+- 页窗口：自动缩到 5-8 页
+
+### 6.2 章节树生成规则
+
+- 优先依据字体大小、位置、编号样式和文本模式抽取标题候选
+- 交给 LLM 做结构归一化，但输出必须约束为 2-5 级节点
+- 若 LLM 输出不可用，回退到按页段分组，而不是阻塞整个流程
+
+### 6.3 图片流水线
+
+#### 第一步：占位符生成
+
+正文生成时输出形如：
+
+`[[IMAGE_PLACEHOLDER:section_id:page_hint:purpose]]`
+
+#### 第二步：定位 Agent
+
+Agent 输出固定格式：
+
+- 第几页
+- 象限：`left_top | right_top | left_bottom | right_bottom`
+
+#### 第三步：切图执行
+
+根据页面宽高将页面切成四象限：
+
+- 左上
+- 右上
+- 左下
+- 右下
+
+切图执行器只做确定性 crop，不自行做语义判断。
+
+#### 第四步：回填
+
+回填模块将图片资源路径写回 Markdown 或 render model，再进入最终 PDF 渲染。
+
+### 6.4 PDF 渲染
+
+- 中间产物使用 Markdown 表达
+- 渲染时先转 HTML，再交给 WeasyPrint 输出 PDF
+- 引用不嵌入正文，只保留干净版 PDF
+- citation manifest 单独生成 JSON，供前端侧栏展示
+
+## 7. 存储与中间态策略
+
+### 7.1 存储内容
+
+在完整保留模式下，应保存：
+
+- 原始上传文件
+- 归一化 PDF
+- 页级索引 JSON
+- 章节树 JSON
+- generation chunks JSON
+- 图片资源
+- 回填后 Markdown
+- citation manifest
+- 最终 PDF
+- `artifact.json`
+
+### 7.2 环境化保留策略
+
+建议新增环境配置项，例如：
+
+- `STRUCTURE_NOTE_RETENTION_MODE=full|minimal`
+
+规则：
+
+- 测试环境默认 `full`
+- 生产环境默认 `minimal`
+
+`minimal` 至少保留：
+
+- `artifact.json`
+- `final.pdf`
+- `citation_manifest.json`
+
+### 7.3 续跑策略
+
+`retry_state` 记录最近成功阶段。续跑时遵循：
+
+- 已完成 `normalize`：不重复转换
+- 已完成 `page_index`：不重复抽页
+- 已完成 `tree_build`：不重复建树
+- 仅后续阶段失败：从失败阶段继续
+
+## 8. 测试矩阵与实施里程碑
+
+### 8.1 单元测试
+
+- `PageIndex` 逐页文本提取
+- 空页处理
+- 页码顺序稳定
+- 标题候选抽取规则
+- 树标准化结果满足 2-5 级结构约束
+- 难度 preset 对窗口大小和长度预算的影响
+- 象限到 crop box 的换算
+- 保留策略清理逻辑
+
+### 8.2 集成测试
+
+- PDF 上传全链路成功，生成 PDF 与 citation manifest
+- PPT/PPTX 上传真实走 LibreOffice 转 PDF，再进入后续链路
+- `simple / medium / detailed` 三档输出长度和内容密度有明显差异
+- 图片占位符能被回填
+- 图片失败时能降级或重试
+- 任务中断后 `retry` 会复用中间态，而不是从头重跑
+
+### 8.3 前端测试
+
+- 上传页能提交文件和难度
+- 处理中状态能接收 SSE 进度
+- 结果页能加载 PDF 和 citation 侧栏
+- 失败任务能触发重试
+
+### 8.4 验收样本
+
+- 学生教材 PDF：中等模式，结果可读、页码回溯清楚
+- 教师 PPT：复杂模式，细节展开明显更多
+- 简单模式：明显短于中等与复杂，不丢失关键词和核心知识
+
+### 8.5 实施里程碑
+
+#### M1：文档与骨架
+
+- 在 `docs/testdoc/` 落 `PRD + 技术计划`
+- 建立路由、artifact 模型、目录结构、SSE 任务流
+
+#### M2：素材归一化与 PageIndex
+
+- 接通 PDF 上传
+- 接通 PPT/PPTX -> PDF 转换
+- 产出页级索引与章节树
+
+#### M3：内容生成与三档难度
+
+- 接通 chunk 生成
+- 接通难度 preset
+- 产出 citation manifest
+
+#### M4：图片流水线与 PDF 渲染
+
+- 接通占位符识别、象限定位、切图回填
+- 接通 Markdown -> HTML -> PDF
+
+#### M5：前端结果工作区与完整测试
+
+- 上传 / 进度 / 结果 / 重试闭环
+- 完成集成测试与验收样本
+
+## 9. 实施默认值
+
+- 文档落盘格式使用中文 Markdown，不额外导出 PDF 版 PRD / 技术计划
+- `docs/testdoc` 仅作归档，不在文档 sidebar 中额外挂载
+- LibreOffice 是首发必需依赖；环境缺失时，PPT/PPTX 上传失败并返回安装指引
+- 最终 PDF 不内嵌完整引用；完整引用只在前端侧栏和 `citation_manifest.json` 中展示
+- 中间态保留走环境配置：测试环境保留完整中间态，生产环境默认保留 `artifact.json + final.pdf + citation_manifest.json`
diff --git a/docs/zh/features/overview.md b/docs/zh/features/overview.md
new file mode 100644
index 000000000..dc9d85265
--- /dev/null
+++ b/docs/zh/features/overview.md
@@ -0,0 +1,57 @@
+# 功能介绍
+
+DeepTutor 提供六个专业模块，助力 AI 驱动的学习体验。
+
+<div class="feature-nav">
+
+## 核心模块
+
+| 模块 | 描述 | 文档 |
+|:-------|:------------|:--------------|
+| 🧠 **智能解题** | 多 Agent 协作解题，双循环推理架构 | [详情 →](https://github.com/HKUDS/DeepTutor#-smart-solver) |
+| 🎯 **题目生成** | 自定义测验生成，模拟真实考试风格 | [详情 →](https://github.com/HKUDS/DeepTutor#-question-generator) |
+| 🎓 **引导学习** | 个性化学习路径，交互式可视化 | [详情 →](https://github.com/HKUDS/DeepTutor#-guided-learning) |
+| 🔬 **深度研究** | 系统化主题探索，动态主题队列 | [详情 →](https://github.com/HKUDS/DeepTutor#-deep-research) |
+| 💡 **想法生成** | 自动化研究想法生成，多阶段过滤 | [详情 →](https://github.com/HKUDS/DeepTutor#-automated-ideagen) |
+| ✏️ **协作写作** | AI 辅助写作，TTS 语音朗读 | [详情 →](https://github.com/HKUDS/DeepTutor#-interactive-ideagen-co-writer) |
+
+## 系统架构
+
+<img src="/full-pipe.png" alt="DeepTutor 架构" style="width: 100%; border-radius: 8px; margin: 24px 0;">
+
+### 系统层次
+
+- **用户界面** — 双向查询响应，结构化输出
+- **Agent 模块** — 各学习任务的专业 AI Agent
+- **工具集成** — RAG、网络搜索、论文检索、代码执行
+- **知识基础** — 知识图谱 + 向量存储 + 记忆系统
+
+</div>
+
+## 支持的服务商
+
+DeepTutor 支持多种 LLM 和 Embedding 服务商：
+
+::: details LLM 服务商
+- OpenAI (GPT-4o, GPT-4)
+- Anthropic (Claude 3.5)
+- Azure OpenAI
+- DeepSeek
+- Groq
+- OpenRouter
+- Ollama（本地部署）
+- Google Gemini
+:::
+
+::: details Embedding 服务商
+- OpenAI
+- Jina AI
+- Cohere
+- Ollama
+- LM Studio
+- HuggingFace
+:::
+
+---
+
+📖 **完整文档**: [GitHub README](https://github.com/HKUDS/DeepTutor)
diff --git a/docs/zh/guide/data-preparation.md b/docs/zh/guide/data-preparation.md
new file mode 100644
index 000000000..e148c40b1
--- /dev/null
+++ b/docs/zh/guide/data-preparation.md
@@ -0,0 +1,185 @@
+# 数据准备
+
+DeepTutor 提供示例知识库和样例问题，帮助您快速上手。
+
+## 示例知识库
+
+我们在 [Google Drive](https://drive.google.com/drive/folders/1iWwfZXiTuQKQqUYb5fGDZjLCeTUP6DA6?usp=sharing) 上提供两个预构建的知识库：
+
+### 1. 研究论文合集
+
+<div class="info-card">
+  <div class="info-header">
+    <span class="info-icon">📄</span>
+    <span class="info-title">5 篇研究论文（每篇 20-50 页）</span>
+  </div>
+  <div class="info-content">
+    <p>来自我们实验室的前沿研究论文精选集，涵盖 RAG 和 Agent 领域。</p>
+    <p><strong>包含论文：</strong></p>
+    <ul>
+      <li><a href="https://github.com/HKUDS/AI-Researcher">AI-Researcher</a> - 自动化研究论文生成</li>
+      <li><a href="https://github.com/HKUDS/AutoAgent">AutoAgent</a> - 自主智能体框架</li>
+      <li><a href="https://github.com/HKUDS/RAG-Anything">RAG-Anything</a> - 多模态 RAG 系统</li>
+      <li><a href="https://github.com/HKUDS/LightRAG">LightRAG</a> - 简洁快速的 RAG</li>
+      <li><a href="https://github.com/HKUDS/VideoRAG">VideoRAG</a> - 基于 RAG 的视频理解</li>
+    </ul>
+    <p><strong>适用场景：</strong> 研究场景，广泛知识覆盖</p>
+  </div>
+</div>
+
+### 2. 数据科学教材
+
+<div class="info-card">
+  <div class="info-header">
+    <span class="info-icon">📚</span>
+    <span class="info-title">8 章，296 页</span>
+  </div>
+  <div class="info-content">
+    <p>来自加州大学伯克利分校的综合深度学习教材。</p>
+    <p><strong>来源：</strong> <a href="https://ma-lab-berkeley.github.io/deep-representation-learning-book/">Deep Representation Learning Book</a></p>
+    <p><strong>涵盖主题：</strong></p>
+    <ul>
+      <li>神经网络基础</li>
+      <li>表示学习</li>
+      <li>深度学习架构</li>
+      <li>高级主题</li>
+    </ul>
+    <p><strong>适用场景：</strong> 学习场景，深度知识挖掘</p>
+  </div>
+</div>
+
+## 下载与设置
+
+### 步骤 1：下载
+
+访问我们的 [Google Drive 文件夹](https://drive.google.com/drive/folders/1iWwfZXiTuQKQqUYb5fGDZjLCeTUP6DA6?usp=sharing) 并下载：
+
+- `knowledge_bases.zip` - 包含嵌入的预构建知识库
+- `questions.zip` - 样例问题和使用示例（可选）
+
+### 步骤 2：解压
+
+将下载的文件解压到 `data/` 目录：
+
+```
+DeepTutor/
+├── data/
+│   └── knowledge_bases/
+│       ├── research_papers/      # 研究论文知识库
+│       ├── data_science_book/    # 教材知识库
+│       └── kb_config.json        # 知识库配置
+└── user/                         # 用户数据（自动创建）
+```
+
+### 步骤 3：验证
+
+解压后，启动 DeepTutor 时您的知识库将自动可用。
+
+::: warning 嵌入兼容性
+我们的示例知识库使用 `text-embedding-3-large`，`dimensions = 3072`。
+
+如果您的嵌入模型具有不同的维度，您需要创建自己的知识库。
+:::
+
+## 创建自定义知识库
+
+### 支持的文件格式
+
+| 格式 | 扩展名 | 说明 |
+|:-------|:----------|:------|
+| PDF | `.pdf` | 支持文本提取和版面分析 |
+| 文本 | `.txt` | 纯文本文件 |
+| Markdown | `.md` | 支持格式化的 Markdown |
+
+### 通过 Web 界面
+
+1. 导航到 `http://localhost:3782/knowledge`
+2. 点击 **"New Knowledge Base"**
+3. 为您的知识库输入唯一名称
+4. 上传您的文档（单个或批量上传）
+5. 等待处理完成
+
+::: tip 处理时间
+- 小文档（< 10 页）：约 1 分钟
+- 中等文档（10-100 页）：约 5-10 分钟
+- 大文档（100+ 页）：可能需要更长时间
+:::
+
+### 通过命令行
+
+```bash
+# 使用文档初始化新知识库
+python -m src.knowledge.start_kb init <kb_name> --docs <pdf_path>
+
+# 向现有知识库添加文档
+python -m src.knowledge.add_documents <kb_name> --docs <new_document.pdf>
+```
+
+## 数据存储结构
+
+所有用户数据存储在 `data/` 目录中：
+
+```
+data/
+├── knowledge_bases/              # 知识库存储
+│   ├── <kb_name>/
+│   │   ├── documents/            # 原始文档
+│   │   ├── chunks/               # 分块内容
+│   │   ├── embeddings/           # 向量嵌入
+│   │   └── graph/                # 知识图谱数据
+└── user/                         # 用户活动数据
+    ├── solve/                    # 解题结果
+    ├── question/                 # 生成的题目
+    ├── research/                 # 研究报告
+    ├── notebook/                 # 笔记本记录
+    └── logs/                     # 系统日志
+```
+
+---
+
+**下一步：** [本地安装 →](/zh/guide/local-start)
+
+<style>
+.info-card {
+  background: var(--vp-c-bg-soft);
+  border: 1px solid var(--vp-c-border);
+  border-radius: 12px;
+  padding: 20px;
+  margin: 16px 0;
+}
+
+.info-header {
+  display: flex;
+  align-items: center;
+  gap: 12px;
+  margin-bottom: 16px;
+}
+
+.info-icon {
+  font-size: 1.5rem;
+}
+
+.info-title {
+  font-size: 1.1rem;
+  font-weight: 600;
+  color: var(--vp-c-text-1);
+}
+
+.info-content {
+  color: var(--vp-c-text-2);
+  line-height: 1.7;
+}
+
+.info-content ul {
+  margin: 12px 0;
+  padding-left: 20px;
+}
+
+.info-content li {
+  margin: 6px 0;
+}
+
+.info-content a {
+  color: var(--vp-c-brand-1);
+}
+</style>
diff --git a/docs/zh/guide/local-conda-cursor.md b/docs/zh/guide/local-conda-cursor.md
new file mode 100644
index 000000000..4ff9e5a2f
--- /dev/null
+++ b/docs/zh/guide/local-conda-cursor.md
@@ -0,0 +1,56 @@
+# 本地 Conda 环境（可选）
+
+仅当你在本机使用 **Cursor/VSCode** 且希望用**专用 conda 环境**时参考，无需所有人统一这样做。
+
+## 1. 让终端识别 conda
+
+若在 Cursor 终端里出现 `command not found: conda`，多半是集成终端未加载 conda。任选其一：
+
+**方式 A：当前终端临时启用**
+
+```bash
+source scripts/activate_conda.sh
+```
+
+**方式 B：长期生效**
+
+在 `~/.zshrc` 中保留 conda 初始化块（安装 Miniconda/Anaconda 时通常已添加），然后新开终端即可。
+
+## 2. 创建项目专用环境
+
+```bash
+# 先让 conda 可用（若尚未可用）
+source scripts/activate_conda.sh
+
+# 一键创建环境并安装依赖（Python 3.12 + Node 20 + 前端）
+bash scripts/setup_conda_env.sh
+```
+
+环境名为 `deeptutor`。
+
+## 3. 在 Cursor 里使用该环境
+
+- 已通过 **`.vscode/settings.json`** 指定解释器为：  
+  `~/miniconda3/envs/deeptutor/bin/python`
+- 若你用的是 **Anaconda**，请把该文件中的 `miniconda3` 改为 `anaconda3`。
+- 打开 Python 文件时，Cursor 会使用上述解释器；终端里可执行：
+
+  ```bash
+  conda activate deeptutor
+  python scripts/start_web.py
+  ```
+
+或直接：
+
+```bash
+bash scripts/run_with_conda.sh
+```
+
+## 4. 小结
+
+| 目的           | 操作 |
+|----------------|------|
+| 终端里能用 conda | `source scripts/activate_conda.sh` 或配置好 `~/.zshrc` |
+| 创建/重建环境   | `bash scripts/setup_conda_env.sh` |
+| 用指定环境启动  | `bash scripts/run_with_conda.sh` 或 `conda activate deeptutor && python scripts/start_web.py` |
+| 编辑器用该环境  | 已由 `.vscode/settings.json` 指定，无需额外操作 |
diff --git a/docs/zh/guide/local-start.md b/docs/zh/guide/local-start.md
new file mode 100644
index 000000000..64dee562d
--- /dev/null
+++ b/docs/zh/guide/local-start.md
@@ -0,0 +1,190 @@
+# 本地安装
+
+本指南介绍用于开发或非 Docker 环境的手动安装。
+
+## 前提条件
+
+- **Python 3.10+** — [下载](https://www.python.org/downloads/)
+- **Node.js 18+** — [下载](https://nodejs.org/)
+- **Git** — [下载](https://git-scm.com/)
+
+::: tip Windows 用户
+如果在安装过程中遇到路径长度错误，请启用长路径支持：
+
+```cmd
+reg add "HKLM\SYSTEM\CurrentControlSet\Control\FileSystem" /v LongPathsEnabled /t REG_DWORD /d 1 /f
+```
+
+运行此命令后重启终端。
+:::
+
+## 步骤 1：设置虚拟环境
+
+选择以下选项之一：
+
+::: code-group
+
+```bash [Conda（推荐）]
+# 创建环境
+conda create -n deeptutor python=3.10
+
+# 激活环境
+conda activate deeptutor
+```
+
+```bash [venv]
+# 创建环境
+python -m venv venv
+
+# 激活 (Windows)
+venv\Scripts\activate
+
+# 激活 (macOS/Linux)
+source venv/bin/activate
+```
+
+:::
+
+## 步骤 2：安装依赖
+
+### 选项 A：自动安装（推荐）
+
+```bash
+# 使用 Python 脚本
+python scripts/install_all.py
+
+# 或使用 shell 脚本 (macOS/Linux)
+bash scripts/install_all.sh
+```
+
+### 选项 B：手动安装
+
+```bash
+# 安装 Python 依赖
+pip install -r requirements.txt
+
+# 安装 Node.js 依赖
+npm install --prefix web
+```
+
+::: warning 常见问题
+如果看到 `npm: command not found`：
+
+```bash
+# 使用 Conda
+conda install -c conda-forge nodejs
+
+# 或从 https://nodejs.org/ 安装
+```
+:::
+
+## 步骤 3：配置环境
+
+确保您已完成[预配置](/zh/guide/pre-config)步骤：
+
+1. ✅ 创建了包含 API 密钥的 `.env` 文件
+2. ✅ （可选）自定义了 `config/agents.yaml`
+3. ✅ （可选）下载了示例知识库
+
+## 步骤 4：启动应用
+
+### 启动 Web 界面（推荐）
+
+```bash
+python scripts/start_web.py
+```
+
+这将同时启动 **前端**（Next.js）和 **后端**（FastAPI）服务器。
+
+### 替代方案：仅 CLI 界面
+
+```bash
+python scripts/start.py
+```
+
+### 访问地址
+
+| 服务 | URL | 说明 |
+|:---:|:---|:---|
+| **前端** | http://localhost:3782 | 主 Web 界面 |
+| **API 文档** | http://localhost:8001/docs | 交互式 API 文档 |
+
+## 高级：分别启动服务
+
+对于开发，您可能想要分别运行前端和后端：
+
+### 后端（FastAPI）
+
+```bash
+python src/api/run_server.py
+
+# 或直接使用 uvicorn
+uvicorn src.api.main:app --host 0.0.0.0 --port 8001 --reload
+```
+
+### 前端（Next.js）
+
+首先，创建 `web/.env.local`：
+
+```bash
+NEXT_PUBLIC_API_BASE=http://localhost:8001
+```
+
+然后启动开发服务器：
+
+```bash
+cd web
+npm install
+npm run dev -- -p 3782
+```
+
+## 停止服务
+
+在终端中按 `Ctrl+C` 停止服务。
+
+::: warning 端口仍在使用？
+如果按 Ctrl+C 后看到"端口已在使用"：
+
+**macOS/Linux：**
+```bash
+lsof -i :8001
+kill -9 <PID>
+```
+
+**Windows：**
+```bash
+netstat -ano | findstr :8001
+taskkill /PID <PID> /F
+```
+:::
+
+## 故障排除
+
+### 后端启动失败
+
+**检查清单：**
+- 确认 Python 版本 >= 3.10：`python --version`
+- 确认所有依赖已安装：`pip install -r requirements.txt`
+- 检查端口 8001 是否被占用
+- 验证 `.env` 文件配置
+
+### 前端无法连接后端
+
+**解决方案：**
+1. 确认后端正在运行：访问 http://localhost:8001/docs
+2. 检查浏览器控制台的错误信息
+3. 创建 `web/.env.local`：
+   ```bash
+   NEXT_PUBLIC_API_BASE=http://localhost:8001
+   ```
+
+### WebSocket 连接失败
+
+**检查清单：**
+- 确认后端正在运行
+- 检查防火墙设置
+- 验证 WebSocket URL 格式：`ws://localhost:8001/api/v1/...`
+
+---
+
+**下一步：** [Docker 部署 →](/zh/guide/docker-start)
diff --git a/docs/zh/guide/pre-config.md b/docs/zh/guide/pre-config.md
new file mode 100644
index 000000000..5708c2b8f
--- /dev/null
+++ b/docs/zh/guide/pre-config.md
@@ -0,0 +1,201 @@
+# 预配置
+
+在启动 DeepTutor 之前，您需要完成以下设置步骤。
+
+## 1. 克隆仓库
+
+```bash
+git clone https://github.com/HKUDS/DeepTutor.git
+cd DeepTutor
+```
+
+## 2. 环境变量配置
+
+从模板创建 `.env` 文件：
+
+```bash
+cp .env.example .env
+```
+
+然后编辑 `.env` 文件，填入您的 API 密钥：
+
+```bash
+# ============================================================================
+# 服务器配置
+# ============================================================================
+BACKEND_PORT=8001                         # 后端 API 端口
+FRONTEND_PORT=3782                        # 前端 Web 端口
+
+# 远程/局域网访问 - 设置为您服务器的 IP 地址
+# NEXT_PUBLIC_API_BASE=http://192.168.1.100:8001
+
+# ============================================================================
+# LLM (大语言模型) 配置 - 必填
+# ============================================================================
+LLM_BINDING=openai                        # 提供商: openai, anthropic, azure_openai, ollama 等
+LLM_MODEL=gpt-4o                          # 模型名: gpt-4o, deepseek-chat, claude-3-5-sonnet 等
+LLM_HOST=https://api.openai.com/v1        # API 端点 URL
+LLM_API_KEY=your_api_key                  # 您的 LLM API 密钥
+
+# ============================================================================
+# 嵌入模型配置 - 知识库必填
+# ============================================================================
+EMBEDDING_BINDING=openai                  # 提供商类型
+EMBEDDING_MODEL=text-embedding-3-large    # 嵌入模型名称
+EMBEDDING_DIMENSION=3072                  # 必须与模型维度匹配
+EMBEDDING_HOST=https://api.openai.com/v1  # API 端点
+EMBEDDING_API_KEY=your_api_key            # 嵌入 API 密钥
+
+# ============================================================================
+# 网络搜索配置 - 可选
+# ============================================================================
+SEARCH_PROVIDER=perplexity                # 选项: perplexity, tavily, serper, jina, exa, baidu
+SEARCH_API_KEY=your_search_api_key        # 搜索提供商的 API 密钥
+```
+
+### 环境变量参考
+
+| 变量 | 必填 | 说明 |
+|:---|:---:|:---|
+| `LLM_MODEL` | **是** | 模型名称 (如 `gpt-4o`, `deepseek-chat`) |
+| `LLM_API_KEY` | **是** | 您的 LLM API 密钥 |
+| `LLM_HOST` | **是** | API 端点 URL |
+| `EMBEDDING_MODEL` | **是** | 嵌入模型名称 |
+| `EMBEDDING_DIMENSION` | **是** | 必须与模型输出维度匹配 |
+| `EMBEDDING_API_KEY` | **是** | 嵌入 API 密钥 |
+| `EMBEDDING_HOST` | **是** | 嵌入 API 端点 |
+| `BACKEND_PORT` | 否 | 后端端口 (默认: `8001`) |
+| `FRONTEND_PORT` | 否 | 前端端口 (默认: `3782`) |
+| `NEXT_PUBLIC_API_BASE` | 否 | 设置用于远程/局域网访问 |
+| `SEARCH_PROVIDER` | 否 | 网络搜索提供商 |
+| `SEARCH_API_KEY` | 否 | 搜索 API 密钥 |
+
+### 支持的 LLM 提供商
+
+| 提供商 | `LLM_BINDING` 值 | 说明 |
+|:---------|:--------------------|:------|
+| OpenAI | `openai` | GPT-4o, GPT-4, GPT-3.5 |
+| Anthropic | `anthropic` | Claude 3.5, Claude 3 |
+| Azure OpenAI | `azure_openai` | 企业部署 |
+| Ollama | `ollama` | 本地模型 |
+| DeepSeek | `deepseek` | DeepSeek-V3, DeepSeek-R1 |
+| Groq | `groq` | 快速推理 |
+| OpenRouter | `openrouter` | 多模型网关 |
+| Google Gemini | `gemini` | OpenAI 兼容模式 |
+
+### 支持的嵌入提供商
+
+| 提供商 | `EMBEDDING_BINDING` 值 | 说明 |
+|:---------|:--------------------------|:------|
+| OpenAI | `openai` | text-embedding-3-large/small |
+| Azure OpenAI | `azure_openai` | 企业部署 |
+| Jina AI | `jina` | jina-embeddings-v3 |
+| Cohere | `cohere` | embed-v3 系列 |
+| Ollama | `ollama` | 本地嵌入模型 |
+| LM Studio | `lm_studio` | 本地推理服务器 |
+| HuggingFace | `huggingface` | OpenAI 兼容端点 |
+
+## 3. 配置文件
+
+DeepTutor 使用两个 YAML 配置文件进行自定义：
+
+### `config/agents.yaml` - Agent 参数
+
+此文件控制每个模块的 LLM 参数：
+
+```yaml
+# 解题模块 - 问题求解 agents
+solve:
+  temperature: 0.3
+  max_tokens: 8192
+
+# 研究模块 - 深度研究 agents  
+research:
+  temperature: 0.5
+  max_tokens: 12000
+
+# 题目模块 - 题目生成 agents
+question:
+  temperature: 0.7
+  max_tokens: 4096
+
+# 引导模块 - 学习引导 agents
+guide:
+  temperature: 0.5
+  max_tokens: 16192
+
+# 灵感生成模块 - 想法生成 agents
+ideagen:
+  temperature: 0.7
+  max_tokens: 4096
+
+# 协作写作模块 - 协作写作 agents
+co_writer:
+  temperature: 0.7
+  max_tokens: 4096
+```
+
+### `config/main.yaml` - 系统设置
+
+此文件控制路径、工具和模块特定设置：
+
+```yaml
+# 系统语言
+system:
+  language: en
+
+# 数据路径
+paths:
+  user_data_dir: ./data/user
+  knowledge_bases_dir: ./data/knowledge_bases
+
+# 工具配置
+tools:
+  rag_tool:
+    kb_base_dir: ./data/knowledge_bases
+    default_kb: ai_textbook
+  run_code:
+    workspace: ./data/user/run_code_workspace
+  web_search:
+    enabled: true
+  query_item:
+    enabled: true
+    max_results: 5
+
+# 模块特定设置
+research:
+  researching:
+    execution_mode: series      # "series" 或 "parallel"
+    max_iterations: 5
+    enable_rag_hybrid: true
+    enable_paper_search: true
+    enable_web_search: true
+```
+
+> **提示：** 对于大多数用户，默认配置已经足够好用。只有在需要特定自定义时才修改这些文件。
+
+## 4. 知识库准备（可选）
+
+您可以使用我们预构建的示例知识库来快速开始。
+
+### 下载示例知识库
+
+从 [Google Drive](https://drive.google.com/drive/folders/1iWwfZXiTuQKQqUYb5fGDZjLCeTUP6DA6?usp=sharing) 下载并解压到 `data/` 目录。
+
+::: info 重要提示
+示例知识库使用 `text-embedding-3-large`，`dimensions = 3072`。请确保您的嵌入模型具有匹配的维度。
+:::
+
+### 创建您自己的知识库
+
+启动 DeepTutor 后：
+
+1. 导航到 `http://localhost:3782/knowledge`
+2. 点击 **"New Knowledge Base"**
+3. 输入唯一的名称
+4. 上传 PDF/TXT/MD 文件
+5. 在终端中监控进度
+
+---
+
+**下一步：** [数据准备 →](/zh/guide/data-preparation)
diff --git a/docs/zh/guide/troubleshooting.md b/docs/zh/guide/troubleshooting.md
new file mode 100644
index 000000000..4bccdce0d
--- /dev/null
+++ b/docs/zh/guide/troubleshooting.md
@@ -0,0 +1,48 @@
+# 常见问题
+
+快速解决常见问题。
+
+## 启动问题
+
+| 问题 | 解决方案 |
+|:--------|:---------|
+| 后端启动失败 | 检查 Python ≥ 3.10，验证 `.env` 配置 |
+| `npm: command not found` | 安装 Node.js: `conda install -c conda-forge nodejs` |
+| 端口已被占用 | 终止进程：`lsof -i :8001` → `kill -9 <PID>` |
+
+## 连接问题
+
+| 问题 | 解决方案 |
+|:--------|:---------|
+| 前端无法连接后端 | 确认后端运行在 <http://localhost:8001/docs> |
+| WebSocket 连接失败 | 检查防火墙，确认 `ws://localhost:8001/api/v1/...` 格式 |
+| 远程访问失败 | 在 `.env` 中设置 `NEXT_PUBLIC_API_BASE=http://your-ip:8001` |
+
+## Docker 问题
+
+| 问题 | 解决方案 |
+|:--------|:---------|
+| 云端前端无法连接 | 设置 `NEXT_PUBLIC_API_BASE_EXTERNAL=https://your-server:8001` |
+| 架构不匹配 | 使用 `uname -m` 检查：AMD64 用 `:latest`，ARM 用 `:latest-arm64` |
+
+## 知识库问题
+
+| 问题 | 解决方案 |
+|:--------|:---------|
+| 处理卡住 | 检查终端日志，验证 API 密钥 |
+| `uvloop.Loop` 错误 | 运行：`./scripts/extract_numbered_items.sh <kb_name>` |
+
+## 终止后台进程
+
+```bash
+# macOS/Linux
+lsof -i :8001 && kill -9 <PID>
+
+# Windows
+netstat -ano | findstr :8001
+taskkill /PID <PID> /F
+```
+
+---
+
+📖 **完整 FAQ**: [GitHub README](https://github.com/HKUDS/DeepTutor#-faq)
diff --git a/docs/zh/index.md b/docs/zh/index.md
new file mode 100644
index 000000000..5cf53712c
--- /dev/null
+++ b/docs/zh/index.md
@@ -0,0 +1,77 @@
+---
+layout: home
+
+hero:
+  name: "DeepTutor"
+  text: "你的 AI 学习伙伴"
+  tagline: 将任何文档转化为多智能体驱动的互动学习体验
+  image:
+    src: /logo.png
+    alt: DeepTutor
+  actions:
+    - theme: brand
+      text: 快速开始 →
+      link: /zh/guide/pre-config
+    - theme: alt
+      text: GitHub
+      link: https://github.com/HKUDS/DeepTutor
+
+features:
+  - icon: 📚
+    title: 海量文档问答
+    details: 上传教材、论文和手册，构建基于 RAG 和知识图谱的 AI 知识库。
+  - icon: 🧠
+    title: 智能解题
+    details: 双循环推理架构配合多智能体协作，提供带有精准文档引用的逐步解答。
+  - icon: 🎯
+    title: 题目生成
+    details: 基于知识库生成自定义测验，或模拟真实考试风格进行练习。
+  - icon: 🎓
+    title: 引导学习
+    details: 个性化学习路径，配合交互式可视化和自适应讲解。
+  - icon: 🔬
+    title: 深度研究
+    details: 系统化主题探索，整合网络搜索、论文检索和文献综合。
+  - icon: 💡
+    title: 灵感生成
+    details: AI 辅助头脑风暴，知识提取与多阶段筛选。
+---
+
+## 为什么选择 DeepTutor？
+
+- **深度理解** — 不只是答案，而是带有可视化讲解的引导式学习之旅
+- **多模态支持** — PDF、LaTeX、图片、代码执行等全面支持
+- **知识图谱** — 基于 LightRAG 的语义连接，实现更好的理解
+- **一站式平台** — 解题、题目生成、研究、灵感生成集于一体
+
+<style>
+:root {
+  --vp-home-hero-name-color: transparent;
+  --vp-home-hero-name-background: linear-gradient(135deg, #667eea 0%, #764ba2 50%, #f093fb 100%);
+  --vp-home-hero-image-background-image: linear-gradient(135deg, rgba(102, 126, 234, 0.2) 0%, rgba(118, 75, 162, 0.2) 50%, rgba(240, 147, 251, 0.15) 100%);
+  --vp-home-hero-image-filter: blur(72px);
+}
+
+.dark {
+  --vp-home-hero-image-background-image: linear-gradient(135deg, rgba(102, 126, 234, 0.15) 0%, rgba(118, 75, 162, 0.15) 50%, rgba(240, 147, 251, 0.1) 100%);
+}
+
+.VPHero .name {
+  font-size: 4.5rem !important;
+  line-height: 1.1 !important;
+}
+
+.VPHero .text {
+  font-size: 2.4rem !important;
+  font-weight: 600 !important;
+}
+
+@media (max-width: 768px) {
+  .VPHero .name {
+    font-size: 3rem !important;
+  }
+  .VPHero .text {
+    font-size: 1.8rem !important;
+  }
+}
+</style>
diff --git a/pyproject.toml b/pyproject.toml
index 1b608155e..9080f5289 100644
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -16,6 +16,7 @@ dependencies = [
     "python-dotenv>=1.0.0",
     "PyYAML>=6.0",
     "jinja2>=3.1.0",
+    "Markdown>=3.6",
     "openai>=1.30.0",
     "tiktoken>=0.5.0",
     "aiohttp>=3.9.4",
@@ -45,6 +46,7 @@ server = [
     "uvicorn[standard]>=0.24.0",
     "websockets>=12.0",
     "python-multipart>=0.0.6",
+    "WeasyPrint>=62.0",
 ]
 math-animator = ["manim>=0.19.0"]
 all = [
@@ -56,6 +58,7 @@ all = [
     "uvicorn[standard]>=0.24.0",
     "websockets>=12.0",
     "python-multipart>=0.0.6",
+    "WeasyPrint>=62.0",
     "manim>=0.19.0",
 ]
 
diff --git a/requirements/cli.txt b/requirements/cli.txt
index dd0b84489..204c0696d 100644
--- a/requirements/cli.txt
+++ b/requirements/cli.txt
@@ -8,6 +8,7 @@
 python-dotenv>=1.0.0
 PyYAML>=6.0
 jinja2>=3.1.0
+Markdown>=3.6
 
 # --- LLM ---
 openai>=1.30.0
diff --git a/requirements/server.txt b/requirements/server.txt
index 6c7350fb1..e11cfe658 100644
--- a/requirements/server.txt
+++ b/requirements/server.txt
@@ -11,3 +11,4 @@ fastapi>=0.100.0
 uvicorn[standard]>=0.24.0
 websockets>=12.0
 python-multipart>=0.0.6
+WeasyPrint>=62.0
diff --git a/tests/api/test_structure_note_router.py b/tests/api/test_structure_note_router.py
new file mode 100644
index 000000000..300582367
--- /dev/null
+++ b/tests/api/test_structure_note_router.py
@@ -0,0 +1,325 @@
+from __future__ import annotations
+
+import json
+from pathlib import Path
+
+import pytest
+
+try:
+    from fastapi import FastAPI
+    from fastapi.testclient import TestClient
+except Exception:  # pragma: no cover
+    FastAPI = None
+    TestClient = None
+
+pytestmark = pytest.mark.skipif(
+    FastAPI is None or TestClient is None, reason="fastapi not installed"
+)
+
+if FastAPI is not None and TestClient is not None:
+    from deeptutor.api.routers import structure_note as structure_note_router_module
+    from deeptutor.services.structure_note import (
+        DifficultyLevel,
+        ExplanationStyleLevel,
+        JobStatus,
+        NoteLanguage,
+        StructureNoteManager,
+        StructureNoteStorage,
+    )
+
+    router = structure_note_router_module.router
+else:  # pragma: no cover
+    structure_note_router_module = None
+    router = None
+
+
+def _build_app() -> FastAPI:
+    if FastAPI is None or router is None:  # pragma: no cover
+        raise RuntimeError("fastapi is not installed")
+    app = FastAPI()
+    app.include_router(router, prefix="/api/v1/structure-note")
+    return app
+
+
+def _write_kb_raw_file(
+    tmp_path: Path,
+    kb_name: str,
+    file_name: str,
+    content: bytes = b"%PDF-1.4\n%%EOF",
+) -> Path:
+    kb_base = tmp_path / "data" / "knowledge_bases"
+    raw_dir = kb_base / kb_name / "raw"
+    raw_dir.mkdir(parents=True, exist_ok=True)
+    (kb_base / kb_name / "llamaindex_storage").mkdir(parents=True, exist_ok=True)
+    config_path = kb_base / "kb_config.json"
+    config = (
+        json.loads(config_path.read_text(encoding="utf-8"))
+        if config_path.exists()
+        else {"knowledge_bases": {}}
+    )
+    config.setdefault("knowledge_bases", {})[kb_name] = {
+        "path": kb_name,
+        "status": "ready",
+        "rag_provider": "llamaindex",
+    }
+    config_path.write_text(json.dumps(config), encoding="utf-8")
+    source_path = raw_dir / file_name
+    source_path.write_bytes(content)
+    return source_path
+
+
+@pytest.fixture
+def manager(tmp_path: Path):
+    storage = StructureNoteStorage()
+    original_root = storage.path_service._project_root
+    original_user_dir = storage.path_service._user_data_dir
+    try:
+        storage.path_service._project_root = tmp_path
+        storage.path_service._user_data_dir = tmp_path / "data" / "user"
+        storage.path_service.ensure_all_directories()
+        yield StructureNoteManager(storage=storage)
+    finally:
+        storage.path_service._project_root = original_root
+        storage.path_service._user_data_dir = original_user_dir
+
+
+def test_create_job_returns_contract(monkeypatch, manager) -> None:
+    monkeypatch.setattr(structure_note_router_module, "_structure_note_manager", manager)
+
+    async def _noop_run(*_args, **_kwargs):
+        return None
+
+    monkeypatch.setattr(structure_note_router_module, "_run_structure_note_job", _noop_run)
+
+    with TestClient(_build_app()) as client:
+        response = client.post(
+            "/api/v1/structure-note/jobs",
+            data={
+                "difficulty_level": DifficultyLevel.MEDIUM.value,
+                "note_language": NoteLanguage.EN.value,
+                "style_level": ExplanationStyleLevel.HIGH.value,
+                "project_name": "Course A",
+            },
+            files={
+                "file": (
+                    "chapter.pdf",
+                    b"%PDF-1.4\n1 0 obj\n<<>>\nendobj\ntrailer\n<<>>\n%%EOF",
+                    "application/pdf",
+                )
+            },
+        )
+
+    assert response.status_code == 200
+    body = response.json()
+    assert body["file_name"] == "chapter.pdf"
+    assert body["difficulty_level"] == "medium"
+    assert body["note_language"] == "en"
+    assert body["style_level"] == "high"
+    assert body["project_name"] == "Course A"
+    assert body["note_title"] == "chapter"
+    assert body["source_kind"] == "upload"
+    assert body["status"] == "queued"
+    assert isinstance(body["task_id"], str) and body["task_id"]
+
+
+def test_create_and_rename_project_updates_jobs(monkeypatch, manager) -> None:
+    monkeypatch.setattr(structure_note_router_module, "_structure_note_manager", manager)
+
+    async def _noop_run(*_args, **_kwargs):
+        return None
+
+    monkeypatch.setattr(structure_note_router_module, "_run_structure_note_job", _noop_run)
+
+    with TestClient(_build_app()) as client:
+        create_project_response = client.post(
+            "/api/v1/structure-note/projects",
+            data={"name": "Course A"},
+        )
+        create_job_response = client.post(
+            "/api/v1/structure-note/jobs",
+            data={
+                "difficulty_level": DifficultyLevel.MEDIUM.value,
+                "note_language": NoteLanguage.EN.value,
+                "style_level": ExplanationStyleLevel.MEDIUM.value,
+                "project_name": "Course A",
+            },
+            files={
+                "file": (
+                    "chapter.pdf",
+                    b"%PDF-1.4\n1 0 obj\n<<>>\nendobj\ntrailer\n<<>>\n%%EOF",
+                    "application/pdf",
+                )
+            },
+        )
+        rename_response = client.post(
+            "/api/v1/structure-note/projects/Course%20A/rename",
+            data={"new_name": "Course B"},
+        )
+        list_response = client.get("/api/v1/structure-note/projects")
+        detail_response = client.get(
+            f"/api/v1/structure-note/jobs/{create_job_response.json()['job_id']}"
+        )
+
+    assert create_project_response.status_code == 200
+    assert create_project_response.json()["name"] == "Course A"
+    assert create_job_response.status_code == 200
+    assert rename_response.status_code == 200
+    assert rename_response.json()["name"] == "Course B"
+    project_names = [project["name"] for project in list_response.json()["projects"]]
+    assert "Course B" in project_names
+    assert "Course A" not in project_names
+    assert detail_response.json()["project_name"] == "Course B"
+
+
+def test_delete_project_removes_jobs(monkeypatch, manager) -> None:
+    monkeypatch.setattr(structure_note_router_module, "_structure_note_manager", manager)
+    job_dirs = manager.storage.ensure_job_dirs("job_project_delete")
+    source_path = job_dirs["source"] / "demo.pdf"
+    source_path.write_text("pdf", encoding="utf-8")
+    artifact = manager.create_job(
+        file_name="demo.pdf",
+        source_format="pdf",
+        difficulty_level=DifficultyLevel.SIMPLE,
+        note_language=NoteLanguage.ZH,
+        style_level=ExplanationStyleLevel.LOW,
+        source_path=source_path,
+        task_id="task_1",
+        job_id="job_project_delete",
+        project_name="Course A",
+    )
+    assert manager.storage.get_job_dir(artifact.job_id).exists()
+
+    with TestClient(_build_app()) as client:
+        response = client.delete("/api/v1/structure-note/projects/Course%20A")
+        list_response = client.get("/api/v1/structure-note/jobs")
+
+    assert response.status_code == 200
+    assert response.json()["deleted_job_ids"] == ["job_project_delete"]
+    assert not manager.storage.get_job_dir(artifact.job_id).exists()
+    assert list_response.json()["jobs"] == []
+
+
+def test_list_and_detail_jobs(monkeypatch, manager) -> None:
+    monkeypatch.setattr(structure_note_router_module, "_structure_note_manager", manager)
+    job_dirs = manager.storage.ensure_job_dirs("job_1")
+    source_path = job_dirs["source"] / "demo.pdf"
+    source_path.write_text("pdf", encoding="utf-8")
+    artifact = manager.create_job(
+        file_name="demo.pdf",
+        source_format="pdf",
+        difficulty_level=DifficultyLevel.SIMPLE,
+        note_language=NoteLanguage.ZH,
+        style_level=ExplanationStyleLevel.LOW,
+        source_path=source_path,
+        task_id="task_1",
+        job_id="job_1",
+    )
+    manager.update_status(artifact, JobStatus.FAILED, error="boom", task_id="task_1")
+
+    with TestClient(_build_app()) as client:
+        list_response = client.get("/api/v1/structure-note/jobs")
+        detail_response = client.get("/api/v1/structure-note/jobs/job_1")
+
+    assert list_response.status_code == 200
+    jobs = list_response.json()["jobs"]
+    assert jobs[0]["job_id"] == "job_1"
+    assert detail_response.status_code == 200
+    assert detail_response.json()["retry_available"] is True
+    assert detail_response.json()["note_language"] == "zh"
+    assert detail_response.json()["style_level"] == "low"
+
+
+def test_retry_failed_job(monkeypatch, manager) -> None:
+    monkeypatch.setattr(structure_note_router_module, "_structure_note_manager", manager)
+
+    async def _noop_run(*_args, **_kwargs):
+        return None
+
+    monkeypatch.setattr(structure_note_router_module, "_run_structure_note_job", _noop_run)
+
+    job_dirs = manager.storage.ensure_job_dirs("job_retry")
+    source_path = job_dirs["source"] / "deck.pdf"
+    source_path.write_text("pdf", encoding="utf-8")
+    artifact = manager.create_job(
+        file_name="deck.pdf",
+        source_format="pdf",
+        difficulty_level=DifficultyLevel.MEDIUM,
+        note_language=NoteLanguage.EN,
+        style_level=ExplanationStyleLevel.MEDIUM,
+        source_path=source_path,
+        task_id="task_old",
+        job_id="job_retry",
+    )
+    manager.update_status(artifact, JobStatus.FAILED, error="old error", task_id="task_old")
+
+    with TestClient(_build_app()) as client:
+        response = client.post("/api/v1/structure-note/jobs/job_retry/retry")
+
+    assert response.status_code == 200
+    body = response.json()
+    assert body["job_id"] == "job_retry"
+    assert body["status"] == "queued"
+    assert body["task_id"] != "task_old"
+
+
+def test_list_knowledge_base_source_files(monkeypatch, tmp_path: Path, manager) -> None:
+    monkeypatch.setattr(structure_note_router_module, "_structure_note_manager", manager)
+    monkeypatch.setattr(
+        structure_note_router_module,
+        "_kb_base_dir",
+        tmp_path / "data" / "knowledge_bases",
+    )
+    _write_kb_raw_file(tmp_path, "Math", "lesson.pdf")
+    _write_kb_raw_file(tmp_path, "Ignored", "notes.txt")
+
+    with TestClient(_build_app()) as client:
+        response = client.get("/api/v1/structure-note/kb/files")
+
+    assert response.status_code == 200
+    groups = response.json()["knowledge_bases"]
+    math_group = next(group for group in groups if group["kb_name"] == "Math")
+    assert math_group["files"][0]["file_id"] == "lesson.pdf"
+    assert math_group["files"][0]["file_name"] == "lesson.pdf"
+    ignored_group = next(group for group in groups if group["kb_name"] == "Ignored")
+    assert ignored_group["files"] == []
+
+
+def test_create_job_from_knowledge_base_file(monkeypatch, tmp_path: Path, manager) -> None:
+    monkeypatch.setattr(structure_note_router_module, "_structure_note_manager", manager)
+    monkeypatch.setattr(
+        structure_note_router_module,
+        "_kb_base_dir",
+        tmp_path / "data" / "knowledge_bases",
+    )
+
+    async def _noop_run(*_args, **_kwargs):
+        return None
+
+    monkeypatch.setattr(structure_note_router_module, "_run_structure_note_job", _noop_run)
+    _write_kb_raw_file(tmp_path, "Math", "lesson.pdf")
+
+    with TestClient(_build_app()) as client:
+        response = client.post(
+            "/api/v1/structure-note/jobs/from-kb",
+            data={
+                "kb_name": "Math",
+                "file_id": "lesson.pdf",
+                "difficulty_level": DifficultyLevel.SIMPLE.value,
+                "note_language": NoteLanguage.ZH.value,
+                "style_level": ExplanationStyleLevel.MEDIUM.value,
+            },
+        )
+
+    assert response.status_code == 200
+    body = response.json()
+    assert body["file_name"] == "lesson.pdf"
+    assert body["project_name"] == "Math"
+    assert body["note_title"] == "lesson"
+    assert body["source_kind"] == "knowledge_base"
+    assert body["source_ref"] == {
+        "kb_name": "Math",
+        "file_id": "lesson.pdf",
+        "file_name": "lesson.pdf",
+    }
+    artifact = manager.get_job(body["job_id"])
+    assert Path(artifact.source_path).exists()
diff --git a/tests/services/test_path_service.py b/tests/services/test_path_service.py
index 50162e2a5..c7222e924 100644
--- a/tests/services/test_path_service.py
+++ b/tests/services/test_path_service.py
@@ -30,9 +30,10 @@ def test_public_output_filter_allows_only_whitelisted_artifacts(tmp_path: Path)
         denied.parent.mkdir(parents=True, exist_ok=True)
         denied.write_text("{}", encoding="utf-8")
 
-        assert service.is_public_output_path(
-            "workspace/chat/deep_solve/solve_1/artifacts/plot.png"
-        ) is True
+        assert (
+            service.is_public_output_path("workspace/chat/deep_solve/solve_1/artifacts/plot.png")
+            is True
+        )
         assert service.is_public_output_path("settings/env.json") is False
         assert service.is_public_output_path("../outside.txt") is False
     finally:
@@ -73,12 +74,16 @@ def test_public_output_filter_allows_math_animator_artifacts(tmp_path: Path) ->
         denied.parent.mkdir(parents=True, exist_ok=True)
         denied.write_text("print('debug')", encoding="utf-8")
 
-        assert service.is_public_output_path(
-            "workspace/chat/math_animator/turn_1/artifacts/animation.mp4"
-        ) is True
-        assert service.is_public_output_path(
-            "workspace/chat/math_animator/turn_1/source/scene.py"
-        ) is False
+        assert (
+            service.is_public_output_path(
+                "workspace/chat/math_animator/turn_1/artifacts/animation.mp4"
+            )
+            is True
+        )
+        assert (
+            service.is_public_output_path("workspace/chat/math_animator/turn_1/source/scene.py")
+            is False
+        )
     finally:
         service._project_root = original_root
         service._user_data_dir = original_user_dir
@@ -97,13 +102,72 @@ def test_task_workspace_maps_capabilities_into_workspace_chat(tmp_path: Path) ->
             tmp_path / "data" / "user" / "workspace" / "chat" / "chat" / "turn_1"
         )
         assert service.get_task_workspace("deep_question", "turn_2") == (
-            tmp_path
-            / "data"
-            / "user"
+            tmp_path / "data" / "user" / "workspace" / "chat" / "deep_question" / "turn_2"
+        )
+    finally:
+        service._project_root = original_root
+        service._user_data_dir = original_user_dir
+
+
+def test_public_output_filter_allows_structure_note_markdown_pdf_and_images(tmp_path: Path) -> None:
+    service = PathService.get_instance()
+    original_root = service._project_root
+    original_user_dir = service._user_data_dir
+
+    try:
+        service._project_root = tmp_path
+        service._user_data_dir = tmp_path / "data" / "user"
+
+        allowed = (
+            service._user_data_dir
             / "workspace"
-            / "chat"
-            / "deep_question"
-            / "turn_2"
+            / "structure_note"
+            / "job_1"
+            / "final"
+            / "final.pdf"
+        )
+        allowed.parent.mkdir(parents=True, exist_ok=True)
+        allowed.write_text("pdf", encoding="utf-8")
+        allowed_md = allowed.with_name("rendered.md")
+        allowed_md.write_text("# Note", encoding="utf-8")
+        allowed_image = (
+            service._user_data_dir
+            / "workspace"
+            / "structure_note"
+            / "job_1"
+            / "images"
+            / "figure.png"
+        )
+        allowed_image.parent.mkdir(parents=True, exist_ok=True)
+        allowed_image.write_text("png", encoding="utf-8")
+
+        denied = (
+            service._user_data_dir
+            / "workspace"
+            / "structure_note"
+            / "job_1"
+            / "chunks"
+            / "generation_chunks.json"
+        )
+        denied.parent.mkdir(parents=True, exist_ok=True)
+        denied.write_text("{}", encoding="utf-8")
+
+        assert (
+            service.is_public_output_path("workspace/structure_note/job_1/final/final.pdf") is True
+        )
+        assert (
+            service.is_public_output_path("workspace/structure_note/job_1/final/rendered.md")
+            is True
+        )
+        assert (
+            service.is_public_output_path("workspace/structure_note/job_1/images/figure.png")
+            is True
+        )
+        assert (
+            service.is_public_output_path(
+                "workspace/structure_note/job_1/chunks/generation_chunks.json"
+            )
+            is False
         )
     finally:
         service._project_root = original_root
diff --git a/tests/services/test_runtime_storage_guard.py b/tests/services/test_runtime_storage_guard.py
index 068505b60..a713ddd1c 100644
--- a/tests/services/test_runtime_storage_guard.py
+++ b/tests/services/test_runtime_storage_guard.py
@@ -2,9 +2,9 @@
 
 from pathlib import Path
 
+from deeptutor.agents.research.utils.citation_manager import CitationManager
 from deeptutor.services.config.loader import load_config_with_main
 from deeptutor.services.path_service import PathService
-from deeptutor.agents.research.utils.citation_manager import CitationManager
 
 
 def test_runtime_config_paths_are_confined_to_data_user() -> None:
@@ -18,6 +18,7 @@ def test_runtime_config_paths_are_confined_to_data_user() -> None:
     assert Path(paths["research_output_dir"]).resolve().is_relative_to(user_root)
     assert Path(paths["research_reports_dir"]).resolve().is_relative_to(user_root)
     assert Path(paths["guide_output_dir"]).resolve().is_relative_to(user_root)
+    assert Path(paths["structure_note_output_dir"]).resolve().is_relative_to(user_root)
     assert Path(paths["user_log_dir"]).resolve() == user_root / "logs"
     assert Path(config["tools"]["run_code"]["workspace"]).resolve().is_relative_to(user_root)
 
@@ -34,13 +35,7 @@ def test_citation_manager_defaults_to_research_workspace(tmp_path: Path) -> None
         manager = CitationManager("research_123")
 
         assert manager.cache_dir == (
-            tmp_path
-            / "data"
-            / "user"
-            / "workspace"
-            / "chat"
-            / "deep_research"
-            / "research_123"
+            tmp_path / "data" / "user" / "workspace" / "chat" / "deep_research" / "research_123"
         )
     finally:
         service._project_root = original_root
diff --git a/tests/services/test_structure_note_service.py b/tests/services/test_structure_note_service.py
new file mode 100644
index 000000000..679b583a4
--- /dev/null
+++ b/tests/services/test_structure_note_service.py
@@ -0,0 +1,373 @@
+from __future__ import annotations
+
+from pathlib import Path
+
+import pytest
+
+from deeptutor.services.structure_note import generator as generator_module
+from deeptutor.services.structure_note.difficulty import get_difficulty_preset
+from deeptutor.services.structure_note.generator import (
+    _combination_instruction,
+    build_generation_chunks,
+    generate_transition_markdown,
+)
+from deeptutor.services.structure_note.image_pipeline import process_images
+from deeptutor.services.structure_note.manager import StructureNoteManager
+from deeptutor.services.structure_note.markdown_postprocessor import (
+    normalize_structure_note_markdown,
+    validate_renderer_compatible_markdown,
+)
+from deeptutor.services.structure_note.models import (
+    DifficultyLevel,
+    ExplanationStyleLevel,
+    GenerationChunk,
+    JobStatus,
+    NoteLanguage,
+    PageIndexPage,
+    SectionTreeNode,
+    StructureNoteArtifact,
+)
+from deeptutor.services.structure_note.normalizer import NormalizationError, normalize_to_pdf
+from deeptutor.services.structure_note.planner import build_document_plan
+from deeptutor.services.structure_note.tree_builder import build_section_tree
+
+
+def _page(page_number: int, *, text: str = "", image_candidates=None) -> PageIndexPage:
+    return PageIndexPage(
+        page_number=page_number,
+        width=800,
+        height=1200,
+        text=text,
+        text_blocks=[],
+        title_candidates=[],
+        image_candidates=image_candidates or [],
+    )
+
+
+def test_normalizer_requires_soffice_for_ppt(monkeypatch, tmp_path: Path) -> None:
+    ppt_path = tmp_path / "deck.pptx"
+    ppt_path.write_text("fake", encoding="utf-8")
+    monkeypatch.setattr("shutil.which", lambda _name: None)
+
+    with pytest.raises(NormalizationError) as exc:
+        normalize_to_pdf(ppt_path, tmp_path / "normalized")
+
+    assert "LibreOffice" in str(exc.value)
+
+
+def test_generation_chunks_use_difficulty_window() -> None:
+    pages = [_page(index, text=f"content {index}") for index in range(1, 15)]
+    chunks = build_generation_chunks(pages, [], get_difficulty_preset(DifficultyLevel.DETAILED))
+
+    assert chunks
+    assert all(len(chunk.page_numbers) <= 6 for chunk in chunks)
+    assert chunks[0].page_start == 1
+
+
+def test_generation_chunks_use_section_plan_not_page_windows() -> None:
+    pages = [_page(index, text=f"content {index}") for index in range(1, 15)]
+    sections = [
+        SectionTreeNode(
+            section_id="section-001",
+            title="Long Section",
+            level=2,
+            page_start=1,
+            page_end=14,
+            summary="A long section.",
+            path=["Long Section"],
+        )
+    ]
+    plan = build_document_plan(pages, sections, document_title="demo.pdf", language="en")
+    chunks = build_generation_chunks(
+        pages,
+        sections,
+        get_difficulty_preset(DifficultyLevel.DETAILED),
+        document_plan=plan,
+    )
+
+    assert len(chunks) == 1
+    assert chunks[0].section_id == "section-001"
+    assert chunks[0].page_start == 1
+    assert chunks[0].page_end == 14
+    assert chunks[0].evidence
+
+
+def test_generation_chunks_limit_parent_section_to_overview_pages() -> None:
+    pages = [_page(index, text=f"content {index}") for index in range(1, 7)]
+    sections = [
+        SectionTreeNode(
+            section_id="section-001",
+            title="Chapter",
+            level=2,
+            page_start=1,
+            page_end=6,
+            summary="Chapter overview.",
+            child_ids=["section-002"],
+            path=["Chapter"],
+        ),
+        SectionTreeNode(
+            section_id="section-002",
+            title="Main Topic",
+            level=3,
+            page_start=2,
+            page_end=6,
+            parent_id="section-001",
+            summary="Main details.",
+            path=["Chapter", "Main Topic"],
+        ),
+    ]
+    plan = build_document_plan(pages, sections, document_title="demo.pdf", language="en")
+    chunks = build_generation_chunks(
+        pages,
+        sections,
+        get_difficulty_preset(DifficultyLevel.MEDIUM),
+        document_plan=plan,
+    )
+
+    assert [chunk.section_id for chunk in chunks] == ["section-001", "section-002"]
+    assert chunks[0].page_numbers == [1]
+    assert chunks[1].page_numbers == [2, 3, 4, 5, 6]
+
+
+@pytest.mark.parametrize(
+    ("depth", "style", "expected"),
+    [
+        (DifficultyLevel.SIMPLE, ExplanationStyleLevel.LOW, "短篇幅、低门槛"),
+        (DifficultyLevel.SIMPLE, ExplanationStyleLevel.MEDIUM, "核心知识骨架"),
+        (DifficultyLevel.SIMPLE, ExplanationStyleLevel.HIGH, "short but dense"),
+        (DifficultyLevel.MEDIUM, ExplanationStyleLevel.LOW, "中等篇幅、科普风格"),
+        (DifficultyLevel.MEDIUM, ExplanationStyleLevel.MEDIUM, "默认模式"),
+        (DifficultyLevel.MEDIUM, ExplanationStyleLevel.HIGH, "学术课堂风格"),
+        (DifficultyLevel.DETAILED, ExplanationStyleLevel.LOW, "长篇幅、低门槛"),
+        (DifficultyLevel.DETAILED, ExplanationStyleLevel.MEDIUM, "完整课堂讲义"),
+        (DifficultyLevel.DETAILED, ExplanationStyleLevel.HIGH, "学术讲义/课程笔记"),
+    ],
+)
+def test_depth_style_combinations_have_stable_prompt_semantics(
+    depth: DifficultyLevel,
+    style: ExplanationStyleLevel,
+    expected: str,
+) -> None:
+    assert expected in _combination_instruction(depth, style, NoteLanguage.ZH.value)
+
+
+def test_markdown_postprocessor_normalizes_renderer_math_syntax() -> None:
+    markdown = (
+        "Use $x + y$ to express the sum, call \\(softmax(x)\\), and keep currency $100.\n\n"
+        "$$a=b$$\n\n"
+        "$$\\(c=d\\)$$\n\n"
+        "\\[e=f\\]\n\n"
+        "```python\nprint('$x$')\n```\n"
+    )
+
+    normalized = normalize_structure_note_markdown(markdown)
+
+    assert "$x + y$" in normalized
+    assert "`softmax(x)`" in normalized
+    assert "$$\na=b\n$$" in normalized
+    assert "$$\nc=d\n$$" in normalized
+    assert "$$\ne=f\n$$" in normalized
+    assert "\\(" not in normalized
+    assert "\\[" not in normalized
+    assert "print('$x$')" in normalized
+    assert validate_renderer_compatible_markdown(normalized).ok is True
+
+
+def test_markdown_validation_detects_damaged_formula() -> None:
+    result = validate_renderer_compatible_markdown("The update is $x + \\frac{1}{2.\n")
+
+    assert result.ok is False
+    assert any("damaged inline math delimiter" in warning for warning in result.warnings)
+
+
+def test_compose_markdown_inserts_generated_transition_between_major_sections() -> None:
+    artifact = StructureNoteArtifact(
+        job_id="job_1",
+        file_name="demo.pdf",
+        source_format="pdf",
+        difficulty_level=DifficultyLevel.MEDIUM,
+        note_language=NoteLanguage.ZH,
+        style_level=ExplanationStyleLevel.HIGH,
+        status=JobStatus.RENDERING,
+        source_path="/tmp/demo.pdf",
+        created_at="2026-01-01T00:00:00",
+        updated_at="2026-01-01T00:00:00",
+    )
+    chunks = [
+        GenerationChunk(
+            chunk_id="chunk-001",
+            section_id="section-001",
+            section_title="基础概念",
+            section_summary="基础概念",
+            section_path=["基础概念"],
+            heading_level=2,
+            page_start=1,
+            page_end=3,
+            page_numbers=[1, 2, 3],
+            markdown="## 基础概念\n\n内容。",
+        ),
+        GenerationChunk(
+            chunk_id="chunk-002",
+            section_id="section-002",
+            section_title="理论展开",
+            section_summary="理论展开",
+            section_path=["理论展开"],
+            heading_level=2,
+            page_start=4,
+            page_end=6,
+            page_numbers=[4, 5, 6],
+            markdown="## 理论展开\n\n内容。",
+        ),
+    ]
+
+    markdown = StructureNoteManager()._compose_markdown(
+        artifact,
+        chunks,
+        NoteLanguage.ZH.value,
+        transition_map={
+            "section-002": "基础概念已经确定了问题的核心变量，但要解释这些变量如何形成稳定关系，还需要进入理论层面的约束与推理。"
+        },
+    )
+
+    assert "> **过渡：**" not in markdown
+    assert "建立了必要的概念基础" not in markdown
+    assert "核心变量" in markdown
+    assert "基础概念" in markdown
+    assert "理论展开" in markdown
+
+
+@pytest.mark.asyncio
+async def test_generate_transition_markdown_uses_llm_context(monkeypatch) -> None:
+    captured: dict[str, str] = {}
+
+    async def _fake_complete(prompt: str, **_kwargs):
+        captured["prompt"] = prompt
+        return (
+            "> 前面的定义已经说明目标函数衡量什么，但优化过程还需要解释参数为什么沿梯度方向移动。"
+        )
+
+    monkeypatch.setattr(generator_module, "llm_complete", _fake_complete)
+    previous = GenerationChunk(
+        chunk_id="chunk-001",
+        section_id="section-001",
+        section_title="目标函数",
+        section_summary="定义损失与优化目标。",
+        section_path=["目标函数"],
+        heading_level=2,
+        page_start=1,
+        page_end=2,
+        page_numbers=[1, 2],
+        markdown="## 目标函数\n\n损失函数刻画预测与真实结果之间的差异。" * 20,
+    )
+    current = GenerationChunk(
+        chunk_id="chunk-002",
+        section_id="section-002",
+        section_title="梯度下降",
+        section_summary="用梯度更新参数。",
+        section_path=["梯度下降"],
+        heading_level=2,
+        page_start=3,
+        page_end=4,
+        page_numbers=[3, 4],
+        markdown="## 梯度下降\n\n梯度方向给出局部变化最快的方向。",
+    )
+
+    transition = await generate_transition_markdown(
+        previous,
+        current,
+        language=NoteLanguage.ZH.value,
+        style_level=ExplanationStyleLevel.HIGH,
+    )
+
+    assert transition.startswith("前面的定义")
+    assert not transition.startswith(">")
+    assert "Title: 目标函数" in captured["prompt"]
+    assert "Title: 梯度下降" in captured["prompt"]
+    assert "损失函数刻画预测" in captured["prompt"]
+    assert "梯度方向给出" in captured["prompt"]
+    assert "Do NOT use template phrases" in captured["prompt"]
+
+
+@pytest.mark.asyncio
+async def test_generate_transition_markdown_falls_back_without_blocking(monkeypatch) -> None:
+    async def _raise_complete(*_args, **_kwargs):
+        raise RuntimeError("llm unavailable")
+
+    monkeypatch.setattr(generator_module, "llm_complete", _raise_complete)
+    previous = GenerationChunk(
+        chunk_id="chunk-001",
+        section_title="A",
+        section_path=["A"],
+        heading_level=2,
+        page_start=1,
+        page_end=1,
+        page_numbers=[1],
+        markdown="## A\n\nA content.",
+    )
+    current = GenerationChunk(
+        chunk_id="chunk-002",
+        section_title="B",
+        section_path=["B"],
+        heading_level=2,
+        page_start=2,
+        page_end=2,
+        page_numbers=[2],
+        markdown="## B\n\nB content.",
+    )
+
+    transition = await generate_transition_markdown(
+        previous,
+        current,
+        language=NoteLanguage.EN.value,
+        style_level=ExplanationStyleLevel.MEDIUM,
+    )
+
+    assert transition == "A leads naturally to B."
+
+
+@pytest.mark.asyncio
+async def test_tree_builder_falls_back_without_candidates() -> None:
+    pages = [_page(index, text=f"content {index}") for index in range(1, 12)]
+    tree = await build_section_tree(pages, page_window=5, language="en")
+
+    assert tree
+    assert tree[0].page_start == 1
+    assert tree[0].page_end == 5
+
+
+def test_image_pipeline_falls_back_to_full_page(tmp_path: Path) -> None:
+    fitz = pytest.importorskip("fitz")
+    pdf_path = tmp_path / "demo.pdf"
+    document = fitz.open()
+    page = document.new_page(width=400, height=600)
+    page.insert_text((72, 72), "Hello Structure Note")
+    document.save(pdf_path)
+    document.close()
+
+    pages = [_page(1, text="Hello", image_candidates=[])]
+    chunks = [
+        GenerationChunk(
+            chunk_id="chunk-001",
+            section_title="Page 1",
+            section_path=["Page 1"],
+            page_start=1,
+            page_end=1,
+            page_numbers=[1],
+            markdown="## Page 1\n\n[[IMAGE_PLACEHOLDER:chunk-001-image-1:1:key_figure]]\n",
+            placeholder_ids=["chunk-001-image-1"],
+        )
+    ]
+
+    next_chunks, placeholders, citations = process_images(
+        chunks,
+        pages,
+        pdf_path,
+        tmp_path / "images",
+        "demo.pdf",
+        language="en",
+    )
+
+    assert placeholders[0].status == "fallback_page"
+    assert citations[0].source_kind == "image"
+    assert "images/chunk-001-image-1.png" in next_chunks[0].markdown
+    assert "It supports the explanation of Page 1" in next_chunks[0].markdown
diff --git a/web/app/(workspace)/structure-note/page.tsx b/web/app/(workspace)/structure-note/page.tsx
new file mode 100644
index 000000000..0f40aacb9
--- /dev/null
+++ b/web/app/(workspace)/structure-note/page.tsx
@@ -0,0 +1,1876 @@
+'use client'
+
+import { useEffect, useMemo, useRef, useState } from 'react'
+import {
+  AlertCircle,
+  BookOpen,
+  CheckCircle2,
+  ChevronDown,
+  ChevronRight,
+  Clock3,
+  Database,
+  Download,
+  Eye,
+  FileText,
+  FolderOpen,
+  Layers3,
+  ListTree,
+  Loader2,
+  PanelLeftClose,
+  PanelLeftOpen,
+  Pencil,
+  Plus,
+  RefreshCcw,
+  ScrollText,
+  Trash2,
+  Upload,
+  X,
+} from 'lucide-react'
+import { useTranslation } from 'react-i18next'
+import RichMarkdownRenderer from '@/components/common/RichMarkdownRenderer'
+import Button from '@/components/ui/Button'
+import { apiUrl } from '@/lib/api'
+import {
+  createStructureNoteJob,
+  createStructureNoteJobFromKnowledgeBase,
+  createStructureNoteProject,
+  deleteStructureNoteProject,
+  fetchStructureNoteMarkdown,
+  getStructureNoteJob,
+  invalidateStructureNoteCaches,
+  listStructureNoteJobs,
+  listStructureNoteKnowledgeBaseFiles,
+  listStructureNoteProjects,
+  renameStructureNoteProject,
+  retryStructureNoteJob,
+  type StructureNoteDifficulty,
+  type StructureNoteJob,
+  type StructureNoteKbFile,
+  type StructureNoteKbGroup,
+  type StructureNoteLanguage,
+  type StructureNoteProject,
+  type StructureNoteStatus,
+  type StructureNoteStyleLevel,
+} from '@/lib/structure-note-api'
+
+type SourceMode = 'upload' | 'knowledge_base'
+
+interface MaterialNode {
+  key: string
+  fileName: string
+  sourceKind: 'upload' | 'knowledge_base'
+  updatedAt: string
+}
+
+interface VersionNode {
+  label: string
+  job: StructureNoteJob
+  isLatest: boolean
+}
+
+interface NoteNode {
+  key: string
+  title: string
+  sourceFileName: string
+  latestJob: StructureNoteJob
+  versions: VersionNode[]
+}
+
+interface ProjectNode {
+  key: string
+  name: string
+  materials: MaterialNode[]
+  notes: NoteNode[]
+}
+
+type MaterialMap = Map<string, MaterialNode>
+type NoteJobMap = Map<string, StructureNoteJob[]>
+
+interface ProjectAccumulator {
+  name: string
+  materials: MaterialMap
+  notes: NoteJobMap
+}
+
+const PROCESSING_STATUS_ORDER: StructureNoteStatus[] = [
+  'queued',
+  'normalizing',
+  'indexing',
+  'planning',
+  'generating',
+  'processing_images',
+  'rendering',
+]
+
+const PROCESSING_STATUSES = new Set<StructureNoteStatus>(PROCESSING_STATUS_ORDER)
+
+const DIFFICULTY_OPTIONS: Array<{
+  value: StructureNoteDifficulty
+  labelKey: string
+  hintKey: string
+}> = [
+  {
+    value: 'simple',
+    labelKey: 'Simple',
+    hintKey: 'Shorter notes focused on key definitions and outcomes.',
+  },
+  {
+    value: 'medium',
+    labelKey: 'Medium',
+    hintKey: 'Balanced classroom-style coverage with core logic.',
+  },
+  {
+    value: 'detailed',
+    labelKey: 'Detailed',
+    hintKey: 'Longer notes with deeper reasoning and slower generation.',
+  },
+]
+
+const NOTE_LANGUAGE_OPTIONS: Array<{
+  value: StructureNoteLanguage
+  labelKey: string
+  hintKey: string
+}> = [
+  {
+    value: 'zh',
+    labelKey: 'Chinese',
+    hintKey: 'Generate the final note content in Chinese.',
+  },
+  {
+    value: 'en',
+    labelKey: 'English',
+    hintKey: 'Generate the final note content in English.',
+  },
+]
+
+const STYLE_LEVEL_OPTIONS: Array<{
+  value: StructureNoteStyleLevel
+  labelKey: string
+  hintKey: string
+}> = [
+  {
+    value: 'low',
+    labelKey: 'Low',
+    hintKey: 'Popular-science style for fast entry-level understanding.',
+  },
+  {
+    value: 'medium',
+    labelKey: 'Medium',
+    hintKey: 'Standard classroom note style with balanced clarity and detail.',
+  },
+  {
+    value: 'high',
+    labelKey: 'High',
+    hintKey:
+      'Academic style with more rigorous principles, formulas, and derivations when supported.',
+  },
+]
+
+const STATUS_LABELS: Record<StructureNoteStatus, string> = {
+  queued: 'Queued',
+  normalizing: 'Normalizing source',
+  indexing: 'Building page index',
+  planning: 'Planning sections',
+  generating: 'Generating notes',
+  processing_images: 'Processing figures',
+  rendering: 'Rendering PDF',
+  ready: 'Ready',
+  failed: 'Failed',
+}
+
+function formatTimestamp(value: string) {
+  if (!value) return ''
+  try {
+    return new Intl.DateTimeFormat(undefined, {
+      month: 'short',
+      day: 'numeric',
+      hour: 'numeric',
+      minute: '2-digit',
+    }).format(new Date(value))
+  } catch {
+    return value
+  }
+}
+
+function formatFileSize(sizeBytes: number) {
+  if (!Number.isFinite(sizeBytes) || sizeBytes <= 0) return ''
+  if (sizeBytes < 1024 * 1024) {
+    return `${Math.max(1, Math.round(sizeBytes / 1024))} KB`
+  }
+  return `${(sizeBytes / 1024 / 1024).toFixed(1)} MB`
+}
+
+function formatPageRange(pageStart: number, pageEnd: number) {
+  return pageStart === pageEnd ? `p. ${pageStart}` : `pp. ${pageStart}-${pageEnd}`
+}
+
+function stripExtension(fileName: string) {
+  return fileName.replace(/\.[^/.]+$/, '') || fileName
+}
+
+function getProjectInitials(name: string) {
+  const compact = name.trim()
+  if (!compact) return 'SN'
+  return compact.slice(0, 2).toUpperCase()
+}
+
+function getProjectName(job: StructureNoteJob) {
+  return job.project_name || job.source_ref?.kb_name || 'Local Uploads'
+}
+
+function getSourceKind(job: StructureNoteJob): 'upload' | 'knowledge_base' {
+  return job.source_kind === 'knowledge_base' ? 'knowledge_base' : 'upload'
+}
+
+function getSourceFileName(job: StructureNoteJob) {
+  return job.source_ref?.file_name || job.file_name
+}
+
+function getSourceFileId(job: StructureNoteJob) {
+  if (getSourceKind(job) === 'knowledge_base') {
+    return `${job.source_ref?.kb_name || getProjectName(job)}/${job.source_ref?.file_id || job.file_name}`
+  }
+  return job.source_ref?.file_name || job.file_name
+}
+
+function getMaterialKey(job: StructureNoteJob) {
+  return `${getSourceKind(job)}:${getProjectName(job)}:${getSourceFileId(job)}`
+}
+
+function getNoteTitle(job: StructureNoteJob) {
+  return job.note_title || stripExtension(getSourceFileName(job))
+}
+
+function getStatusProgress(status: StructureNoteStatus) {
+  if (status === 'ready' || status === 'failed') return 100
+  const index = PROCESSING_STATUS_ORDER.indexOf(status)
+  if (index < 0) return 8
+  return Math.max(10, Math.round(((index + 1) / PROCESSING_STATUS_ORDER.length) * 92))
+}
+
+function buildProjectTree(
+  jobs: StructureNoteJob[],
+  projectRecords: StructureNoteProject[]
+): ProjectNode[] {
+  const projectMap = new Map<string, ProjectAccumulator>()
+
+  projectRecords.forEach(project => {
+    const projectName = project.name.trim()
+    if (!projectName) return
+    projectMap.set(projectName, {
+      name: projectName,
+      materials: new Map<string, MaterialNode>(),
+      notes: new Map<string, StructureNoteJob[]>(),
+    })
+  })
+
+  jobs.forEach(job => {
+    const projectName = getProjectName(job)
+    const projectKey = projectName
+    const project = projectMap.get(projectKey) ?? {
+      name: projectName,
+      materials: new Map<string, MaterialNode>(),
+      notes: new Map<string, StructureNoteJob[]>(),
+    }
+    const materialKey = getMaterialKey(job)
+    const existingMaterial = project.materials.get(materialKey)
+    if (!existingMaterial || job.updated_at > existingMaterial.updatedAt) {
+      project.materials.set(materialKey, {
+        key: materialKey,
+        fileName: getSourceFileName(job),
+        sourceKind: getSourceKind(job),
+        updatedAt: job.updated_at,
+      })
+    }
+    project.notes.set(materialKey, [...(project.notes.get(materialKey) ?? []), job])
+    projectMap.set(projectKey, project)
+  })
+
+  return Array.from(projectMap.entries())
+    .map(([projectKey, project]) => {
+      const notes = Array.from(project.notes.entries())
+        .map(([noteKey, noteJobs]) => {
+          const sortedVersions = [...noteJobs].sort((a, b) =>
+            a.created_at.localeCompare(b.created_at)
+          )
+          const latestJob = sortedVersions[sortedVersions.length - 1]
+          return {
+            key: noteKey,
+            title: getNoteTitle(latestJob),
+            sourceFileName: getSourceFileName(latestJob),
+            latestJob,
+            versions: sortedVersions.map((job, index) => ({
+              label: `v${index + 1}`,
+              job,
+              isLatest: index === sortedVersions.length - 1,
+            })),
+          }
+        })
+        .sort((a, b) => b.latestJob.updated_at.localeCompare(a.latestJob.updated_at))
+
+      return {
+        key: projectKey,
+        name: project.name,
+        materials: Array.from(project.materials.values()).sort((a, b) =>
+          a.fileName.localeCompare(b.fileName)
+        ),
+        notes,
+      }
+    })
+    .sort((a, b) => a.name.localeCompare(b.name))
+}
+
+function rewriteRelativeMarkdownAssets(content: string, assetBaseUrl: string | null) {
+  if (!assetBaseUrl) return content
+  const base = apiUrl(assetBaseUrl).replace(/\/$/, '')
+  return content.replace(
+    /(!\[[^\]]*\]\()((?!https?:\/\/|data:|\/|#)[^)]+)(\))/gi,
+    (_match, prefix, src, suffix) => {
+      const normalizedSrc = String(src).replace(/^\.\//, '')
+      return `${prefix}${base}/${normalizedSrc}${suffix}`
+    }
+  )
+}
+
+function scrollToSection(sectionId: string) {
+  const target = document.getElementById(sectionId)
+  target?.scrollIntoView({ block: 'start', behavior: 'smooth' })
+}
+
+function StatusIcon({ status }: { status: StructureNoteStatus }) {
+  if (status === 'ready') {
+    return <CheckCircle2 className="h-4 w-4 text-emerald-600" aria-hidden="true" />
+  }
+  if (status === 'failed') {
+    return <AlertCircle className="h-4 w-4 text-rose-600" aria-hidden="true" />
+  }
+  if (PROCESSING_STATUSES.has(status)) {
+    return <Clock3 className="h-4 w-4 text-[var(--muted-foreground)]" aria-hidden="true" />
+  }
+  return <Clock3 className="h-4 w-4 text-[var(--muted-foreground)]" aria-hidden="true" />
+}
+
+export default function StructureNotePage() {
+  const { t, i18n } = useTranslation()
+  const [jobs, setJobs] = useState<StructureNoteJob[]>([])
+  const [projects, setProjects] = useState<StructureNoteProject[]>([])
+  const [kbGroups, setKbGroups] = useState<StructureNoteKbGroup[]>([])
+  const [selectedJobId, setSelectedJobId] = useState<string | null>(null)
+  const selectedJobIdRef = useRef<string | null>(null)
+  const [selectedJob, setSelectedJob] = useState<StructureNoteJob | null>(null)
+  const [sourceMode, setSourceMode] = useState<SourceMode>('upload')
+  const [selectedFile, setSelectedFile] = useState<File | null>(null)
+  const [selectedKbName, setSelectedKbName] = useState('')
+  const [selectedKbFileId, setSelectedKbFileId] = useState('')
+  const [targetProjectName, setTargetProjectName] = useState('')
+  const [difficulty, setDifficulty] = useState<StructureNoteDifficulty>('medium')
+  const [noteLanguage, setNoteLanguage] = useState<StructureNoteLanguage>(() =>
+    i18n.language?.toLowerCase().startsWith('zh') ? 'zh' : 'en'
+  )
+  const [styleLevel, setStyleLevel] = useState<StructureNoteStyleLevel>('medium')
+  const [logs, setLogs] = useState<string[]>([])
+  const [markdownText, setMarkdownText] = useState('')
+  const [markdownLoading, setMarkdownLoading] = useState(false)
+  const [markdownError, setMarkdownError] = useState<string | null>(null)
+  const [editingMarkdown, setEditingMarkdown] = useState(false)
+  const [loadingJobs, setLoadingJobs] = useState(true)
+  const [loadingKbFiles, setLoadingKbFiles] = useState(true)
+  const [submitting, setSubmitting] = useState(false)
+  const [retrying, setRetrying] = useState(false)
+  const [pageError, setPageError] = useState<string | null>(null)
+  const [sidebarCollapsed, setSidebarCollapsed] = useState(false)
+  const [expandedProjectKeys, setExpandedProjectKeys] = useState<Set<string>>(new Set())
+  const [expandedMaterialsKeys, setExpandedMaterialsKeys] = useState<Set<string>>(new Set())
+  const [expandedNoteKeys, setExpandedNoteKeys] = useState<Set<string>>(new Set())
+  const seenProjectKeysRef = useRef<Set<string>>(new Set())
+  const [creatingProject, setCreatingProject] = useState(false)
+  const [newProjectName, setNewProjectName] = useState('')
+  const [renamingProjectName, setRenamingProjectName] = useState<string | null>(null)
+  const [projectNameDraft, setProjectNameDraft] = useState('')
+  const [projectBusyName, setProjectBusyName] = useState<string | null>(null)
+
+  useEffect(() => {
+    selectedJobIdRef.current = selectedJobId
+  }, [selectedJobId])
+
+  const projectTree = useMemo(() => buildProjectTree(jobs, projects), [jobs, projects])
+
+  const selectedTreeContext = useMemo(() => {
+    if (!selectedJobId) return null
+    for (const project of projectTree) {
+      for (const note of project.notes) {
+        for (const version of note.versions) {
+          if (version.job.job_id === selectedJobId) {
+            return {
+              projectKey: project.key,
+              projectName: project.name,
+              noteKey: note.key,
+              noteTitle: note.title,
+              versionLabel: version.label,
+              isLatest: version.isLatest,
+            }
+          }
+        }
+      }
+    }
+    return null
+  }, [projectTree, selectedJobId])
+
+  const selectedKbGroup = useMemo(
+    () => kbGroups.find(group => group.kb_name === selectedKbName) ?? null,
+    [kbGroups, selectedKbName]
+  )
+
+  const selectedKbFile = useMemo<StructureNoteKbFile | null>(
+    () => selectedKbGroup?.files.find(file => file.file_id === selectedKbFileId) ?? null,
+    [selectedKbFileId, selectedKbGroup]
+  )
+
+  const selectedPdfUrl = useMemo(() => {
+    if (!selectedJob?.final_pdf_url) return null
+    return apiUrl(selectedJob.final_pdf_url)
+  }, [selectedJob])
+
+  const selectedMarkdownUrl = useMemo(() => {
+    if (!selectedJob?.rendered_markdown_url) return null
+    return apiUrl(selectedJob.rendered_markdown_url)
+  }, [selectedJob])
+
+  const displayMarkdown = useMemo(
+    () => rewriteRelativeMarkdownAssets(markdownText, selectedJob?.asset_base_url ?? null),
+    [markdownText, selectedJob?.asset_base_url]
+  )
+
+  useEffect(() => {
+    let active = true
+    void (async () => {
+      try {
+        setLoadingJobs(true)
+        const [nextProjects, nextJobs] = await Promise.all([
+          listStructureNoteProjects({ force: true }),
+          listStructureNoteJobs({ force: true }),
+        ])
+        if (!active) return
+        setProjects(nextProjects)
+        setJobs(nextJobs)
+        const currentSelectedJobId = selectedJobIdRef.current
+        const nextSelectedJobId =
+          currentSelectedJobId && nextJobs.some(job => job.job_id === currentSelectedJobId)
+            ? currentSelectedJobId
+            : (nextJobs[0]?.job_id ?? null)
+        setSelectedJobId(nextSelectedJobId)
+        setSelectedJob(
+          nextJobs.find(job => job.job_id === nextSelectedJobId) ?? nextJobs[0] ?? null
+        )
+      } catch (error) {
+        if (!active) return
+        setPageError(error instanceof Error ? error.message : t('Unknown error'))
+      } finally {
+        if (active) setLoadingJobs(false)
+      }
+    })()
+    return () => {
+      active = false
+    }
+  }, [t])
+
+  useEffect(() => {
+    let active = true
+    void (async () => {
+      try {
+        setLoadingKbFiles(true)
+        const nextGroups = await listStructureNoteKnowledgeBaseFiles({ force: true })
+        if (!active) return
+        setKbGroups(nextGroups)
+      } catch (error) {
+        if (!active) return
+        setPageError(error instanceof Error ? error.message : t('Unknown error'))
+      } finally {
+        if (active) setLoadingKbFiles(false)
+      }
+    })()
+    return () => {
+      active = false
+    }
+  }, [t])
+
+  useEffect(() => {
+    if (kbGroups.length === 0) {
+      setSelectedKbName('')
+      setSelectedKbFileId('')
+      return
+    }
+    const firstSelectableGroup = kbGroups.find(group => group.files.length > 0) ?? kbGroups[0]
+    setSelectedKbName(current =>
+      current && kbGroups.some(group => group.kb_name === current)
+        ? current
+        : firstSelectableGroup.kb_name
+    )
+  }, [kbGroups])
+
+  useEffect(() => {
+    if (!selectedKbGroup) {
+      setSelectedKbFileId('')
+      return
+    }
+    setSelectedKbFileId(current =>
+      current && selectedKbGroup.files.some(file => file.file_id === current)
+        ? current
+        : (selectedKbGroup.files[0]?.file_id ?? '')
+    )
+  }, [selectedKbGroup])
+
+  useEffect(() => {
+    if (!selectedTreeContext) return
+    setExpandedProjectKeys(current => new Set(current).add(selectedTreeContext.projectKey))
+    setExpandedNoteKeys(current => new Set(current).add(selectedTreeContext.noteKey))
+  }, [selectedTreeContext])
+
+  useEffect(() => {
+    setExpandedMaterialsKeys(current => {
+      const next = new Set(current)
+      const seen = seenProjectKeysRef.current
+      projectTree.forEach(project => {
+        if (seen.has(project.key)) return
+        seen.add(project.key)
+        next.add(project.key)
+      })
+      return next
+    })
+  }, [projectTree])
+
+  useEffect(() => {
+    if (targetProjectName && projectTree.some(project => project.name === targetProjectName)) {
+      return
+    }
+    if (selectedTreeContext?.projectName) {
+      setTargetProjectName(selectedTreeContext.projectName)
+      return
+    }
+    setTargetProjectName(projectTree[0]?.name ?? '')
+  }, [projectTree, selectedTreeContext?.projectName, targetProjectName])
+
+  useEffect(() => {
+    if (!selectedJobId) return
+    let active = true
+    void (async () => {
+      try {
+        const job = await getStructureNoteJob(selectedJobId)
+        if (!active) return
+        setSelectedJob(job)
+        setJobs(prev => {
+          const others = prev.filter(item => item.job_id !== job.job_id)
+          return [job, ...others].sort((a, b) => b.updated_at.localeCompare(a.updated_at))
+        })
+      } catch (error) {
+        if (!active) return
+        setPageError(error instanceof Error ? error.message : t('Unknown error'))
+      }
+    })()
+    return () => {
+      active = false
+    }
+  }, [selectedJobId, t])
+
+  useEffect(() => {
+    if (!selectedJob?.rendered_markdown_url) {
+      setMarkdownText('')
+      setMarkdownError(null)
+      setEditingMarkdown(false)
+      return
+    }
+
+    let active = true
+    void (async () => {
+      try {
+        setMarkdownLoading(true)
+        setMarkdownError(null)
+        const content = await fetchStructureNoteMarkdown(selectedJob.rendered_markdown_url!)
+        if (!active) return
+        setMarkdownText(content)
+        setEditingMarkdown(false)
+      } catch (error) {
+        if (!active) return
+        setMarkdownError(error instanceof Error ? error.message : t('Unknown error'))
+      } finally {
+        if (active) setMarkdownLoading(false)
+      }
+    })()
+
+    return () => {
+      active = false
+    }
+  }, [selectedJob?.rendered_markdown_url, t])
+
+  useEffect(() => {
+    if (!selectedJob || !selectedJob.task_id || !PROCESSING_STATUSES.has(selectedJob.status)) {
+      return
+    }
+
+    const source = new EventSource(
+      apiUrl(`/api/v1/structure-note/tasks/${selectedJob.task_id}/stream`)
+    )
+    source.addEventListener('log', event => {
+      try {
+        const payload = JSON.parse((event as MessageEvent).data) as { line?: string }
+        if (!payload.line) return
+        setLogs(prev => [...prev.slice(-19), payload.line!])
+      } catch {}
+    })
+
+    const refreshSelected = async () => {
+      try {
+        const refreshed = await getStructureNoteJob(selectedJob.job_id)
+        setSelectedJob(refreshed)
+        setJobs(prev => {
+          const others = prev.filter(item => item.job_id !== refreshed.job_id)
+          return [refreshed, ...others].sort((a, b) => b.updated_at.localeCompare(a.updated_at))
+        })
+        if (!PROCESSING_STATUSES.has(refreshed.status)) {
+          invalidateStructureNoteCaches()
+        }
+      } catch {}
+    }
+
+    const interval = window.setInterval(() => {
+      void refreshSelected()
+    }, 2500)
+
+    source.addEventListener('complete', () => {
+      void refreshSelected()
+      source.close()
+    })
+    source.addEventListener('failed', () => {
+      void refreshSelected()
+      source.close()
+    })
+    source.onerror = () => {
+      source.close()
+    }
+
+    return () => {
+      window.clearInterval(interval)
+      source.close()
+    }
+  }, [selectedJob])
+
+  const toggleProject = (projectKey: string) => {
+    setExpandedProjectKeys(current => {
+      const next = new Set(current)
+      if (next.has(projectKey)) {
+        next.delete(projectKey)
+      } else {
+        next.add(projectKey)
+      }
+      return next
+    })
+  }
+
+  const toggleMaterials = (projectKey: string) => {
+    setExpandedMaterialsKeys(current => {
+      const next = new Set(current)
+      if (next.has(projectKey)) {
+        next.delete(projectKey)
+      } else {
+        next.add(projectKey)
+      }
+      return next
+    })
+  }
+
+  const toggleNote = (noteKey: string) => {
+    setExpandedNoteKeys(current => {
+      const next = new Set(current)
+      if (next.has(noteKey)) {
+        next.delete(noteKey)
+      } else {
+        next.add(noteKey)
+      }
+      return next
+    })
+  }
+
+  const selectJob = (job: StructureNoteJob) => {
+    setSelectedJobId(job.job_id)
+    setSelectedJob(job)
+    setLogs([])
+  }
+
+  const refreshProjectState = async (preferredJobId?: string | null) => {
+    const [nextProjects, nextJobs] = await Promise.all([
+      listStructureNoteProjects({ force: true }),
+      listStructureNoteJobs({ force: true }),
+    ])
+    setProjects(nextProjects)
+    setJobs(nextJobs)
+    const nextSelectedJobId =
+      preferredJobId && nextJobs.some(job => job.job_id === preferredJobId)
+        ? preferredJobId
+        : (nextJobs[0]?.job_id ?? null)
+    setSelectedJobId(nextSelectedJobId)
+    setSelectedJob(nextJobs.find(job => job.job_id === nextSelectedJobId) ?? null)
+    if (!nextSelectedJobId) {
+      setMarkdownText('')
+      setMarkdownError(null)
+      setEditingMarkdown(false)
+      setLogs([])
+    }
+    return { projects: nextProjects, jobs: nextJobs }
+  }
+
+  const handleCreateProject = async () => {
+    const name = newProjectName.trim()
+    if (!name) {
+      setPageError(t('Enter a project name first.'))
+      return
+    }
+    try {
+      setProjectBusyName(name)
+      setPageError(null)
+      const project = await createStructureNoteProject(name)
+      await refreshProjectState(selectedJobId)
+      setExpandedProjectKeys(current => new Set(current).add(project.name))
+      setExpandedMaterialsKeys(current => new Set(current).add(project.name))
+      setTargetProjectName(project.name)
+      setNewProjectName('')
+      setCreatingProject(false)
+    } catch (error) {
+      setPageError(error instanceof Error ? error.message : t('Unknown error'))
+    } finally {
+      setProjectBusyName(null)
+    }
+  }
+
+  const startRenameProject = (projectName: string) => {
+    setRenamingProjectName(projectName)
+    setProjectNameDraft(projectName)
+  }
+
+  const handleRenameProject = async (oldName: string) => {
+    const newName = projectNameDraft.trim()
+    if (!newName) {
+      setPageError(t('Enter a project name first.'))
+      return
+    }
+    try {
+      setProjectBusyName(oldName)
+      setPageError(null)
+      const project = await renameStructureNoteProject(oldName, newName)
+      await refreshProjectState(selectedJobId)
+      setExpandedProjectKeys(current => {
+        const next = new Set(current)
+        if (next.delete(oldName)) next.add(project.name)
+        return next
+      })
+      setExpandedMaterialsKeys(current => {
+        const next = new Set(current)
+        if (next.delete(oldName)) next.add(project.name)
+        return next
+      })
+      setExpandedNoteKeys(current => {
+        const next = new Set<string>()
+        current.forEach(key => next.add(key.replace(`:${oldName}:`, `:${project.name}:`)))
+        return next
+      })
+      if (targetProjectName === oldName) {
+        setTargetProjectName(project.name)
+      }
+      setRenamingProjectName(null)
+      setProjectNameDraft('')
+    } catch (error) {
+      setPageError(error instanceof Error ? error.message : t('Unknown error'))
+    } finally {
+      setProjectBusyName(null)
+    }
+  }
+
+  const handleDeleteProject = async (projectName: string) => {
+    const confirmed = window.confirm(
+      t('Delete project "{{name}}" and all of its Structure Note versions?', { name: projectName })
+    )
+    if (!confirmed) return
+    try {
+      setProjectBusyName(projectName)
+      setPageError(null)
+      await deleteStructureNoteProject(projectName)
+      await refreshProjectState(
+        selectedTreeContext?.projectKey === projectName ? null : selectedJobId
+      )
+      setExpandedProjectKeys(current => {
+        const next = new Set(current)
+        next.delete(projectName)
+        return next
+      })
+      setExpandedMaterialsKeys(current => {
+        const next = new Set(current)
+        next.delete(projectName)
+        return next
+      })
+      if (targetProjectName === projectName) {
+        setTargetProjectName('')
+      }
+      if (renamingProjectName === projectName) {
+        setRenamingProjectName(null)
+        setProjectNameDraft('')
+      }
+    } catch (error) {
+      setPageError(error instanceof Error ? error.message : t('Unknown error'))
+    } finally {
+      setProjectBusyName(null)
+    }
+  }
+
+  const handleCreate = async () => {
+    if (sourceMode === 'upload' && !selectedFile) {
+      setPageError(t('Select a PDF, PPT, or PPTX file first.'))
+      return
+    }
+    if (sourceMode === 'knowledge_base' && (!selectedKbName || !selectedKbFileId)) {
+      setPageError(t('Select a Knowledge Base file first.'))
+      return
+    }
+
+    try {
+      setSubmitting(true)
+      setPageError(null)
+      setLogs([])
+      const effectiveProjectName = targetProjectName.trim() || null
+      const job =
+        sourceMode === 'knowledge_base'
+          ? await createStructureNoteJobFromKnowledgeBase(
+              selectedKbName,
+              selectedKbFileId,
+              difficulty,
+              noteLanguage,
+              styleLevel,
+              effectiveProjectName
+            )
+          : await createStructureNoteJob(
+              selectedFile!,
+              difficulty,
+              noteLanguage,
+              styleLevel,
+              effectiveProjectName
+            )
+      const nextProjects = await listStructureNoteProjects({ force: true })
+      setProjects(nextProjects)
+      setJobs(prev => [job, ...prev.filter(item => item.job_id !== job.job_id)])
+      setSelectedJobId(job.job_id)
+      setSelectedJob(job)
+      setSelectedFile(null)
+      setExpandedProjectKeys(current => new Set(current).add(getProjectName(job)))
+      setExpandedMaterialsKeys(current => new Set(current).add(getProjectName(job)))
+      setTargetProjectName(getProjectName(job))
+    } catch (error) {
+      setPageError(error instanceof Error ? error.message : t('Unknown error'))
+    } finally {
+      setSubmitting(false)
+    }
+  }
+
+  const handleRetry = async () => {
+    if (!selectedJob) return
+    try {
+      setRetrying(true)
+      setPageError(null)
+      setLogs([])
+      const job = await retryStructureNoteJob(selectedJob.job_id)
+      setSelectedJob(job)
+      setSelectedJobId(job.job_id)
+      setJobs(prev => [job, ...prev.filter(item => item.job_id !== job.job_id)])
+    } catch (error) {
+      setPageError(error instanceof Error ? error.message : t('Unknown error'))
+    } finally {
+      setRetrying(false)
+    }
+  }
+
+  const createDisabled =
+    submitting || (sourceMode === 'upload' ? !selectedFile : !selectedKbName || !selectedKbFileId)
+
+  return (
+    <div
+      className={[
+        'grid h-full min-h-0 grid-cols-1 gap-0',
+        sidebarCollapsed
+          ? 'lg:grid-cols-[72px_minmax(0,1fr)]'
+          : 'lg:grid-cols-[340px_minmax(0,1fr)]',
+      ].join(' ')}
+    >
+      <aside className="border-b border-[var(--border)] bg-[var(--secondary)]/35 lg:border-b-0 lg:border-r">
+        <div className="flex h-full min-h-0 flex-col">
+          <div className="border-b border-[var(--border)] px-3 py-4">
+            <div className="flex items-start justify-between gap-2">
+              {sidebarCollapsed ? (
+                <div className="flex h-9 w-9 items-center justify-center rounded-lg bg-[var(--background)] text-sm font-semibold text-[var(--foreground)]">
+                  <BookOpen className="h-4 w-4" aria-hidden="true" />
+                </div>
+              ) : (
+                <div className="min-w-0 px-2">
+                  <h1 className="text-lg font-semibold text-[var(--foreground)] text-balance">
+                    {t('Structure Note')}
+                  </h1>
+                  <p className="mt-1 text-sm text-[var(--muted-foreground)]">
+                    {t('Manage materials and generated notes by project.')}
+                  </p>
+                </div>
+              )}
+              <button
+                type="button"
+                onClick={() => setSidebarCollapsed(value => !value)}
+                className="rounded-lg p-2 text-[var(--muted-foreground)] transition-colors hover:bg-[var(--background)] hover:text-[var(--foreground)] focus-visible:outline-none focus-visible:ring-2 focus-visible:ring-[var(--ring)]"
+                aria-label={sidebarCollapsed ? t('Expand sidebar') : t('Collapse sidebar')}
+                title={sidebarCollapsed ? t('Expand sidebar') : t('Collapse sidebar')}
+              >
+                {sidebarCollapsed ? (
+                  <PanelLeftOpen className="h-4 w-4" aria-hidden="true" />
+                ) : (
+                  <PanelLeftClose className="h-4 w-4" aria-hidden="true" />
+                )}
+              </button>
+            </div>
+          </div>
+
+          <div className="min-h-0 flex-1 overflow-y-auto px-3 py-3">
+            {sidebarCollapsed ? (
+              <nav aria-label={t('Projects')} className="space-y-2">
+                {loadingJobs ? (
+                  <div className="flex h-10 w-10 items-center justify-center rounded-lg text-[var(--muted-foreground)]">
+                    <Loader2 className="h-4 w-4 animate-spin" aria-hidden="true" />
+                  </div>
+                ) : projectTree.length === 0 ? (
+                  <div
+                    className="flex h-10 w-10 items-center justify-center rounded-lg border border-dashed border-[var(--border)] text-xs text-[var(--muted-foreground)]"
+                    title={t('No projects yet. Upload or select a Knowledge Base file to start.')}
+                  >
+                    0
+                  </div>
+                ) : (
+                  projectTree.map(project => {
+                    const active = selectedTreeContext?.projectKey === project.key
+                    return (
+                      <button
+                        key={project.key}
+                        type="button"
+                        onClick={() => {
+                          setExpandedProjectKeys(current => new Set(current).add(project.key))
+                          setSidebarCollapsed(false)
+                        }}
+                        title={project.name}
+                        className={[
+                          'flex h-10 w-10 items-center justify-center rounded-lg border text-xs font-semibold transition-colors focus-visible:outline-none focus-visible:ring-2 focus-visible:ring-[var(--ring)]',
+                          active
+                            ? 'border-[var(--ring)] bg-[var(--background)] text-[var(--foreground)]'
+                            : 'border-transparent text-[var(--muted-foreground)] hover:border-[var(--border)] hover:bg-[var(--background)]',
+                        ].join(' ')}
+                      >
+                        {getProjectInitials(project.name)}
+                      </button>
+                    )
+                  })
+                )}
+              </nav>
+            ) : (
+              <div className="space-y-2" aria-label={t('Project navigator')}>
+                {creatingProject ? (
+                  <form
+                    className="mb-3 space-y-2 rounded-lg border border-[var(--border)] bg-[var(--background)] p-2"
+                    onSubmit={event => {
+                      event.preventDefault()
+                      void handleCreateProject()
+                    }}
+                  >
+                    <input
+                      value={newProjectName}
+                      onChange={event => setNewProjectName(event.target.value)}
+                      placeholder={t('New project name')}
+                      className="w-full rounded-lg border border-[var(--border)] bg-[var(--background)] px-3 py-2 text-sm text-[var(--foreground)] focus-visible:outline-none focus-visible:ring-2 focus-visible:ring-[var(--ring)]"
+                      aria-label={t('New project name')}
+                    />
+                    <div className="flex items-center justify-end gap-2">
+                      <button
+                        type="button"
+                        onClick={() => {
+                          setCreatingProject(false)
+                          setNewProjectName('')
+                        }}
+                        className="rounded-lg p-2 text-[var(--muted-foreground)] hover:bg-[var(--secondary)] hover:text-[var(--foreground)] focus-visible:outline-none focus-visible:ring-2 focus-visible:ring-[var(--ring)]"
+                        aria-label={t('Cancel new project')}
+                        title={t('Cancel new project')}
+                      >
+                        <X className="h-4 w-4" aria-hidden="true" />
+                      </button>
+                      <button
+                        type="submit"
+                        disabled={projectBusyName === newProjectName.trim()}
+                        className="inline-flex items-center gap-2 rounded-lg bg-[var(--primary)] px-3 py-2 text-xs font-medium text-[var(--primary-foreground)] disabled:opacity-60"
+                      >
+                        {projectBusyName === newProjectName.trim() ? (
+                          <Loader2 className="h-3.5 w-3.5 animate-spin" aria-hidden="true" />
+                        ) : (
+                          <Plus className="h-3.5 w-3.5" aria-hidden="true" />
+                        )}
+                        {t('Create')}
+                      </button>
+                    </div>
+                  </form>
+                ) : (
+                  <button
+                    type="button"
+                    onClick={() => setCreatingProject(true)}
+                    className="mb-3 flex w-full items-center justify-center gap-2 rounded-lg border border-dashed border-[var(--border)] px-3 py-2 text-sm font-medium text-[var(--foreground)] transition-colors hover:bg-[var(--background)] focus-visible:outline-none focus-visible:ring-2 focus-visible:ring-[var(--ring)]"
+                  >
+                    <Plus className="h-4 w-4" aria-hidden="true" />
+                    {t('New Project')}
+                  </button>
+                )}
+                {loadingJobs ? (
+                  <div className="flex items-center gap-2 px-2 py-3 text-sm text-[var(--muted-foreground)]">
+                    <Loader2 className="h-4 w-4 animate-spin" aria-hidden="true" />
+                    <span>{t('Loading')}</span>
+                  </div>
+                ) : projectTree.length === 0 ? (
+                  <p className="px-2 py-3 text-sm text-[var(--muted-foreground)]">
+                    {t('No projects yet. Upload or select a Knowledge Base file to start.')}
+                  </p>
+                ) : (
+                  projectTree.map(project => {
+                    const projectExpanded = expandedProjectKeys.has(project.key)
+                    const projectActive = selectedTreeContext?.projectKey === project.key
+                    const projectBusy = projectBusyName === project.name
+                    return (
+                      <div key={project.key} className="rounded-lg">
+                        {renamingProjectName === project.name ? (
+                          <form
+                            className="flex items-center gap-2 rounded-lg bg-[var(--background)] px-2 py-2"
+                            onSubmit={event => {
+                              event.preventDefault()
+                              void handleRenameProject(project.name)
+                            }}
+                          >
+                            <input
+                              value={projectNameDraft}
+                              onChange={event => setProjectNameDraft(event.target.value)}
+                              className="min-w-0 flex-1 rounded-lg border border-[var(--border)] bg-[var(--background)] px-2 py-1 text-sm text-[var(--foreground)] focus-visible:outline-none focus-visible:ring-2 focus-visible:ring-[var(--ring)]"
+                              aria-label={t('Project name')}
+                            />
+                            <button
+                              type="submit"
+                              disabled={projectBusy}
+                              className="rounded-lg p-1.5 text-emerald-600 hover:bg-[var(--secondary)] focus-visible:outline-none focus-visible:ring-2 focus-visible:ring-[var(--ring)] disabled:opacity-60"
+                              aria-label={t('Save project name')}
+                              title={t('Save project name')}
+                            >
+                              {projectBusy ? (
+                                <Loader2 className="h-4 w-4 animate-spin" aria-hidden="true" />
+                              ) : (
+                                <CheckCircle2 className="h-4 w-4" aria-hidden="true" />
+                              )}
+                            </button>
+                            <button
+                              type="button"
+                              onClick={() => {
+                                setRenamingProjectName(null)
+                                setProjectNameDraft('')
+                              }}
+                              className="rounded-lg p-1.5 text-[var(--muted-foreground)] hover:bg-[var(--secondary)] hover:text-[var(--foreground)] focus-visible:outline-none focus-visible:ring-2 focus-visible:ring-[var(--ring)]"
+                              aria-label={t('Cancel rename')}
+                              title={t('Cancel rename')}
+                            >
+                              <X className="h-4 w-4" aria-hidden="true" />
+                            </button>
+                          </form>
+                        ) : (
+                          <div
+                            className={[
+                              'flex items-center gap-1 rounded-lg transition-colors',
+                              projectActive
+                                ? 'bg-[var(--background)] text-[var(--foreground)]'
+                                : 'text-[var(--foreground)] hover:bg-[var(--background)]/70',
+                            ].join(' ')}
+                          >
+                            <button
+                              type="button"
+                              onClick={() => toggleProject(project.key)}
+                              onDoubleClick={() => startRenameProject(project.name)}
+                              className="flex min-w-0 flex-1 items-center gap-2 rounded-lg px-2 py-2 text-left text-sm focus-visible:outline-none focus-visible:ring-2 focus-visible:ring-[var(--ring)]"
+                            >
+                              {projectExpanded ? (
+                                <ChevronDown
+                                  className="h-4 w-4 shrink-0 text-[var(--muted-foreground)]"
+                                  aria-hidden="true"
+                                />
+                              ) : (
+                                <ChevronRight
+                                  className="h-4 w-4 shrink-0 text-[var(--muted-foreground)]"
+                                  aria-hidden="true"
+                                />
+                              )}
+                              <Layers3
+                                className="h-4 w-4 shrink-0 text-[var(--muted-foreground)]"
+                                aria-hidden="true"
+                              />
+                              <span className="min-w-0 flex-1 truncate font-medium">
+                                {project.name}
+                              </span>
+                            </button>
+                            <button
+                              type="button"
+                              onClick={() => startRenameProject(project.name)}
+                              className="rounded-lg p-1.5 text-[var(--muted-foreground)] hover:bg-[var(--secondary)] hover:text-[var(--foreground)] focus-visible:outline-none focus-visible:ring-2 focus-visible:ring-[var(--ring)]"
+                              aria-label={t('Rename project')}
+                              title={t('Rename project')}
+                            >
+                              <Pencil className="h-3.5 w-3.5" aria-hidden="true" />
+                            </button>
+                            <button
+                              type="button"
+                              onClick={() => void handleDeleteProject(project.name)}
+                              disabled={projectBusy}
+                              className="mr-1 rounded-lg p-1.5 text-[var(--muted-foreground)] hover:bg-rose-50 hover:text-rose-600 focus-visible:outline-none focus-visible:ring-2 focus-visible:ring-[var(--ring)] disabled:opacity-60 dark:hover:bg-rose-950/30"
+                              aria-label={t('Delete project')}
+                              title={t('Delete project')}
+                            >
+                              {projectBusy ? (
+                                <Loader2 className="h-3.5 w-3.5 animate-spin" aria-hidden="true" />
+                              ) : (
+                                <Trash2 className="h-3.5 w-3.5" aria-hidden="true" />
+                              )}
+                            </button>
+                          </div>
+                        )}
+
+                        {projectExpanded ? (
+                          <div className="ml-4 mt-1 space-y-3 border-l border-[var(--border)] pl-3">
+                            <div>
+                              <button
+                                type="button"
+                                onClick={() => toggleMaterials(project.key)}
+                                className="mb-1 flex w-full items-center gap-2 rounded-lg px-2 py-1 text-left text-xs font-medium uppercase tracking-wide text-[var(--muted-foreground)] hover:bg-[var(--background)] focus-visible:outline-none focus-visible:ring-2 focus-visible:ring-[var(--ring)]"
+                              >
+                                {expandedMaterialsKeys.has(project.key) ? (
+                                  <ChevronDown className="h-3.5 w-3.5" aria-hidden="true" />
+                                ) : (
+                                  <ChevronRight className="h-3.5 w-3.5" aria-hidden="true" />
+                                )}
+                                <FolderOpen className="h-3.5 w-3.5" aria-hidden="true" />
+                                <span className="min-w-0 flex-1">{t('Materials')}</span>
+                                <span className="rounded bg-[var(--secondary)] px-1.5 py-0.5">
+                                  {project.materials.length}
+                                </span>
+                              </button>
+                              {expandedMaterialsKeys.has(project.key) ? (
+                                <div className="space-y-1">
+                                  {project.materials.length > 0 ? (
+                                    project.materials.map(material => (
+                                      <div
+                                        key={material.key}
+                                        className="flex items-center gap-2 rounded-lg px-2 py-1.5 text-xs text-[var(--muted-foreground)]"
+                                        title={material.fileName}
+                                      >
+                                        {material.sourceKind === 'knowledge_base' ? (
+                                          <Database
+                                            className="h-3.5 w-3.5 shrink-0"
+                                            aria-hidden="true"
+                                          />
+                                        ) : (
+                                          <FileText
+                                            className="h-3.5 w-3.5 shrink-0"
+                                            aria-hidden="true"
+                                          />
+                                        )}
+                                        <span className="min-w-0 flex-1 truncate">
+                                          {material.fileName}
+                                        </span>
+                                      </div>
+                                    ))
+                                  ) : (
+                                    <p className="px-2 py-1.5 text-xs text-[var(--muted-foreground)]">
+                                      {t('No materials yet.')}
+                                    </p>
+                                  )}
+                                </div>
+                              ) : null}
+                            </div>
+
+                            <div>
+                              <div className="mb-1 flex items-center gap-2 px-2 text-xs font-medium uppercase tracking-wide text-[var(--muted-foreground)]">
+                                <BookOpen className="h-3.5 w-3.5" aria-hidden="true" />
+                                <span>{t('Structure Notes')}</span>
+                              </div>
+                              <div className="space-y-1">
+                                {project.notes.length === 0 ? (
+                                  <p className="px-2 py-1.5 text-xs text-[var(--muted-foreground)]">
+                                    {t('No Structure Notes yet.')}
+                                  </p>
+                                ) : null}
+                                {project.notes.map(note => {
+                                  const noteExpanded = expandedNoteKeys.has(note.key)
+                                  const noteActive = selectedTreeContext?.noteKey === note.key
+                                  return (
+                                    <div key={note.key}>
+                                      <button
+                                        type="button"
+                                        onClick={() => toggleNote(note.key)}
+                                        className={[
+                                          'flex w-full items-start gap-2 rounded-lg px-2 py-2 text-left transition-colors focus-visible:outline-none focus-visible:ring-2 focus-visible:ring-[var(--ring)]',
+                                          noteActive
+                                            ? 'bg-[var(--background)] text-[var(--foreground)]'
+                                            : 'text-[var(--foreground)] hover:bg-[var(--background)]/70',
+                                        ].join(' ')}
+                                      >
+                                        {noteExpanded ? (
+                                          <ChevronDown
+                                            className="mt-0.5 h-4 w-4 shrink-0 text-[var(--muted-foreground)]"
+                                            aria-hidden="true"
+                                          />
+                                        ) : (
+                                          <ChevronRight
+                                            className="mt-0.5 h-4 w-4 shrink-0 text-[var(--muted-foreground)]"
+                                            aria-hidden="true"
+                                          />
+                                        )}
+                                        <span className="min-w-0 flex-1">
+                                          <span className="block truncate text-sm font-medium">
+                                            {note.title}
+                                          </span>
+                                          <span className="mt-0.5 block truncate text-xs text-[var(--muted-foreground)]">
+                                            {note.sourceFileName}
+                                          </span>
+                                        </span>
+                                        <StatusIcon status={note.latestJob.status} />
+                                      </button>
+
+                                      {noteExpanded ? (
+                                        <div className="ml-6 mt-1 space-y-1 border-l border-[var(--border)] pl-2">
+                                          {note.versions.map(version => {
+                                            const active = version.job.job_id === selectedJobId
+                                            return (
+                                              <button
+                                                key={version.job.job_id}
+                                                type="button"
+                                                onClick={() => selectJob(version.job)}
+                                                className={[
+                                                  'flex w-full items-center gap-2 rounded-lg px-2 py-2 text-left text-xs transition-colors focus-visible:outline-none focus-visible:ring-2 focus-visible:ring-[var(--ring)]',
+                                                  active
+                                                    ? 'border border-[var(--ring)] bg-[var(--background)] text-[var(--foreground)]'
+                                                    : 'border border-transparent text-[var(--muted-foreground)] hover:border-[var(--border)] hover:bg-[var(--background)]/70',
+                                                ].join(' ')}
+                                              >
+                                                <StatusIcon status={version.job.status} />
+                                                <span className="min-w-0 flex-1">
+                                                  <span className="font-medium">
+                                                    {version.label}
+                                                  </span>
+                                                  {version.isLatest ? (
+                                                    <span className="ml-1 rounded bg-[var(--secondary)] px-1.5 py-0.5">
+                                                      {t('latest')}
+                                                    </span>
+                                                  ) : null}
+                                                  {active ? (
+                                                    <span className="ml-1 rounded bg-[var(--primary)] px-1.5 py-0.5 text-[var(--primary-foreground)]">
+                                                      {t('current')}
+                                                    </span>
+                                                  ) : null}
+                                                  <span className="mt-1 block truncate">
+                                                    {t(STATUS_LABELS[version.job.status])} ·{' '}
+                                                    {formatTimestamp(version.job.updated_at)}
+                                                  </span>
+                                                </span>
+                                              </button>
+                                            )
+                                          })}
+                                        </div>
+                                      ) : null}
+                                    </div>
+                                  )
+                                })}
+                              </div>
+                            </div>
+                          </div>
+                        ) : null}
+                      </div>
+                    )
+                  })
+                )}
+              </div>
+            )}
+          </div>
+        </div>
+      </aside>
+
+      <section className="min-h-0 overflow-y-auto">
+        <div className="mx-auto flex min-h-full w-full max-w-7xl flex-col gap-8 px-5 py-6 lg:px-8">
+          <section
+            aria-labelledby="structure-note-upload-title"
+            className="grid gap-6 border border-[var(--border)] bg-[var(--background)] p-5 lg:grid-cols-[minmax(0,1.1fr)_minmax(320px,0.9fr)]"
+          >
+            <div className="space-y-4">
+              <div>
+                <h2
+                  id="structure-note-upload-title"
+                  className="text-base font-semibold text-[var(--foreground)]"
+                >
+                  {t('Add Material & Configure')}
+                </h2>
+                <p className="mt-1 max-w-2xl text-sm text-[var(--muted-foreground)]">
+                  {t(
+                    'Upload a local file or select one file from Knowledge Base, then generate a versioned lecture note under its project.'
+                  )}
+                </p>
+              </div>
+
+                <div className="space-y-2">
+                  <label
+                    htmlFor="structure-note-target-project"
+                    className="text-sm font-medium text-[var(--foreground)]"
+                  >
+                    {t('Target Project')}
+                  </label>
+                  <select
+                    id="structure-note-target-project"
+                    value={targetProjectName}
+                    onChange={event => setTargetProjectName(event.target.value)}
+                    disabled={projectTree.length === 0}
+                    className="w-full rounded-lg border border-[var(--border)] bg-[var(--background)] px-3 py-2 text-sm text-[var(--foreground)] focus-visible:outline-none focus-visible:ring-2 focus-visible:ring-[var(--ring)] disabled:opacity-60"
+                  >
+                    {projectTree.length === 0 ? (
+                      <option value="">
+                        {sourceMode === 'knowledge_base'
+                          ? t('A project will be created from the selected Knowledge Base.')
+                          : t('Local Uploads will be created automatically.')}
+                      </option>
+                    ) : (
+                      projectTree.map(project => (
+                        <option key={project.key} value={project.name}>
+                          {project.name}
+                        </option>
+                      ))
+                    )}
+                  </select>
+                  <p className="text-xs text-[var(--muted-foreground)]">
+                    {t('New files and KB selections are added to this project.')}
+                  </p>
+                </div>
+
+              {sourceMode === 'upload' ? (
+                <div className="space-y-2">
+                  <label
+                    htmlFor="structure-note-file"
+                    className="text-sm font-medium text-[var(--foreground)]"
+                  >
+                    {t('Course File')}
+                  </label>
+                  <div className="flex flex-col gap-3 border border-dashed border-[var(--border)] p-4">
+                    <input
+                      id="structure-note-file"
+                      name="structure_note_file"
+                      type="file"
+                      accept=".pdf,.ppt,.pptx,application/pdf,application/vnd.ms-powerpoint,application/vnd.openxmlformats-officedocument.presentationml.presentation"
+                      onChange={event => setSelectedFile(event.target.files?.[0] ?? null)}
+                      className="block w-full text-sm text-[var(--muted-foreground)] file:mr-4 file:rounded-lg file:border-0 file:bg-[var(--secondary)] file:px-3 file:py-2 file:text-sm file:font-medium file:text-[var(--foreground)] hover:file:bg-[var(--muted)] focus-visible:outline-none"
+                      aria-describedby="structure-note-file-help"
+                    />
+                    <p
+                      id="structure-note-file-help"
+                      className="text-xs text-[var(--muted-foreground)]"
+                    >
+                      {selectedFile
+                        ? `${selectedFile.name} · ${formatFileSize(selectedFile.size)}`
+                        : t('Accepted formats: PDF, PPT, PPTX')}
+                    </p>
+                  </div>
+                </div>
+              ) : (
+                <div className="grid gap-3 border border-dashed border-[var(--border)] p-4 sm:grid-cols-2">
+                  <div className="space-y-2">
+                    <label
+                      htmlFor="structure-note-kb"
+                      className="text-sm font-medium text-[var(--foreground)]"
+                    >
+                      {t('Knowledge Base')}
+                    </label>
+                    <select
+                      id="structure-note-kb"
+                      value={selectedKbName}
+                      onChange={event => setSelectedKbName(event.target.value)}
+                      disabled={loadingKbFiles || kbGroups.length === 0}
+                      className="w-full rounded-lg border border-[var(--border)] bg-[var(--background)] px-3 py-2 text-sm text-[var(--foreground)] focus-visible:outline-none focus-visible:ring-2 focus-visible:ring-[var(--ring)] disabled:opacity-60"
+                    >
+                      {kbGroups.length === 0 ? (
+                        <option value="">{loadingKbFiles ? t('Loading') : t('No Knowledge Base files available.')}</option>
+                      ) : (
+                        kbGroups.map(group => (
+                          <option key={group.kb_name} value={group.kb_name}>
+                            {group.kb_name}
+                          </option>
+                        ))
+                      )}
+                    </select>
+                  </div>
+
+                  <div className="space-y-2">
+                    <label
+                      htmlFor="structure-note-kb-file"
+                      className="text-sm font-medium text-[var(--foreground)]"
+                    >
+                      {t('Knowledge Base File')}
+                    </label>
+                    <select
+                      id="structure-note-kb-file"
+                      value={selectedKbFileId}
+                      onChange={event => setSelectedKbFileId(event.target.value)}
+                      disabled={!selectedKbGroup || selectedKbGroup.files.length === 0}
+                      className="w-full rounded-lg border border-[var(--border)] bg-[var(--background)] px-3 py-2 text-sm text-[var(--foreground)] focus-visible:outline-none focus-visible:ring-2 focus-visible:ring-[var(--ring)] disabled:opacity-60"
+                    >
+                      {!selectedKbGroup || selectedKbGroup.files.length === 0 ? (
+                        <option value="">{t('No files in this Knowledge Base.')}</option>
+                      ) : (
+                        selectedKbGroup.files.map(file => (
+                          <option key={file.file_id} value={file.file_id}>
+                            {file.display_path}
+                          </option>
+                        ))
+                      )}
+                    </select>
+                  </div>
+
+                  <p className="text-xs leading-5 text-[var(--muted-foreground)] sm:col-span-2">
+                    {selectedKbFile
+                      ? `${selectedKbFile.file_name} · ${formatFileSize(selectedKbFile.size_bytes)} · ${t('Project will use the selected Knowledge Base name automatically.')}`
+                      : t(
+                          'Only the selected file is used for Structure Note; the Knowledge Base index is unchanged.'
+                        )}
+                  </p>
+                </div>
+              )}
+
+              <fieldset className="space-y-3">
+                <legend className="text-sm font-medium text-[var(--foreground)]">
+                  {t('Note Language')}
+                </legend>
+                <div className="grid gap-3 sm:grid-cols-2">
+                  {NOTE_LANGUAGE_OPTIONS.map(option => (
+                    <label
+                      key={option.value}
+                      className={[
+                        'flex cursor-pointer flex-col gap-2 rounded-lg border p-3 transition-colors focus-within:ring-2 focus-within:ring-[var(--ring)]',
+                        noteLanguage === option.value
+                          ? 'border-[var(--ring)] bg-[var(--secondary)]/55'
+                          : 'border-[var(--border)] hover:bg-[var(--secondary)]/35',
+                      ].join(' ')}
+                    >
+                      <span className="flex items-center gap-2">
+                        <input
+                          type="radio"
+                          name="structure-note-language"
+                          value={option.value}
+                          checked={noteLanguage === option.value}
+                          onChange={() => setNoteLanguage(option.value)}
+                          className="h-4 w-4 border-[var(--border)] text-[var(--primary)] focus:ring-[var(--ring)]"
+                        />
+                        <span className="text-sm font-medium text-[var(--foreground)]">
+                          {t(option.labelKey)}
+                        </span>
+                      </span>
+                      <span className="text-xs text-[var(--muted-foreground)]">
+                        {t(option.hintKey)}
+                      </span>
+                    </label>
+                  ))}
+                </div>
+              </fieldset>
+
+              <fieldset className="space-y-3">
+                <legend className="text-sm font-medium text-[var(--foreground)]">
+                  {t('Explanation Depth')}
+                </legend>
+                <div className="grid gap-3 sm:grid-cols-3">
+                  {DIFFICULTY_OPTIONS.map(option => (
+                    <label
+                      key={option.value}
+                      className={[
+                        'flex cursor-pointer flex-col gap-2 rounded-lg border p-3 transition-colors focus-within:ring-2 focus-within:ring-[var(--ring)]',
+                        difficulty === option.value
+                          ? 'border-[var(--ring)] bg-[var(--secondary)]/55'
+                          : 'border-[var(--border)] hover:bg-[var(--secondary)]/35',
+                      ].join(' ')}
+                    >
+                      <span className="flex items-center gap-2">
+                        <input
+                          type="radio"
+                          name="structure-note-difficulty"
+                          value={option.value}
+                          checked={difficulty === option.value}
+                          onChange={() => setDifficulty(option.value)}
+                          className="h-4 w-4 border-[var(--border)] text-[var(--primary)] focus:ring-[var(--ring)]"
+                        />
+                        <span className="text-sm font-medium text-[var(--foreground)]">
+                          {t(option.labelKey)}
+                        </span>
+                      </span>
+                      <span className="text-xs text-[var(--muted-foreground)]">
+                        {t(option.hintKey)}
+                      </span>
+                    </label>
+                  ))}
+                </div>
+              </fieldset>
+
+              <fieldset className="space-y-3">
+                <legend className="text-sm font-medium text-[var(--foreground)]">
+                  {t('Lecture Style Level')}
+                </legend>
+                <div className="grid gap-3 sm:grid-cols-3">
+                  {STYLE_LEVEL_OPTIONS.map(option => (
+                    <label
+                      key={option.value}
+                      className={[
+                        'flex cursor-pointer flex-col gap-2 rounded-lg border p-3 transition-colors focus-within:ring-2 focus-within:ring-[var(--ring)]',
+                        styleLevel === option.value
+                          ? 'border-[var(--ring)] bg-[var(--secondary)]/55'
+                          : 'border-[var(--border)] hover:bg-[var(--secondary)]/35',
+                      ].join(' ')}
+                    >
+                      <span className="flex items-center gap-2">
+                        <input
+                          type="radio"
+                          name="structure-note-style-level"
+                          value={option.value}
+                          checked={styleLevel === option.value}
+                          onChange={() => setStyleLevel(option.value)}
+                          className="h-4 w-4 border-[var(--border)] text-[var(--primary)] focus:ring-[var(--ring)]"
+                        />
+                        <span className="text-sm font-medium text-[var(--foreground)]">
+                          {t(option.labelKey)}
+                        </span>
+                      </span>
+                      <span className="text-xs text-[var(--muted-foreground)]">
+                        {t(option.hintKey)}
+                      </span>
+                    </label>
+                  ))}
+                </div>
+              </fieldset>
+
+              <div className="flex flex-wrap items-center gap-3">
+                <Button
+                  type="button"
+                  onClick={handleCreate}
+                  loading={submitting}
+                  disabled={createDisabled}
+                  icon={<Upload className="h-4 w-4" aria-hidden="true" />}
+                  aria-label={t('Generate Structure Note')}
+                >
+                  {t('Generate Structure Note')}
+                </Button>
+                <span className="text-xs text-[var(--muted-foreground)]">
+                  {t('Each generation creates a new version under the matching Structure Note.')}
+                </span>
+              </div>
+            </div>
+
+            <div
+              aria-live="polite"
+              className="border border-[var(--border)] bg-[var(--secondary)]/28 p-4"
+            >
+              <div className="flex items-start justify-between gap-4">
+                <div>
+                  <h2 className="text-base font-semibold text-[var(--foreground)]">
+                    {t('Current Version')}
+                  </h2>
+                  <p className="mt-1 text-sm text-[var(--muted-foreground)]">
+                    {selectedJob
+                      ? `${getNoteTitle(selectedJob)} · ${t(STATUS_LABELS[selectedJob.status])}`
+                      : t('Select or create a note version to see progress and results.')}
+                  </p>
+                  {selectedJob ? (
+                    <div className="mt-2 space-y-1 text-xs text-[var(--muted-foreground)]">
+                      <p>
+                        {t('Project')}: {getProjectName(selectedJob)} · {t('Source')}:{' '}
+                        {getSourceFileName(selectedJob)}
+                      </p>
+                      <p>
+                        {t('Version')}:{' '}
+                        {selectedTreeContext?.versionLabel ?? selectedJob.job_id.slice(-6)}
+                        {selectedTreeContext?.isLatest ? ` · ${t('latest')}` : ''} ·{' '}
+                        {t('Difficulty')}: {selectedJob.difficulty_level} · {t('Note Language')}:{' '}
+                        {t(selectedJob.note_language === 'zh' ? 'Chinese' : 'English')} ·{' '}
+                        {t('Lecture Style Level')}:{' '}
+                        {t(
+                          STYLE_LEVEL_OPTIONS.find(
+                            option => option.value === selectedJob.style_level
+                          )?.labelKey || selectedJob.style_level
+                        )}
+                      </p>
+                    </div>
+                  ) : null}
+                </div>
+                {selectedJob && selectedJob.status === 'failed' ? (
+                  <Button
+                    type="button"
+                    variant="secondary"
+                    loading={retrying}
+                    icon={<RefreshCcw className="h-4 w-4" aria-hidden="true" />}
+                    onClick={handleRetry}
+                    aria-label={t('Retry failed job')}
+                  >
+                    {t('Retry')}
+                  </Button>
+                ) : null}
+              </div>
+
+              {selectedJob ? (
+                <div className="mt-5 space-y-4">
+                  <div>
+                    <div className="mb-2 flex items-center justify-between text-xs text-[var(--muted-foreground)]">
+                      <span>{t('Status')}</span>
+                      <span className="inline-flex items-center gap-1">
+                        <StatusIcon status={selectedJob.status} />
+                        {t(STATUS_LABELS[selectedJob.status])}
+                      </span>
+                    </div>
+                    <div className="h-2 overflow-hidden rounded-full bg-[var(--border)]">
+                      <div
+                        className={[
+                          'h-full rounded-full bg-[var(--primary)] transition-[width] duration-300',
+                          selectedJob.status === 'failed' ? 'bg-[var(--destructive)]' : '',
+                          selectedJob.status === 'ready' ? 'bg-emerald-600' : '',
+                        ].join(' ')}
+                        style={{ width: `${getStatusProgress(selectedJob.status)}%` }}
+                      />
+                    </div>
+                  </div>
+
+                  {selectedJob.error ? (
+                    <div className="flex gap-3 border border-rose-200 bg-rose-50 p-3 text-sm text-rose-700 dark:border-rose-900/50 dark:bg-rose-950/30 dark:text-rose-300">
+                      <AlertCircle className="mt-0.5 h-4 w-4 shrink-0" aria-hidden="true" />
+                      <span>{selectedJob.error}</span>
+                    </div>
+                  ) : null}
+
+                  <div>
+                    <div className="mb-2 flex items-center gap-2 text-sm font-medium text-[var(--foreground)]">
+                      {PROCESSING_STATUSES.has(selectedJob.status) ? (
+                        <Loader2
+                          className="h-4 w-4 animate-spin text-[var(--primary)]"
+                          aria-hidden="true"
+                        />
+                      ) : (
+                        <ScrollText
+                          className="h-4 w-4 text-[var(--muted-foreground)]"
+                          aria-hidden="true"
+                        />
+                      )}
+                      <span>{t('Recent Logs')}</span>
+                    </div>
+                    <ul className="max-h-48 space-y-2 overflow-y-auto border border-[var(--border)] bg-[var(--background)] p-3 text-xs text-[var(--muted-foreground)]">
+                      {logs.length > 0 ? (
+                        logs.map((line, index) => (
+                          <li key={`${line}-${index}`} className="break-words">
+                            {line}
+                          </li>
+                        ))
+                      ) : (
+                        <li>{t('Logs will appear here while the job is running.')}</li>
+                      )}
+                    </ul>
+                  </div>
+                </div>
+              ) : null}
+            </div>
+          </section>
+
+          <section className="min-h-0 border border-[var(--border)] bg-[var(--background)]">
+            <div className="flex flex-col gap-4 border-b border-[var(--border)] px-5 py-4 lg:flex-row lg:items-center lg:justify-between">
+              <div>
+                <h2 className="text-base font-semibold text-[var(--foreground)]">
+                  {t('Online Lecture Note')}
+                </h2>
+                <p className="mt-1 text-sm text-[var(--muted-foreground)]">
+                  {selectedJob?.rendered_markdown_url
+                    ? t(
+                        'Read the Markdown note with section navigation, page grounding, and export links.'
+                      )
+                    : t('The Markdown lecture note will appear here when generation finishes.')}
+                </p>
+              </div>
+              <div className="flex flex-wrap items-center gap-2">
+                {markdownText ? (
+                  <Button
+                    type="button"
+                    variant="secondary"
+                    icon={
+                      editingMarkdown ? (
+                        <Eye className="h-4 w-4" aria-hidden="true" />
+                      ) : (
+                        <Pencil className="h-4 w-4" aria-hidden="true" />
+                      )
+                    }
+                    onClick={() => setEditingMarkdown(value => !value)}
+                    aria-label={editingMarkdown ? t('Preview Markdown') : t('Edit Markdown')}
+                  >
+                    {editingMarkdown ? t('Preview') : t('Edit')}
+                  </Button>
+                ) : null}
+                {selectedMarkdownUrl ? (
+                  <a
+                    href={selectedMarkdownUrl}
+                    download
+                    className="inline-flex items-center gap-2 rounded-lg border border-[var(--border)] px-3 py-2 text-sm font-medium text-[var(--foreground)] transition-colors hover:bg-[var(--secondary)] focus-visible:outline-none focus-visible:ring-2 focus-visible:ring-[var(--ring)]"
+                  >
+                    <Download className="h-4 w-4" aria-hidden="true" />
+                    {t('Download MD')}
+                  </a>
+                ) : null}
+                {selectedPdfUrl ? (
+                  <a
+                    href={selectedPdfUrl}
+                    target="_blank"
+                    rel="noreferrer"
+                    className="inline-flex items-center gap-2 rounded-lg border border-[var(--border)] px-3 py-2 text-sm font-medium text-[var(--foreground)] transition-colors hover:bg-[var(--secondary)] focus-visible:outline-none focus-visible:ring-2 focus-visible:ring-[var(--ring)]"
+                  >
+                    <FileText className="h-4 w-4" aria-hidden="true" />
+                    {t('Download PDF')}
+                  </a>
+                ) : null}
+              </div>
+            </div>
+
+            {selectedJob?.rendered_markdown_url ? (
+              <div className="grid min-h-[640px] lg:grid-cols-[280px_minmax(0,1fr)]">
+                <aside className="border-b border-[var(--border)] bg-[var(--secondary)]/20 lg:border-b-0 lg:border-r">
+                  <div className="sticky top-0 max-h-[640px] overflow-y-auto px-4 py-4">
+                    <div className="mb-3 flex items-center gap-2 text-sm font-medium text-[var(--foreground)]">
+                      <ListTree
+                        className="h-4 w-4 text-[var(--muted-foreground)]"
+                        aria-hidden="true"
+                      />
+                      <span>{t('Sections & Pages')}</span>
+                    </div>
+                    {selectedJob.sections?.length ? (
+                      <nav aria-label={t('Structure Note sections')} className="space-y-1">
+                        {selectedJob.sections.map(section => (
+                          <button
+                            key={section.section_id}
+                            type="button"
+                            onClick={() => scrollToSection(section.section_id)}
+                            className="w-full rounded-lg px-3 py-2 text-left text-sm text-[var(--foreground)] transition-colors hover:bg-[var(--background)] focus-visible:outline-none focus-visible:ring-2 focus-visible:ring-[var(--ring)]"
+                            style={{ paddingLeft: `${12 + Math.max(0, section.level - 2) * 14}px` }}
+                          >
+                            <span className="block font-medium leading-5">{section.title}</span>
+                            <span className="mt-1 block text-xs text-[var(--muted-foreground)]">
+                              {formatPageRange(section.page_start, section.page_end)}
+                            </span>
+                          </button>
+                        ))}
+                      </nav>
+                    ) : (
+                      <p className="text-sm text-[var(--muted-foreground)]">
+                        {t('Section navigation will appear after planning completes.')}
+                      </p>
+                    )}
+                  </div>
+                </aside>
+
+                <div className="min-w-0">
+                  {markdownLoading ? (
+                    <div className="flex min-h-[560px] items-center justify-center gap-2 text-sm text-[var(--muted-foreground)]">
+                      <Loader2 className="h-4 w-4 animate-spin" aria-hidden="true" />
+                      <span>{t('Loading Markdown note')}</span>
+                    </div>
+                  ) : markdownError ? (
+                    <div className="m-5 flex gap-3 border border-rose-200 bg-rose-50 p-3 text-sm text-rose-700 dark:border-rose-900/50 dark:bg-rose-950/30 dark:text-rose-300">
+                      <AlertCircle className="mt-0.5 h-4 w-4 shrink-0" aria-hidden="true" />
+                      <span>{markdownError}</span>
+                    </div>
+                  ) : editingMarkdown ? (
+                    <textarea
+                      value={markdownText}
+                      onChange={event => setMarkdownText(event.target.value)}
+                      className="min-h-[620px] w-full resize-y border-0 bg-[var(--background)] p-5 font-mono text-sm leading-6 text-[var(--foreground)] outline-none"
+                      aria-label={t('Markdown source')}
+                    />
+                  ) : (
+                    <article className="mx-auto max-w-4xl px-5 py-6 lg:px-8">
+                      <RichMarkdownRenderer
+                        content={displayMarkdown}
+                        variant="prose"
+                        enableMath
+                        enableCode
+                        enableMermaid
+                        allowHtml
+                      />
+                    </article>
+                  )}
+                </div>
+              </div>
+            ) : (
+              <div className="flex min-h-[440px] flex-col items-center justify-center gap-3 px-6 text-center text-sm text-[var(--muted-foreground)]">
+                <FileText className="h-10 w-10 text-[var(--border)]" aria-hidden="true" />
+                <p>{t('No lecture note yet.')}</p>
+                <p>
+                  {t(
+                    'Upload a file, select a Knowledge Base file, or wait for the current version to finish rendering.'
+                  )}
+                </p>
+              </div>
+            )}
+          </section>
+
+          <section className="border border-[var(--border)] bg-[var(--background)]">
+            <div className="border-b border-[var(--border)] px-5 py-4">
+              <h2 className="text-base font-semibold text-[var(--foreground)]">{t('Grounding')}</h2>
+              <p className="mt-1 text-sm text-[var(--muted-foreground)]">
+                {t(
+                  'Each entry tracks the section path and source page range used in the exported note.'
+                )}
+              </p>
+            </div>
+            <div className="max-h-[420px] overflow-y-auto px-4 py-4">
+              {selectedJob?.citations?.length ? (
+                <ol className="grid gap-3 md:grid-cols-2 xl:grid-cols-3">
+                  {selectedJob.citations.map(citation => (
+                    <li
+                      key={citation.citation_id}
+                      className="rounded-lg border border-[var(--border)] bg-[var(--secondary)]/24 p-3"
+                    >
+                      <p className="text-sm font-medium text-[var(--foreground)]">
+                        {citation.section_path?.length
+                          ? citation.section_path.join(' / ')
+                          : t('Unlabeled section')}
+                      </p>
+                      <p className="mt-1 text-xs text-[var(--muted-foreground)]">
+                        {citation.source_kind === 'image' ? t('Image') : t('Text')} · {t('Pages')}{' '}
+                        {citation.page_start}
+                        {citation.page_end !== citation.page_start ? `-${citation.page_end}` : ''}
+                      </p>
+                      {citation.excerpt ? (
+                        <p className="mt-2 text-xs leading-6 text-[var(--muted-foreground)] break-words">
+                          {citation.excerpt}
+                        </p>
+                      ) : null}
+                    </li>
+                  ))}
+                </ol>
+              ) : (
+                <p className="text-sm text-[var(--muted-foreground)]">
+                  {t('Citation entries will appear here when a job completes.')}
+                </p>
+              )}
+            </div>
+          </section>
+
+          {pageError ? (
+            <div
+              role="alert"
+              className="rounded-lg border border-rose-200 bg-rose-50 px-4 py-3 text-sm text-rose-700 dark:border-rose-900/50 dark:bg-rose-950/30 dark:text-rose-300"
+            >
+              {pageError}
+            </div>
+          ) : null}
+        </div>
+      </section>
+    </div>
+  )
+}
diff --git a/web/components/sidebar/SidebarShell.tsx b/web/components/sidebar/SidebarShell.tsx
index 1712981ee..2bc46b6ca 100644
--- a/web/components/sidebar/SidebarShell.tsx
+++ b/web/components/sidebar/SidebarShell.tsx
@@ -1,13 +1,14 @@
-"use client";
+'use client'
 
-import Image from "next/image";
-import Link from "next/link";
-import { usePathname, useRouter } from "next/navigation";
-import { useState, type ReactNode } from "react";
+import Image from 'next/image'
+import Link from 'next/link'
+import { usePathname, useRouter } from 'next/navigation'
+import { useState, type ReactNode } from 'react'
 import {
   BookOpen,
   Bot,
   Brain,
+  FileStack,
   GraduationCap,
   MessageSquare,
   PanelLeftClose,
@@ -16,41 +17,42 @@ import {
   Plus,
   Settings,
   type LucideIcon,
-} from "lucide-react";
-import { useTranslation } from "react-i18next";
-import SessionList from "@/components/SessionList";
-import { TutorBotRecent } from "@/components/sidebar/TutorBotRecent";
-import type { SessionSummary } from "@/lib/session-api";
+} from 'lucide-react'
+import { useTranslation } from 'react-i18next'
+import SessionList from '@/components/SessionList'
+import { TutorBotRecent } from '@/components/sidebar/TutorBotRecent'
+import type { SessionSummary } from '@/lib/session-api'
 
 interface NavEntry {
-  href: string;
-  label: string;
-  icon: LucideIcon;
+  href: string
+  label: string
+  icon: LucideIcon
 }
 
 const PRIMARY_NAV: NavEntry[] = [
-  { href: "/", label: "Chat", icon: MessageSquare },
-  { href: "/agents", label: "TutorBot", icon: Bot },
-  { href: "/co-writer", label: "Co-Writer", icon: PenLine },
-  { href: "/guide", label: "Guided Learning", icon: GraduationCap },
-  { href: "/knowledge", label: "Knowledge", icon: BookOpen },
-  { href: "/memory", label: "Memory", icon: Brain },
-];
-
-const SECONDARY_NAV: NavEntry[] = [{ href: "/settings", label: "Settings", icon: Settings }];
-const DEFAULT_SESSION_VIEWPORT_CLASS_NAME = "max-h-[112px]";
+  { href: '/', label: 'Chat', icon: MessageSquare },
+  { href: '/agents', label: 'TutorBot', icon: Bot },
+  { href: '/co-writer', label: 'Co-Writer', icon: PenLine },
+  { href: '/guide', label: 'Guided Learning', icon: GraduationCap },
+  { href: '/structure-note', label: 'Structure Note', icon: FileStack },
+  { href: '/knowledge', label: 'Knowledge', icon: BookOpen },
+  { href: '/memory', label: 'Memory', icon: Brain },
+]
+
+const SECONDARY_NAV: NavEntry[] = [{ href: '/settings', label: 'Settings', icon: Settings }]
+const DEFAULT_SESSION_VIEWPORT_CLASS_NAME = 'max-h-[112px]'
 
 interface SidebarShellProps {
-  sessions?: SessionSummary[];
-  activeSessionId?: string | null;
-  loadingSessions?: boolean;
-  showSessions?: boolean;
-  sessionViewportClassName?: string;
-  onNewChat?: () => void;
-  onSelectSession?: (sessionId: string) => void | Promise<void>;
-  onRenameSession?: (sessionId: string, title: string) => void | Promise<void>;
-  onDeleteSession?: (sessionId: string) => void | Promise<void>;
-  footerSlot?: ReactNode;
+  sessions?: SessionSummary[]
+  activeSessionId?: string | null
+  loadingSessions?: boolean
+  showSessions?: boolean
+  sessionViewportClassName?: string
+  onNewChat?: () => void
+  onSelectSession?: (sessionId: string) => void | Promise<void>
+  onRenameSession?: (sessionId: string, title: string) => void | Promise<void>
+  onDeleteSession?: (sessionId: string) => void | Promise<void>
+  footerSlot?: ReactNode
 }
 
 export function SidebarShell({
@@ -65,18 +67,18 @@ export function SidebarShell({
   onDeleteSession,
   footerSlot,
 }: SidebarShellProps) {
-  const pathname = usePathname();
-  const router = useRouter();
-  const { t } = useTranslation();
-  const [collapsed, setCollapsed] = useState(false);
+  const pathname = usePathname()
+  const router = useRouter()
+  const { t } = useTranslation()
+  const [collapsed, setCollapsed] = useState(false)
 
   const handleNewChat = () => {
     if (onNewChat) {
-      onNewChat();
-      return;
+      onNewChat()
+      return
     }
-    router.push("/");
-  };
+    router.push('/')
+  }
 
   /* ---- Collapsed state ---- */
   if (collapsed) {
@@ -85,7 +87,7 @@ export function SidebarShell({
         <button
           onClick={() => setCollapsed(false)}
           className="mb-4 rounded-md p-1.5 text-[var(--muted-foreground)] transition-colors hover:text-[var(--foreground)]"
-          aria-label={t("Expand sidebar")}
+          aria-label={t('Expand sidebar')}
         >
           <PanelLeftOpen size={15} />
         </button>
@@ -93,55 +95,55 @@ export function SidebarShell({
         <button
           onClick={handleNewChat}
           className="mb-3 rounded-lg p-2 text-[var(--muted-foreground)] transition-colors hover:bg-[var(--background)]/60 hover:text-[var(--foreground)]"
-          aria-label={t("New Chat")}
+          aria-label={t('New Chat')}
         >
           <Plus size={16} strokeWidth={2} />
         </button>
 
         <nav className="flex flex-col items-center gap-px pt-1">
-          {PRIMARY_NAV.map((item) => {
-            const active = item.href === "/" ? pathname === "/" : pathname.startsWith(item.href);
+          {PRIMARY_NAV.map(item => {
+            const active = item.href === '/' ? pathname === '/' : pathname.startsWith(item.href)
             return (
               <div key={item.href} className="flex flex-col items-center">
                 <Link
                   href={item.href}
                   className={`rounded-lg p-2 transition-colors ${
                     active
-                      ? "bg-[var(--background)]/70 text-[var(--foreground)]"
-                      : "text-[var(--muted-foreground)] hover:bg-[var(--background)]/50 hover:text-[var(--foreground)]"
+                      ? 'bg-[var(--background)]/70 text-[var(--foreground)]'
+                      : 'text-[var(--muted-foreground)] hover:bg-[var(--background)]/50 hover:text-[var(--foreground)]'
                   }`}
                 >
                   <item.icon size={16} strokeWidth={active ? 1.9 : 1.5} />
                 </Link>
-                {item.href === "/agents" && <TutorBotRecent collapsed />}
+                {item.href === '/agents' && <TutorBotRecent collapsed />}
               </div>
-            );
+            )
           })}
         </nav>
 
         <div className="flex-1" />
 
         <div className="flex flex-col items-center gap-px pb-1">
-          {SECONDARY_NAV.map((item) => {
-            const active = pathname.startsWith(item.href);
+          {SECONDARY_NAV.map(item => {
+            const active = pathname.startsWith(item.href)
             return (
               <Link
                 key={item.href}
                 href={item.href}
                 className={`rounded-lg p-2 transition-colors ${
                   active
-                    ? "bg-[var(--background)]/70 text-[var(--foreground)]"
-                    : "text-[var(--muted-foreground)] hover:bg-[var(--background)]/50 hover:text-[var(--foreground)]"
+                    ? 'bg-[var(--background)]/70 text-[var(--foreground)]'
+                    : 'text-[var(--muted-foreground)] hover:bg-[var(--background)]/50 hover:text-[var(--foreground)]'
                 }`}
               >
                 <item.icon size={16} strokeWidth={active ? 1.9 : 1.5} />
               </Link>
-            );
+            )
           })}
           {footerSlot}
         </div>
       </aside>
-    );
+    )
   }
 
   /* ---- Expanded state ---- */
@@ -150,15 +152,15 @@ export function SidebarShell({
       {/* Header: logo + collapse toggle */}
       <div className="flex h-12 items-center justify-between px-4">
         <Link href="/" className="flex items-center gap-2">
-          <Image src="/logo-ver2.png" alt="DeepTutor" width={20} height={20} />
+          <Image src="/logo-ver2.png" alt={t('DeepTutor')} width={20} height={20} />
           <span className="text-[15px] font-semibold tracking-tight text-[var(--foreground)]">
-            DeepTutor
+            {t('DeepTutor')}
           </span>
         </Link>
         <button
           onClick={() => setCollapsed(true)}
           className="rounded-md p-1 text-[var(--muted-foreground)] transition-colors hover:text-[var(--foreground)]"
-          aria-label={t("Collapse sidebar")}
+          aria-label={t('Collapse sidebar')}
         >
           <PanelLeftClose size={15} />
         </button>
@@ -173,21 +175,26 @@ export function SidebarShell({
             className="flex w-full items-center gap-2.5 rounded-lg px-3 py-2 text-[13.5px] text-[var(--muted-foreground)] transition-colors hover:bg-[var(--background)]/60 hover:text-[var(--foreground)]"
           >
             <Plus size={16} strokeWidth={2} />
-            <span>{t("New Chat")}</span>
+            <span>{t('New Chat')}</span>
           </button>
 
-          {PRIMARY_NAV.map((item) => {
-            const active = item.href === "/" ? pathname === "/" : pathname.startsWith(item.href);
-            const hasSessionsBelow = item.href === "/" && showSessions && onSelectSession && onRenameSession && onDeleteSession;
-            const hasBots = item.href === "/agents";
+          {PRIMARY_NAV.map(item => {
+            const active = item.href === '/' ? pathname === '/' : pathname.startsWith(item.href)
+            const hasSessionsBelow =
+              item.href === '/' &&
+              showSessions &&
+              onSelectSession &&
+              onRenameSession &&
+              onDeleteSession
+            const hasBots = item.href === '/agents'
             return (
               <div key={item.href}>
                 <Link
                   href={item.href}
                   className={`flex items-center gap-2.5 rounded-lg px-3 py-2 text-[13.5px] transition-colors ${
                     active
-                      ? "bg-[var(--background)]/70 font-medium text-[var(--foreground)]"
-                      : "text-[var(--muted-foreground)] hover:bg-[var(--background)]/50 hover:text-[var(--foreground)]"
+                      ? 'bg-[var(--background)]/70 font-medium text-[var(--foreground)]'
+                      : 'text-[var(--muted-foreground)] hover:bg-[var(--background)]/50 hover:text-[var(--foreground)]'
                   }`}
                 >
                   <item.icon size={16} strokeWidth={active ? 1.9 : 1.5} />
@@ -208,7 +215,7 @@ export function SidebarShell({
                 )}
                 {hasBots && <TutorBotRecent />}
               </div>
-            );
+            )
           })}
         </div>
       </nav>
@@ -218,25 +225,25 @@ export function SidebarShell({
 
       {/* Secondary nav + footer */}
       <div className="border-t border-[var(--border)]/40 px-2 py-2">
-        {SECONDARY_NAV.map((item) => {
-          const active = pathname.startsWith(item.href);
+        {SECONDARY_NAV.map(item => {
+          const active = pathname.startsWith(item.href)
           return (
             <Link
               key={item.href}
               href={item.href}
               className={`flex items-center gap-2.5 rounded-lg px-3 py-2 text-[13.5px] transition-colors ${
                 active
-                  ? "bg-[var(--background)]/70 font-medium text-[var(--foreground)]"
-                  : "text-[var(--muted-foreground)] hover:bg-[var(--background)]/50 hover:text-[var(--foreground)]"
+                  ? 'bg-[var(--background)]/70 font-medium text-[var(--foreground)]'
+                  : 'text-[var(--muted-foreground)] hover:bg-[var(--background)]/50 hover:text-[var(--foreground)]'
               }`}
             >
               <item.icon size={16} strokeWidth={active ? 1.9 : 1.5} />
               <span>{t(item.label)}</span>
             </Link>
-          );
+          )
         })}
         {footerSlot}
       </div>
     </aside>
-  );
+  )
 }
diff --git a/web/components/ui/Button.tsx b/web/components/ui/Button.tsx
index e0a46eb4a..07f306ab4 100644
--- a/web/components/ui/Button.tsx
+++ b/web/components/ui/Button.tsx
@@ -1,46 +1,45 @@
-"use client";
+'use client'
 
-import React from "react";
-import { Loader2 } from "lucide-react";
+import React from 'react'
+import { Loader2 } from 'lucide-react'
 
 interface ButtonProps extends React.ButtonHTMLAttributes<HTMLButtonElement> {
-  variant?: "primary" | "secondary" | "danger" | "ghost";
-  size?: "sm" | "md" | "lg";
-  loading?: boolean;
-  icon?: React.ReactNode;
-  children: React.ReactNode;
+  variant?: 'primary' | 'secondary' | 'danger' | 'ghost'
+  size?: 'sm' | 'md' | 'lg'
+  loading?: boolean
+  icon?: React.ReactNode
+  children: React.ReactNode
 }
 
 const variantStyles = {
   primary:
-    "bg-[var(--primary)] text-[var(--primary-foreground)] hover:opacity-90 shadow-md shadow-[var(--primary)]/15",
-  secondary:
-    "bg-[var(--secondary)] text-[var(--secondary-foreground)] hover:bg-[var(--muted)]",
+    'bg-[var(--primary)] text-[var(--primary-foreground)] hover:opacity-90 shadow-md shadow-[var(--primary)]/15',
+  secondary: 'bg-[var(--secondary)] text-[var(--secondary-foreground)] hover:bg-[var(--muted)]',
   danger:
-    "bg-[var(--destructive)] text-[var(--destructive-foreground)] hover:opacity-90 shadow-md shadow-[var(--destructive)]/15",
-  ghost: "text-[var(--muted-foreground)] hover:bg-[var(--muted)] hover:text-[var(--foreground)]",
-};
+    'bg-[var(--destructive)] text-[var(--destructive-foreground)] hover:opacity-90 shadow-md shadow-[var(--destructive)]/15',
+  ghost: 'text-[var(--muted-foreground)] hover:bg-[var(--muted)] hover:text-[var(--foreground)]',
+}
 
 const sizeStyles = {
-  sm: "px-3 py-1.5 text-xs",
-  md: "px-4 py-2 text-sm",
-  lg: "px-6 py-3 text-base",
-};
+  sm: 'px-3 py-1.5 text-xs',
+  md: 'px-4 py-2 text-sm',
+  lg: 'px-6 py-3 text-base',
+}
 
 export default function Button({
-  variant = "primary",
-  size = "md",
+  variant = 'primary',
+  size = 'md',
   loading = false,
   icon,
   children,
-  className = "",
+  className = '',
   disabled,
   ...props
 }: ButtonProps) {
   return (
     <button
       className={`
-        inline-flex items-center justify-center gap-2 font-medium rounded-lg transition-all
+        inline-flex items-center justify-center gap-2 font-medium rounded-lg transition-colors
         disabled:opacity-50 disabled:cursor-not-allowed
         ${variantStyles[variant]}
         ${sizeStyles[size]}
@@ -49,12 +48,8 @@ export default function Button({
       disabled={disabled || loading}
       {...props}
     >
-      {loading ? (
-        <Loader2 className="w-4 h-4 animate-spin" />
-      ) : icon ? (
-        icon
-      ) : null}
+      {loading ? <Loader2 className="w-4 h-4 animate-spin" /> : icon ? icon : null}
       {children}
     </button>
-  );
+  )
 }
diff --git a/web/lib/latex.ts b/web/lib/latex.ts
index 62532eedb..bc74a8ac1 100644
--- a/web/lib/latex.ts
+++ b/web/lib/latex.ts
@@ -14,265 +14,266 @@
  * @returns Content with $...$ and $$...$$ delimiters
  */
 export function convertLatexDelimiters(content: string): string {
-  if (!content) return content;
+  if (!content) return content
 
-  let result = content;
+  let result = content
 
   // editor.md examples sometimes wrap \( ... \) inside $$ ... $$.
   // In that case the inner delimiters should be stripped rather than rewrapped.
-  result = result.replace(/\$\$\s*\\\(([\s\S]*?)\\\)\s*\$\$/g, "\n$$\n$1\n$$\n");
+  result = result.replace(/\$\$\s*\\\(([\s\S]*?)\\\)\s*\$\$/g, '\n$$\n$1\n$$\n')
 
   // Convert \[...\] to $$...$$ (block math)
   // Use a regex that handles multiline content
   // Note: In JSON strings, \[ becomes \\[ which in JS becomes \[
-  result = result.replace(/\\\[([\s\S]*?)\\\]/g, "\n$$\n$1\n$$\n");
+  result = result.replace(/\\\[([\s\S]*?)\\\]/g, '\n$$\n$1\n$$\n')
 
   // Convert \(...\) to $...$ (inline math)
   // Be careful not to match escaped parentheses in other contexts
-  result = result.replace(/\\\(([\s\S]*?)\\\)/g, " $$$1$$ ");
+  result = result.replace(/\\\(([\s\S]*?)\\\)/g, (_match, expr: string) => {
+    return ` $${expr.trim()}$ `
+  })
 
   // Also handle cases where LaTeX is directly in the text without proper delimiters
   // e.g., standalone \lim, \frac, etc. that should be wrapped
   // This is a common issue with LLM outputs
 
   // Clean up multiple consecutive newlines
-  result = result.replace(/\n{3,}/g, "\n\n");
+  result = result.replace(/\n{3,}/g, '\n\n')
 
-  return result;
+  return result
 }
 
 function normalizeEditorMdHeadings(content: string): string {
-  return content.replace(/^(#{1,6})(\S)/gm, "$1 $2");
+  return content.replace(/^(#{1,6})(\S)/gm, '$1 $2')
 }
 
 function normalizeEditorMdInlineMath(content: string): string {
   return content
-    .split("\n")
-    .map((line) => {
-      const trimmed = line.trim();
+    .split('\n')
+    .map(line => {
+      const trimmed = line.trim()
 
       // Preserve block math on its own line, but normalize one-line block math.
-      if (
-        /^\$\$[\s\S]+\$\$$/.test(trimmed) &&
-        (trimmed.match(/\$\$/g)?.length ?? 0) === 2
-      ) {
+      if (/^\$\$[\s\S]+\$\$$/.test(trimmed) && (trimmed.match(/\$\$/g)?.length ?? 0) === 2) {
         if (line.trim() === trimmed) {
-          const inner = trimmed.slice(2, -2).trim();
-          return `$$\n${inner}\n$$`;
+          const inner = trimmed.slice(2, -2).trim()
+          return `$$\n${inner}\n$$`
         }
       }
 
       // editor.md commonly uses $$...$$ for inline math.
       return line.replace(/\$\$([^$\n]+?)\$\$/g, (_match, expr: string) => {
-        return `$${expr.trim()}$`;
-      });
+        return `$${expr.trim()}$`
+      })
     })
-    .join("\n");
+    .join('\n')
 }
 
 type HeadingEntry = {
-  level: number;
-  text: string;
-  slug: string;
-};
+  level: number
+  text: string
+  slug: string
+}
 
 function slugifyHeading(text: string): string {
   return text
     .trim()
     .toLowerCase()
-    .replace(/[^\w\s-]/g, "")
-    .replace(/\s+/g, "-");
+    .replace(/[^\w\s-]/g, '')
+    .replace(/\s+/g, '-')
 }
 
 function collectMarkdownHeadings(content: string): HeadingEntry[] {
-  const lines = content.split("\n");
-  const headings: HeadingEntry[] = [];
-  let inFence = false;
+  const lines = content.split('\n')
+  const headings: HeadingEntry[] = []
+  let inFence = false
 
   for (let i = 0; i < lines.length; i += 1) {
-    const line = lines[i];
-    const trimmed = line.trim();
+    const line = lines[i]
+    const trimmed = line.trim()
 
     if (/^```/.test(trimmed)) {
-      inFence = !inFence;
-      continue;
+      inFence = !inFence
+      continue
     }
 
-    if (inFence) continue;
+    if (inFence) continue
 
-    const atxMatch = /^(#{1,6})\s+(.+?)\s*$/.exec(line);
+    const atxMatch = /^(#{1,6})\s+(.+?)\s*$/.exec(line)
     if (atxMatch) {
-      const text = atxMatch[2].replace(/\s+#+\s*$/, "").trim();
-      const slug = slugifyHeading(text);
-      if (slug) headings.push({ level: atxMatch[1].length, text, slug });
-      continue;
+      const text = atxMatch[2].replace(/\s+#+\s*$/, '').trim()
+      const slug = slugifyHeading(text)
+      if (slug) headings.push({ level: atxMatch[1].length, text, slug })
+      continue
     }
 
-    const next = lines[i + 1]?.trim();
-    if (!trimmed || !next) continue;
+    const next = lines[i + 1]?.trim()
+    if (!trimmed || !next) continue
 
     if (/^=+$/.test(next)) {
-      const slug = slugifyHeading(trimmed);
-      if (slug) headings.push({ level: 1, text: trimmed, slug });
-      i += 1;
-      continue;
+      const slug = slugifyHeading(trimmed)
+      if (slug) headings.push({ level: 1, text: trimmed, slug })
+      i += 1
+      continue
     }
 
     if (/^-+$/.test(next)) {
-      const slug = slugifyHeading(trimmed);
-      if (slug) headings.push({ level: 2, text: trimmed, slug });
-      i += 1;
+      const slug = slugifyHeading(trimmed)
+      if (slug) headings.push({ level: 2, text: trimmed, slug })
+      i += 1
     }
   }
 
-  return headings;
+  return headings
 }
 
 function buildTableOfContents(headings: HeadingEntry[]): string {
-  if (headings.length === 0) return "";
+  if (headings.length === 0) return ''
 
   return headings
     .map(({ level, text, slug }) => {
-      const indent = "  ".repeat(Math.max(level - 1, 0));
-      return `${indent}- [${text}](#${slug})`;
+      const indent = '  '.repeat(Math.max(level - 1, 0))
+      return `${indent}- [${text}](#${slug})`
     })
-    .join("\n");
+    .join('\n')
 }
 
 function injectEditorMdTableOfContents(content: string): string {
-  const headings = collectMarkdownHeadings(content);
+  const headings = collectMarkdownHeadings(content)
   if (headings.length === 0) {
-    return content.replace(/^\[TOCM?\]\s*$/gim, "");
+    return content.replace(/^\[TOCM?\]\s*$/gim, '')
   }
 
-  const toc = buildTableOfContents(headings);
-  return content.replace(/^\[TOCM?\]\s*$/gim, toc);
+  const toc = buildTableOfContents(headings)
+  return content.replace(/^\[TOCM?\]\s*$/gim, toc)
 }
 
 function convertFlowFenceToMermaid(source: string): string | null {
   const lines = source
-    .split("\n")
-    .map((line) => line.trim())
-    .filter(Boolean);
+    .split('\n')
+    .map(line => line.trim())
+    .filter(Boolean)
 
-  if (lines.length === 0) return null;
+  if (lines.length === 0) return null
 
-  const nodeDefs: string[] = [];
-  const edges: string[] = [];
+  const nodeDefs: string[] = []
+  const edges: string[] = []
 
   const renderNode = (id: string, type: string, label: string): string => {
-    const safeLabel = label.replace(/\|/g, "\\|");
+    const safeLabel = label.replace(/\|/g, '\\|')
     switch (type) {
-      case "start":
-      case "end":
-        return `${id}([${safeLabel}])`;
-      case "condition":
-        return `${id}{${safeLabel}}`;
-      case "inputoutput":
-        return `${id}[/${safeLabel}/]`;
-      case "subroutine":
-        return `${id}[[${safeLabel}]]`;
-      case "database":
-        return `${id}[(${safeLabel})]`;
+      case 'start':
+      case 'end':
+        return `${id}([${safeLabel}])`
+      case 'condition':
+        return `${id}{${safeLabel}}`
+      case 'inputoutput':
+        return `${id}[/${safeLabel}/]`
+      case 'subroutine':
+        return `${id}[[${safeLabel}]]`
+      case 'database':
+        return `${id}[(${safeLabel})]`
       default:
-        return `${id}[${safeLabel}]`;
+        return `${id}[${safeLabel}]`
     }
-  };
+  }
 
   for (const line of lines) {
     const defMatch =
       /^([A-Za-z][\w-]*)(?:=>|=)(start|end|operation|condition|inputoutput|subroutine|database):\s*(.+)$/.exec(
-        line,
-      );
+        line
+      )
 
     if (defMatch) {
-      const [, id, type, label] = defMatch;
-      nodeDefs.push(`  ${renderNode(id, type, label)}`);
-      continue;
+      const [, id, type, label] = defMatch
+      nodeDefs.push(`  ${renderNode(id, type, label)}`)
+      continue
     }
 
-    if (!line.includes("->")) continue;
+    if (!line.includes('->')) continue
 
-    const parts = line.split("->").map((part) => part.trim()).filter(Boolean);
+    const parts = line
+      .split('->')
+      .map(part => part.trim())
+      .filter(Boolean)
     for (let i = 0; i < parts.length - 1; i += 1) {
-      const fromMatch = /^([A-Za-z][\w-]*)(?:\(([^)]+)\))?$/.exec(parts[i]);
-      const toMatch = /^([A-Za-z][\w-]*)(?:\(([^)]+)\))?$/.exec(parts[i + 1]);
-      if (!fromMatch || !toMatch) continue;
-
-      const [, fromId] = fromMatch;
-      const [, toId, edgeLabel] = toMatch;
-      const label = edgeLabel ? `|${edgeLabel}|` : "";
-      edges.push(`  ${fromId} -->${label} ${toId}`);
+      const fromMatch = /^([A-Za-z][\w-]*)(?:\(([^)]+)\))?$/.exec(parts[i])
+      const toMatch = /^([A-Za-z][\w-]*)(?:\(([^)]+)\))?$/.exec(parts[i + 1])
+      if (!fromMatch || !toMatch) continue
+
+      const [, fromId] = fromMatch
+      const [, toId, edgeLabel] = toMatch
+      const label = edgeLabel ? `|${edgeLabel}|` : ''
+      edges.push(`  ${fromId} -->${label} ${toId}`)
     }
   }
 
-  if (nodeDefs.length === 0 || edges.length === 0) return null;
-  return ["flowchart TD", ...nodeDefs, ...edges].join("\n");
+  if (nodeDefs.length === 0 || edges.length === 0) return null
+  return ['flowchart TD', ...nodeDefs, ...edges].join('\n')
 }
 
 function convertSequenceFenceToMermaid(source: string): string | null {
   const lines = source
-    .split("\n")
-    .map((line) => line.trim())
-    .filter(Boolean);
+    .split('\n')
+    .map(line => line.trim())
+    .filter(Boolean)
 
-  if (lines.length === 0) return null;
+  if (lines.length === 0) return null
 
   const isSequenceDirective = (line: string): boolean => {
     return (
       /^Note\s+(left|right)\s+of\s+/i.test(line) ||
       /^participant\s+/i.test(line) ||
       /^(title|autonumber|activate|deactivate|loop|rect|opt|alt|par|critical|break|box|create|destroy)\b/i.test(
-        line,
+        line
       ) ||
       /^([A-Za-z][\w.-]*)(?:-{1,2}>>?|--?>)([A-Za-z][\w.-]*)\s*:\s*.+$/.test(line)
-    );
-  };
+    )
+  }
 
-  const normalizedLines: string[] = [];
+  const normalizedLines: string[] = []
   for (let i = 0; i < lines.length; i += 1) {
-    const line = lines[i];
+    const line = lines[i]
 
     if (/^Note\s+(left|right)\s+of\s+/i.test(line)) {
-      let combined = line;
+      let combined = line
 
       while (i + 1 < lines.length && !isSequenceDirective(lines[i + 1])) {
-        combined += `\\n${lines[i + 1]}`;
-        i += 1;
+        combined += `\\n${lines[i + 1]}`
+        i += 1
       }
 
-      normalizedLines.push(combined);
-      continue;
+      normalizedLines.push(combined)
+      continue
     }
 
-    normalizedLines.push(line);
+    normalizedLines.push(line)
   }
 
-  const converted = normalizedLines.map((line) => {
+  const converted = normalizedLines.map(line => {
     if (/^Note\s+(left|right)\s+of\s+/i.test(line)) {
-      return `  ${line.replace(/\\n/g, "<br/>")}`;
+      return `  ${line.replace(/\\n/g, '<br/>')}`
     }
 
-    const messageMatch =
-      /^([A-Za-z][\w.-]*)(-{1,2}>>?|--?>)([A-Za-z][\w.-]*)\s*:\s*(.+)$/.exec(
-        line,
-      );
+    const messageMatch = /^([A-Za-z][\w.-]*)(-{1,2}>>?|--?>)([A-Za-z][\w.-]*)\s*:\s*(.+)$/.exec(
+      line
+    )
 
     if (messageMatch) {
-      const [, from, operator, to, message] = messageMatch;
+      const [, from, operator, to, message] = messageMatch
       const arrow =
-        operator === "--" || operator === "-->"
-          ? "-->>"
-          : operator === "->>" || operator === "-->>"
+        operator === '--' || operator === '-->'
+          ? '-->>'
+          : operator === '->>' || operator === '-->>'
             ? operator
-            : "->>";
-      return `  ${from}${arrow}${to}: ${message}`;
+            : '->>'
+      return `  ${from}${arrow}${to}: ${message}`
     }
 
-    return `  ${line}`;
-  });
+    return `  ${line}`
+  })
 
-  return ["sequenceDiagram", ...converted].join("\n");
+  return ['sequenceDiagram', ...converted].join('\n')
 }
 
 function convertEditorMdFences(content: string): string {
@@ -280,14 +281,12 @@ function convertEditorMdFences(content: string): string {
     /```(flow|seq|sequence)\s*\n([\s\S]*?)```/g,
     (_match, lang: string, body: string) => {
       const converted =
-        lang === "flow"
-          ? convertFlowFenceToMermaid(body)
-          : convertSequenceFenceToMermaid(body);
-
-      if (!converted) return `\`\`\`${lang}\n${body}\`\`\``;
-      return `\`\`\`mermaid\n${converted}\n\`\`\``;
-    },
-  );
+        lang === 'flow' ? convertFlowFenceToMermaid(body) : convertSequenceFenceToMermaid(body)
+
+      if (!converted) return `\`\`\`${lang}\n${body}\`\`\``
+      return `\`\`\`mermaid\n${converted}\n\`\`\``
+    }
+  )
 }
 
 /**
@@ -298,25 +297,25 @@ function convertEditorMdFences(content: string): string {
  * @returns Processed content ready for ReactMarkdown with remark-math
  */
 export function processLatexContent(content: string): string {
-  if (!content) return "";
+  if (!content) return ''
 
   // Convert to string if not already
-  const str = String(content);
+  const str = String(content)
 
   // Apply delimiter conversion
-  return convertLatexDelimiters(str);
+  return convertLatexDelimiters(str)
 }
 
 export function processMarkdownContent(content: string): string {
-  if (!content) return "";
+  if (!content) return ''
 
-  let result = String(content);
-  result = normalizeEditorMdHeadings(result);
-  result = normalizeEditorMdInlineMath(result);
-  result = convertEditorMdFences(result);
-  result = injectEditorMdTableOfContents(result);
-  result = convertLatexDelimiters(result);
-  result = result.replace(/\n{3,}/g, "\n\n");
+  let result = String(content)
+  result = normalizeEditorMdHeadings(result)
+  result = normalizeEditorMdInlineMath(result)
+  result = convertEditorMdFences(result)
+  result = injectEditorMdTableOfContents(result)
+  result = convertLatexDelimiters(result)
+  result = result.replace(/\n{3,}/g, '\n\n')
 
-  return result;
+  return result
 }
diff --git a/web/lib/structure-note-api.ts b/web/lib/structure-note-api.ts
new file mode 100644
index 000000000..448870c41
--- /dev/null
+++ b/web/lib/structure-note-api.ts
@@ -0,0 +1,275 @@
+import { apiUrl } from '@/lib/api'
+import { invalidateClientCache, withClientCache } from '@/lib/client-cache'
+
+const CACHE_PREFIX = 'structure-note:'
+
+export type StructureNoteStatus =
+  | 'queued'
+  | 'normalizing'
+  | 'indexing'
+  | 'planning'
+  | 'generating'
+  | 'processing_images'
+  | 'rendering'
+  | 'ready'
+  | 'failed'
+
+export type StructureNoteDifficulty = 'simple' | 'medium' | 'detailed'
+export type StructureNoteLanguage = 'zh' | 'en'
+export type StructureNoteStyleLevel = 'low' | 'medium' | 'high'
+
+export interface StructureNoteCitation {
+  citation_id: string
+  section_path: string[]
+  page_start: number
+  page_end: number
+  source_file: string
+  source_kind: 'text' | 'image'
+  image_page?: number | null
+  image_region?: number[] | null
+  excerpt?: string | null
+}
+
+export interface StructureNoteSection {
+  section_id: string
+  title: string
+  level: number
+  page_start: number
+  page_end: number
+  summary?: string
+  parent_id?: string | null
+  child_ids?: string[]
+  path?: string[]
+}
+
+export interface StructureNoteJob {
+  job_id: string
+  file_name: string
+  status: StructureNoteStatus
+  source_format: string
+  difficulty_level: StructureNoteDifficulty
+  note_language: StructureNoteLanguage
+  style_level: StructureNoteStyleLevel
+  project_name?: string | null
+  note_title?: string | null
+  source_kind?: 'upload' | 'knowledge_base'
+  source_ref?: Record<string, string>
+  final_pdf_url: string | null
+  rendered_markdown_url: string | null
+  asset_base_url: string | null
+  sections: StructureNoteSection[]
+  citations: StructureNoteCitation[]
+  retry_available: boolean
+  error: string | null
+  task_id: string | null
+  created_at: string
+  updated_at: string
+}
+
+export interface StructureNoteKbFile {
+  file_id: string
+  file_name: string
+  display_path: string
+  size_bytes: number
+  updated_at: string
+}
+
+export interface StructureNoteKbGroup {
+  kb_name: string
+  files: StructureNoteKbFile[]
+}
+
+export interface StructureNoteProject {
+  name: string
+  created_at: string
+  updated_at: string
+}
+
+async function expectJson<T>(response: Response): Promise<T> {
+  if (!response.ok) {
+    let detail = `Request failed: ${response.status}`
+    try {
+      const payload = await response.json()
+      if (typeof payload?.detail === 'string') {
+        detail = payload.detail
+      }
+    } catch {}
+    throw new Error(detail)
+  }
+  return response.json() as Promise<T>
+}
+
+export async function listStructureNoteProjects(options?: { force?: boolean }) {
+  return withClientCache<StructureNoteProject[]>(
+    `${CACHE_PREFIX}projects`,
+    async () => {
+      const response = await fetch(apiUrl('/api/v1/structure-note/projects'), {
+        cache: 'no-store',
+      })
+      const data = await expectJson<{ projects?: StructureNoteProject[] }>(response)
+      return Array.isArray(data.projects) ? data.projects : []
+    },
+    {
+      force: options?.force,
+      ttlMs: 10_000,
+    }
+  )
+}
+
+export async function createStructureNoteProject(name: string): Promise<StructureNoteProject> {
+  const formData = new FormData()
+  formData.append('name', name)
+  const response = await fetch(apiUrl('/api/v1/structure-note/projects'), {
+    method: 'POST',
+    body: formData,
+  })
+  const data = await expectJson<StructureNoteProject>(response)
+  invalidateClientCache(CACHE_PREFIX)
+  return data
+}
+
+export async function renameStructureNoteProject(
+  projectName: string,
+  newName: string
+): Promise<StructureNoteProject> {
+  const formData = new FormData()
+  formData.append('new_name', newName)
+  const response = await fetch(
+    apiUrl(`/api/v1/structure-note/projects/${encodeURIComponent(projectName)}/rename`),
+    {
+      method: 'POST',
+      body: formData,
+    }
+  )
+  const data = await expectJson<StructureNoteProject>(response)
+  invalidateClientCache(CACHE_PREFIX)
+  return data
+}
+
+export async function deleteStructureNoteProject(
+  projectName: string
+): Promise<{ deleted_job_ids: string[] }> {
+  const response = await fetch(
+    apiUrl(`/api/v1/structure-note/projects/${encodeURIComponent(projectName)}`),
+    {
+      method: 'DELETE',
+    }
+  )
+  const data = await expectJson<{ deleted_job_ids: string[] }>(response)
+  invalidateClientCache(CACHE_PREFIX)
+  return data
+}
+
+export async function listStructureNoteKnowledgeBaseFiles(options?: { force?: boolean }) {
+  return withClientCache<StructureNoteKbGroup[]>(
+    `${CACHE_PREFIX}kb-files`,
+    async () => {
+      const response = await fetch(apiUrl('/api/v1/structure-note/kb/files'), {
+        cache: 'no-store',
+      })
+      const data = await expectJson<{ knowledge_bases?: StructureNoteKbGroup[] }>(response)
+      return Array.isArray(data.knowledge_bases) ? data.knowledge_bases : []
+    },
+    {
+      force: options?.force,
+      ttlMs: 10_000,
+    }
+  )
+}
+
+export async function listStructureNoteJobs(options?: { force?: boolean }) {
+  return withClientCache<StructureNoteJob[]>(
+    `${CACHE_PREFIX}jobs`,
+    async () => {
+      const response = await fetch(apiUrl('/api/v1/structure-note/jobs'), {
+        cache: 'no-store',
+      })
+      const data = await expectJson<{ jobs?: StructureNoteJob[] }>(response)
+      return Array.isArray(data.jobs) ? data.jobs : []
+    },
+    {
+      force: options?.force,
+      ttlMs: 10_000,
+    }
+  )
+}
+
+export async function getStructureNoteJob(jobId: string): Promise<StructureNoteJob> {
+  const response = await fetch(apiUrl(`/api/v1/structure-note/jobs/${jobId}`), {
+    cache: 'no-store',
+  })
+  return expectJson<StructureNoteJob>(response)
+}
+
+export async function createStructureNoteJob(
+  file: File,
+  difficultyLevel: StructureNoteDifficulty,
+  noteLanguage: StructureNoteLanguage,
+  styleLevel: StructureNoteStyleLevel,
+  projectName?: string | null
+): Promise<StructureNoteJob> {
+  const formData = new FormData()
+  formData.append('file', file)
+  formData.append('difficulty_level', difficultyLevel)
+  formData.append('note_language', noteLanguage)
+  formData.append('style_level', styleLevel)
+  if (projectName) {
+    formData.append('project_name', projectName)
+  }
+  const response = await fetch(apiUrl('/api/v1/structure-note/jobs'), {
+    method: 'POST',
+    body: formData,
+  })
+  const data = await expectJson<StructureNoteJob>(response)
+  invalidateClientCache(CACHE_PREFIX)
+  return data
+}
+
+export async function createStructureNoteJobFromKnowledgeBase(
+  kbName: string,
+  fileId: string,
+  difficultyLevel: StructureNoteDifficulty,
+  noteLanguage: StructureNoteLanguage,
+  styleLevel: StructureNoteStyleLevel,
+  projectName?: string | null
+): Promise<StructureNoteJob> {
+  const formData = new FormData()
+  formData.append('kb_name', kbName)
+  formData.append('file_id', fileId)
+  formData.append('difficulty_level', difficultyLevel)
+  formData.append('note_language', noteLanguage)
+  formData.append('style_level', styleLevel)
+  if (projectName) {
+    formData.append('project_name', projectName)
+  }
+  const response = await fetch(apiUrl('/api/v1/structure-note/jobs/from-kb'), {
+    method: 'POST',
+    body: formData,
+  })
+  const data = await expectJson<StructureNoteJob>(response)
+  invalidateClientCache(CACHE_PREFIX)
+  return data
+}
+
+export async function retryStructureNoteJob(jobId: string): Promise<StructureNoteJob> {
+  const response = await fetch(apiUrl(`/api/v1/structure-note/jobs/${jobId}/retry`), {
+    method: 'POST',
+  })
+  const data = await expectJson<StructureNoteJob>(response)
+  invalidateClientCache(CACHE_PREFIX)
+  return data
+}
+
+export async function fetchStructureNoteMarkdown(markdownUrl: string): Promise<string> {
+  const response = await fetch(apiUrl(markdownUrl), {
+    cache: 'no-store',
+  })
+  if (!response.ok) {
+    throw new Error(`Markdown download failed: ${response.status}`)
+  }
+  return response.text()
+}
+
+export function invalidateStructureNoteCaches() {
+  invalidateClientCache(CACHE_PREFIX)
+}
diff --git a/web/locales/en/app.json b/web/locales/en/app.json
index f6bd94838..8129fab75 100644
--- a/web/locales/en/app.json
+++ b/web/locales/en/app.json
@@ -1,4 +1,5 @@
 {
+  "DeepTutor": "DeepTutor",
   "language.english": "English",
   "language.chinese": "中文",
   "Start": "Start",
@@ -860,11 +861,9 @@
   "Delete this chat history?": "Delete this chat history?",
   "Question Notebook": "Question Notebook",
   "Review and organize quiz questions across sessions.": "Review and organize quiz questions across sessions.",
-  "All": "All",
   "Bookmarked": "Bookmarked",
   "Wrong Only": "Wrong Only",
   "Total": "Total",
-  "Refresh": "Refresh",
   "Categories": "Categories",
   "Manage Categories": "Manage Categories",
   "New category name...": "New category name...",
@@ -874,17 +873,121 @@
   "No entries yet": "No entries yet",
   "Questions from your quizzes will appear here.": "Questions from your quizzes will appear here.",
   "Your Answer": "Your Answer",
-  "Correct Answer": "Correct Answer",
   "From session": "From session",
   "Follow-up": "Follow-up",
   "Bookmark": "Bookmark",
   "Remove Bookmark": "Remove Bookmark",
   "Add to Category": "Add to Category",
-  "Delete": "Delete",
   "Delete this entry?": "Delete this entry?",
   "Failed to load entries": "Failed to load entries",
-  "Retry": "Retry",
   "Your pick": "Your pick",
   "No categories yet.": "No categories yet.",
-  "Original Session": "Original Session"
+  "Original Session": "Original Session",
+  "Structure Note": "Structure Note",
+  "Turn course PDFs or slides into structured study notes and a final PDF.": "Turn course PDFs or slides into structured study notes and a final PDF.",
+  "Structure Note history": "Structure Note history",
+  "No Structure Note jobs yet. Upload a file to start.": "No Structure Note jobs yet. Upload a file to start.",
+  "Upload & Configure": "Upload & Configure",
+  "Upload one course PDF or slide deck, choose the explanation depth, and generate a clean reading PDF with citations.": "Upload one course PDF or slide deck, choose the explanation depth, and generate a clean reading PDF with citations.",
+  "Course File": "Course File",
+  "Accepted formats: PDF, PPT, PPTX": "Accepted formats: PDF, PPT, PPTX",
+  "Explanation Depth": "Explanation Depth",
+  "Simple": "Simple",
+  "Detailed": "Detailed",
+  "Shorter notes focused on key definitions and outcomes.": "Shorter notes focused on key definitions and outcomes.",
+  "Balanced classroom-style coverage with core logic.": "Balanced classroom-style coverage with core logic.",
+  "Longer notes with deeper reasoning and slower generation.": "Longer notes with deeper reasoning and slower generation.",
+  "Generate Structure Note": "Generate Structure Note",
+  "Detailed mode runs longer to keep more reasoning and context.": "Detailed mode runs longer to keep more reasoning and context.",
+  "Current Job": "Current Job",
+  "Select or create a job to see progress and results.": "Select or create a job to see progress and results.",
+  "Retry failed job": "Retry failed job",
+  "Stage": "Stage",
+  "Recent Logs": "Recent Logs",
+  "Logs will appear here while the job is running.": "Logs will appear here while the job is running.",
+  "Queued": "Queued",
+  "Normalizing source": "Normalizing source",
+  "Building page index": "Building page index",
+  "Planning sections": "Planning sections",
+  "Generating notes": "Generating notes",
+  "Processing figures": "Processing figures",
+  "Rendering PDF": "Rendering PDF",
+  "Result": "Result",
+  "Preview the exported note PDF and open the source citations in the right column.": "Preview the exported note PDF and open the source citations in the right column.",
+  "The generated PDF preview will appear here when the job finishes.": "The generated PDF preview will appear here when the job finishes.",
+  "Download PDF": "Download PDF",
+  "Structure Note PDF preview": "Structure Note PDF preview",
+  "No final PDF yet.": "No final PDF yet.",
+  "Upload a file or wait for the current job to finish rendering.": "Upload a file or wait for the current job to finish rendering.",
+  "Citations": "Citations",
+  "Each entry tracks the section path and source page range used in the exported note.": "Each entry tracks the section path and source page range used in the exported note.",
+  "Text": "Text",
+  "Pages": "Pages",
+  "Unlabeled section": "Unlabeled section",
+  "Citation entries will appear here when a job completes.": "Citation entries will appear here when a job completes.",
+  "Select a PDF, PPT, or PPTX file first.": "Select a PDF, PPT, or PPTX file first.",
+  "Online Lecture Note": "Online Lecture Note",
+  "Read the Markdown note with section navigation, page grounding, and export links.": "Read the Markdown note with section navigation, page grounding, and export links.",
+  "The Markdown lecture note will appear here when generation finishes.": "The Markdown lecture note will appear here when generation finishes.",
+  "Preview Markdown": "Preview Markdown",
+  "Edit Markdown": "Edit Markdown",
+  "Download MD": "Download MD",
+  "Sections & Pages": "Sections & Pages",
+  "Structure Note sections": "Structure Note sections",
+  "Section navigation will appear after planning completes.": "Section navigation will appear after planning completes.",
+  "Loading Markdown note": "Loading Markdown note",
+  "Markdown source": "Markdown source",
+  "No lecture note yet.": "No lecture note yet.",
+  "Note Language": "Note Language",
+  "Generate the final note content in Chinese.": "Generate the final note content in Chinese.",
+  "Generate the final note content in English.": "Generate the final note content in English.",
+  "Lecture Style Level": "Lecture Style Level",
+  "Popular-science style for fast entry-level understanding.": "Popular-science style for fast entry-level understanding.",
+  "Standard classroom note style with balanced clarity and detail.": "Standard classroom note style with balanced clarity and detail.",
+  "Academic style with more rigorous principles, formulas, and derivations when supported.": "Academic style with more rigorous principles, formulas, and derivations when supported.",
+  "Manage materials and generated notes by project.": "Manage materials and generated notes by project.",
+  "Add Material & Configure": "Add Material & Configure",
+  "Upload a local file or select one file from Knowledge Base, then generate a versioned lecture note under its project.": "Upload a local file or select one file from Knowledge Base, then generate a versioned lecture note under its project.",
+  "File Source": "File Source",
+  "Local Upload": "Local Upload",
+  "Use a file from this device.": "Use a file from this device.",
+  "Use one existing KB file without changing KB indexing.": "Use one existing KB file without changing KB indexing.",
+  "Select a Knowledge Base file first.": "Select a Knowledge Base file first.",
+  "Knowledge Base File": "Knowledge Base File",
+  "No Knowledge Base files available.": "No Knowledge Base files available.",
+  "No files in this Knowledge Base.": "No files in this Knowledge Base.",
+  "Project will use the selected Knowledge Base name automatically.": "Project will use the selected Knowledge Base name automatically.",
+  "Only the selected file is used for Structure Note; the Knowledge Base index is unchanged.": "Only the selected file is used for Structure Note; the Knowledge Base index is unchanged.",
+  "Each generation creates a new version under the matching Structure Note.": "Each generation creates a new version under the matching Structure Note.",
+  "Current Version": "Current Version",
+  "Select or create a note version to see progress and results.": "Select or create a note version to see progress and results.",
+  "Project": "Project",
+  "Version": "Version",
+  "Projects": "Projects",
+  "Project navigator": "Project navigator",
+  "Materials": "Materials",
+  "Structure Notes": "Structure Notes",
+  "latest": "latest",
+  "current": "current",
+  "New Project": "New Project",
+  "New project name": "New project name",
+  "Cancel new project": "Cancel new project",
+  "Enter a project name first.": "Enter a project name first.",
+  "Project name": "Project name",
+  "Save project name": "Save project name",
+  "Cancel rename": "Cancel rename",
+  "Rename project": "Rename project",
+  "Delete project": "Delete project",
+  "Delete project \"{{name}}\" and all of its Structure Note versions?": "Delete project \"{{name}}\" and all of its Structure Note versions?",
+  "No materials yet.": "No materials yet.",
+  "No Structure Notes yet.": "No Structure Notes yet.",
+  "Target Project": "Target Project",
+  "A project will be created from the selected Knowledge Base.": "A project will be created from the selected Knowledge Base.",
+  "Local Uploads will be created automatically.": "Local Uploads will be created automatically.",
+  "New files and KB selections are added to this project.": "New files and KB selections are added to this project.",
+  "Expand sidebar": "Expand sidebar",
+  "Collapse sidebar": "Collapse sidebar",
+  "No projects yet. Upload or select a Knowledge Base file to start.": "No projects yet. Upload or select a Knowledge Base file to start.",
+  "Upload a file, select a Knowledge Base file, or wait for the current version to finish rendering.": "Upload a file, select a Knowledge Base file, or wait for the current version to finish rendering.",
+  "Grounding": "Grounding"
 }
diff --git a/web/locales/zh/app.json b/web/locales/zh/app.json
index 4414dea46..e6336404a 100644
--- a/web/locales/zh/app.json
+++ b/web/locales/zh/app.json
@@ -1,4 +1,5 @@
 {
+  "DeepTutor": "DeepTutor",
   "language.english": "English",
   "language.chinese": "中文",
   "Start": "开始",
@@ -441,7 +442,7 @@
   "RAG-Anything (Docling)": "LlamaIndex",
   "Documents": "文档",
   "Images": "图片",
-  "Ready": "就绪",
+  "Ready": "已完成",
   "Processing": "处理中",
   "Processing File": "处理文件",
   "Extracting Items": "提取内容",
@@ -860,11 +861,9 @@
   "Delete this chat history?": "确定删除此聊天记录吗？",
   "Question Notebook": "题目笔记本",
   "Review and organize quiz questions across sessions.": "跨会话回顾和整理测验题目。",
-  "All": "全部",
   "Bookmarked": "已收藏",
   "Wrong Only": "仅错题",
   "Total": "总计",
-  "Refresh": "刷新",
   "Categories": "分类",
   "Manage Categories": "管理分类",
   "New category name...": "新分类名称...",
@@ -874,17 +873,121 @@
   "No entries yet": "暂无题目",
   "Questions from your quizzes will appear here.": "测验中的题目将汇总到此处。",
   "Your Answer": "你的答案",
-  "Correct Answer": "正确答案",
   "From session": "来自会话",
   "Follow-up": "追问对话",
   "Bookmark": "收藏",
   "Remove Bookmark": "取消收藏",
   "Add to Category": "添加到分类",
-  "Delete": "删除",
   "Delete this entry?": "确定删除此条目吗？",
   "Failed to load entries": "加载失败",
-  "Retry": "重试",
   "Your pick": "你的选择",
   "No categories yet.": "暂无分类。",
-  "Original Session": "原始会话"
+  "Original Session": "原始会话",
+  "Structure Note": "结构讲义",
+  "Turn course PDFs or slides into structured study notes and a final PDF.": "将课程 PDF 或幻灯片整理成结构化讲义，并导出最终 PDF。",
+  "Structure Note history": "结构讲义历史任务",
+  "No Structure Note jobs yet. Upload a file to start.": "还没有结构讲义任务。上传文件即可开始。",
+  "Upload & Configure": "上传与配置",
+  "Upload one course PDF or slide deck, choose the explanation depth, and generate a clean reading PDF with citations.": "上传一份课程 PDF 或幻灯片，选择讲解深度，然后生成带引用的整洁讲义 PDF。",
+  "Course File": "课程文件",
+  "Accepted formats: PDF, PPT, PPTX": "支持格式：PDF、PPT、PPTX",
+  "Explanation Depth": "讲解深度",
+  "Simple": "简单",
+  "Detailed": "复杂",
+  "Shorter notes focused on key definitions and outcomes.": "篇幅更短，聚焦关键定义、结论和核心知识。",
+  "Balanced classroom-style coverage with core logic.": "保持课堂讲解密度，兼顾重点解释和基础逻辑。",
+  "Longer notes with deeper reasoning and slower generation.": "篇幅更长，展开更多推理细节，生成时间也更久。",
+  "Generate Structure Note": "生成结构讲义",
+  "Detailed mode runs longer to keep more reasoning and context.": "复杂模式会花更久时间，以保留更多推理和上下文。",
+  "Current Job": "当前任务",
+  "Select or create a job to see progress and results.": "选择已有任务，或新建任务后在这里查看进度和结果。",
+  "Retry failed job": "重试失败任务",
+  "Stage": "阶段",
+  "Recent Logs": "最近日志",
+  "Logs will appear here while the job is running.": "任务运行时，日志会显示在这里。",
+  "Queued": "已排队",
+  "Normalizing source": "正在归一化素材",
+  "Building page index": "正在构建页级索引",
+  "Planning sections": "正在规划章节结构",
+  "Generating notes": "正在生成讲义",
+  "Processing figures": "正在处理配图",
+  "Rendering PDF": "正在渲染 PDF",
+  "Result": "结果",
+  "Preview the exported note PDF and open the source citations in the right column.": "在这里预览导出的讲义 PDF，并在右侧查看引用来源。",
+  "The generated PDF preview will appear here when the job finishes.": "任务完成后，生成的 PDF 预览会显示在这里。",
+  "Download PDF": "下载 PDF",
+  "Structure Note PDF preview": "结构讲义 PDF 预览",
+  "No final PDF yet.": "还没有最终 PDF。",
+  "Upload a file or wait for the current job to finish rendering.": "请先上传文件，或等待当前任务完成渲染。",
+  "Citations": "引用来源",
+  "Each entry tracks the section path and source page range used in the exported note.": "每条记录都保留章节路径和导出讲义使用的页码范围。",
+  "Text": "文本",
+  "Pages": "页码",
+  "Unlabeled section": "未命名章节",
+  "Citation entries will appear here when a job completes.": "任务完成后，引用来源会显示在这里。",
+  "Select a PDF, PPT, or PPTX file first.": "请先选择一个 PDF、PPT 或 PPTX 文件。",
+  "Online Lecture Note": "在线讲义",
+  "Read the Markdown note with section navigation, page grounding, and export links.": "阅读带章节导航、页码溯源和导出入口的 Markdown 讲义。",
+  "The Markdown lecture note will appear here when generation finishes.": "生成完成后，Markdown 讲义会显示在这里。",
+  "Preview Markdown": "预览 Markdown",
+  "Edit Markdown": "编辑 Markdown",
+  "Download MD": "下载 MD",
+  "Sections & Pages": "章节与页码",
+  "Structure Note sections": "结构讲义章节",
+  "Section navigation will appear after planning completes.": "章节规划完成后会显示导航。",
+  "Loading Markdown note": "正在加载 Markdown 讲义",
+  "Markdown source": "Markdown 源文",
+  "No lecture note yet.": "还没有讲义。",
+  "Note Language": "笔记语言",
+  "Generate the final note content in Chinese.": "最终讲义内容使用中文生成。",
+  "Generate the final note content in English.": "最终讲义内容使用英文生成。",
+  "Lecture Style Level": "讲解风格等级",
+  "Popular-science style for fast entry-level understanding.": "科普级别，更通俗，适合快速理解和入门阅读。",
+  "Standard classroom note style with balanced clarity and detail.": "正常讲解风格，接近日常课堂讲义，兼顾清晰度和信息量。",
+  "Academic style with more rigorous principles, formulas, and derivations when supported.": "更学术严谨；材料支持时加入原理、公式和推导。",
+  "Manage materials and generated notes by project.": "按项目管理原始材料和生成讲义。",
+  "Add Material & Configure": "添加材料与配置",
+  "Upload a local file or select one file from Knowledge Base, then generate a versioned lecture note under its project.": "上传本地文件，或从知识库选择一个文件，然后在对应项目下生成带版本的讲义。",
+  "File Source": "文件来源",
+  "Local Upload": "本地上传",
+  "Use a file from this device.": "使用当前设备中的文件。",
+  "Use one existing KB file without changing KB indexing.": "使用一个已有知识库文件，不改变知识库索引。",
+  "Select a Knowledge Base file first.": "请先选择一个知识库文件。",
+  "Knowledge Base File": "知识库文件",
+  "No Knowledge Base files available.": "暂无可用知识库文件。",
+  "No files in this Knowledge Base.": "该知识库中没有可用文件。",
+  "Project will use the selected Knowledge Base name automatically.": "项目会自动沿用所选知识库名称。",
+  "Only the selected file is used for Structure Note; the Knowledge Base index is unchanged.": "Structure Note 只使用当前选中文件；知识库索引保持不变。",
+  "Each generation creates a new version under the matching Structure Note.": "每次生成都会在对应结构讲义下创建一个新版本。",
+  "Current Version": "当前版本",
+  "Select or create a note version to see progress and results.": "选择或创建一个讲义版本后，在这里查看进度与结果。",
+  "Project": "项目",
+  "Version": "版本",
+  "Projects": "项目",
+  "Project navigator": "项目导航",
+  "Materials": "材料",
+  "Structure Notes": "结构讲义",
+  "latest": "最新",
+  "current": "当前",
+  "New Project": "新建项目",
+  "New project name": "新项目名称",
+  "Cancel new project": "取消新建项目",
+  "Enter a project name first.": "请先输入项目名称。",
+  "Project name": "项目名称",
+  "Save project name": "保存项目名称",
+  "Cancel rename": "取消重命名",
+  "Rename project": "重命名项目",
+  "Delete project": "删除项目",
+  "Delete project \"{{name}}\" and all of its Structure Note versions?": "删除项目「{{name}}」以及其中所有结构讲义版本？",
+  "No materials yet.": "暂无材料。",
+  "No Structure Notes yet.": "暂无结构讲义。",
+  "Target Project": "目标项目",
+  "A project will be created from the selected Knowledge Base.": "将根据所选知识库自动创建项目。",
+  "Local Uploads will be created automatically.": "将自动创建 Local Uploads 项目。",
+  "New files and KB selections are added to this project.": "新文件和知识库选择都会加入该项目。",
+  "Expand sidebar": "展开侧边栏",
+  "Collapse sidebar": "折叠侧边栏",
+  "No projects yet. Upload or select a Knowledge Base file to start.": "暂无项目。上传文件或选择知识库文件即可开始。",
+  "Upload a file, select a Knowledge Base file, or wait for the current version to finish rendering.": "请上传文件、选择知识库文件，或等待当前版本完成渲染。",
+  "Grounding": "溯源"
 }
diff --git a/web/package-lock.json b/web/package-lock.json
index 6cbf89e4a..80cccb123 100644
--- a/web/package-lock.json
+++ b/web/package-lock.json
@@ -4817,6 +4817,7 @@
       "version": "2.3.2",
       "resolved": "https://registry.npmjs.org/fsevents/-/fsevents-2.3.2.tgz",
       "integrity": "sha512-xiqMQR4xAeHTuB9uWm+fFRcIOgKBMiOBP+eXiyT7jsgVCq1bkVygt00oASowB7EdtpOHaaPgKt812P9ab+DDKA==",
+      "dev": true,
       "hasInstallScript": true,
       "license": "MIT",
       "optional": true,
diff --git a/web/scripts/route_budgets.mjs b/web/scripts/route_budgets.mjs
index ca714b7e4..01772bfe7 100644
--- a/web/scripts/route_budgets.mjs
+++ b/web/scripts/route_budgets.mjs
@@ -1,128 +1,129 @@
-import fs from "fs";
-import path from "path";
-import vm from "vm";
+import fs from 'fs'
+import path from 'path'
+import vm from 'vm'
 
-const APP_SERVER_DIR = path.resolve(".next/server/app");
-const APP_OUTPUT_DIR = path.resolve(".next");
+const APP_SERVER_DIR = path.resolve('.next/server/app')
+const APP_OUTPUT_DIR = path.resolve('.next')
 
 const ROUTE_BUDGETS_KB = {
-  "/": 700,
-  "/playground": 700,
-  "/co-writer": 700,
-  "/guide": 700,
-  "/knowledge": 450,
-  "/memory": 450,
-  "/settings": 180,
-};
+  '/': 700,
+  '/playground': 700,
+  '/co-writer': 700,
+  '/guide': 700,
+  '/structure-note': 600,
+  '/knowledge': 450,
+  '/memory': 450,
+  '/settings': 180,
+}
 
-const ROOT_SHELL_BUDGET_KB = 220;
+const ROOT_SHELL_BUDGET_KB = 220
 
 function walkManifestFiles(rootDir) {
-  const entries = [];
+  const entries = []
   for (const item of fs.readdirSync(rootDir, { withFileTypes: true })) {
-    const fullPath = path.join(rootDir, item.name);
+    const fullPath = path.join(rootDir, item.name)
     if (item.isDirectory()) {
-      entries.push(...walkManifestFiles(fullPath));
-      continue;
+      entries.push(...walkManifestFiles(fullPath))
+      continue
     }
-    if (item.name.endsWith("_client-reference-manifest.js")) {
-      entries.push(fullPath);
+    if (item.name.endsWith('_client-reference-manifest.js')) {
+      entries.push(fullPath)
     }
   }
-  return entries.sort();
+  return entries.sort()
 }
 
 function evaluateManifest(filePath) {
-  const context = { globalThis: { __RSC_MANIFEST: {} } };
-  vm.createContext(context);
-  vm.runInContext(fs.readFileSync(filePath, "utf8"), context);
-  const manifestEntries = Object.entries(context.globalThis.__RSC_MANIFEST);
+  const context = { globalThis: { __RSC_MANIFEST: {} } }
+  vm.createContext(context)
+  vm.runInContext(fs.readFileSync(filePath, 'utf8'), context)
+  const manifestEntries = Object.entries(context.globalThis.__RSC_MANIFEST)
   if (manifestEntries.length !== 1) {
-    throw new Error(`Expected exactly one manifest in ${filePath}`);
+    throw new Error(`Expected exactly one manifest in ${filePath}`)
   }
-  const [manifestKey, manifest] = manifestEntries[0];
-  return { manifestKey, manifest };
+  const [manifestKey, manifest] = manifestEntries[0]
+  return { manifestKey, manifest }
 }
 
 function normalizePublicRoute(manifestKey) {
-  const withoutGroups = manifestKey.replace(/\/\([^/]+\)/g, "");
-  const withoutPageSuffix = withoutGroups.replace(/\/page$/, "");
-  return withoutPageSuffix || "/";
+  const withoutGroups = manifestKey.replace(/\/\([^/]+\)/g, '')
+  const withoutPageSuffix = withoutGroups.replace(/\/page$/, '')
+  return withoutPageSuffix || '/'
 }
 
 function resolveChunkSize(chunkPath) {
-  const filePath = path.join(APP_OUTPUT_DIR, chunkPath.replace(/^\/+/, ""));
-  return fs.existsSync(filePath) ? fs.statSync(filePath).size : 0;
+  const filePath = path.join(APP_OUTPUT_DIR, chunkPath.replace(/^\/+/, ''))
+  return fs.existsSync(filePath) ? fs.statSync(filePath).size : 0
 }
 
 function sumChunkSizes(chunkPaths) {
-  return chunkPaths.reduce((total, chunkPath) => total + resolveChunkSize(chunkPath), 0);
+  return chunkPaths.reduce((total, chunkPath) => total + resolveChunkSize(chunkPath), 0)
 }
 
 if (!fs.existsSync(APP_SERVER_DIR)) {
-  console.error("Missing .next/server/app. Run `npm run build` before `npm run perf:check`.");
-  process.exit(1);
+  console.error('Missing .next/server/app. Run `npm run build` before `npm run perf:check`.')
+  process.exit(1)
 }
 
 const manifestFiles = walkManifestFiles(APP_SERVER_DIR).filter(
-  (filePath) => !filePath.includes("_global-error") && !filePath.includes("_not-found"),
-);
+  filePath => !filePath.includes('_global-error') && !filePath.includes('_not-found')
+)
 
-const routeRows = [];
-let rootShellSize = 0;
+const routeRows = []
+let rootShellSize = 0
 
 for (const manifestFile of manifestFiles) {
-  const { manifestKey, manifest } = evaluateManifest(manifestFile);
-  const route = normalizePublicRoute(manifestKey);
-  const entryFiles = manifest.entryJSFiles;
+  const { manifestKey, manifest } = evaluateManifest(manifestFile)
+  const route = normalizePublicRoute(manifestKey)
+  const entryFiles = manifest.entryJSFiles
 
-  const rootLayoutFiles = entryFiles["[project]/app/layout"] || [];
+  const rootLayoutFiles = entryFiles['[project]/app/layout'] || []
   if (!rootShellSize && rootLayoutFiles.length > 0) {
-    rootShellSize = sumChunkSizes(rootLayoutFiles);
+    rootShellSize = sumChunkSizes(rootLayoutFiles)
   }
 
   const routeEntryKey = Object.keys(entryFiles).find(
-    (key) => key.startsWith("[project]/app/") && key.endsWith("/page") && !key.includes("/layout"),
-  );
+    key => key.startsWith('[project]/app/') && key.endsWith('/page') && !key.includes('/layout')
+  )
   if (!routeEntryKey) {
-    continue;
+    continue
   }
 
-  const chunkPaths = entryFiles[routeEntryKey] || [];
+  const chunkPaths = entryFiles[routeEntryKey] || []
   routeRows.push({
     route,
     sizeBytes: sumChunkSizes(chunkPaths),
-    chunks: chunkPaths.map((chunkPath) => path.basename(chunkPath)),
-  });
+    chunks: chunkPaths.map(chunkPath => path.basename(chunkPath)),
+  })
 }
 
-let hasFailure = false;
+let hasFailure = false
 
-console.log("Route budgets:");
+console.log('Route budgets:')
 for (const row of routeRows) {
-  const sizeKb = Math.round(row.sizeBytes / 1024);
-  const budget = ROUTE_BUDGETS_KB[row.route];
-  const status = budget && sizeKb > budget ? "FAIL" : "OK";
-  if (status === "FAIL") {
-    hasFailure = true;
+  const sizeKb = Math.round(row.sizeBytes / 1024)
+  const budget = ROUTE_BUDGETS_KB[row.route]
+  const status = budget && sizeKb > budget ? 'FAIL' : 'OK'
+  if (status === 'FAIL') {
+    hasFailure = true
   }
   console.log(
     `${status.padEnd(4)} ${row.route.padEnd(12)} ${String(sizeKb).padStart(4)}KB` +
-      (budget ? ` / budget ${budget}KB` : ""),
-  );
+      (budget ? ` / budget ${budget}KB` : '')
+  )
 }
 
 if (rootShellSize) {
-  const rootShellKb = Math.round(rootShellSize / 1024);
-  const rootStatus = rootShellKb > ROOT_SHELL_BUDGET_KB ? "FAIL" : "OK";
-  if (rootStatus === "FAIL") {
-    hasFailure = true;
+  const rootShellKb = Math.round(rootShellSize / 1024)
+  const rootStatus = rootShellKb > ROOT_SHELL_BUDGET_KB ? 'FAIL' : 'OK'
+  if (rootStatus === 'FAIL') {
+    hasFailure = true
   }
   console.log(
-    `${rootStatus.padEnd(4)} ${"root-shell".padEnd(12)} ${String(rootShellKb).padStart(4)}KB / budget ${ROOT_SHELL_BUDGET_KB}KB`,
-  );
+    `${rootStatus.padEnd(4)} ${'root-shell'.padEnd(12)} ${String(rootShellKb).padStart(4)}KB / budget ${ROOT_SHELL_BUDGET_KB}KB`
+  )
 }
 
 if (hasFailure) {
-  process.exit(1);
+  process.exit(1)
 }
diff --git a/web/tests/e2e/structure-note.audit.ts b/web/tests/e2e/structure-note.audit.ts
new file mode 100644
index 000000000..365b660ab
--- /dev/null
+++ b/web/tests/e2e/structure-note.audit.ts
@@ -0,0 +1,25 @@
+import { expect, test } from '@playwright/test'
+
+const BASE_URL =
+  process.env.WEB_BASE_URL || process.env.NEXT_PUBLIC_API_BASE || 'http://localhost:3000'
+
+test.describe('Structure Note :: Accessibility & UX', () => {
+  test('page exposes heading, labeled controls, and result regions', async ({ page }) => {
+    await page.route('**/api/v1/structure-note/jobs', route =>
+      route.fulfill({
+        status: 200,
+        headers: { 'content-type': 'application/json' },
+        body: JSON.stringify({ jobs: [] }),
+      })
+    )
+
+    await page.goto(`${BASE_URL}/structure-note`)
+
+    await expect(page.locator('main')).toBeVisible()
+    await expect(page.getByRole('heading', { name: 'Structure Note' })).toBeVisible()
+    await expect(page.getByLabel('Course File')).toBeVisible()
+    await expect(page.getByRole('button', { name: 'Generate Structure Note' })).toBeVisible()
+    await expect(page.getByRole('heading', { name: 'Result' })).toBeVisible()
+    await expect(page.getByRole('heading', { name: 'Citations' })).toBeVisible()
+  })
+})

From 650cc00806233674c7e56a92711ab72494d8b3f2 Mon Sep 17 00:00:00 2001
From: txxxxz <chendi_zhou@163.com>
Date: Tue, 14 Apr 2026 21:52:07 +0800
Subject: [PATCH 2/4] Integrate VectifyAI PageIndex for structure notes

---
 .gitmodules                                   |   3 +
 deeptutor/services/structure_note/manager.py  |  97 ++++-
 .../services/structure_note/page_index.py     | 381 ++++++++++++++++--
 pyproject.toml                                |   5 +-
 requirements/cli.txt                          |   6 +-
 tests/services/test_structure_note_service.py |  28 ++
 third_party/PageIndex                         |   1 +
 7 files changed, 462 insertions(+), 59 deletions(-)
 create mode 100644 .gitmodules
 create mode 160000 third_party/PageIndex

diff --git a/.gitmodules b/.gitmodules
new file mode 100644
index 000000000..c151c6822
--- /dev/null
+++ b/.gitmodules
@@ -0,0 +1,3 @@
+[submodule "third_party/PageIndex"]
+	path = third_party/PageIndex
+	url = https://github.com/VectifyAI/PageIndex.git
diff --git a/deeptutor/services/structure_note/manager.py b/deeptutor/services/structure_note/manager.py
index b4cd9bc8c..f750c79b0 100644
--- a/deeptutor/services/structure_note/manager.py
+++ b/deeptutor/services/structure_note/manager.py
@@ -1,5 +1,6 @@
 from __future__ import annotations
 
+import asyncio
 from datetime import datetime
 from pathlib import Path
 from typing import Any, Literal
@@ -30,11 +31,15 @@
     StructureNoteProject,
 )
 from .normalizer import normalize_to_pdf
-from .page_index import build_page_index
+from .page_index import (
+    VECTIFY_PAGEINDEX_RAW_FILENAME,
+    build_page_index_bundle,
+    pages_from_pageindex_raw,
+    sections_from_pageindex_raw,
+)
 from .planner import build_document_plan
 from .renderer import render_pdf
 from .storage import StructureNoteStorage
-from .tree_builder import build_section_tree
 
 
 class StructureNoteManager:
@@ -260,18 +265,54 @@ async def run_job(self, job_id: str, task_id: str, emit_log) -> StructureNoteArt
                 self.storage.write_artifact(artifact)
 
             page_index_path = job_dirs["index"] / "page_index.json"
+            page_index_raw_path = job_dirs["index"] / VECTIFY_PAGEINDEX_RAW_FILENAME
+            page_index_bundle = None
+            raw_page_index: Any | None = (
+                self.storage.read_json(page_index_raw_path)
+                if page_index_raw_path.exists()
+                else None
+            )
+            pageindex_tree_refreshed = False
             artifact = self.update_status(
                 artifact, JobStatus.INDEXING, retry_state=JobStatus.INDEXING.value
             )
-            if artifact.page_index_path and Path(artifact.page_index_path).exists():
-                emit_log(task_id, "Reusing existing page index.")
+            if (
+                artifact.page_index_path
+                and Path(artifact.page_index_path).exists()
+                and raw_page_index is not None
+            ):
+                emit_log(task_id, "Reusing VectifyAI PageIndex page evidence.")
                 page_index = [
                     PageIndexPage.model_validate(item)
                     for item in self.storage.read_json(Path(artifact.page_index_path))
                 ]
+            elif raw_page_index is not None:
+                emit_log(task_id, "Rebuilding page evidence from VectifyAI PageIndex output.")
+                page_index = pages_from_pageindex_raw(normalized_pdf_path, raw_page_index)
+                artifact.page_index_path = str(
+                    self.storage.write_json(
+                        page_index_path,
+                        [page.model_dump(mode="json") for page in page_index],
+                    )
+                )
+                self.storage.write_artifact(artifact)
             else:
-                emit_log(task_id, "Building page-level index.")
-                page_index = build_page_index(normalized_pdf_path)
+                if artifact.page_index_path and Path(artifact.page_index_path).exists():
+                    emit_log(
+                        task_id,
+                        "Existing page index is legacy; rebuilding with VectifyAI PageIndex.",
+                    )
+                else:
+                    emit_log(task_id, "Building VectifyAI PageIndex tree and page evidence.")
+                page_index_bundle = await asyncio.to_thread(
+                    build_page_index_bundle,
+                    normalized_pdf_path,
+                    work_dir=job_dirs["index"],
+                )
+                raw_page_index = page_index_bundle.raw
+                pageindex_tree_refreshed = True
+                self.storage.write_json(page_index_raw_path, raw_page_index)
+                page_index = page_index_bundle.pages
                 artifact.page_index_path = str(
                     self.storage.write_json(
                         page_index_path,
@@ -284,17 +325,29 @@ async def run_job(self, job_id: str, task_id: str, emit_log) -> StructureNoteArt
             artifact = self.update_status(
                 artifact, JobStatus.PLANNING, retry_state=JobStatus.PLANNING.value
             )
-            if artifact.section_tree_path and Path(artifact.section_tree_path).exists():
+            section_tree_refreshed = False
+            if (
+                artifact.section_tree_path
+                and Path(artifact.section_tree_path).exists()
+                and not pageindex_tree_refreshed
+            ):
                 emit_log(task_id, "Reusing section tree.")
                 section_tree = [
                     SectionTreeNode.model_validate(item)
                     for item in self.storage.read_json(Path(artifact.section_tree_path))
                 ]
             else:
-                emit_log(task_id, "Deriving section tree.")
-                section_tree = await build_section_tree(
-                    page_index, preset.page_window, language=language
-                )
+                emit_log(task_id, "Using VectifyAI PageIndex section tree.")
+                if page_index_bundle is not None:
+                    section_tree = page_index_bundle.section_tree
+                else:
+                    if raw_page_index is None:
+                        raw_page_index = self.storage.read_json(page_index_raw_path)
+                    section_tree = sections_from_pageindex_raw(
+                        raw_page_index,
+                        total_pages=len(page_index),
+                    )
+                section_tree_refreshed = True
                 artifact.section_tree_path = str(
                     self.storage.write_json(
                         section_tree_path,
@@ -304,7 +357,12 @@ async def run_job(self, job_id: str, task_id: str, emit_log) -> StructureNoteArt
                 self.storage.write_artifact(artifact)
 
             document_plan_path = job_dirs["index"] / "document_plan.json"
-            if artifact.document_plan_path and Path(artifact.document_plan_path).exists():
+            document_plan_refreshed = False
+            if (
+                artifact.document_plan_path
+                and Path(artifact.document_plan_path).exists()
+                and not section_tree_refreshed
+            ):
                 emit_log(task_id, "Reusing document-level plan.")
                 document_plan = DocumentPlan.model_validate(
                     self.storage.read_json(Path(artifact.document_plan_path))
@@ -317,6 +375,7 @@ async def run_job(self, job_id: str, task_id: str, emit_log) -> StructureNoteArt
                     document_title=artifact.file_name,
                     language=language,
                 )
+                document_plan_refreshed = True
                 artifact.document_plan_path = str(
                     self.storage.write_json(
                         document_plan_path,
@@ -329,7 +388,12 @@ async def run_job(self, job_id: str, task_id: str, emit_log) -> StructureNoteArt
             artifact = self.update_status(
                 artifact, JobStatus.GENERATING, retry_state=JobStatus.GENERATING.value
             )
-            if artifact.generation_chunks_path and Path(artifact.generation_chunks_path).exists():
+            generation_chunks_refreshed = False
+            if (
+                artifact.generation_chunks_path
+                and Path(artifact.generation_chunks_path).exists()
+                and not document_plan_refreshed
+            ):
                 emit_log(task_id, "Reusing generated chunks.")
                 chunks = [
                     GenerationChunk.model_validate(item)
@@ -353,6 +417,7 @@ async def run_job(self, job_id: str, task_id: str, emit_log) -> StructureNoteArt
                         document_plan=document_plan,
                     )
                 chunks = inject_image_placeholders(chunks, page_index, preset.placeholder_purpose)
+                generation_chunks_refreshed = True
                 artifact.generation_chunks_path = str(
                     self.storage.write_json(
                         chunks_path,
@@ -367,7 +432,11 @@ async def run_job(self, job_id: str, task_id: str, emit_log) -> StructureNoteArt
                 JobStatus.PROCESSING_IMAGES,
                 retry_state=JobStatus.PROCESSING_IMAGES.value,
             )
-            if artifact.rendered_markdown_path and Path(artifact.rendered_markdown_path).exists():
+            if (
+                artifact.rendered_markdown_path
+                and Path(artifact.rendered_markdown_path).exists()
+                and not generation_chunks_refreshed
+            ):
                 emit_log(task_id, "Reusing rendered markdown after image processing.")
                 rendered_path = Path(artifact.rendered_markdown_path)
                 markdown_text = normalize_structure_note_markdown(
diff --git a/deeptutor/services/structure_note/page_index.py b/deeptutor/services/structure_note/page_index.py
index be559f920..394cef11e 100644
--- a/deeptutor/services/structure_note/page_index.py
+++ b/deeptutor/services/structure_note/page_index.py
@@ -1,23 +1,192 @@
 from __future__ import annotations
 
+from collections.abc import Callable, Iterator
+from contextlib import contextmanager
+from dataclasses import dataclass
+from datetime import datetime
+import importlib
+import json
+import os
 from pathlib import Path
-import re
-from statistics import median
+import sys
+import threading
+from typing import Any
 
-from .models import ImageCandidate, PageIndexPage, TextBlock, TitleCandidate
+from .models import ImageCandidate, PageIndexPage, SectionTreeNode, TextBlock, TitleCandidate
 
-_HEADING_PATTERN = re.compile(r"^(\d+([.\-]\d+)*|[IVXLC]+|[A-Z])[\).:\s-]")
+VECTIFY_PAGEINDEX_RAW_FILENAME = "vectify_pageindex.json"
+
+_REPO_ROOT = Path(__file__).resolve().parents[3]
+_VECTIFY_PAGEINDEX_ROOT = _REPO_ROOT / "third_party" / "PageIndex"
+_PAGEINDEX_LOCK = threading.Lock()
+_PageIndexRunner = Callable[..., dict[str, Any]]
+
+
+@dataclass(frozen=True)
+class PageIndexBuildResult:
+    pages: list[PageIndexPage]
+    section_tree: list[SectionTreeNode]
+    raw: dict[str, Any]
 
 
 def _bbox_list(bbox: tuple[float, float, float, float] | list[float]) -> list[float]:
     return [float(value) for value in bbox]
 
 
-def build_page_index(pdf_path: Path) -> list[PageIndexPage]:
+def _coerce_int(value: object, default: int) -> int:
+    if isinstance(value, str):
+        value = value.strip()
+        if value.startswith("<physical_index_"):
+            value = value.removeprefix("<physical_index_").removesuffix(">")
+        elif value.startswith("physical_index_"):
+            value = value.removeprefix("physical_index_")
+    try:
+        return int(value)  # type: ignore[arg-type]
+    except (TypeError, ValueError):
+        return default
+
+
+def _bounded_page(value: object, *, default: int, total_pages: int) -> int:
+    if total_pages <= 0:
+        return default
+    page = _coerce_int(value, default)
+    return max(1, min(total_pages, page))
+
+
+def _normalize_raw_result(raw: Any) -> dict[str, Any]:
+    if isinstance(raw, dict):
+        structure = raw.get("structure")
+        if isinstance(structure, list):
+            return raw
+        if raw.get("title") and raw.get("start_index"):
+            return {"structure": [raw]}
+    if isinstance(raw, list):
+        return {"structure": raw}
+    raise RuntimeError("VectifyAI PageIndex returned an unsupported result shape.")
+
+
+def _load_vectify_pageindex_module() -> Any:
+    if not (_VECTIFY_PAGEINDEX_ROOT / "pageindex").exists():
+        raise RuntimeError(
+            "VectifyAI PageIndex submodule is missing. "
+            "Run `git submodule update --init --recursive third_party/PageIndex`."
+        )
+    root = str(_VECTIFY_PAGEINDEX_ROOT)
+    if root not in sys.path:
+        sys.path.insert(0, root)
+    try:
+        return importlib.import_module("pageindex.page_index")
+    except ModuleNotFoundError as exc:
+        raise RuntimeError(
+            "VectifyAI PageIndex dependencies are not installed. "
+            "Install the Structure Note dependencies including litellm, PyPDF2, "
+            "PyMuPDF, python-dotenv, and pyyaml."
+        ) from exc
+
+
+def _resolve_pageindex_model(model: str | None) -> str | None:
+    if model:
+        return model
+    env_model = os.getenv("DEEPTUTOR_PAGEINDEX_MODEL")
+    if env_model:
+        return env_model
+
+    try:
+        from deeptutor.services.llm import get_llm_client, get_llm_config
+
+        config = get_llm_config()
+        get_llm_client(config)
+        api_key = getattr(config, "api_key", None)
+        base_url = getattr(config, "base_url", None)
+        if api_key and not os.getenv("OPENAI_API_KEY"):
+            os.environ["OPENAI_API_KEY"] = str(api_key)
+        if base_url and not os.getenv("OPENAI_BASE_URL"):
+            os.environ["OPENAI_BASE_URL"] = str(base_url)
+        return str(config.model) if config.model else None
+    except Exception:
+        return None
+
+
+def _safe_stem(value: object) -> str:
+    stem = Path(str(value)).name or "pageindex"
+    return "".join(char if char.isalnum() or char in ".-_" else "-" for char in stem)
+
+
+def _logger_class(log_dir: Path) -> type:
+    class PageIndexJsonLogger:
+        def __init__(self, file_path: object) -> None:
+            log_dir.mkdir(parents=True, exist_ok=True)
+            timestamp = datetime.now().strftime("%Y%m%d_%H%M%S")
+            self._path = log_dir / f"{_safe_stem(file_path)}_{timestamp}.json"
+            self._items: list[object] = []
+
+        def log(self, _level: str, message: object, **_kwargs: object) -> None:
+            self._items.append(message if isinstance(message, dict) else {"message": str(message)})
+            self._path.write_text(
+                json.dumps(self._items, indent=2, ensure_ascii=False, default=str),
+                encoding="utf-8",
+            )
+
+        def info(self, message: object, **kwargs: object) -> None:
+            self.log("INFO", message, **kwargs)
+
+        def error(self, message: object, **kwargs: object) -> None:
+            self.log("ERROR", message, **kwargs)
+
+        def debug(self, message: object, **kwargs: object) -> None:
+            self.log("DEBUG", message, **kwargs)
+
+        def exception(self, message: object, **kwargs: object) -> None:
+            self.log("ERROR", message, **kwargs)
+
+    return PageIndexJsonLogger
+
+
+@contextmanager
+def _patched_pageindex_logger(module: Any, log_dir: Path | None) -> Iterator[None]:
+    original = getattr(module, "JsonLogger", None)
+    if original is None or log_dir is None:
+        yield
+        return
+    module.JsonLogger = _logger_class(log_dir)
+    try:
+        yield
+    finally:
+        module.JsonLogger = original
+
+
+def _run_vectify_pageindex(
+    pdf_path: Path,
+    *,
+    model: str | None = None,
+    work_dir: Path | None = None,
+    pageindex_runner: _PageIndexRunner | None = None,
+) -> dict[str, Any]:
+    resolved_model = _resolve_pageindex_model(model)
+    kwargs: dict[str, object] = {
+        "model": resolved_model,
+        "if_add_node_id": "yes",
+        "if_add_node_summary": "yes",
+        "if_add_doc_description": "yes",
+        "if_add_node_text": "no",
+    }
+
+    if pageindex_runner is not None:
+        return _normalize_raw_result(pageindex_runner(str(pdf_path), **kwargs))
+
+    module = _load_vectify_pageindex_module()
+    log_dir = (work_dir or pdf_path.parent) / "pageindex_logs"
+    with _PAGEINDEX_LOCK:
+        with _patched_pageindex_logger(module, log_dir):
+            raw = module.page_index(str(pdf_path), **kwargs)
+    return _normalize_raw_result(raw)
+
+
+def _extract_page_artifacts(pdf_path: Path) -> list[PageIndexPage]:
     try:
         import fitz
     except ImportError as exc:  # pragma: no cover - dependency is runtime-required
-        raise RuntimeError("PyMuPDF is required for Structure Note indexing.") from exc
+        raise RuntimeError("PyMuPDF is required for Structure Note page evidence.") from exc
 
     pages: list[PageIndexPage] = []
     document = fitz.open(pdf_path)
@@ -25,10 +194,7 @@ def build_page_index(pdf_path: Path) -> list[PageIndexPage]:
         for page_index, page in enumerate(document, start=1):
             raw = page.get_text("dict")
             blocks: list[TextBlock] = []
-            title_candidates: list[TitleCandidate] = []
             image_candidates: list[ImageCandidate] = []
-            font_sizes: list[float] = []
-            max_font_size = 0.0
 
             for block in raw.get("blocks", []):
                 block_type = int(block.get("type", 0))
@@ -49,56 +215,28 @@ def build_page_index(pdf_path: Path) -> list[PageIndexPage]:
                     )
                     continue
 
-                lines = block.get("lines", [])
-                for line in lines:
+                for line in block.get("lines", []):
                     spans = line.get("spans", [])
                     text = "".join(str(span.get("text", "")) for span in spans).strip()
                     if not text:
                         continue
                     span_sizes = [float(span.get("size", 0.0) or 0.0) for span in spans]
-                    line_font_size = max(span_sizes) if span_sizes else None
-                    if line_font_size:
-                        font_sizes.extend(span_sizes)
-                        max_font_size = max(max_font_size, line_font_size)
-                    line_bbox = _bbox_list(line.get("bbox", bbox))
                     blocks.append(
                         TextBlock(
                             text=text,
-                            bbox=line_bbox,
-                            font_size=line_font_size,
+                            bbox=_bbox_list(line.get("bbox", bbox)),
+                            font_size=max(span_sizes) if span_sizes else None,
                         )
                     )
 
-            size_median = median(font_sizes) if font_sizes else 0.0
-            top_threshold = page.rect.height * 0.45
-            for block in blocks:
-                font_size = block.font_size or 0.0
-                heading_like = bool(_HEADING_PATTERN.match(block.text))
-                large_enough = font_size >= max(size_median + 1.5, max_font_size * 0.82, 11.5)
-                near_top = block.bbox[1] <= top_threshold
-                if len(block.text) > 160:
-                    continue
-                if not (heading_like or (large_enough and near_top)):
-                    continue
-                title_candidates.append(
-                    TitleCandidate(
-                        text=block.text,
-                        page_number=page_index,
-                        bbox=block.bbox,
-                        font_size=font_size or None,
-                        score=round((font_size or 0.0) + (3 if heading_like else 0), 3),
-                    )
-                )
-
-            page_text = "\n".join(block.text for block in blocks).strip()
             pages.append(
                 PageIndexPage(
                     page_number=page_index,
                     width=float(page.rect.width),
                     height=float(page.rect.height),
-                    text=page_text,
+                    text="\n".join(block.text for block in blocks).strip(),
                     text_blocks=blocks,
-                    title_candidates=title_candidates,
+                    title_candidates=[],
                     image_candidates=image_candidates,
                 )
             )
@@ -106,3 +244,162 @@ def build_page_index(pdf_path: Path) -> list[PageIndexPage]:
         document.close()
 
     return pages
+
+
+def _iter_structure_nodes(structure: object, level: int = 2) -> Iterator[tuple[dict[str, Any], int]]:
+    if isinstance(structure, dict):
+        yield structure, level
+        children = structure.get("nodes") or []
+        yield from _iter_structure_nodes(children, level + 1)
+    elif isinstance(structure, list):
+        for item in structure:
+            yield from _iter_structure_nodes(item, level)
+
+
+def _attach_pageindex_title_candidates(
+    pages: list[PageIndexPage],
+    structure: object,
+) -> None:
+    page_lookup = {page.page_number: page for page in pages}
+    seen: set[tuple[int, str]] = set()
+    for raw_node, level in _iter_structure_nodes(structure):
+        title = str(raw_node.get("title") or "").strip()
+        if not title:
+            continue
+        page_number = _coerce_int(raw_node.get("start_index"), 0)
+        page = page_lookup.get(page_number)
+        if page is None:
+            continue
+        key = (page_number, title)
+        if key in seen:
+            continue
+        seen.add(key)
+        page.title_candidates.append(
+            TitleCandidate(
+                text=title,
+                page_number=page_number,
+                bbox=[],
+                font_size=None,
+                score=max(1.0, 100.0 - float(level)),
+            )
+        )
+
+
+def pages_from_pageindex_raw(pdf_path: Path, raw: dict[str, Any]) -> list[PageIndexPage]:
+    normalized = _normalize_raw_result(raw)
+    pages = _extract_page_artifacts(pdf_path)
+    _attach_pageindex_title_candidates(pages, normalized.get("structure") or [])
+    return pages
+
+
+def sections_from_pageindex_raw(
+    raw: dict[str, Any],
+    *,
+    total_pages: int,
+) -> list[SectionTreeNode]:
+    normalized = _normalize_raw_result(raw)
+    return sections_from_pageindex_structure(normalized.get("structure") or [], total_pages)
+
+
+def sections_from_pageindex_structure(
+    structure: object,
+    total_pages: int,
+) -> list[SectionTreeNode]:
+    if total_pages <= 0:
+        return []
+
+    nodes: list[SectionTreeNode] = []
+    counter = 0
+
+    def visit(
+        raw_items: object,
+        *,
+        parent_id: str | None,
+        level: int,
+        path: list[str],
+    ) -> list[str]:
+        nonlocal counter
+        child_ids: list[str] = []
+        items = raw_items if isinstance(raw_items, list) else [raw_items]
+        for raw in items:
+            if not isinstance(raw, dict):
+                continue
+            title = str(raw.get("title") or "").strip()
+            if not title:
+                continue
+
+            page_start = _bounded_page(raw.get("start_index"), default=1, total_pages=total_pages)
+            page_end = _bounded_page(raw.get("end_index"), default=page_start, total_pages=total_pages)
+            if page_end < page_start:
+                page_end = page_start
+
+            counter += 1
+            section_id = f"section-{counter:03d}"
+            section_path = [*path, title]
+            node = SectionTreeNode(
+                section_id=section_id,
+                title=title,
+                level=max(2, min(level, 5)),
+                page_start=page_start,
+                page_end=page_end,
+                summary=str(raw.get("summary") or "").strip(),
+                parent_id=parent_id,
+                child_ids=[],
+                path=section_path,
+            )
+            nodes.append(node)
+            child_ids.append(section_id)
+            node.child_ids = visit(
+                raw.get("nodes") or [],
+                parent_id=section_id,
+                level=level + 1,
+                path=section_path,
+            )
+        return child_ids
+
+    visit(structure, parent_id=None, level=2, path=[])
+    if nodes:
+        return nodes
+    return [
+        SectionTreeNode(
+            section_id="section-001",
+            title="Document",
+            level=2,
+            page_start=1,
+            page_end=total_pages,
+            path=["Document"],
+        )
+    ]
+
+
+def build_page_index_bundle(
+    pdf_path: Path,
+    *,
+    model: str | None = None,
+    work_dir: Path | None = None,
+    pageindex_runner: _PageIndexRunner | None = None,
+) -> PageIndexBuildResult:
+    raw = _run_vectify_pageindex(
+        Path(pdf_path),
+        model=model,
+        work_dir=work_dir,
+        pageindex_runner=pageindex_runner,
+    )
+    pages = pages_from_pageindex_raw(Path(pdf_path), raw)
+    section_tree = sections_from_pageindex_raw(raw, total_pages=len(pages))
+    return PageIndexBuildResult(pages=pages, section_tree=section_tree, raw=raw)
+
+
+def build_page_index(pdf_path: Path) -> list[PageIndexPage]:
+    return build_page_index_bundle(Path(pdf_path)).pages
+
+
+__all__ = [
+    "PageIndexBuildResult",
+    "VECTIFY_PAGEINDEX_RAW_FILENAME",
+    "build_page_index",
+    "build_page_index_bundle",
+    "pages_from_pageindex_raw",
+    "sections_from_pageindex_raw",
+    "sections_from_pageindex_structure",
+]
diff --git a/pyproject.toml b/pyproject.toml
index 9080f5289..be77112c9 100644
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -23,11 +23,14 @@ dependencies = [
     "httpx>=0.27.0",
     "requests>=2.32.2",
     "ddgs>=9.9.1",
+    "litellm>=1.83.0",
     "nest_asyncio>=1.5.8",
     "tenacity>=8.0.0",
-    "pydantic>=2.0.0",
+    "pydantic>=2.0.0,<2.12",
     "pydantic-settings>=2.0.0",
     "aiosqlite>=0.19.0",
+    "PyMuPDF>=1.26.4",
+    "PyPDF2>=3.0.1",
     "typer[all]>=0.9.0",
     "rich>=13.0.0",
     "prompt_toolkit>=3.0.36",
diff --git a/requirements/cli.txt b/requirements/cli.txt
index 204c0696d..18796c04d 100644
--- a/requirements/cli.txt
+++ b/requirements/cli.txt
@@ -13,6 +13,7 @@ Markdown>=3.6
 # --- LLM ---
 openai>=1.30.0
 tiktoken>=0.5.0
+litellm>=1.83.0
 
 # --- LLM provider SDKs ---
 anthropic>=0.30.0
@@ -30,13 +31,14 @@ nest_asyncio>=1.5.8
 tenacity>=8.0.0
 
 # --- Data models & storage ---
-pydantic>=2.0.0
+pydantic>=2.0.0,<2.12
 pydantic-settings>=2.0.0
 aiosqlite>=0.19.0
 
 # --- RAG (LlamaIndex) ---
 llama-index>=0.14.12
-PyMuPDF>=1.26.0
+PyMuPDF>=1.26.4
+PyPDF2>=3.0.1
 numpy>=1.24.0,<2.0.0
 arxiv>=2.0.0
 
diff --git a/tests/services/test_structure_note_service.py b/tests/services/test_structure_note_service.py
index 679b583a4..e35a455aa 100644
--- a/tests/services/test_structure_note_service.py
+++ b/tests/services/test_structure_note_service.py
@@ -28,6 +28,7 @@
     StructureNoteArtifact,
 )
 from deeptutor.services.structure_note.normalizer import NormalizationError, normalize_to_pdf
+from deeptutor.services.structure_note.page_index import sections_from_pageindex_structure
 from deeptutor.services.structure_note.planner import build_document_plan
 from deeptutor.services.structure_note.tree_builder import build_section_tree
 
@@ -44,6 +45,33 @@ def _page(page_number: int, *, text: str = "", image_candidates=None) -> PageInd
     )
 
 
+def test_vectify_pageindex_structure_maps_to_section_tree() -> None:
+    structure = [
+        {
+            "title": "Chapter 1",
+            "start_index": 1,
+            "end_index": 4,
+            "summary": "Core ideas.",
+            "nodes": [
+                {
+                    "title": "Topic 1.1",
+                    "start_index": 2,
+                    "end_index": 4,
+                    "summary": "Details.",
+                }
+            ],
+        },
+        {"title": "Chapter 2", "start_index": 5, "end_index": 9},
+    ]
+
+    tree = sections_from_pageindex_structure(structure, total_pages=6)
+
+    assert [node.title for node in tree] == ["Chapter 1", "Topic 1.1", "Chapter 2"]
+    assert tree[0].child_ids == ["section-002"]
+    assert tree[1].parent_id == "section-001"
+    assert tree[2].page_end == 6
+
+
 def test_normalizer_requires_soffice_for_ppt(monkeypatch, tmp_path: Path) -> None:
     ppt_path = tmp_path / "deck.pptx"
     ppt_path.write_text("fake", encoding="utf-8")
diff --git a/third_party/PageIndex b/third_party/PageIndex
new file mode 160000
index 000000000..f2dcffc0b
--- /dev/null
+++ b/third_party/PageIndex
@@ -0,0 +1 @@
+Subproject commit f2dcffc0b79a8ccaddcaa9f51e6a54e3b7e7020b

From eab0a112be38072ca82ec5fd6da3b017b28ae656 Mon Sep 17 00:00:00 2001
From: txxxxz <chendi_zhou@163.com>
Date: Wed, 15 Apr 2026 19:32:56 +0800
Subject: [PATCH 3/4] Refactor structure note backend into agents

---
 deeptutor/agents/__init__.py                  |   1 +
 .../structure_note/__init__.py                |   0
 .../structure_note/difficulty.py              |   0
 .../structure_note/generator.py               |   0
 .../structure_note/image_pipeline.py          |   0
 .../structure_note/manager.py                 |  21 +-
 .../structure_note/markdown_postprocessor.py  |   0
 .../structure_note/models.py                  |   0
 .../structure_note/normalizer.py              |   0
 .../structure_note/page_index.py              |   0
 .../structure_note/planner.py                 |   0
 .../structure_note/renderer.py                |   4 +-
 .../structure_note/storage.py                 |   0
 .../structure_note/tree_builder.py            |   0
 deeptutor/api/routers/structure_note.py       |   2 +-
 deeptutor/services/__init__.py                |   3 -
 deeptutor_cli/README.md                       |   2 +-
 docs/features/overview.md                     | 162 ------
 docs/guide/data-preparation.md                | 185 ------
 docs/guide/local-start.md                     | 190 ------
 docs/guide/pre-config.md                      | 201 -------
 docs/guide/troubleshooting.md                 | 170 ------
 docs/index.md                                 |  77 ---
 docs/roadmap.md                               |  41 --
 docs/testdoc/structure-note-prd.md            | 278 ---------
 docs/testdoc/structure-note-technical-plan.md | 539 ------------------
 docs/zh/features/overview.md                  |  57 --
 docs/zh/guide/data-preparation.md             | 185 ------
 docs/zh/guide/local-conda-cursor.md           |  56 --
 docs/zh/guide/local-start.md                  | 190 ------
 docs/zh/guide/pre-config.md                   | 201 -------
 docs/zh/guide/troubleshooting.md              |  48 --
 docs/zh/index.md                              |  77 ---
 .../structure_note/test_structure_note.py}    |  40 +-
 tests/api/test_structure_note_router.py       |   2 +-
 tests/services/test_path_service.py           |  13 +-
 36 files changed, 64 insertions(+), 2681 deletions(-)
 rename deeptutor/{services => agents}/structure_note/__init__.py (100%)
 rename deeptutor/{services => agents}/structure_note/difficulty.py (100%)
 rename deeptutor/{services => agents}/structure_note/generator.py (100%)
 rename deeptutor/{services => agents}/structure_note/image_pipeline.py (100%)
 rename deeptutor/{services => agents}/structure_note/manager.py (96%)
 rename deeptutor/{services => agents}/structure_note/markdown_postprocessor.py (100%)
 rename deeptutor/{services => agents}/structure_note/models.py (100%)
 rename deeptutor/{services => agents}/structure_note/normalizer.py (100%)
 rename deeptutor/{services => agents}/structure_note/page_index.py (100%)
 rename deeptutor/{services => agents}/structure_note/planner.py (100%)
 rename deeptutor/{services => agents}/structure_note/renderer.py (97%)
 rename deeptutor/{services => agents}/structure_note/storage.py (100%)
 rename deeptutor/{services => agents}/structure_note/tree_builder.py (100%)
 delete mode 100644 docs/features/overview.md
 delete mode 100644 docs/guide/data-preparation.md
 delete mode 100644 docs/guide/local-start.md
 delete mode 100644 docs/guide/pre-config.md
 delete mode 100644 docs/guide/troubleshooting.md
 delete mode 100644 docs/index.md
 delete mode 100644 docs/roadmap.md
 delete mode 100644 docs/testdoc/structure-note-prd.md
 delete mode 100644 docs/testdoc/structure-note-technical-plan.md
 delete mode 100644 docs/zh/features/overview.md
 delete mode 100644 docs/zh/guide/data-preparation.md
 delete mode 100644 docs/zh/guide/local-conda-cursor.md
 delete mode 100644 docs/zh/guide/local-start.md
 delete mode 100644 docs/zh/guide/pre-config.md
 delete mode 100644 docs/zh/guide/troubleshooting.md
 delete mode 100644 docs/zh/index.md
 rename tests/{services/test_structure_note_service.py => agents/structure_note/test_structure_note.py} (89%)

diff --git a/deeptutor/agents/__init__.py b/deeptutor/agents/__init__.py
index 63c9c1e3f..019228a97 100644
--- a/deeptutor/agents/__init__.py
+++ b/deeptutor/agents/__init__.py
@@ -8,6 +8,7 @@
 - co_writer: Co-writing agents (EditAgent, NarratorAgent)
 - question: Question generation agents (ReAct architecture, separate base)
 - chat: Lightweight conversational agent with session management
+- structure_note: Structure Note generation workflow and artifact management
 
 Usage:
     from deeptutor.agents.base_agent import BaseAgent
diff --git a/deeptutor/services/structure_note/__init__.py b/deeptutor/agents/structure_note/__init__.py
similarity index 100%
rename from deeptutor/services/structure_note/__init__.py
rename to deeptutor/agents/structure_note/__init__.py
diff --git a/deeptutor/services/structure_note/difficulty.py b/deeptutor/agents/structure_note/difficulty.py
similarity index 100%
rename from deeptutor/services/structure_note/difficulty.py
rename to deeptutor/agents/structure_note/difficulty.py
diff --git a/deeptutor/services/structure_note/generator.py b/deeptutor/agents/structure_note/generator.py
similarity index 100%
rename from deeptutor/services/structure_note/generator.py
rename to deeptutor/agents/structure_note/generator.py
diff --git a/deeptutor/services/structure_note/image_pipeline.py b/deeptutor/agents/structure_note/image_pipeline.py
similarity index 100%
rename from deeptutor/services/structure_note/image_pipeline.py
rename to deeptutor/agents/structure_note/image_pipeline.py
diff --git a/deeptutor/services/structure_note/manager.py b/deeptutor/agents/structure_note/manager.py
similarity index 96%
rename from deeptutor/services/structure_note/manager.py
rename to deeptutor/agents/structure_note/manager.py
index f750c79b0..50329b8ee 100644
--- a/deeptutor/services/structure_note/manager.py
+++ b/deeptutor/agents/structure_note/manager.py
@@ -3,6 +3,7 @@
 import asyncio
 from datetime import datetime
 from pathlib import Path
+import re
 from typing import Any, Literal
 import uuid
 
@@ -58,6 +59,17 @@ def _normalize_project_name(self, project_name: str | None) -> str:
     def _artifact_project_name(self, artifact: StructureNoteArtifact) -> str:
         return artifact.project_name or artifact.source_ref.get("kb_name") or "Local Uploads"
 
+    def _export_output_stem(self, artifact: StructureNoteArtifact) -> str:
+        title = (artifact.note_title or Path(artifact.file_name).stem or "structure-note").strip()
+        title = title.replace("/", "-").replace("\\", "-")
+        title = re.sub(r"\s+", " ", title).strip(" .")
+        if not title:
+            title = "structure-note"
+        suffix = "-structure-note"
+        if title.lower().endswith(suffix):
+            return title
+        return f"{title}{suffix}"
+
     def list_projects(self) -> list[StructureNoteProject]:
         projects_by_name: dict[str, StructureNoteProject] = {
             self._normalize_project_name(project.name): project
@@ -432,6 +444,8 @@ async def run_job(self, job_id: str, task_id: str, emit_log) -> StructureNoteArt
                 JobStatus.PROCESSING_IMAGES,
                 retry_state=JobStatus.PROCESSING_IMAGES.value,
             )
+            output_stem = self._export_output_stem(artifact)
+            rendered_markdown_path = job_dirs["final"] / f"{output_stem}.md"
             if (
                 artifact.rendered_markdown_path
                 and Path(artifact.rendered_markdown_path).exists()
@@ -442,7 +456,9 @@ async def run_job(self, job_id: str, task_id: str, emit_log) -> StructureNoteArt
                 markdown_text = normalize_structure_note_markdown(
                     rendered_path.read_text(encoding="utf-8")
                 )
-                rendered_path.write_text(markdown_text, encoding="utf-8")
+                rendered_markdown_path.write_text(markdown_text, encoding="utf-8")
+                artifact.rendered_markdown_path = str(rendered_markdown_path)
+                self.storage.write_artifact(artifact)
                 image_citations = self._load_image_citations(artifact.image_fill_state_path)
             else:
                 emit_log(task_id, "Resolving figure placeholders.")
@@ -484,7 +500,7 @@ async def run_job(self, job_id: str, task_id: str, emit_log) -> StructureNoteArt
                     )
                 )
                 artifact.rendered_markdown_path = str(
-                    self.storage.write_text(job_dirs["final"] / "rendered.md", markdown_text)
+                    self.storage.write_text(rendered_markdown_path, markdown_text)
                 )
                 self.storage.write_artifact(artifact)
 
@@ -500,6 +516,7 @@ async def run_job(self, job_id: str, task_id: str, emit_log) -> StructureNoteArt
                 citation_entries=citations,
                 job_dir=job_dirs["job"],
                 final_dir=job_dirs["final"],
+                output_stem=self._export_output_stem(artifact),
             )
             artifact.final_pdf_path = str(final_pdf_path)
             artifact.citation_manifest_path = str(citation_path)
diff --git a/deeptutor/services/structure_note/markdown_postprocessor.py b/deeptutor/agents/structure_note/markdown_postprocessor.py
similarity index 100%
rename from deeptutor/services/structure_note/markdown_postprocessor.py
rename to deeptutor/agents/structure_note/markdown_postprocessor.py
diff --git a/deeptutor/services/structure_note/models.py b/deeptutor/agents/structure_note/models.py
similarity index 100%
rename from deeptutor/services/structure_note/models.py
rename to deeptutor/agents/structure_note/models.py
diff --git a/deeptutor/services/structure_note/normalizer.py b/deeptutor/agents/structure_note/normalizer.py
similarity index 100%
rename from deeptutor/services/structure_note/normalizer.py
rename to deeptutor/agents/structure_note/normalizer.py
diff --git a/deeptutor/services/structure_note/page_index.py b/deeptutor/agents/structure_note/page_index.py
similarity index 100%
rename from deeptutor/services/structure_note/page_index.py
rename to deeptutor/agents/structure_note/page_index.py
diff --git a/deeptutor/services/structure_note/planner.py b/deeptutor/agents/structure_note/planner.py
similarity index 100%
rename from deeptutor/services/structure_note/planner.py
rename to deeptutor/agents/structure_note/planner.py
diff --git a/deeptutor/services/structure_note/renderer.py b/deeptutor/agents/structure_note/renderer.py
similarity index 97%
rename from deeptutor/services/structure_note/renderer.py
rename to deeptutor/agents/structure_note/renderer.py
index 0572660e9..9687c7880 100644
--- a/deeptutor/services/structure_note/renderer.py
+++ b/deeptutor/agents/structure_note/renderer.py
@@ -132,6 +132,7 @@ def render_pdf(
     citation_entries: list[CitationEntry],
     job_dir: Path,
     final_dir: Path,
+    output_stem: str = "final",
 ) -> tuple[Path, Path]:
     try:
         from markdown import markdown
@@ -163,7 +164,8 @@ def render_pdf(
         f"{html_body}</body></html>"
     )
 
-    pdf_path = final_dir / "final.pdf"
+    pdf_stem = output_stem.strip() or "final"
+    pdf_path = final_dir / f"{pdf_stem}.pdf"
     HTML(string=html, base_url=str(job_dir)).write_pdf(str(pdf_path))
 
     citation_path = final_dir / "citation_manifest.json"
diff --git a/deeptutor/services/structure_note/storage.py b/deeptutor/agents/structure_note/storage.py
similarity index 100%
rename from deeptutor/services/structure_note/storage.py
rename to deeptutor/agents/structure_note/storage.py
diff --git a/deeptutor/services/structure_note/tree_builder.py b/deeptutor/agents/structure_note/tree_builder.py
similarity index 100%
rename from deeptutor/services/structure_note/tree_builder.py
rename to deeptutor/agents/structure_note/tree_builder.py
diff --git a/deeptutor/api/routers/structure_note.py b/deeptutor/api/routers/structure_note.py
index 7c5677392..0afe8f4b2 100644
--- a/deeptutor/api/routers/structure_note.py
+++ b/deeptutor/api/routers/structure_note.py
@@ -20,7 +20,7 @@
 from deeptutor.api.utils.task_log_stream import get_task_stream_manager
 from deeptutor.logging import get_logger
 from deeptutor.services.config import PROJECT_ROOT, load_config_with_main
-from deeptutor.services.structure_note import (
+from deeptutor.agents.structure_note import (
     DifficultyLevel,
     ExplanationStyleLevel,
     JobStatus,
diff --git a/deeptutor/services/__init__.py b/deeptutor/services/__init__.py
index 75e938001..167b90c3e 100644
--- a/deeptutor/services/__init__.py
+++ b/deeptutor/services/__init__.py
@@ -50,7 +50,6 @@
     "rag",
     "prompt",
     "search",
-    "structure_note",
     "setup",
     "session",
     "config",
@@ -72,8 +71,6 @@ def __getattr__(name: str):
         return importlib.import_module(f"{__name__}.search")
     if name == "setup":
         return importlib.import_module(f"{__name__}.setup")
-    if name == "structure_note":
-        return importlib.import_module(f"{__name__}.structure_note")
     if name == "session":
         return importlib.import_module(f"{__name__}.session")
     if name == "config":
diff --git a/deeptutor_cli/README.md b/deeptutor_cli/README.md
index df1d4f29a..ebdc4b1db 100644
--- a/deeptutor_cli/README.md
+++ b/deeptutor_cli/README.md
@@ -132,7 +132,7 @@ deeptutor serve [--host 0.0.0.0] [--port 8001] [--reload]
 deeptutor kb list                                # 列出所有知识库
 deeptutor kb info <name>                         # 查看详情
 deeptutor kb create <name> --doc file.pdf        # 创建并导入文档
-deeptutor kb create <name> --docs-dir ./docs/    # 从目录批量导入
+deeptutor kb create <name> --docs-dir ./materials/    # 从目录批量导入
 deeptutor kb add <name> --doc extra.pdf          # 追加文档
 deeptutor kb set-default <name>                  # 设为默认
 deeptutor kb search <name> "查询内容"             # 搜索
diff --git a/docs/features/overview.md b/docs/features/overview.md
deleted file mode 100644
index 7b99fd076..000000000
--- a/docs/features/overview.md
+++ /dev/null
@@ -1,162 +0,0 @@
-# 🏛️ DeepTutor's Framework
-
-<img src="/full-pipe.png" alt="DeepTutor Full-Stack Workflow" width="100%">
-
-## 💬 User Interface Layer
-• **Intuitive Interaction**: Simple bidirectional query-response flow for intuitive interaction.
-• **Structured Output**: Structured response generation that organizes complex information into actionable outputs.
-• **Dark/Light Mode**: System-wide theme support with automatic system preference detection.
-• **Collapsible Sidebar**: Compact navigation with icon-only mode for focused learning.
-
-## 🤖 Intelligent Agent Modules
-• **Problem Solving & Assessment**: Step-by-step problem solving and custom assessment generation.
-• **Research & Learning**: Deep Research for topic exploration and Guided Learning with visualization.
-• **Idea Generation**: Automated and interactive concept development with multi-source insights.
-
-## 🔧 Tool Integration Layer
-• **Information Retrieval**: RAG hybrid retrieval, real-time web search, and academic paper databases.
-• **Processing & Analysis**: Python code execution, query item lookup, and PDF parsing for document analysis.
-• **Multi-Provider Support**: Flexible LLM providers (OpenAI, Anthropic, Ollama, etc.) and embedding adapters (OpenAI, Jina, Cohere, Ollama, etc.).
-
-## 🧠 Knowledge & Memory Foundation
-• **Knowledge Graph**: Entity-relation mapping for semantic connections and knowledge discovery.
-• **Vector Store**: Embedding-based semantic search for intelligent content retrieval.
-• **Memory System**: Session state management and citation tracking for contextual continuity.
-
----
-
-# Key Features of DeepTutor
-
-## 📚 Massive Document Knowledge Q&A
-
-• **Smart Knowledge Base**: Upload textbooks, research papers, technical manuals, and domain-specific documents. Build a comprehensive AI-powered knowledge repository for instant access.
-
-• **Multi-Agent Problem Solving**: Dual-loop reasoning architecture with RAG, web search, paper search, and code execution—delivering step-by-step solutions with precise citations.
-
-## 🎨 Interactive Learning Visualization
-
-• **Knowledge Simplification & Explanations**: Transform complex concepts, knowledge, and algorithms into easy-to-understand visual aids, detailed step-by-step breakdowns, and engaging interactive demonstrations.
-
-• **Personalized Q&A**: Context-aware conversations that adapt to your learning progress, with interactive pages and session-based knowledge tracking.
-
-## 🎯 Knowledge Reinforcement with Practice Problem Generator
-
-• **Intelligent Exercise Creation**: Generate targeted quizzes, practice problems, and customized assessments tailored to your current knowledge level and specific learning objectives.
-
-• **Authentic Exam Simulation**: Upload reference exams to generate practice questions that perfectly match the original style, format, and difficulty—giving you realistic preparation for the actual test.
-
-## 🔍 Deep Research & Idea Generation
-
-• **Comprehensive Research & Literature Review**: Conduct in-depth topic exploration with systematic analysis. Identify patterns, connect related concepts across disciplines, and synthesize existing research findings.
-
-• **Novel Insight Discovery**: Generate structured learning materials and uncover knowledge gaps. Identify promising new research directions through intelligent cross-domain knowledge synthesis.
-
----
-
-<!-- Core Learning Experience -->
-
-<table>
-<tr>
-<td width="50%" align="center" valign="top">
-
-### 📚 Massive Document Knowledge Q&A
-
-<img src="/solve.gif" alt="Document Q&A demonstration" width="100%">
-
-Document Q&A and Step-by-Step Problem Solving
-
-</td>
-<td width="50%" align="center" valign="top">
-
-### 🎨 Interactive Learning Visualization
-
-<img src="/guided-learning.gif" alt="Interactive learning visualization demo" width="100%">
-
-Interactive AI Learning with Knowledge Visual Explanations
-
-</td>
-</tr>
-</table>
-
-<!-- Practice & Reinforcement -->
-
-### 🎯 Knowledge Reinforcement
-
-<table>
-<tr>
-<td width="50%" valign="top" align="center">
-
-<img src="/question-1.gif" alt="Custom question generation demo" width="100%">
-
-**Custom Questions**
-Auto-Validated Practice Questions with Instant Feedback
-
-</td>
-<td width="50%" valign="top" align="center">
-
-<img src="/question-2.gif" alt="Mimic exam style questions demo" width="100%">
-
-**Mimic Questions**
-Clone Exam Style for Authentic Practice
-
-</td>
-</tr>
-</table>
-
-<!-- Research & Creation -->
-
-### 🔍 Deep Research & Idea Generation
-
-<table>
-<tr>
-<td width="33%" align="center">
-
-<img src="/deepresearch.gif" alt="Deep research with web and paper search demo" width="100%">
-
-**Deep Research**
-Web and Paper Search with Literature Review
-
-</td>
-<td width="33%" align="center">
-
-<img src="/ideagen.gif" alt="Automated idea generation demo" width="100%">
-
-**Automated IdeaGen**
-Systematic Brainstorming and Concept Synthesis
-
-</td>
-<td width="33%" align="center">
-
-<img src="/co-writer.gif" alt="Interactive idea generation demo" width="100%">
-
-**Interactive IdeaGen**
-RAG-powered Idea Generation with Multi-Source Insights
-
-</td>
-</tr>
-</table>
-
-<!-- Knowledge Infrastructure -->
-
-### 🏗️ All-in-One Knowledge System
-
-<table>
-<tr>
-<td width="50%" align="center">
-
-<img src="/knowledge_bases.png" alt="Personal knowledge base demo" width="100%">
-
-**Personal Knowledge Base**
-Build and Organize Your Own Knowledge Repository
-
-</td>
-<td width="50%" align="center">
-
-<img src="/notebooks.png" alt="Personal notebook demo" width="100%">
-
-**Personal Notebook**
-Your Contextual Memory for Learning Sessions
-
-</td>
-</tr>
-</table>
diff --git a/docs/guide/data-preparation.md b/docs/guide/data-preparation.md
deleted file mode 100644
index 7b502b06d..000000000
--- a/docs/guide/data-preparation.md
+++ /dev/null
@@ -1,185 +0,0 @@
-# Data Preparation
-
-DeepTutor provides demo knowledge bases and sample questions to help you get started quickly.
-
-## Demo Knowledge Bases
-
-We provide two pre-built knowledge bases on [Google Drive](https://drive.google.com/drive/folders/1iWwfZXiTuQKQqUYb5fGDZjLCeTUP6DA6?usp=sharing):
-
-### 1. Research Papers Collection
-
-<div class="info-card">
-  <div class="info-header">
-    <span class="info-icon">📄</span>
-    <span class="info-title">5 Research Papers (20-50 pages each)</span>
-  </div>
-  <div class="info-content">
-    <p>A curated collection of cutting-edge research papers from our lab, covering RAG and Agent fields.</p>
-    <p><strong>Included Papers:</strong></p>
-    <ul>
-      <li><a href="https://github.com/HKUDS/AI-Researcher">AI-Researcher</a> - Automated research paper generation</li>
-      <li><a href="https://github.com/HKUDS/AutoAgent">AutoAgent</a> - Autonomous agent framework</li>
-      <li><a href="https://github.com/HKUDS/RAG-Anything">RAG-Anything</a> - Multimodal RAG system</li>
-      <li><a href="https://github.com/HKUDS/LightRAG">LightRAG</a> - Simple and fast RAG</li>
-      <li><a href="https://github.com/HKUDS/VideoRAG">VideoRAG</a> - Video understanding with RAG</li>
-    </ul>
-    <p><strong>Best for:</strong> Research scenarios, broad knowledge coverage</p>
-  </div>
-</div>
-
-### 2. Data Science Textbook
-
-<div class="info-card">
-  <div class="info-header">
-    <span class="info-icon">📚</span>
-    <span class="info-title">8 Chapters, 296 Pages</span>
-  </div>
-  <div class="info-content">
-    <p>A comprehensive deep learning textbook from UC Berkeley.</p>
-    <p><strong>Source:</strong> <a href="https://ma-lab-berkeley.github.io/deep-representation-learning-book/">Deep Representation Learning Book</a></p>
-    <p><strong>Topics Covered:</strong></p>
-    <ul>
-      <li>Neural Network Fundamentals</li>
-      <li>Representation Learning</li>
-      <li>Deep Learning Architectures</li>
-      <li>Advanced Topics</li>
-    </ul>
-    <p><strong>Best for:</strong> Learning scenarios, deep knowledge depth</p>
-  </div>
-</div>
-
-## Download & Setup
-
-### Step 1: Download
-
-Visit our [Google Drive folder](https://drive.google.com/drive/folders/1iWwfZXiTuQKQqUYb5fGDZjLCeTUP6DA6?usp=sharing) and download:
-
-- `knowledge_bases.zip` - Pre-built knowledge bases with embeddings
-- `questions.zip` - Sample questions and usage examples (optional)
-
-### Step 2: Extract
-
-Extract the downloaded files into the `data/` directory:
-
-```
-DeepTutor/
-├── data/
-│   └── knowledge_bases/
-│       ├── research_papers/      # Research papers KB
-│       ├── data_science_book/    # Textbook KB
-│       └── kb_config.json        # Knowledge base config
-└── user/                         # User data (auto-created)
-```
-
-### Step 3: Verify
-
-After extracting, your knowledge bases will be automatically available when you start DeepTutor.
-
-::: warning Embedding Compatibility
-Our demo knowledge bases use `text-embedding-3-large` with `dimensions = 3072`.
-
-If your embedding model has different dimensions, you'll need to create your own knowledge base instead.
-:::
-
-## Creating Custom Knowledge Bases
-
-### Supported File Formats
-
-| Format | Extension | Notes |
-|:-------|:----------|:------|
-| PDF | `.pdf` | Supports text extraction and layout analysis |
-| Text | `.txt` | Plain text files |
-| Markdown | `.md` | Markdown with formatting support |
-
-### Via Web Interface
-
-1. Navigate to `http://localhost:3782/knowledge`
-2. Click **"New Knowledge Base"**
-3. Enter a unique name for your knowledge base
-4. Upload your documents (single or batch upload)
-5. Wait for processing to complete
-
-::: tip Processing Time
-- Small documents (< 10 pages): ~1 minute
-- Medium documents (10-100 pages): ~5-10 minutes
-- Large documents (100+ pages): May take longer
-:::
-
-### Via Command Line
-
-```bash
-# Initialize a new knowledge base with documents
-python -m src.knowledge.start_kb init <kb_name> --docs <pdf_path>
-
-# Add documents to existing knowledge base
-python -m src.knowledge.add_documents <kb_name> --docs <new_document.pdf>
-```
-
-## Data Storage Structure
-
-All user data is stored in the `data/` directory:
-
-```
-data/
-├── knowledge_bases/              # Knowledge base storage
-│   ├── <kb_name>/
-│   │   ├── documents/            # Original documents
-│   │   ├── chunks/               # Chunked content
-│   │   ├── embeddings/           # Vector embeddings
-│   │   └── graph/                # Knowledge graph data
-└── user/                         # User activity data
-    ├── solve/                    # Problem solving results
-    ├── question/                 # Generated questions
-    ├── research/                 # Research reports
-    ├── notebook/                 # Notebook records
-    └── logs/                     # System logs
-```
-
----
-
-**Next Step:** [Local Installation →](/guide/local-start)
-
-<style>
-.info-card {
-  background: var(--vp-c-bg-soft);
-  border: 1px solid var(--vp-c-border);
-  border-radius: 12px;
-  padding: 20px;
-  margin: 16px 0;
-}
-
-.info-header {
-  display: flex;
-  align-items: center;
-  gap: 12px;
-  margin-bottom: 16px;
-}
-
-.info-icon {
-  font-size: 1.5rem;
-}
-
-.info-title {
-  font-size: 1.1rem;
-  font-weight: 600;
-  color: var(--vp-c-text-1);
-}
-
-.info-content {
-  color: var(--vp-c-text-2);
-  line-height: 1.7;
-}
-
-.info-content ul {
-  margin: 12px 0;
-  padding-left: 20px;
-}
-
-.info-content li {
-  margin: 6px 0;
-}
-
-.info-content a {
-  color: var(--vp-c-brand-1);
-}
-</style>
diff --git a/docs/guide/local-start.md b/docs/guide/local-start.md
deleted file mode 100644
index e015eec86..000000000
--- a/docs/guide/local-start.md
+++ /dev/null
@@ -1,190 +0,0 @@
-# Local Installation
-
-This guide covers manual installation for development or non-Docker environments.
-
-## Prerequisites
-
-- **Python 3.10+** — [Download](https://www.python.org/downloads/)
-- **Node.js 18+** — [Download](https://nodejs.org/)
-- **Git** — [Download](https://git-scm.com/)
-
-::: tip Windows Users
-If you encounter path length errors during installation, enable long path support:
-
-```cmd
-reg add "HKLM\SYSTEM\CurrentControlSet\Control\FileSystem" /v LongPathsEnabled /t REG_DWORD /d 1 /f
-```
-
-Restart your terminal after running this command.
-:::
-
-## Step 1: Set Up Virtual Environment
-
-Choose one of the following options:
-
-::: code-group
-
-```bash [Conda (Recommended)]
-# Create environment
-conda create -n deeptutor python=3.10
-
-# Activate environment
-conda activate deeptutor
-```
-
-```bash [venv]
-# Create environment
-python -m venv venv
-
-# Activate (Windows)
-venv\Scripts\activate
-
-# Activate (macOS/Linux)
-source venv/bin/activate
-```
-
-:::
-
-## Step 2: Install Dependencies
-
-### Option A: Automated Installation (Recommended)
-
-```bash
-# Using Python script
-python scripts/install_all.py
-
-# Or using shell script (macOS/Linux)
-bash scripts/install_all.sh
-```
-
-### Option B: Manual Installation
-
-```bash
-# Install Python dependencies
-pip install -r requirements.txt
-
-# Install Node.js dependencies
-npm install --prefix web
-```
-
-::: warning Common Issues
-If you see `npm: command not found`:
-
-```bash
-# Using Conda
-conda install -c conda-forge nodejs
-
-# Or install from https://nodejs.org/
-```
-:::
-
-## Step 3: Configure Environment
-
-Make sure you have completed the [Pre-Configuration](/guide/pre-config) steps:
-
-1. ✅ Created `.env` file with your API keys
-2. ✅ (Optional) Customized `config/agents.yaml`
-3. ✅ (Optional) Downloaded demo knowledge bases
-
-## Step 4: Launch Application
-
-### Start Web Interface (Recommended)
-
-```bash
-python scripts/start_web.py
-```
-
-This starts both the **frontend** (Next.js) and **backend** (FastAPI) servers.
-
-### Alternative: CLI Interface Only
-
-```bash
-python scripts/start.py
-```
-
-### Access URLs
-
-| Service | URL | Description |
-|:---:|:---|:---|
-| **Frontend** | http://localhost:3782 | Main web interface |
-| **API Docs** | http://localhost:8001/docs | Interactive API documentation |
-
-## Advanced: Start Services Separately
-
-For development, you may want to run frontend and backend separately:
-
-### Backend (FastAPI)
-
-```bash
-python src/api/run_server.py
-
-# Or with uvicorn directly
-uvicorn src.api.main:app --host 0.0.0.0 --port 8001 --reload
-```
-
-### Frontend (Next.js)
-
-First, create `web/.env.local`:
-
-```bash
-NEXT_PUBLIC_API_BASE=http://localhost:8001
-```
-
-Then start the development server:
-
-```bash
-cd web
-npm install
-npm run dev -- -p 3782
-```
-
-## Stopping the Service
-
-Press `Ctrl+C` in the terminal to stop the service.
-
-::: warning Port Still in Use?
-If you see "port already in use" after pressing Ctrl+C:
-
-**macOS/Linux:**
-```bash
-lsof -i :8001
-kill -9 <PID>
-```
-
-**Windows:**
-```bash
-netstat -ano | findstr :8001
-taskkill /PID <PID> /F
-```
-:::
-
-## Troubleshooting
-
-### Backend fails to start
-
-**Checklist:**
-- Confirm Python version >= 3.10: `python --version`
-- Confirm all dependencies installed: `pip install -r requirements.txt`
-- Check if port 8001 is in use
-- Verify `.env` file configuration
-
-### Frontend cannot connect to backend
-
-**Solutions:**
-1. Confirm backend is running: visit http://localhost:8001/docs
-2. Check browser console for error messages
-3. Create `web/.env.local` with:
-   ```bash
-   NEXT_PUBLIC_API_BASE=http://localhost:8001
-   ```
-
-### WebSocket connection fails
-
-**Checklist:**
-- Confirm backend is running
-- Check firewall settings
-- Verify WebSocket URL format: `ws://localhost:8001/api/v1/...`
-
----
-
-**Next Step:** [Docker Deployment →](/guide/docker-start)
diff --git a/docs/guide/pre-config.md b/docs/guide/pre-config.md
deleted file mode 100644
index 94f9a885f..000000000
--- a/docs/guide/pre-config.md
+++ /dev/null
@@ -1,201 +0,0 @@
-# Pre-Configuration
-
-Before starting DeepTutor, you need to complete the following setup steps.
-
-## 1. Clone Repository
-
-```bash
-git clone https://github.com/HKUDS/DeepTutor.git
-cd DeepTutor
-```
-
-## 2. Environment Variables Setup
-
-Create your `.env` file from the template:
-
-```bash
-cp .env.example .env
-```
-
-Then edit the `.env` file with your API keys:
-
-```bash
-# ============================================================================
-# Server Configuration
-# ============================================================================
-BACKEND_PORT=8001                         # Backend API port
-FRONTEND_PORT=3782                        # Frontend web port
-
-# For remote/LAN access - set to your server's IP address
-# NEXT_PUBLIC_API_BASE=http://192.168.1.100:8001
-
-# ============================================================================
-# LLM (Large Language Model) Configuration - Required
-# ============================================================================
-LLM_BINDING=openai                        # Provider: openai, anthropic, azure_openai, ollama, etc.
-LLM_MODEL=gpt-4o                          # Model name: gpt-4o, deepseek-chat, claude-3-5-sonnet, etc.
-LLM_HOST=https://api.openai.com/v1        # API endpoint URL
-LLM_API_KEY=your_api_key                  # Your LLM API key
-
-# ============================================================================
-# Embedding Model Configuration - Required for Knowledge Base
-# ============================================================================
-EMBEDDING_BINDING=openai                  # Provider type
-EMBEDDING_MODEL=text-embedding-3-large    # Embedding model name
-EMBEDDING_DIMENSION=3072                  # Must match model dimensions
-EMBEDDING_HOST=https://api.openai.com/v1  # API endpoint
-EMBEDDING_API_KEY=your_api_key            # Embedding API key
-
-# ============================================================================
-# Web Search Configuration - Optional
-# ============================================================================
-SEARCH_PROVIDER=perplexity                # Options: perplexity, tavily, serper, jina, exa, baidu
-SEARCH_API_KEY=your_search_api_key        # API key for search provider
-```
-
-### Environment Variables Reference
-
-| Variable | Required | Description |
-|:---|:---:|:---|
-| `LLM_MODEL` | **Yes** | Model name (e.g., `gpt-4o`, `deepseek-chat`) |
-| `LLM_API_KEY` | **Yes** | Your LLM API key |
-| `LLM_HOST` | **Yes** | API endpoint URL |
-| `EMBEDDING_MODEL` | **Yes** | Embedding model name |
-| `EMBEDDING_DIMENSION` | **Yes** | Must match model output dimensions |
-| `EMBEDDING_API_KEY` | **Yes** | Embedding API key |
-| `EMBEDDING_HOST` | **Yes** | Embedding API endpoint |
-| `BACKEND_PORT` | No | Backend port (default: `8001`) |
-| `FRONTEND_PORT` | No | Frontend port (default: `3782`) |
-| `NEXT_PUBLIC_API_BASE` | No | Set for remote/LAN access |
-| `SEARCH_PROVIDER` | No | Web search provider |
-| `SEARCH_API_KEY` | No | Search API key |
-
-### Supported LLM Providers
-
-| Provider | `LLM_BINDING` Value | Notes |
-|:---------|:--------------------|:------|
-| OpenAI | `openai` | GPT-4o, GPT-4, GPT-3.5 |
-| Anthropic | `anthropic` | Claude 3.5, Claude 3 |
-| Azure OpenAI | `azure_openai` | Enterprise deployments |
-| Ollama | `ollama` | Local models |
-| DeepSeek | `deepseek` | DeepSeek-V3, DeepSeek-R1 |
-| Groq | `groq` | Fast inference |
-| OpenRouter | `openrouter` | Multi-model gateway |
-| Google Gemini | `gemini` | OpenAI-compatible mode |
-
-### Supported Embedding Providers
-
-| Provider | `EMBEDDING_BINDING` Value | Notes |
-|:---------|:--------------------------|:------|
-| OpenAI | `openai` | text-embedding-3-large/small |
-| Azure OpenAI | `azure_openai` | Enterprise deployments |
-| Jina AI | `jina` | jina-embeddings-v3 |
-| Cohere | `cohere` | embed-v3 series |
-| Ollama | `ollama` | Local embedding models |
-| LM Studio | `lm_studio` | Local inference server |
-| HuggingFace | `huggingface` | OpenAI-compatible endpoints |
-
-## 3. Configuration Files
-
-DeepTutor uses two YAML configuration files for customization:
-
-### `config/agents.yaml` - Agent Parameters
-
-This file controls LLM parameters for each module:
-
-```yaml
-# Solve Module - Problem solving agents
-solve:
-  temperature: 0.3
-  max_tokens: 8192
-
-# Research Module - Deep research agents
-research:
-  temperature: 0.5
-  max_tokens: 12000
-
-# Question Module - Question generation agents
-question:
-  temperature: 0.7
-  max_tokens: 4096
-
-# Guide Module - Learning guidance agents
-guide:
-  temperature: 0.5
-  max_tokens: 16192
-
-# IdeaGen Module - Idea generation agents
-ideagen:
-  temperature: 0.7
-  max_tokens: 4096
-
-# CoWriter Module - Collaborative writing agents
-co_writer:
-  temperature: 0.7
-  max_tokens: 4096
-```
-
-### `config/main.yaml` - System Settings
-
-This file controls paths, tools, and module-specific settings:
-
-```yaml
-# System language
-system:
-  language: en
-
-# Data paths
-paths:
-  user_data_dir: ./data/user
-  knowledge_bases_dir: ./data/knowledge_bases
-
-# Tool configuration
-tools:
-  rag_tool:
-    kb_base_dir: ./data/knowledge_bases
-    default_kb: ai_textbook
-  run_code:
-    workspace: ./data/user/run_code_workspace
-  web_search:
-    enabled: true
-  query_item:
-    enabled: true
-    max_results: 5
-
-# Module-specific settings
-research:
-  researching:
-    execution_mode: series      # "series" or "parallel"
-    max_iterations: 5
-    enable_rag_hybrid: true
-    enable_paper_search: true
-    enable_web_search: true
-```
-
-> **Tip:** For most users, the default configuration works well. Only modify these files if you need specific customizations.
-
-## 4. Knowledge Base Preparation (Optional)
-
-You can use our pre-built demo knowledge bases to get started quickly.
-
-### Download Demo Knowledge Bases
-
-Download from [Google Drive](https://drive.google.com/drive/folders/1iWwfZXiTuQKQqUYb5fGDZjLCeTUP6DA6?usp=sharing) and extract into the `data/` directory.
-
-::: info Important
-The demo knowledge bases use `text-embedding-3-large` with `dimensions = 3072`. Make sure your embedding model has matching dimensions.
-:::
-
-### Create Your Own Knowledge Base
-
-After launching DeepTutor:
-
-1. Navigate to `http://localhost:3782/knowledge`
-2. Click **"New Knowledge Base"**
-3. Enter a unique name
-4. Upload PDF/TXT/MD files
-5. Monitor progress in the terminal
-
----
-
-**Next Step:** [Data Preparation →](/guide/data-preparation)
diff --git a/docs/guide/troubleshooting.md b/docs/guide/troubleshooting.md
deleted file mode 100644
index 37803c3ff..000000000
--- a/docs/guide/troubleshooting.md
+++ /dev/null
@@ -1,170 +0,0 @@
-# ❓ FAQ
-
-## Backend fails to start?
-
-**Checklist**
-- Confirm Python version >= 3.10
-- Confirm all dependencies installed: `pip install -r requirements.txt`
-- Check if port 8001 is in use (configurable in `config/main.yaml`)
-- Check `.env` file configuration
-
-**Solutions**
-- **Change port**: Edit `config/main.yaml` server.backend_port
-- **Check logs**: Review terminal error messages
-
----
-
-## Port occupied after Ctrl+C?
-
-**Problem**
-
-After pressing Ctrl+C during a running task (e.g., deep research), restarting shows "port already in use" error.
-
-**Cause**
-
-Ctrl+C sometimes only terminates the frontend process while the backend continues running in the background.
-
-**Solution**
-
-```bash
-# macOS/Linux
-kill -9 $(lsof -t -i :8001)
-
-# Windows
-netstat -ano | findstr :8001
-taskkill /PID <PID> /F
-```
-
-Then restart the service with `python scripts/start_web.py`.
-
----
-
-## npm: command not found error?
-
-**Problem**
-
-Running `scripts/start_web.py` shows `npm: command not found` or exit status 127.
-
-**Checklist**
-- Check if npm is installed: `npm --version`
-- Check if Node.js is installed: `node --version`
-- Confirm conda environment is activated (if using conda)
-
-**Solutions**
-```bash
-# Option A: Using Conda (Recommended)
-conda install -c conda-forge nodejs
-
-# Option B: Using Official Installer
-# Download from https://nodejs.org/
-
-# Option C: Using nvm
-nvm install 18
-nvm use 18
-```
-
-**Verify Installation**
-```bash
-node --version  # Should show v18.x.x or higher
-npm --version   # Should show version number
-```
-
----
-
-## Frontend cannot connect to backend?
-
-**Checklist**
-- Confirm backend is running (visit `http://localhost:8001/docs`)
-- Check browser console for error messages
-
-**Solution**
-
-Create `.env.local` in `web` directory:
-
-```bash
-NEXT_PUBLIC_API_BASE=http://localhost:8001
-```
-
----
-
-## WebSocket connection fails?
-
-**Checklist**
-- Confirm backend is running
-- Check firewall settings
-- Confirm WebSocket URL is correct
-
-**Solution**
-- **Check backend logs**
-- **Confirm URL format**: `ws://localhost:8001/api/v1/...`
-
----
-
-## Where are module outputs stored?
-
-| Module | Output Path |
-|:---:|:---|
-| Solve | `data/user/solve/solve_YYYYMMDD_HHMMSS/` |
-| Question | `data/user/question/question_YYYYMMDD_HHMMSS/` |
-| Research | `data/user/research/reports/` |
-| Interactive IdeaGen | `data/user/co-writer/` |
-| Notebook | `data/user/notebook/` |
-| Guide | `data/user/guide/session_{session_id}.json` |
-| Logs | `data/user/logs/` |
-
----
-
-## How to add a new knowledge base?
-
-**Web Interface**
-1. Visit `http://localhost:3782/knowledge`
-2. Click "New Knowledge Base"
-3. Enter knowledge base name
-4. Upload PDF/TXT/MD documents
-5. System will process documents in background
-
-**CLI**
-```bash
-python -m src.knowledge.start_kb init <kb_name> --docs <pdf_path>
-```
-
----
-
-## How to incrementally add documents to existing KB?
-
-**CLI (Recommended)**
-```bash
-python -m src.knowledge.add_documents <kb_name> --docs <new_document.pdf>
-```
-
-**Benefits**
-- Only processes new documents, saves time and API costs
-- Automatically merges with existing knowledge graph
-- Preserves all existing data
-
----
-
-## Numbered items extraction failed with uvloop.Loop error?
-
-**Problem**
-
-When initializing a knowledge base, you may encounter this error:
-```text
-ValueError: Can't patch loop of type <class 'uvloop.Loop'>
-```
-
-This occurs because Uvicorn uses `uvloop` event loop by default, which is incompatible with `nest_asyncio`.
-
-**Solution**
-
-Use one of the following methods to extract numbered items:
-
-```bash
-# Option 1: Using the shell script (recommended)
-./scripts/extract_numbered_items.sh <kb_name>
-
-# Option 2: Direct Python command
-python src/knowledge/extract_numbered_items.py --kb <kb_name> --base-dir ./data/knowledge_bases
-```
-
-This will extract numbered items (Definitions, Theorems, Equations, etc.) from your knowledge base without reinitializing it.
diff --git a/docs/index.md b/docs/index.md
deleted file mode 100644
index 3e892b379..000000000
--- a/docs/index.md
+++ /dev/null
@@ -1,77 +0,0 @@
----
-layout: home
-
-hero:
-  name: "DeepTutor"
-  text: "Your AI Learning Companion"
-  tagline: Transform any document into an interactive learning experience with multi-agent intelligence
-  image:
-    src: /logo.png
-    alt: DeepTutor
-  actions:
-    - theme: brand
-      text: Get Started →
-      link: /guide/pre-config
-    - theme: alt
-      text: GitHub
-      link: https://github.com/HKUDS/DeepTutor
-
-features:
-  - icon: 📚
-    title: Massive Document Q&A
-    details: Upload textbooks, papers, and manuals. Build AI-powered knowledge repositories with RAG and knowledge graph integration.
-  - icon: 🧠
-    title: Smart Problem Solving
-    details: Dual-loop reasoning architecture with multi-agent collaboration, delivering step-by-step solutions with precise citations.
-  - icon: 🎯
-    title: Practice Generator
-    details: Generate custom quizzes based on your knowledge base, or mimic real exam styles for authentic practice.
-  - icon: 🎓
-    title: Guided Learning
-    details: Personalized learning paths with interactive visualizations and adaptive explanations.
-  - icon: 🔬
-    title: Deep Research
-    details: Systematic topic exploration with web search, paper retrieval, and literature synthesis.
-  - icon: 💡
-    title: Idea Generation
-    details: AI-assisted brainstorming with knowledge extraction and multi-stage filtering.
----
-
-## Why DeepTutor?
-
-- **Deep Understanding** — Not just answers, but guided learning journeys with visual explanations
-- **Multi-Modal Support** — PDF, LaTeX, images, code execution, and more
-- **Knowledge Graph** — Semantic connections powered by LightRAG for better comprehension
-- **All-in-One Platform** — Problem solving, question generation, research, and idea generation in one place
-
-<style>
-:root {
-  --vp-home-hero-name-color: transparent;
-  --vp-home-hero-name-background: linear-gradient(135deg, #667eea 0%, #764ba2 50%, #f093fb 100%);
-  --vp-home-hero-image-background-image: linear-gradient(135deg, rgba(102, 126, 234, 0.2) 0%, rgba(118, 75, 162, 0.2) 50%, rgba(240, 147, 251, 0.15) 100%);
-  --vp-home-hero-image-filter: blur(72px);
-}
-
-.dark {
-  --vp-home-hero-image-background-image: linear-gradient(135deg, rgba(102, 126, 234, 0.15) 0%, rgba(118, 75, 162, 0.15) 50%, rgba(240, 147, 251, 0.1) 100%);
-}
-
-.VPHero .name {
-  font-size: 4.5rem !important;
-  line-height: 1.1 !important;
-}
-
-.VPHero .text {
-  font-size: 2.4rem !important;
-  font-weight: 600 !important;
-}
-
-@media (max-width: 768px) {
-  .VPHero .name {
-    font-size: 3rem !important;
-  }
-  .VPHero .text {
-    font-size: 1.8rem !important;
-  }
-}
-</style>
diff --git a/docs/roadmap.md b/docs/roadmap.md
deleted file mode 100644
index c0e530452..000000000
--- a/docs/roadmap.md
+++ /dev/null
@@ -1,41 +0,0 @@
-# Roadmap
-
-Our vision for DeepTutor's future development.
-
-## ✅ Recently Completed (v0.4.0)
-
-- [x] **RAG Module Decoupling** — Modular RAG architecture with provider-agnostic interface
-  - Currently supports RAG-Anything (MinerU + LightRAG)
-  - More backends coming soon
-- [x] **Multi-Provider Support** — Expanded LLM and Embedding provider options
-  - LLM: OpenAI, Anthropic, Azure, Ollama, Groq, OpenRouter, DeepSeek, Gemini
-  - Embedding: OpenAI, Jina, Cohere, Ollama, LM Studio, HuggingFace
-- [x] **Dark Mode** — System-wide dark/light theme support
-- [x] **Environment Configuration** — Unified `.env` based configuration
-
-## 🚀 Planned Features
-
-- [ ] **Deepcoding from Idea Generation** — Transform research ideas into working prototypes
-- [ ] **Personalized Memory** — Adapt tutoring style based on user learning history
-- [ ] **Additional RAG Backends** — LlamaIndex, ChromaDB, Pinecone integration
-- [ ] **More Embedding Adapters** — Voyage AI, Mixedbread, local transformers
-
-## 💭 Under Consideration
-
-- Multi-language support
-- Mobile-friendly interface
-- Collaborative learning features
-- Voice interaction support
-- Faster frontend framework
-
-## 🤝 Community Requests
-
-Have a feature idea? We'd love to hear it!
-
-- Open a [Feature Request](https://github.com/HKUDS/DeepTutor/issues/new?template=feature_request.yml)
-- Join the discussion on existing proposals
-- Check our [GitHub Discussions](https://github.com/HKUDS/DeepTutor/discussions)
-
----
-
-⭐ **Star the repo** to follow our future updates!
diff --git a/docs/testdoc/structure-note-prd.md b/docs/testdoc/structure-note-prd.md
deleted file mode 100644
index 6557dd096..000000000
--- a/docs/testdoc/structure-note-prd.md
+++ /dev/null
@@ -1,278 +0,0 @@
-# Structure Note 产品需求文档（PRD）
-
-## Title
-
-Structure Note: 基于 PageIndex 的课件/教材结构化讲义工作区
-
-## Summary
-
-新增一个独立的 `Structure Note` 工作区。用户上传 `PDF` 或 `PPT/PPTX` 后，系统先统一归一化为 PDF，再基于新增的 `PageIndex` 构建页级结构树，按章节与页范围分段生成详细讲义，并通过图片占位、定位、切图和回填补全图文内容，最终输出一份带引用来源的可读 PDF。用户可在生成前选择三档讲解难度：简单、中等（默认）、复杂。
-
-## Existing Requirements And Current State
-
-DeepTutor 当前已具备相邻能力，但缺少本功能所需的页级结构层：
-
-- 知识库主干已统一到 `llamaindex`，`lightrag` 只是兼容别名
-- 当前文档导入以整文抽取和向量检索为主，没有稳定的页级索引或章节树
-- `Guided Learning` 已有独立工作区、session、分页状态和后台生成机制，可作为工作区组织方式参考
-- `Notebook` 适合保存文本记录，不适合作为 PDF 最终产物主模型
-- 上传校验允许 `ppt/pptx`，但 RAG 文件路由当前并不真正支持它们进入主流程
-
-## Problem Statement
-
-DeepTutor 目前没有一个面向课件和教材的“逐页、详细、可回溯”的结构化讲义产物。
-
-这带来两个明显缺口：
-
-1. 学生无法获得接近逐字稿的图文讲义，用于跟课、补漏和课后复习
-2. 教师无法将现有 PPT 快速转换为可直接讲授的 Script，仍需自行整理讲稿
-
-现有知识库能力偏向检索，不足以支撑页级结构、章节树、图片回填和最终 PDF 产出。
-
-## Repo Context
-
-- 该功能应是独立工作区，而不是 `Knowledge Hub` 的附属按钮，也不是 `Guided Learning` 的变种
-- 该功能不应建立在 LightRAG 上，而应新增 `PageIndex` 结构层
-- 当前 repo 没有现成 `PageIndex` 实现，需要新增核心服务
-- 该功能会跨后端 router、任务流、路径管理、前端工作区和 PDF 导出，更适合进入 core，并以实验性工作区首发
-
-## Target Users
-
-- 学生：跟课、补漏、课后复习
-- 教师：PPT 转 Script，减轻备课负担
-- 研发与测试：验证引用、图片回填和恢复流程
-
-## Goals
-
-- 提供独立的 `Structure Note` 工作区
-- 支持 `PDF + PPT/PPTX` 上传
-- 将 PPT/PPTX 先归一化为 PDF
-- 基于 `PageIndex` 生成页级结构树，而非整文向量块
-- 采用章节树加分段生成策略，降低 lost-in-the-middle 风险
-- 支持简单 / 中等 / 复杂三档讲解难度，其中中等为默认
-- 输出最终可读 PDF，并附带引用来源
-- 在后端保留中间状态、图片回填和续跑能力，用于测试和恢复
-
-## Non-Goals
-
-- 不替换现有 `Knowledge Hub` 主流程
-- 不把最终产物首发建模为 Notebook 主记录类型
-- 不在首发覆盖 DOCX、图片 OCR、音频转录等更多素材
-- 不向前端暴露占位符、象限定位、切图调试细节
-- 不要求 CLI / SDK 首发同步支持
-
-## Proposed Solution
-
-新增 `Structure Note` 工作区，采用独立 router、manager、artifact 存储与前端页面。
-
-### 主流程
-
-1. 用户上传 `PDF` 或 `PPT/PPTX`
-2. 若为 PPT/PPTX，先通过转换适配器归一化为 PDF
-3. 对 PDF 执行 `PageIndex`，输出逐页文本、页码、标题候选、图像候选区域
-4. 构建多级章节树，优先覆盖二级到五级结构
-5. 以章节树为主线，按约 10 页窗口分段生成讲义；`复杂讲解` 可自动缩小为 5-8 页窗口
-6. 首轮文本生成时插入图片占位符，并记录对应页码范围
-7. 图像流水线识别占位符，执行“页定位 -> 象限定位 -> 切图 -> 回填”
-8. 将最终内容渲染为 PDF，并生成 `citation_manifest.json`
-9. 前端展示最终 PDF、下载入口和引用来源列表
-
-### Difficulty Model
-
-#### simple
-
-- 定位：科普型、入门型
-- 目标：讲清关键词、定义、核心知识和结论
-- 风格：少推理、少展开、少旁支
-- 篇幅：最短
-
-#### medium
-
-- 定位：默认档，接近正常课堂讲解密度
-- 目标：概念、重点、基础逻辑链讲清楚
-- 风格：细致但不过度展开
-- 篇幅：中等
-
-#### detailed
-
-- 定位：最完整档
-- 目标：尽量展开所有内容，包括推理、过程、细节和隐含连接
-- 风格：最详细
-- 篇幅：最长
-- 特殊策略：自动缩小页窗口，以换取生成稳定性
-
-## Scope In
-
-- 独立工作区
-- PDF 与 PPT/PPTX 上传
-- PPT/PPTX -> PDF 归一化
-- `PageIndex` 服务层
-- 章节树生成
-- 按页范围分段生成
-- 三档难度控制
-- 图片占位、定位、切图、回填
-- 最终 PDF 导出
-- 引用来源展示
-- 后端中间状态持久化与续跑
-
-## Scope Out
-
-- 与知识库检索结果的双向联动
-- Notebook 一键保存 PDF
-- 用户手动编辑章节树
-- 多文档自动合并成一本总讲义
-- CLI / SDK 首发接口
-- 高级版式编辑器
-
-## UX Or Interaction Notes
-
-- 工作区形态采用“上传 -> 配置 -> 处理中 -> 查看结果”
-- 上传页提供：
-  - 文件选择
-  - 难度选择器：简单 / 中等（默认） / 复杂
-- 结果页仅展示：
-  - 最终 PDF 预览或下载
-  - 本次难度档位
-  - 引用来源列表
-  - 失败后的重试入口
-- 不向用户展示内部中间态和 agent 细节
-
-## Technical Considerations
-
-- `PageIndex` 是新增结构服务，不是新的 RAG provider
-- 用户可见主产物是 PDF；后端内部仍保留中间 JSON / Markdown / render state
-- 内部 artifact 至少包含：
-  - `source_file`
-  - `normalized_pdf_path`
-  - `difficulty_level`
-  - `page_index`
-  - `section_tree`
-  - `generation_chunks`
-  - `image_fill_state`
-  - `final_pdf_path`
-  - `citation_manifest`
-- 引用来源至少应包含：
-  - 章节路径
-  - 页码范围
-  - 原始 PDF 页
-  - 图像来源页
-- `detailed` 模式应允许更长耗时和更小页窗口，以换取稳定性
-
-## Impacted Areas Of The Repo
-
-- 新增 backend router：`deeptutor/api/routers/structure_note.py`
-- 新增服务目录：`deeptutor/services/structure_note/`
-- 扩展路径管理：`deeptutor/services/path_service.py`
-- 复用任务流与日志广播模式：`deeptutor/api/routers/knowledge.py`
-- 新增前端页面：`web/app/(workspace)/structure-note/page.tsx`
-- 更新工作区导航与文档
-
-## Acceptance Criteria
-
-- 用户可在独立工作区上传 PDF 并生成最终 PDF 讲义
-- 用户可上传 PPT/PPTX，系统会先转换为 PDF 再进入同一流程
-- 系统基于页级结构和章节树分段生成，而不是整文一次性生成
-- 用户可选择三档难度；未选择时默认为中等
-- 三档难度的结果在覆盖密度和篇幅上有明显差异
-- 最终结果可回溯到页码范围，并在前端展示引用来源
-- 图片可通过占位符 -> 定位 -> 切图 -> 回填进入最终结果
-- 生成中断后可在后端基于中间状态续跑
-- 不影响现有 `Knowledge Hub`、`Notebook`、`Guided Learning`
-
-## Success Metrics
-
-- 任务成功率
-- 平均生成时长
-- 页码引用正确率
-- 图片回填成功率
-- 三档难度的用户使用分布
-- 学生复习场景下的二次打开率
-- 教师上传后导出率
-
-## Rollout And Compatibility
-
-- 以独立工作区、实验性功能首发
-- 完全 opt-in，不替换现有知识库主行为
-- 中间状态保留策略做成可配置项，测试环境默认开启，生产环境可裁剪
-- 若 PPT 转 PDF 或 `PageIndex` 失败，应给出明确错误并允许重试
-
-## Risks And Mitigations
-
-### PageIndex 质量不稳定
-
-- 风险：树生成失败或页级抽取噪声过大
-- 缓解：树失败时回退为按页段生成，保证主流程可用
-
-### PPT 转 PDF 兼容性不足
-
-- 风险：不同模板、字体或复杂动画导致转换异常
-- 缓解：转换器做成可替换 adapter；首发默认使用 LibreOffice
-
-### simple 过度压缩
-
-- 风险：为追求短篇幅丢失关键上下文
-- 缓解：强制保留关键词、定义、结论和最小解释链
-
-### detailed 成本和耗时过高
-
-- 风险：长文档生成时间和成本显著上升
-- 缓解：缩小页窗口并启用缓存和续跑
-
-### 图片定位不准
-
-- 风险：四象限粗定位与真实图像区域偏差较大
-- 缓解：定位失败时允许整页截图回退
-
-## Maintainer Fit
-
-该功能适合进入 core，但建议以实验性工作区首发。它直接服务于 DeepTutor 的“材料 -> 学习产物”主线，需要复用上传、任务流、前端工作区和路径管理；若做成外置 plugin，会让产品入口、状态管理和文件处理都变得割裂。
-
-## Alternatives Considered
-
-- 挂在 `Knowledge Hub` 下：不选，因为它不是普通 KB 初始化副产物
-- 复用 `Guided Learning`：不选，因为其主产物是交互页面，不是最终 PDF 讲义
-- 只保存最终 PDF，不保留中间状态：不选，因为测试、恢复和图片回填都会变差
-- 基于 LightRAG 扩展：不选，因为当前主干不走这条路径，且需求核心是页级结构
-
-## Docs And Test Impact
-
-- README 增加 `Structure Note` 工作区说明
-- docs 增加支持格式、难度档位、生成流程、引用来源说明
-- 后端测试覆盖：
-  - PPT/PPTX 归一化
-  - `PageIndex`
-  - 章节树生成
-  - 难度分层
-  - 引用页码
-  - 图片回填
-  - 续跑恢复
-- 前端测试覆盖：
-  - 上传与难度选择
-  - 处理中状态
-  - 最终 PDF 展示
-  - 引用来源展示
-
-## Open Questions
-
-- 最终 PDF 是否需要内嵌引用附录，还是只在前端展示完整 citation
-- 生产环境中间状态保留多久
-- 是否允许下载 `PDF + citation manifest` 打包结果
-
-## Assumptions
-
-- 首发是 web-first
-- 最终用户产物是 PDF
-- 后端保留中间状态仅用于测试、恢复和内部验证
-- `medium` 为默认档位
-- `detailed` 可接受更长生成时延和更高成本
-
-## Decision Log
-
-- 入口：独立工作区
-- 素材：PDF + PPT/PPTX
-- 归一化：PPT/PPTX 先转 PDF
-- 结构底座：新增 `PageIndex`
-- 用户可见产物：最终 PDF
-- 前端：只展示结果与引用
-- 后端：保留中间状态、图片回填和续跑
-- 难度：简单 / 中等（默认） / 复杂
diff --git a/docs/testdoc/structure-note-technical-plan.md b/docs/testdoc/structure-note-technical-plan.md
deleted file mode 100644
index 7e35a1f5a..000000000
--- a/docs/testdoc/structure-note-technical-plan.md
+++ /dev/null
@@ -1,539 +0,0 @@
-# Structure Note 详细技术计划
-
-## 1. 背景与决策
-
-### 1.1 目标
-
-在 DeepTutor 中新增一个独立的 `Structure Note` 工作区，将用户上传的课件或教材转成可阅读、可回溯的结构化 PDF 讲义。
-
-### 1.2 已锁定决策
-
-- 工作区独立存在，不挂在 `Knowledge Hub` 或 `Guided Learning` 下
-- 首发真实支持 `PDF + PPT/PPTX`
-- `PPT/PPTX -> PDF` 由服务端通过 `headless LibreOffice` 实现
-- 结构底座为新增的 `PageIndex`，不接入现有 `llamaindex` provider
-- 最终用户产物是 PDF
-- 引用只在前端结果页侧栏展示，不强行内嵌到 PDF 中
-- 中间状态保留采用环境可配策略
-- 难度固定为 `simple / medium / detailed`，默认 `medium`
-
-### 1.3 与现有能力的关系
-
-- 复用 `knowledge` 路由中的任务流、SSE 日志和后台任务模式
-- 参考 `guide` 工作区的 session / manager 组织方式
-- 不复用 Notebook 作为主产物容器
-- 不影响现有 RAG 搜索、聊天和 Guided Learning
-
-## 2. 端到端数据流
-
-### 2.1 主流程
-
-1. 前端上传文件并提交难度参数
-2. 后端创建 `job_id`，生成 artifact 目录结构
-3. 后端执行素材归一化：
-   - PDF：直接进入下一阶段
-   - PPT/PPTX：使用 `soffice --headless --convert-to pdf` 转为 PDF
-4. 后端执行 `PageIndex`：
-   - 逐页抽文本
-   - 渲染页图缩略信息
-   - 识别标题候选
-   - 记录图像候选区域
-5. 后端构建章节树：
-   - 规则层抽标题候选
-   - LLM 将候选标准化为 2-5 级结构
-   - 输出节点与页码范围映射
-6. 后端分段生成正文：
-   - 按章节树与页范围切块
-   - 每块调用 LLM 生成 Markdown 讲义正文
-   - 同步输出页码范围与图片占位符
-7. 后端执行图片流水线：
-   - 识别占位符
-   - 生成页号映射
-   - 通过定位 Agent 选择象限
-   - 通过切图执行器生成图片资源
-   - 回填 Markdown / render model
-8. 后端渲染最终 PDF 与 `citation_manifest.json`
-9. 前端结果页读取任务详情、PDF 地址与 citation 清单
-
-### 2.2 阶段与状态
-
-统一任务状态：
-
-- `queued`
-- `normalizing`
-- `indexing`
-- `planning`
-- `generating`
-- `processing_images`
-- `rendering`
-- `ready`
-- `failed`
-
-### 2.3 失败与续跑原则
-
-- 若素材归一化失败，任务直接失败，不进入后续阶段
-- 若 `PageIndex` 失败，任务失败；后续重试从 `normalize` 后的 PDF 继续
-- 若章节树生成失败，可回退到按页段生成
-- 若图片定位或切图失败，不阻塞整份文档，可对该占位符降级为整页截图或文本标注
-- `retry` 优先复用已存在中间态，而不是重新上传文件
-
-## 3. 后端模块拆分
-
-### 3.1 新增目录
-
-建议新增：
-
-- `deeptutor/api/routers/structure_note.py`
-- `deeptutor/services/structure_note/`
-
-### 3.2 服务子模块
-
-建议按以下模块拆分：
-
-#### `models.py`
-
-定义内部类型：
-
-- `DifficultyLevel`
-- `JobStatus`
-- `StructureNoteArtifact`
-- `PageIndexPage`
-- `SectionTreeNode`
-- `GenerationChunk`
-- `CitationEntry`
-- `ImagePlaceholder`
-
-#### `storage.py`
-
-负责：
-
-- 生成 artifact 目录
-- 读写 `artifact.json`
-- 路径组装
-- 环境化保留策略清理
-
-#### `normalizer.py`
-
-负责：
-
-- 判断输入格式
-- 调用 LibreOffice 完成 PPT/PPTX -> PDF 转换
-- 输出标准 PDF 路径
-- 提供依赖缺失时的明确错误消息
-
-#### `page_index.py`
-
-负责：
-
-- 使用 PyMuPDF 逐页抽文本
-- 记录页码、页尺寸、文本块信息
-- 渲染页面基础图像信息
-- 提取标题候选与图像候选区域
-
-#### `tree_builder.py`
-
-负责：
-
-- 规则层标题候选提取
-- 调用 LLM 将候选标准化为 2-5 级章节树
-- 建立 `section -> page range` 映射
-- 失败时回退到按页段生成
-
-#### `difficulty.py`
-
-负责三档难度 preset：
-
-- 输出长度预算
-- 输出风格约束
-- 页窗口大小
-- 术语解释深度
-- 推理展开深度
-
-#### `generator.py`
-
-负责：
-
-- 根据树结构切分 generation chunks
-- 生成 Markdown 正文
-- 注入页码范围标签
-- 生成图片占位符
-
-#### `image_pipeline.py`
-
-负责：
-
-- 占位符扫描
-- 页号映射
-- 调用定位 Agent 得到页与象限
-- 将象限转换为 PyMuPDF crop box
-- 切图并写入 `images/`
-- 回填到 Markdown / render model
-
-#### `renderer.py`
-
-负责：
-
-- Markdown -> HTML
-- HTML -> PDF（WeasyPrint）
-- citation manifest 输出
-
-#### `manager.py`
-
-负责：
-
-- 任务编排
-- 状态流转
-- 后台续跑
-- 对 router 提供统一接口
-
-### 3.3 PathService 扩展
-
-在 `deeptutor/services/path_service.py` 中增加 `structure_note` 工作区路径支持，最终目录落到：
-
-`data/user/workspace/structure_note/<job_id>/`
-
-固定目录结构：
-
-- `source/`
-- `normalized/`
-- `index/`
-- `chunks/`
-- `images/`
-- `final/`
-- `artifact.json`
-
-## 4. API 与类型
-
-### 4.1 对外接口
-
-#### `POST /api/v1/structure-note/jobs`
-
-用途：创建任务
-请求：`multipart/form-data`
-
-- `file`: 上传文件
-- `difficulty_level`: `simple | medium | detailed`
-
-行为：
-
-- 验证格式
-- 创建 `job_id`
-- 写入源文件
-- 启动后台任务
-- 返回任务基础信息与 task stream 标识
-
-#### `GET /api/v1/structure-note/jobs`
-
-用途：获取工作区历史列表
-返回最少字段：
-
-- `job_id`
-- `file_name`
-- `difficulty_level`
-- `status`
-- `created_at`
-- `updated_at`
-
-#### `GET /api/v1/structure-note/jobs/{job_id}`
-
-用途：获取任务详情
-返回最少字段：
-
-- `job_id`
-- `status`
-- `source_format`
-- `difficulty_level`
-- `final_pdf_path`
-- `citation_manifest_summary`
-- `retry_available`
-
-#### `POST /api/v1/structure-note/jobs/{job_id}/retry`
-
-用途：失败任务续跑
-行为：
-
-- 读取 `artifact.json`
-- 检查上次成功阶段
-- 从最近可复用阶段继续执行
-
-#### `GET /api/v1/structure-note/tasks/{task_id}/stream`
-
-用途：SSE 任务流
-复用 `knowledge` 的日志和状态推送模式
-
-### 4.2 内部 artifact 结构
-
-`artifact.json` 至少包含：
-
-- `job_id`
-- `source_format`
-- `difficulty_level`
-- `source_path`
-- `normalized_pdf_path`
-- `page_index_path`
-- `section_tree_path`
-- `generation_chunks_path`
-- `citation_manifest_path`
-- `final_pdf_path`
-- `status`
-- `retry_state`
-- `created_at`
-- `updated_at`
-
-### 4.3 Citation 类型
-
-每条 citation 至少包含：
-
-- `citation_id`
-- `section_path`
-- `page_start`
-- `page_end`
-- `source_file`
-- `source_kind`
-- `image_page`
-- `image_region`
-
-其中：
-
-- `source_kind` 仅允许 `text` 或 `image`
-- `image_page` / `image_region` 仅在图像引用时填写
-
-## 5. 前端工作区设计
-
-### 5.1 页面结构
-
-新页面建议为：
-
-`web/app/(workspace)/structure-note/page.tsx`
-
-### 5.2 三个核心面板
-
-#### 上传与配置
-
-- 文件选择
-- 难度切换：
-  - 简单
-  - 中等（默认）
-  - 复杂
-- `detailed` 旁边增加一条轻量提示：生成时间更长
-
-#### 处理中
-
-- 阶段文本
-- 进度条
-- 错误提示
-- 重试按钮
-
-#### 结果页
-
-- PDF 预览
-- 下载按钮
-- citation 侧栏
-- 历史任务入口
-
-### 5.3 非目标展示
-
-前端明确不展示：
-
-- 章节树调试信息
-- 图片占位符
-- 四象限判断
-- crop box
-- 中间 Markdown
-- 中间 JSON
-
-### 5.4 历史列表字段
-
-至少显示：
-
-- 文件名
-- 难度
-- 状态
-- 创建时间
-- 重新打开结果
-
-## 6. 生成与渲染策略
-
-### 6.1 难度预设
-
-#### simple
-
-- 目标：关键词、定义、核心知识、结论
-- 风格：科普型
-- 输出：最短
-- 推理：尽量压缩
-- 页窗口：默认 10 页
-
-#### medium
-
-- 目标：正常课堂讲解
-- 风格：重点解释 + 基础逻辑链
-- 输出：中等
-- 推理：保留基础过程
-- 页窗口：默认 10 页
-
-#### detailed
-
-- 目标：覆盖细节、推理、过程与隐含逻辑
-- 风格：最详细
-- 输出：最长
-- 推理：尽量完整
-- 页窗口：自动缩到 5-8 页
-
-### 6.2 章节树生成规则
-
-- 优先依据字体大小、位置、编号样式和文本模式抽取标题候选
-- 交给 LLM 做结构归一化，但输出必须约束为 2-5 级节点
-- 若 LLM 输出不可用，回退到按页段分组，而不是阻塞整个流程
-
-### 6.3 图片流水线
-
-#### 第一步：占位符生成
-
-正文生成时输出形如：
-
-`[[IMAGE_PLACEHOLDER:section_id:page_hint:purpose]]`
-
-#### 第二步：定位 Agent
-
-Agent 输出固定格式：
-
-- 第几页
-- 象限：`left_top | right_top | left_bottom | right_bottom`
-
-#### 第三步：切图执行
-
-根据页面宽高将页面切成四象限：
-
-- 左上
-- 右上
-- 左下
-- 右下
-
-切图执行器只做确定性 crop，不自行做语义判断。
-
-#### 第四步：回填
-
-回填模块将图片资源路径写回 Markdown 或 render model，再进入最终 PDF 渲染。
-
-### 6.4 PDF 渲染
-
-- 中间产物使用 Markdown 表达
-- 渲染时先转 HTML，再交给 WeasyPrint 输出 PDF
-- 引用不嵌入正文，只保留干净版 PDF
-- citation manifest 单独生成 JSON，供前端侧栏展示
-
-## 7. 存储与中间态策略
-
-### 7.1 存储内容
-
-在完整保留模式下，应保存：
-
-- 原始上传文件
-- 归一化 PDF
-- 页级索引 JSON
-- 章节树 JSON
-- generation chunks JSON
-- 图片资源
-- 回填后 Markdown
-- citation manifest
-- 最终 PDF
-- `artifact.json`
-
-### 7.2 环境化保留策略
-
-建议新增环境配置项，例如：
-
-- `STRUCTURE_NOTE_RETENTION_MODE=full|minimal`
-
-规则：
-
-- 测试环境默认 `full`
-- 生产环境默认 `minimal`
-
-`minimal` 至少保留：
-
-- `artifact.json`
-- `final.pdf`
-- `citation_manifest.json`
-
-### 7.3 续跑策略
-
-`retry_state` 记录最近成功阶段。续跑时遵循：
-
-- 已完成 `normalize`：不重复转换
-- 已完成 `page_index`：不重复抽页
-- 已完成 `tree_build`：不重复建树
-- 仅后续阶段失败：从失败阶段继续
-
-## 8. 测试矩阵与实施里程碑
-
-### 8.1 单元测试
-
-- `PageIndex` 逐页文本提取
-- 空页处理
-- 页码顺序稳定
-- 标题候选抽取规则
-- 树标准化结果满足 2-5 级结构约束
-- 难度 preset 对窗口大小和长度预算的影响
-- 象限到 crop box 的换算
-- 保留策略清理逻辑
-
-### 8.2 集成测试
-
-- PDF 上传全链路成功，生成 PDF 与 citation manifest
-- PPT/PPTX 上传真实走 LibreOffice 转 PDF，再进入后续链路
-- `simple / medium / detailed` 三档输出长度和内容密度有明显差异
-- 图片占位符能被回填
-- 图片失败时能降级或重试
-- 任务中断后 `retry` 会复用中间态，而不是从头重跑
-
-### 8.3 前端测试
-
-- 上传页能提交文件和难度
-- 处理中状态能接收 SSE 进度
-- 结果页能加载 PDF 和 citation 侧栏
-- 失败任务能触发重试
-
-### 8.4 验收样本
-
-- 学生教材 PDF：中等模式，结果可读、页码回溯清楚
-- 教师 PPT：复杂模式，细节展开明显更多
-- 简单模式：明显短于中等与复杂，不丢失关键词和核心知识
-
-### 8.5 实施里程碑
-
-#### M1：文档与骨架
-
-- 在 `docs/testdoc/` 落 `PRD + 技术计划`
-- 建立路由、artifact 模型、目录结构、SSE 任务流
-
-#### M2：素材归一化与 PageIndex
-
-- 接通 PDF 上传
-- 接通 PPT/PPTX -> PDF 转换
-- 产出页级索引与章节树
-
-#### M3：内容生成与三档难度
-
-- 接通 chunk 生成
-- 接通难度 preset
-- 产出 citation manifest
-
-#### M4：图片流水线与 PDF 渲染
-
-- 接通占位符识别、象限定位、切图回填
-- 接通 Markdown -> HTML -> PDF
-
-#### M5：前端结果工作区与完整测试
-
-- 上传 / 进度 / 结果 / 重试闭环
-- 完成集成测试与验收样本
-
-## 9. 实施默认值
-
-- 文档落盘格式使用中文 Markdown，不额外导出 PDF 版 PRD / 技术计划
-- `docs/testdoc` 仅作归档，不在文档 sidebar 中额外挂载
-- LibreOffice 是首发必需依赖；环境缺失时，PPT/PPTX 上传失败并返回安装指引
-- 最终 PDF 不内嵌完整引用；完整引用只在前端侧栏和 `citation_manifest.json` 中展示
-- 中间态保留走环境配置：测试环境保留完整中间态，生产环境默认保留 `artifact.json + final.pdf + citation_manifest.json`
diff --git a/docs/zh/features/overview.md b/docs/zh/features/overview.md
deleted file mode 100644
index dc9d85265..000000000
--- a/docs/zh/features/overview.md
+++ /dev/null
@@ -1,57 +0,0 @@
-# 功能介绍
-
-DeepTutor 提供六个专业模块，助力 AI 驱动的学习体验。
-
-<div class="feature-nav">
-
-## 核心模块
-
-| 模块 | 描述 | 文档 |
-|:-------|:------------|:--------------|
-| 🧠 **智能解题** | 多 Agent 协作解题，双循环推理架构 | [详情 →](https://github.com/HKUDS/DeepTutor#-smart-solver) |
-| 🎯 **题目生成** | 自定义测验生成，模拟真实考试风格 | [详情 →](https://github.com/HKUDS/DeepTutor#-question-generator) |
-| 🎓 **引导学习** | 个性化学习路径，交互式可视化 | [详情 →](https://github.com/HKUDS/DeepTutor#-guided-learning) |
-| 🔬 **深度研究** | 系统化主题探索，动态主题队列 | [详情 →](https://github.com/HKUDS/DeepTutor#-deep-research) |
-| 💡 **想法生成** | 自动化研究想法生成，多阶段过滤 | [详情 →](https://github.com/HKUDS/DeepTutor#-automated-ideagen) |
-| ✏️ **协作写作** | AI 辅助写作，TTS 语音朗读 | [详情 →](https://github.com/HKUDS/DeepTutor#-interactive-ideagen-co-writer) |
-
-## 系统架构
-
-<img src="/full-pipe.png" alt="DeepTutor 架构" style="width: 100%; border-radius: 8px; margin: 24px 0;">
-
-### 系统层次
-
-- **用户界面** — 双向查询响应，结构化输出
-- **Agent 模块** — 各学习任务的专业 AI Agent
-- **工具集成** — RAG、网络搜索、论文检索、代码执行
-- **知识基础** — 知识图谱 + 向量存储 + 记忆系统
-
-</div>
-
-## 支持的服务商
-
-DeepTutor 支持多种 LLM 和 Embedding 服务商：
-
-::: details LLM 服务商
-- OpenAI (GPT-4o, GPT-4)
-- Anthropic (Claude 3.5)
-- Azure OpenAI
-- DeepSeek
-- Groq
-- OpenRouter
-- Ollama（本地部署）
-- Google Gemini
-:::
-
-::: details Embedding 服务商
-- OpenAI
-- Jina AI
-- Cohere
-- Ollama
-- LM Studio
-- HuggingFace
-:::
-
----
-
-📖 **完整文档**: [GitHub README](https://github.com/HKUDS/DeepTutor)
diff --git a/docs/zh/guide/data-preparation.md b/docs/zh/guide/data-preparation.md
deleted file mode 100644
index e148c40b1..000000000
--- a/docs/zh/guide/data-preparation.md
+++ /dev/null
@@ -1,185 +0,0 @@
-# 数据准备
-
-DeepTutor 提供示例知识库和样例问题，帮助您快速上手。
-
-## 示例知识库
-
-我们在 [Google Drive](https://drive.google.com/drive/folders/1iWwfZXiTuQKQqUYb5fGDZjLCeTUP6DA6?usp=sharing) 上提供两个预构建的知识库：
-
-### 1. 研究论文合集
-
-<div class="info-card">
-  <div class="info-header">
-    <span class="info-icon">📄</span>
-    <span class="info-title">5 篇研究论文（每篇 20-50 页）</span>
-  </div>
-  <div class="info-content">
-    <p>来自我们实验室的前沿研究论文精选集，涵盖 RAG 和 Agent 领域。</p>
-    <p><strong>包含论文：</strong></p>
-    <ul>
-      <li><a href="https://github.com/HKUDS/AI-Researcher">AI-Researcher</a> - 自动化研究论文生成</li>
-      <li><a href="https://github.com/HKUDS/AutoAgent">AutoAgent</a> - 自主智能体框架</li>
-      <li><a href="https://github.com/HKUDS/RAG-Anything">RAG-Anything</a> - 多模态 RAG 系统</li>
-      <li><a href="https://github.com/HKUDS/LightRAG">LightRAG</a> - 简洁快速的 RAG</li>
-      <li><a href="https://github.com/HKUDS/VideoRAG">VideoRAG</a> - 基于 RAG 的视频理解</li>
-    </ul>
-    <p><strong>适用场景：</strong> 研究场景，广泛知识覆盖</p>
-  </div>
-</div>
-
-### 2. 数据科学教材
-
-<div class="info-card">
-  <div class="info-header">
-    <span class="info-icon">📚</span>
-    <span class="info-title">8 章，296 页</span>
-  </div>
-  <div class="info-content">
-    <p>来自加州大学伯克利分校的综合深度学习教材。</p>
-    <p><strong>来源：</strong> <a href="https://ma-lab-berkeley.github.io/deep-representation-learning-book/">Deep Representation Learning Book</a></p>
-    <p><strong>涵盖主题：</strong></p>
-    <ul>
-      <li>神经网络基础</li>
-      <li>表示学习</li>
-      <li>深度学习架构</li>
-      <li>高级主题</li>
-    </ul>
-    <p><strong>适用场景：</strong> 学习场景，深度知识挖掘</p>
-  </div>
-</div>
-
-## 下载与设置
-
-### 步骤 1：下载
-
-访问我们的 [Google Drive 文件夹](https://drive.google.com/drive/folders/1iWwfZXiTuQKQqUYb5fGDZjLCeTUP6DA6?usp=sharing) 并下载：
-
-- `knowledge_bases.zip` - 包含嵌入的预构建知识库
-- `questions.zip` - 样例问题和使用示例（可选）
-
-### 步骤 2：解压
-
-将下载的文件解压到 `data/` 目录：
-
-```
-DeepTutor/
-├── data/
-│   └── knowledge_bases/
-│       ├── research_papers/      # 研究论文知识库
-│       ├── data_science_book/    # 教材知识库
-│       └── kb_config.json        # 知识库配置
-└── user/                         # 用户数据（自动创建）
-```
-
-### 步骤 3：验证
-
-解压后，启动 DeepTutor 时您的知识库将自动可用。
-
-::: warning 嵌入兼容性
-我们的示例知识库使用 `text-embedding-3-large`，`dimensions = 3072`。
-
-如果您的嵌入模型具有不同的维度，您需要创建自己的知识库。
-:::
-
-## 创建自定义知识库
-
-### 支持的文件格式
-
-| 格式 | 扩展名 | 说明 |
-|:-------|:----------|:------|
-| PDF | `.pdf` | 支持文本提取和版面分析 |
-| 文本 | `.txt` | 纯文本文件 |
-| Markdown | `.md` | 支持格式化的 Markdown |
-
-### 通过 Web 界面
-
-1. 导航到 `http://localhost:3782/knowledge`
-2. 点击 **"New Knowledge Base"**
-3. 为您的知识库输入唯一名称
-4. 上传您的文档（单个或批量上传）
-5. 等待处理完成
-
-::: tip 处理时间
-- 小文档（< 10 页）：约 1 分钟
-- 中等文档（10-100 页）：约 5-10 分钟
-- 大文档（100+ 页）：可能需要更长时间
-:::
-
-### 通过命令行
-
-```bash
-# 使用文档初始化新知识库
-python -m src.knowledge.start_kb init <kb_name> --docs <pdf_path>
-
-# 向现有知识库添加文档
-python -m src.knowledge.add_documents <kb_name> --docs <new_document.pdf>
-```
-
-## 数据存储结构
-
-所有用户数据存储在 `data/` 目录中：
-
-```
-data/
-├── knowledge_bases/              # 知识库存储
-│   ├── <kb_name>/
-│   │   ├── documents/            # 原始文档
-│   │   ├── chunks/               # 分块内容
-│   │   ├── embeddings/           # 向量嵌入
-│   │   └── graph/                # 知识图谱数据
-└── user/                         # 用户活动数据
-    ├── solve/                    # 解题结果
-    ├── question/                 # 生成的题目
-    ├── research/                 # 研究报告
-    ├── notebook/                 # 笔记本记录
-    └── logs/                     # 系统日志
-```
-
----
-
-**下一步：** [本地安装 →](/zh/guide/local-start)
-
-<style>
-.info-card {
-  background: var(--vp-c-bg-soft);
-  border: 1px solid var(--vp-c-border);
-  border-radius: 12px;
-  padding: 20px;
-  margin: 16px 0;
-}
-
-.info-header {
-  display: flex;
-  align-items: center;
-  gap: 12px;
-  margin-bottom: 16px;
-}
-
-.info-icon {
-  font-size: 1.5rem;
-}
-
-.info-title {
-  font-size: 1.1rem;
-  font-weight: 600;
-  color: var(--vp-c-text-1);
-}
-
-.info-content {
-  color: var(--vp-c-text-2);
-  line-height: 1.7;
-}
-
-.info-content ul {
-  margin: 12px 0;
-  padding-left: 20px;
-}
-
-.info-content li {
-  margin: 6px 0;
-}
-
-.info-content a {
-  color: var(--vp-c-brand-1);
-}
-</style>
diff --git a/docs/zh/guide/local-conda-cursor.md b/docs/zh/guide/local-conda-cursor.md
deleted file mode 100644
index fa8054d9c..000000000
--- a/docs/zh/guide/local-conda-cursor.md
+++ /dev/null
@@ -1,56 +0,0 @@
-# 本地 Conda 环境（可选）
-
-仅当你在本机使用 **Cursor/VSCode** 且希望用**专用 conda 环境**时参考，无需所有人统一这样做。
-
-## 1. 让终端识别 conda
-
-若在 Cursor 终端里出现 `command not found: conda`，多半是集成终端未加载 conda。任选其一：
-
-**方式 A：当前终端临时启用**
-
-```bash
-source scripts/activate_conda.sh
-```
-
-**方式 B：长期生效**
-
-在 `~/.zshrc` 中保留 conda 初始化块（安装 Miniconda/Anaconda 时通常已添加），然后新开终端即可。
-
-## 2. 创建项目专用环境
-
-```bash
-# 先让 conda 可用（若尚未可用）
-source scripts/activate_conda.sh
-
-# 一键创建环境并安装依赖（Python 3.12 + Node 20 + 前端）
-bash scripts/setup_conda_env.sh
-```
-
-环境名为 `deeptutor`。
-
-## 3. 在 Cursor 里使用该环境
-
-- 已通过 **`.vscode/settings.json`** 指定解释器为：
-  `~/miniconda3/envs/deeptutor/bin/python`
-- 若你用的是 **Anaconda**，请把该文件中的 `miniconda3` 改为 `anaconda3`。
-- 打开 Python 文件时，Cursor 会使用上述解释器；终端里可执行：
-
-  ```bash
-  conda activate deeptutor
-  python scripts/start_web.py
-  ```
-
-或直接：
-
-```bash
-bash scripts/run_with_conda.sh
-```
-
-## 4. 小结
-
-| 目的           | 操作 |
-|----------------|------|
-| 终端里能用 conda | `source scripts/activate_conda.sh` 或配置好 `~/.zshrc` |
-| 创建/重建环境   | `bash scripts/setup_conda_env.sh` |
-| 用指定环境启动  | `bash scripts/run_with_conda.sh` 或 `conda activate deeptutor && python scripts/start_web.py` |
-| 编辑器用该环境  | 已由 `.vscode/settings.json` 指定，无需额外操作 |
diff --git a/docs/zh/guide/local-start.md b/docs/zh/guide/local-start.md
deleted file mode 100644
index 64dee562d..000000000
--- a/docs/zh/guide/local-start.md
+++ /dev/null
@@ -1,190 +0,0 @@
-# 本地安装
-
-本指南介绍用于开发或非 Docker 环境的手动安装。
-
-## 前提条件
-
-- **Python 3.10+** — [下载](https://www.python.org/downloads/)
-- **Node.js 18+** — [下载](https://nodejs.org/)
-- **Git** — [下载](https://git-scm.com/)
-
-::: tip Windows 用户
-如果在安装过程中遇到路径长度错误，请启用长路径支持：
-
-```cmd
-reg add "HKLM\SYSTEM\CurrentControlSet\Control\FileSystem" /v LongPathsEnabled /t REG_DWORD /d 1 /f
-```
-
-运行此命令后重启终端。
-:::
-
-## 步骤 1：设置虚拟环境
-
-选择以下选项之一：
-
-::: code-group
-
-```bash [Conda（推荐）]
-# 创建环境
-conda create -n deeptutor python=3.10
-
-# 激活环境
-conda activate deeptutor
-```
-
-```bash [venv]
-# 创建环境
-python -m venv venv
-
-# 激活 (Windows)
-venv\Scripts\activate
-
-# 激活 (macOS/Linux)
-source venv/bin/activate
-```
-
-:::
-
-## 步骤 2：安装依赖
-
-### 选项 A：自动安装（推荐）
-
-```bash
-# 使用 Python 脚本
-python scripts/install_all.py
-
-# 或使用 shell 脚本 (macOS/Linux)
-bash scripts/install_all.sh
-```
-
-### 选项 B：手动安装
-
-```bash
-# 安装 Python 依赖
-pip install -r requirements.txt
-
-# 安装 Node.js 依赖
-npm install --prefix web
-```
-
-::: warning 常见问题
-如果看到 `npm: command not found`：
-
-```bash
-# 使用 Conda
-conda install -c conda-forge nodejs
-
-# 或从 https://nodejs.org/ 安装
-```
-:::
-
-## 步骤 3：配置环境
-
-确保您已完成[预配置](/zh/guide/pre-config)步骤：
-
-1. ✅ 创建了包含 API 密钥的 `.env` 文件
-2. ✅ （可选）自定义了 `config/agents.yaml`
-3. ✅ （可选）下载了示例知识库
-
-## 步骤 4：启动应用
-
-### 启动 Web 界面（推荐）
-
-```bash
-python scripts/start_web.py
-```
-
-这将同时启动 **前端**（Next.js）和 **后端**（FastAPI）服务器。
-
-### 替代方案：仅 CLI 界面
-
-```bash
-python scripts/start.py
-```
-
-### 访问地址
-
-| 服务 | URL | 说明 |
-|:---:|:---|:---|
-| **前端** | http://localhost:3782 | 主 Web 界面 |
-| **API 文档** | http://localhost:8001/docs | 交互式 API 文档 |
-
-## 高级：分别启动服务
-
-对于开发，您可能想要分别运行前端和后端：
-
-### 后端（FastAPI）
-
-```bash
-python src/api/run_server.py
-
-# 或直接使用 uvicorn
-uvicorn src.api.main:app --host 0.0.0.0 --port 8001 --reload
-```
-
-### 前端（Next.js）
-
-首先，创建 `web/.env.local`：
-
-```bash
-NEXT_PUBLIC_API_BASE=http://localhost:8001
-```
-
-然后启动开发服务器：
-
-```bash
-cd web
-npm install
-npm run dev -- -p 3782
-```
-
-## 停止服务
-
-在终端中按 `Ctrl+C` 停止服务。
-
-::: warning 端口仍在使用？
-如果按 Ctrl+C 后看到"端口已在使用"：
-
-**macOS/Linux：**
-```bash
-lsof -i :8001
-kill -9 <PID>
-```
-
-**Windows：**
-```bash
-netstat -ano | findstr :8001
-taskkill /PID <PID> /F
-```
-:::
-
-## 故障排除
-
-### 后端启动失败
-
-**检查清单：**
-- 确认 Python 版本 >= 3.10：`python --version`
-- 确认所有依赖已安装：`pip install -r requirements.txt`
-- 检查端口 8001 是否被占用
-- 验证 `.env` 文件配置
-
-### 前端无法连接后端
-
-**解决方案：**
-1. 确认后端正在运行：访问 http://localhost:8001/docs
-2. 检查浏览器控制台的错误信息
-3. 创建 `web/.env.local`：
-   ```bash
-   NEXT_PUBLIC_API_BASE=http://localhost:8001
-   ```
-
-### WebSocket 连接失败
-
-**检查清单：**
-- 确认后端正在运行
-- 检查防火墙设置
-- 验证 WebSocket URL 格式：`ws://localhost:8001/api/v1/...`
-
----
-
-**下一步：** [Docker 部署 →](/zh/guide/docker-start)
diff --git a/docs/zh/guide/pre-config.md b/docs/zh/guide/pre-config.md
deleted file mode 100644
index 92a225580..000000000
--- a/docs/zh/guide/pre-config.md
+++ /dev/null
@@ -1,201 +0,0 @@
-# 预配置
-
-在启动 DeepTutor 之前，您需要完成以下设置步骤。
-
-## 1. 克隆仓库
-
-```bash
-git clone https://github.com/HKUDS/DeepTutor.git
-cd DeepTutor
-```
-
-## 2. 环境变量配置
-
-从模板创建 `.env` 文件：
-
-```bash
-cp .env.example .env
-```
-
-然后编辑 `.env` 文件，填入您的 API 密钥：
-
-```bash
-# ============================================================================
-# 服务器配置
-# ============================================================================
-BACKEND_PORT=8001                         # 后端 API 端口
-FRONTEND_PORT=3782                        # 前端 Web 端口
-
-# 远程/局域网访问 - 设置为您服务器的 IP 地址
-# NEXT_PUBLIC_API_BASE=http://192.168.1.100:8001
-
-# ============================================================================
-# LLM (大语言模型) 配置 - 必填
-# ============================================================================
-LLM_BINDING=openai                        # 提供商: openai, anthropic, azure_openai, ollama 等
-LLM_MODEL=gpt-4o                          # 模型名: gpt-4o, deepseek-chat, claude-3-5-sonnet 等
-LLM_HOST=https://api.openai.com/v1        # API 端点 URL
-LLM_API_KEY=your_api_key                  # 您的 LLM API 密钥
-
-# ============================================================================
-# 嵌入模型配置 - 知识库必填
-# ============================================================================
-EMBEDDING_BINDING=openai                  # 提供商类型
-EMBEDDING_MODEL=text-embedding-3-large    # 嵌入模型名称
-EMBEDDING_DIMENSION=3072                  # 必须与模型维度匹配
-EMBEDDING_HOST=https://api.openai.com/v1  # API 端点
-EMBEDDING_API_KEY=your_api_key            # 嵌入 API 密钥
-
-# ============================================================================
-# 网络搜索配置 - 可选
-# ============================================================================
-SEARCH_PROVIDER=perplexity                # 选项: perplexity, tavily, serper, jina, exa, baidu
-SEARCH_API_KEY=your_search_api_key        # 搜索提供商的 API 密钥
-```
-
-### 环境变量参考
-
-| 变量 | 必填 | 说明 |
-|:---|:---:|:---|
-| `LLM_MODEL` | **是** | 模型名称 (如 `gpt-4o`, `deepseek-chat`) |
-| `LLM_API_KEY` | **是** | 您的 LLM API 密钥 |
-| `LLM_HOST` | **是** | API 端点 URL |
-| `EMBEDDING_MODEL` | **是** | 嵌入模型名称 |
-| `EMBEDDING_DIMENSION` | **是** | 必须与模型输出维度匹配 |
-| `EMBEDDING_API_KEY` | **是** | 嵌入 API 密钥 |
-| `EMBEDDING_HOST` | **是** | 嵌入 API 端点 |
-| `BACKEND_PORT` | 否 | 后端端口 (默认: `8001`) |
-| `FRONTEND_PORT` | 否 | 前端端口 (默认: `3782`) |
-| `NEXT_PUBLIC_API_BASE` | 否 | 设置用于远程/局域网访问 |
-| `SEARCH_PROVIDER` | 否 | 网络搜索提供商 |
-| `SEARCH_API_KEY` | 否 | 搜索 API 密钥 |
-
-### 支持的 LLM 提供商
-
-| 提供商 | `LLM_BINDING` 值 | 说明 |
-|:---------|:--------------------|:------|
-| OpenAI | `openai` | GPT-4o, GPT-4, GPT-3.5 |
-| Anthropic | `anthropic` | Claude 3.5, Claude 3 |
-| Azure OpenAI | `azure_openai` | 企业部署 |
-| Ollama | `ollama` | 本地模型 |
-| DeepSeek | `deepseek` | DeepSeek-V3, DeepSeek-R1 |
-| Groq | `groq` | 快速推理 |
-| OpenRouter | `openrouter` | 多模型网关 |
-| Google Gemini | `gemini` | OpenAI 兼容模式 |
-
-### 支持的嵌入提供商
-
-| 提供商 | `EMBEDDING_BINDING` 值 | 说明 |
-|:---------|:--------------------------|:------|
-| OpenAI | `openai` | text-embedding-3-large/small |
-| Azure OpenAI | `azure_openai` | 企业部署 |
-| Jina AI | `jina` | jina-embeddings-v3 |
-| Cohere | `cohere` | embed-v3 系列 |
-| Ollama | `ollama` | 本地嵌入模型 |
-| LM Studio | `lm_studio` | 本地推理服务器 |
-| HuggingFace | `huggingface` | OpenAI 兼容端点 |
-
-## 3. 配置文件
-
-DeepTutor 使用两个 YAML 配置文件进行自定义：
-
-### `config/agents.yaml` - Agent 参数
-
-此文件控制每个模块的 LLM 参数：
-
-```yaml
-# 解题模块 - 问题求解 agents
-solve:
-  temperature: 0.3
-  max_tokens: 8192
-
-# 研究模块 - 深度研究 agents
-research:
-  temperature: 0.5
-  max_tokens: 12000
-
-# 题目模块 - 题目生成 agents
-question:
-  temperature: 0.7
-  max_tokens: 4096
-
-# 引导模块 - 学习引导 agents
-guide:
-  temperature: 0.5
-  max_tokens: 16192
-
-# 灵感生成模块 - 想法生成 agents
-ideagen:
-  temperature: 0.7
-  max_tokens: 4096
-
-# 协作写作模块 - 协作写作 agents
-co_writer:
-  temperature: 0.7
-  max_tokens: 4096
-```
-
-### `config/main.yaml` - 系统设置
-
-此文件控制路径、工具和模块特定设置：
-
-```yaml
-# 系统语言
-system:
-  language: en
-
-# 数据路径
-paths:
-  user_data_dir: ./data/user
-  knowledge_bases_dir: ./data/knowledge_bases
-
-# 工具配置
-tools:
-  rag_tool:
-    kb_base_dir: ./data/knowledge_bases
-    default_kb: ai_textbook
-  run_code:
-    workspace: ./data/user/run_code_workspace
-  web_search:
-    enabled: true
-  query_item:
-    enabled: true
-    max_results: 5
-
-# 模块特定设置
-research:
-  researching:
-    execution_mode: series      # "series" 或 "parallel"
-    max_iterations: 5
-    enable_rag_hybrid: true
-    enable_paper_search: true
-    enable_web_search: true
-```
-
-> **提示：** 对于大多数用户，默认配置已经足够好用。只有在需要特定自定义时才修改这些文件。
-
-## 4. 知识库准备（可选）
-
-您可以使用我们预构建的示例知识库来快速开始。
-
-### 下载示例知识库
-
-从 [Google Drive](https://drive.google.com/drive/folders/1iWwfZXiTuQKQqUYb5fGDZjLCeTUP6DA6?usp=sharing) 下载并解压到 `data/` 目录。
-
-::: info 重要提示
-示例知识库使用 `text-embedding-3-large`，`dimensions = 3072`。请确保您的嵌入模型具有匹配的维度。
-:::
-
-### 创建您自己的知识库
-
-启动 DeepTutor 后：
-
-1. 导航到 `http://localhost:3782/knowledge`
-2. 点击 **"New Knowledge Base"**
-3. 输入唯一的名称
-4. 上传 PDF/TXT/MD 文件
-5. 在终端中监控进度
-
----
-
-**下一步：** [数据准备 →](/zh/guide/data-preparation)
diff --git a/docs/zh/guide/troubleshooting.md b/docs/zh/guide/troubleshooting.md
deleted file mode 100644
index 4bccdce0d..000000000
--- a/docs/zh/guide/troubleshooting.md
+++ /dev/null
@@ -1,48 +0,0 @@
-# 常见问题
-
-快速解决常见问题。
-
-## 启动问题
-
-| 问题 | 解决方案 |
-|:--------|:---------|
-| 后端启动失败 | 检查 Python ≥ 3.10，验证 `.env` 配置 |
-| `npm: command not found` | 安装 Node.js: `conda install -c conda-forge nodejs` |
-| 端口已被占用 | 终止进程：`lsof -i :8001` → `kill -9 <PID>` |
-
-## 连接问题
-
-| 问题 | 解决方案 |
-|:--------|:---------|
-| 前端无法连接后端 | 确认后端运行在 <http://localhost:8001/docs> |
-| WebSocket 连接失败 | 检查防火墙，确认 `ws://localhost:8001/api/v1/...` 格式 |
-| 远程访问失败 | 在 `.env` 中设置 `NEXT_PUBLIC_API_BASE=http://your-ip:8001` |
-
-## Docker 问题
-
-| 问题 | 解决方案 |
-|:--------|:---------|
-| 云端前端无法连接 | 设置 `NEXT_PUBLIC_API_BASE_EXTERNAL=https://your-server:8001` |
-| 架构不匹配 | 使用 `uname -m` 检查：AMD64 用 `:latest`，ARM 用 `:latest-arm64` |
-
-## 知识库问题
-
-| 问题 | 解决方案 |
-|:--------|:---------|
-| 处理卡住 | 检查终端日志，验证 API 密钥 |
-| `uvloop.Loop` 错误 | 运行：`./scripts/extract_numbered_items.sh <kb_name>` |
-
-## 终止后台进程
-
-```bash
-# macOS/Linux
-lsof -i :8001 && kill -9 <PID>
-
-# Windows
-netstat -ano | findstr :8001
-taskkill /PID <PID> /F
-```
-
----
-
-📖 **完整 FAQ**: [GitHub README](https://github.com/HKUDS/DeepTutor#-faq)
diff --git a/docs/zh/index.md b/docs/zh/index.md
deleted file mode 100644
index 5cf53712c..000000000
--- a/docs/zh/index.md
+++ /dev/null
@@ -1,77 +0,0 @@
----
-layout: home
-
-hero:
-  name: "DeepTutor"
-  text: "你的 AI 学习伙伴"
-  tagline: 将任何文档转化为多智能体驱动的互动学习体验
-  image:
-    src: /logo.png
-    alt: DeepTutor
-  actions:
-    - theme: brand
-      text: 快速开始 →
-      link: /zh/guide/pre-config
-    - theme: alt
-      text: GitHub
-      link: https://github.com/HKUDS/DeepTutor
-
-features:
-  - icon: 📚
-    title: 海量文档问答
-    details: 上传教材、论文和手册，构建基于 RAG 和知识图谱的 AI 知识库。
-  - icon: 🧠
-    title: 智能解题
-    details: 双循环推理架构配合多智能体协作，提供带有精准文档引用的逐步解答。
-  - icon: 🎯
-    title: 题目生成
-    details: 基于知识库生成自定义测验，或模拟真实考试风格进行练习。
-  - icon: 🎓
-    title: 引导学习
-    details: 个性化学习路径，配合交互式可视化和自适应讲解。
-  - icon: 🔬
-    title: 深度研究
-    details: 系统化主题探索，整合网络搜索、论文检索和文献综合。
-  - icon: 💡
-    title: 灵感生成
-    details: AI 辅助头脑风暴，知识提取与多阶段筛选。
----
-
-## 为什么选择 DeepTutor？
-
-- **深度理解** — 不只是答案，而是带有可视化讲解的引导式学习之旅
-- **多模态支持** — PDF、LaTeX、图片、代码执行等全面支持
-- **知识图谱** — 基于 LightRAG 的语义连接，实现更好的理解
-- **一站式平台** — 解题、题目生成、研究、灵感生成集于一体
-
-<style>
-:root {
-  --vp-home-hero-name-color: transparent;
-  --vp-home-hero-name-background: linear-gradient(135deg, #667eea 0%, #764ba2 50%, #f093fb 100%);
-  --vp-home-hero-image-background-image: linear-gradient(135deg, rgba(102, 126, 234, 0.2) 0%, rgba(118, 75, 162, 0.2) 50%, rgba(240, 147, 251, 0.15) 100%);
-  --vp-home-hero-image-filter: blur(72px);
-}
-
-.dark {
-  --vp-home-hero-image-background-image: linear-gradient(135deg, rgba(102, 126, 234, 0.15) 0%, rgba(118, 75, 162, 0.15) 50%, rgba(240, 147, 251, 0.1) 100%);
-}
-
-.VPHero .name {
-  font-size: 4.5rem !important;
-  line-height: 1.1 !important;
-}
-
-.VPHero .text {
-  font-size: 2.4rem !important;
-  font-weight: 600 !important;
-}
-
-@media (max-width: 768px) {
-  .VPHero .name {
-    font-size: 3rem !important;
-  }
-  .VPHero .text {
-    font-size: 1.8rem !important;
-  }
-}
-</style>
diff --git a/tests/services/test_structure_note_service.py b/tests/agents/structure_note/test_structure_note.py
similarity index 89%
rename from tests/services/test_structure_note_service.py
rename to tests/agents/structure_note/test_structure_note.py
index e35a455aa..8a247f3cd 100644
--- a/tests/services/test_structure_note_service.py
+++ b/tests/agents/structure_note/test_structure_note.py
@@ -4,20 +4,20 @@
 
 import pytest
 
-from deeptutor.services.structure_note import generator as generator_module
-from deeptutor.services.structure_note.difficulty import get_difficulty_preset
-from deeptutor.services.structure_note.generator import (
+from deeptutor.agents.structure_note import generator as generator_module
+from deeptutor.agents.structure_note.difficulty import get_difficulty_preset
+from deeptutor.agents.structure_note.generator import (
     _combination_instruction,
     build_generation_chunks,
     generate_transition_markdown,
 )
-from deeptutor.services.structure_note.image_pipeline import process_images
-from deeptutor.services.structure_note.manager import StructureNoteManager
-from deeptutor.services.structure_note.markdown_postprocessor import (
+from deeptutor.agents.structure_note.image_pipeline import process_images
+from deeptutor.agents.structure_note.manager import StructureNoteManager
+from deeptutor.agents.structure_note.markdown_postprocessor import (
     normalize_structure_note_markdown,
     validate_renderer_compatible_markdown,
 )
-from deeptutor.services.structure_note.models import (
+from deeptutor.agents.structure_note.models import (
     DifficultyLevel,
     ExplanationStyleLevel,
     GenerationChunk,
@@ -27,10 +27,10 @@
     SectionTreeNode,
     StructureNoteArtifact,
 )
-from deeptutor.services.structure_note.normalizer import NormalizationError, normalize_to_pdf
-from deeptutor.services.structure_note.page_index import sections_from_pageindex_structure
-from deeptutor.services.structure_note.planner import build_document_plan
-from deeptutor.services.structure_note.tree_builder import build_section_tree
+from deeptutor.agents.structure_note.normalizer import NormalizationError, normalize_to_pdf
+from deeptutor.agents.structure_note.page_index import sections_from_pageindex_structure
+from deeptutor.agents.structure_note.planner import build_document_plan
+from deeptutor.agents.structure_note.tree_builder import build_section_tree
 
 
 def _page(page_number: int, *, text: str = "", image_candidates=None) -> PageIndexPage:
@@ -264,6 +264,24 @@ def test_compose_markdown_inserts_generated_transition_between_major_sections()
     assert "理论展开" in markdown
 
 
+def test_export_output_stem_uses_source_title_with_structure_note_suffix() -> None:
+    artifact = StructureNoteArtifact(
+        job_id="job_1",
+        file_name="Week3.pptx",
+        source_format="pptx",
+        difficulty_level=DifficultyLevel.MEDIUM,
+        note_language=NoteLanguage.EN,
+        style_level=ExplanationStyleLevel.MEDIUM,
+        note_title="Week3",
+        status=JobStatus.RENDERING,
+        source_path="/tmp/Week3.pptx",
+        created_at="2026-01-01T00:00:00",
+        updated_at="2026-01-01T00:00:00",
+    )
+
+    assert StructureNoteManager()._export_output_stem(artifact) == "Week3-structure-note"
+
+
 @pytest.mark.asyncio
 async def test_generate_transition_markdown_uses_llm_context(monkeypatch) -> None:
     captured: dict[str, str] = {}
diff --git a/tests/api/test_structure_note_router.py b/tests/api/test_structure_note_router.py
index 300582367..3ab3449ea 100644
--- a/tests/api/test_structure_note_router.py
+++ b/tests/api/test_structure_note_router.py
@@ -18,7 +18,7 @@
 
 if FastAPI is not None and TestClient is not None:
     from deeptutor.api.routers import structure_note as structure_note_router_module
-    from deeptutor.services.structure_note import (
+    from deeptutor.agents.structure_note import (
         DifficultyLevel,
         ExplanationStyleLevel,
         JobStatus,
diff --git a/tests/services/test_path_service.py b/tests/services/test_path_service.py
index c7222e924..ec6c24a2a 100644
--- a/tests/services/test_path_service.py
+++ b/tests/services/test_path_service.py
@@ -124,11 +124,11 @@ def test_public_output_filter_allows_structure_note_markdown_pdf_and_images(tmp_
             / "structure_note"
             / "job_1"
             / "final"
-            / "final.pdf"
+            / "Week3-structure-note.pdf"
         )
         allowed.parent.mkdir(parents=True, exist_ok=True)
         allowed.write_text("pdf", encoding="utf-8")
-        allowed_md = allowed.with_name("rendered.md")
+        allowed_md = allowed.with_name("Week3-structure-note.md")
         allowed_md.write_text("# Note", encoding="utf-8")
         allowed_image = (
             service._user_data_dir
@@ -153,10 +153,15 @@ def test_public_output_filter_allows_structure_note_markdown_pdf_and_images(tmp_
         denied.write_text("{}", encoding="utf-8")
 
         assert (
-            service.is_public_output_path("workspace/structure_note/job_1/final/final.pdf") is True
+            service.is_public_output_path(
+                "workspace/structure_note/job_1/final/Week3-structure-note.pdf"
+            )
+            is True
         )
         assert (
-            service.is_public_output_path("workspace/structure_note/job_1/final/rendered.md")
+            service.is_public_output_path(
+                "workspace/structure_note/job_1/final/Week3-structure-note.md"
+            )
             is True
         )
         assert (

From e180e04bd4e68b01e9645a9f8b6243507b123dfd Mon Sep 17 00:00:00 2001
From: txxxxz <chendi_zhou@163.com>
Date: Wed, 15 Apr 2026 19:46:53 +0800
Subject: [PATCH 4/4] Address structure note review feedback

---
 .github/workflows/tests.yml                   | 24 ++++++++
 Dockerfile                                    | 21 ++++++-
 deeptutor/agents/structure_note/renderer.py   | 61 ++++++++++++++++++-
 deeptutor/api/routers/structure_note.py       | 17 +++---
 .../structure_note/test_structure_note.py     | 45 ++++++++++++++
 5 files changed, 156 insertions(+), 12 deletions(-)

diff --git a/.github/workflows/tests.yml b/.github/workflows/tests.yml
index 8012b2455..022f37041 100644
--- a/.github/workflows/tests.yml
+++ b/.github/workflows/tests.yml
@@ -52,6 +52,18 @@ jobs:
           restore-keys: |
             ${{ runner.os }}-pip-${{ matrix.python-version }}-
 
+      - name: Install WeasyPrint system dependencies
+        run: |
+          sudo apt-get update
+          sudo apt-get install -y --no-install-recommends \
+            libcairo2 \
+            libpango-1.0-0 \
+            libpangoft2-1.0-0 \
+            libgdk-pixbuf-2.0-0 \
+            libharfbuzz0b \
+            libharfbuzz-subset0 \
+            shared-mime-info
+
       - name: Install minimal dependencies for import check
         run: |
           python -m pip install --upgrade pip
@@ -92,6 +104,18 @@ jobs:
           restore-keys: |
             ${{ runner.os }}-pip-3.11-
 
+      - name: Install WeasyPrint system dependencies
+        run: |
+          sudo apt-get update
+          sudo apt-get install -y --no-install-recommends \
+            libcairo2 \
+            libpango-1.0-0 \
+            libpangoft2-1.0-0 \
+            libgdk-pixbuf-2.0-0 \
+            libharfbuzz0b \
+            libharfbuzz-subset0 \
+            shared-mime-info
+
       - name: Install smoke test dependencies
         run: |
           python -m pip install --upgrade pip
diff --git a/Dockerfile b/Dockerfile
index 4991652f5..cd7918fae 100644
--- a/Dockerfile
+++ b/Dockerfile
@@ -67,7 +67,8 @@ ENV PYTHONDONTWRITEBYTECODE=1 \
 WORKDIR /app
 
 # Install system dependencies
-# Note: libgl1 and libglib2.0-0 are required for OpenCV (used by mineru)
+# Note: libgl1 and libglib2.0-0 are required for OpenCV (used by mineru).
+# Pango/Cairo/GDK-PixBuf libraries are required by WeasyPrint PDF export.
 # Rust is required for building tiktoken and other packages without pre-built wheels
 RUN apt-get update && apt-get install -y --no-install-recommends \
     curl \
@@ -78,7 +79,15 @@ RUN apt-get update && apt-get install -y --no-install-recommends \
     libsm6 \
     libxext6 \
     libxrender1 \
+    libcairo2 \
+    libpango-1.0-0 \
+    libpangoft2-1.0-0 \
+    libgdk-pixbuf-2.0-0 \
+    libharfbuzz0b \
+    libharfbuzz-subset0 \
+    shared-mime-info \
     pkg-config \
+    libffi-dev \
     libssl-dev \
     && rm -rf /var/lib/apt/lists/* \
     && curl --proto '=https' --tlsv1.2 -sSf https://sh.rustup.rs | sh -s -- -y
@@ -114,7 +123,8 @@ ENV PYTHONDONTWRITEBYTECODE=1 \
 WORKDIR /app
 
 # Install system dependencies
-# Note: libgl1 and libglib2.0-0 are required for OpenCV (used by mineru)
+# Note: libgl1 and libglib2.0-0 are required for OpenCV (used by mineru).
+# Pango/Cairo/GDK-PixBuf libraries are required by WeasyPrint PDF export.
 RUN apt-get update && apt-get install -y --no-install-recommends \
     curl \
     ca-certificates \
@@ -125,6 +135,13 @@ RUN apt-get update && apt-get install -y --no-install-recommends \
     libsm6 \
     libxext6 \
     libxrender1 \
+    libcairo2 \
+    libpango-1.0-0 \
+    libpangoft2-1.0-0 \
+    libgdk-pixbuf-2.0-0 \
+    libharfbuzz0b \
+    libharfbuzz-subset0 \
+    shared-mime-info \
     && rm -rf /var/lib/apt/lists/*
 
 # Copy Node.js from node-runtime stage (platform-matched binary)
diff --git a/deeptutor/agents/structure_note/renderer.py b/deeptutor/agents/structure_note/renderer.py
index 9687c7880..1a9d3fa61 100644
--- a/deeptutor/agents/structure_note/renderer.py
+++ b/deeptutor/agents/structure_note/renderer.py
@@ -1,9 +1,12 @@
 from __future__ import annotations
 
+from collections.abc import Callable
 from html import escape
 import json
 from pathlib import Path
 import re
+from typing import Any
+from urllib.parse import unquote, urlparse
 
 from .markdown_postprocessor import (
     normalize_structure_note_markdown,
@@ -94,6 +97,10 @@ class RenderError(RuntimeError):
 _MATH_BLOCK_RE = re.compile(r"(?<!\$)\$\$\s*([\s\S]*?)\s*\$\$(?!\$)")
 _MATH_INLINE_RE = re.compile(r"(?<!\\)(?<!\$)\$(?!\$|\s)([^$\n]+?)(?<!\s)(?<!\\)\$(?!\$)")
 _FENCE_RE = re.compile(r"(```[\s\S]*?```|~~~[\s\S]*?~~~)")
+_SAFE_ANCHOR_RE = re.compile(r'<a\s+id="([A-Za-z0-9_.:-]+)"\s*></a>')
+
+
+UrlFetcher = Callable[[str], dict[str, Any]]
 
 
 def _render_math_for_pdf(markdown_text: str) -> str:
@@ -109,6 +116,21 @@ def _render_math_for_pdf(markdown_text: str) -> str:
     return "".join(parts)
 
 
+def _escape_raw_html(markdown_text: str) -> str:
+    anchors: dict[str, str] = {}
+
+    def preserve_anchor(match: re.Match[str]) -> str:
+        token = f"@@STRUCTURE_NOTE_ANCHOR_{len(anchors)}@@"
+        anchors[token] = match.group(0)
+        return token
+
+    protected = _SAFE_ANCHOR_RE.sub(preserve_anchor, markdown_text)
+    escaped = protected.replace("<", "&lt;").replace(">", "&gt;")
+    for token, anchor in anchors.items():
+        escaped = escaped.replace(token, anchor)
+    return escaped
+
+
 def _render_math_in_non_fenced_text(markdown_text: str) -> str:
     def replace_display(match: re.Match[str]) -> str:
         expression = match.group(1).strip()
@@ -126,6 +148,35 @@ def replace_inline(match: re.Match[str]) -> str:
     return _MATH_INLINE_RE.sub(replace_inline, rendered)
 
 
+def _build_safe_url_fetcher(job_dir: Path, delegate: UrlFetcher) -> UrlFetcher:
+    root = job_dir.resolve()
+
+    def fetch(url: str) -> dict[str, Any]:
+        parsed = urlparse(url)
+        scheme = parsed.scheme.lower()
+        if scheme not in {"", "file"}:
+            raise RenderError("Blocked remote resource while rendering Structure Note PDF.")
+        if parsed.netloc and parsed.netloc != "localhost":
+            raise RenderError("Blocked non-local file resource while rendering Structure Note PDF.")
+
+        if scheme == "file":
+            candidate = Path(unquote(parsed.path)).resolve()
+        else:
+            candidate = (root / unquote(url)).resolve()
+
+        try:
+            candidate.relative_to(root)
+        except ValueError:
+            raise RenderError(
+                "Blocked file resource outside the Structure Note workspace during PDF render."
+            )
+        if not candidate.is_file():
+            raise RenderError(f"Structure Note render resource not found: {candidate}")
+        return delegate(candidate.as_uri())
+
+    return fetch
+
+
 def render_pdf(
     markdown_text: str,
     title: str,
@@ -142,7 +193,7 @@ def render_pdf(
         ) from exc
 
     try:
-        from weasyprint import HTML
+        from weasyprint import HTML, default_url_fetcher
     except ImportError as exc:
         raise RenderError(
             "WeasyPrint is required for Structure Note PDF export. Install `weasyprint` and retry."
@@ -155,7 +206,7 @@ def render_pdf(
         raise RenderError(f"Structure Note Markdown contains unsupported math syntax: {detail}")
 
     final_dir.mkdir(parents=True, exist_ok=True)
-    html_ready_markdown = _render_math_for_pdf(markdown_text)
+    html_ready_markdown = _render_math_for_pdf(_escape_raw_html(markdown_text))
     html_body = markdown(html_ready_markdown, extensions=["extra", "fenced_code", "tables", "toc"])
     html = (
         "<!doctype html><html><head><meta charset='utf-8'>"
@@ -166,7 +217,11 @@ def render_pdf(
 
     pdf_stem = output_stem.strip() or "final"
     pdf_path = final_dir / f"{pdf_stem}.pdf"
-    HTML(string=html, base_url=str(job_dir)).write_pdf(str(pdf_path))
+    HTML(
+        string=html,
+        base_url=str(job_dir),
+        url_fetcher=_build_safe_url_fetcher(job_dir, default_url_fetcher),
+    ).write_pdf(str(pdf_path))
 
     citation_path = final_dir / "citation_manifest.json"
     with open(citation_path, "w", encoding="utf-8") as handle:
diff --git a/deeptutor/api/routers/structure_note.py b/deeptutor/api/routers/structure_note.py
index 0afe8f4b2..5197febc8 100644
--- a/deeptutor/api/routers/structure_note.py
+++ b/deeptutor/api/routers/structure_note.py
@@ -16,10 +16,6 @@
 from fastapi import APIRouter, BackgroundTasks, File, Form, HTTPException, UploadFile
 from fastapi.responses import StreamingResponse
 
-from deeptutor.api.utils.task_id_manager import TaskIDManager
-from deeptutor.api.utils.task_log_stream import get_task_stream_manager
-from deeptutor.logging import get_logger
-from deeptutor.services.config import PROJECT_ROOT, load_config_with_main
 from deeptutor.agents.structure_note import (
     DifficultyLevel,
     ExplanationStyleLevel,
@@ -27,6 +23,10 @@
     NoteLanguage,
     StructureNoteManager,
 )
+from deeptutor.api.utils.task_id_manager import TaskIDManager
+from deeptutor.api.utils.task_log_stream import get_task_stream_manager
+from deeptutor.logging import get_logger
+from deeptutor.services.config import PROJECT_ROOT, load_config_with_main
 from deeptutor.utils.document_validator import DocumentValidator
 
 router = APIRouter()
@@ -62,7 +62,7 @@ def _emit_log(task_id: str, message: str) -> None:
     logger.info(f"[{task_id}] {message}")
 
 
-def _save_upload(file: UploadFile, target_dir: Path) -> tuple[Path, str, int]:
+async def _save_upload(file: UploadFile, target_dir: Path) -> tuple[Path, str, int]:
     safe_name = DocumentValidator.validate_upload_safety(
         file.filename or "upload",
         None,
@@ -72,7 +72,10 @@ def _save_upload(file: UploadFile, target_dir: Path) -> tuple[Path, str, int]:
     target_path = target_dir / safe_name
     written_bytes = 0
     with open(target_path, "wb") as handle:
-        for chunk in iter(lambda: file.file.read(8192), b""):
+        while True:
+            chunk = await file.read(8192)
+            if not chunk:
+                break
             written_bytes += len(chunk)
             if written_bytes > DocumentValidator.MAX_FILE_SIZE:
                 raise HTTPException(status_code=400, detail="Uploaded file exceeds the size limit.")
@@ -231,7 +234,7 @@ async def create_job(
 
     job_id = f"structure_note_{datetime.utcnow().strftime('%Y%m%d_%H%M%S')}_{uuid4().hex[:8]}"
     job_dirs = manager.storage.ensure_job_dirs(job_id)
-    source_path, safe_name, _ = _save_upload(file, job_dirs["source"])
+    source_path, safe_name, _ = await _save_upload(file, job_dirs["source"])
 
     target_project_name = (
         project_name.strip() if project_name and project_name.strip() else "Local Uploads"
diff --git a/tests/agents/structure_note/test_structure_note.py b/tests/agents/structure_note/test_structure_note.py
index 8a247f3cd..15d8eca25 100644
--- a/tests/agents/structure_note/test_structure_note.py
+++ b/tests/agents/structure_note/test_structure_note.py
@@ -30,6 +30,11 @@
 from deeptutor.agents.structure_note.normalizer import NormalizationError, normalize_to_pdf
 from deeptutor.agents.structure_note.page_index import sections_from_pageindex_structure
 from deeptutor.agents.structure_note.planner import build_document_plan
+from deeptutor.agents.structure_note.renderer import (
+    RenderError,
+    _build_safe_url_fetcher,
+    _escape_raw_html,
+)
 from deeptutor.agents.structure_note.tree_builder import build_section_tree
 
 
@@ -282,6 +287,46 @@ def test_export_output_stem_uses_source_title_with_structure_note_suffix() -> No
     assert StructureNoteManager()._export_output_stem(artifact) == "Week3-structure-note"
 
 
+def test_pdf_renderer_escapes_raw_html_but_preserves_section_anchors() -> None:
+    markdown = (
+        '<a id="section-001"></a>\n\n'
+        '<img src="https://169.254.169.254/latest/meta-data"> '
+        "<script>alert('x')</script>"
+    )
+
+    escaped = _escape_raw_html(markdown)
+
+    assert '<a id="section-001"></a>' in escaped
+    assert "&lt;img src=" in escaped
+    assert "&lt;script&gt;" in escaped
+    assert "<script>" not in escaped
+    assert "<img" not in escaped
+
+
+def test_pdf_renderer_url_fetcher_allows_only_job_workspace_files(tmp_path: Path) -> None:
+    job_dir = tmp_path / "job"
+    image_path = job_dir / "images" / "figure.png"
+    image_path.parent.mkdir(parents=True)
+    image_path.write_bytes(b"png")
+    outside_path = tmp_path / "outside.png"
+    outside_path.write_bytes(b"png")
+    fetched_urls: list[str] = []
+
+    def _fake_fetcher(url: str):
+        fetched_urls.append(url)
+        return {"string": b""}
+
+    fetcher = _build_safe_url_fetcher(job_dir, _fake_fetcher)
+
+    fetcher(image_path.as_uri())
+
+    assert fetched_urls == [image_path.as_uri()]
+    with pytest.raises(RenderError):
+        fetcher("https://example.com/figure.png")
+    with pytest.raises(RenderError):
+        fetcher(outside_path.as_uri())
+
+
 @pytest.mark.asyncio
 async def test_generate_transition_markdown_uses_llm_context(monkeypatch) -> None:
     captured: dict[str, str] = {}