From caba92a820ea3212e98a7ed9fd1294c40668d6eb Mon Sep 17 00:00:00 2001
From: Jack Luar <jluar@precisioninno.com>
Date: Sun, 7 Jun 2026 06:15:30 +0000
Subject: [PATCH 1/3] ci: pre-build FAISS indices in Docker image to fix ~60
 min graph init

Graph initialisation during the docker-eval CI job was taking ~60 minutes
because all 6 FAISS vector indices were rebuilt from scratch at container
startup on every run (HuggingFace CPU inference over the full corpus, or
Google Gemini embedding API exhausting its quota and retrying with 60 s
minimum backoff).

Root cause:
- HybridRetrieverChain.create_hybrid_retriever() takes the slow embed_docs()
  path when faiss_db/<name> does not exist on disk.
- The faiss_data named volume is empty on every CI run (docker compose down
  --volumes is called between jobs), so the indices are never reused.

Fix:
- Add backend/scripts/build_faiss.py: runs RetrieverTools.initialize() with
  EMBEDDINGS_TYPE=HF, FAST_MODE=true, and contextual_rerank=False at Docker
  build time, saving all 6 FAISS indices into the image layer.
- Add a RUN step in the Dockerfile that calls the script after the dataset
  is downloaded. Docker layer caching means the step is skipped on re-runs
  where neither source nor data changed.
- Set ENV EMBEDDINGS_TYPE=HF / HF_EMBEDDINGS=thenlper/gte-large as container
  defaults so runtime matches the pre-built indices (override in .env or via
  docker run -e if a different model is needed).
- Add contextual_rerank: bool = True param to RetrieverTools.initialize() so
  the build script can skip loading the cross-encoder model, keeping the
  Docker build dependency-light.

On first CI run with an empty faiss_data volume Docker copies the pre-built
indices from the image into the volume automatically, so the container finds
faiss_db/<name> at startup and takes the load_db() path instead.  Graph init
drops from ~60 min to a few seconds.

Note: ensure backend/.env (or ci-secret.yaml) sets EMBEDDINGS_TYPE=HF to
match the pre-built indices; using a different model at runtime causes a
vector dimension mismatch.

Signed-off-by: Jack Luar <jluar@precisioninno.com>
---
 backend/Dockerfile                    | 17 +++++++++
 backend/scripts/build_faiss.py        | 52 +++++++++++++++++++++++++++
 backend/src/agents/retriever_tools.py | 13 +++----
 3 files changed, 76 insertions(+), 6 deletions(-)
 create mode 100644 backend/scripts/build_faiss.py
diff --git a/backend/Dockerfile b/backend/Dockerfile
index b8cbb94f..de9ddd83 100644
--- a/backend/Dockerfile
+++ b/backend/Dockerfile
@@ -27,6 +27,23 @@ RUN git clone https://huggingface.co/datasets/The-OpenROAD-Project/ORAssistant_R
     mv ORAssistant_RAG_Dataset/* data/ && \
     rm -rf ORAssistant_RAG_Dataset
 
+# Build FAISS indices into the image using HuggingFace embeddings (no API quota).
+# At container startup HybridRetrieverChain detects faiss_db/ and loads from disk,
+# reducing graph init from ~60 min to a few seconds.
+# Override these ARGs to build with a different model when needed.
+ARG BUILD_EMBEDDINGS_TYPE=HF
+ARG BUILD_HF_MODEL=thenlper/gte-large
+RUN PYTHONPATH=/ORAssistant-backend \
+    EMBEDDINGS_TYPE=${BUILD_EMBEDDINGS_TYPE} \
+    HF_EMBEDDINGS=${BUILD_HF_MODEL} \
+    FAST_MODE=true \
+    uv run python scripts/build_faiss.py
+
+# Set HF as the default embedding backend so runtime matches the pre-built indices.
+# Override at container runtime (docker run -e / docker-compose environment) if needed.
+ENV EMBEDDINGS_TYPE=HF
+ENV HF_EMBEDDINGS=thenlper/gte-large
+
 EXPOSE 8000
 
 CMD ["uv", "run", "uvicorn", "src.api.main:app", "--host", "0.0.0.0", "--port", "8000", "--reload"]
diff --git a/backend/scripts/build_faiss.py b/backend/scripts/build_faiss.py
new file mode 100644
index 00000000..8fda8a96
--- /dev/null
+++ b/backend/scripts/build_faiss.py
@@ -0,0 +1,52 @@
+"""
+Pre-build FAISS indices for all retriever chains at Docker image build time.
+
+Run from /ORAssistant-backend (the WORKDIR in the Dockerfile) so that data/ is
+reachable via relative paths.  Uses HuggingFace embeddings by default so no
+external API key or network quota is required during docker build.
+
+The saved indices land in faiss_db/ inside the image.  At container startup,
+HybridRetrieverChain.create_hybrid_retriever() detects existing directories and
+takes the load_db() path instead of re-embedding, dropping init time from ~60 min
+to a few seconds.
+
+EMBEDDINGS_TYPE and HF_EMBEDDINGS are read from the environment so the Dockerfile
+ARG values propagate through cleanly.
+"""
+
+import os
+import sys
+import logging
+
+logging.basicConfig(level="INFO", format="%(levelname)s %(message)s")
+
+if not os.path.isdir("data"):
+    sys.exit("ERROR: run from backend directory — data/ not found")
+
+embeddings_type = os.environ.get("EMBEDDINGS_TYPE", "HF")
+hf_embeddings = os.environ.get("HF_EMBEDDINGS", "thenlper/gte-large")
+fast_mode = os.environ.get("FAST_MODE", "true").lower() == "true"
+
+if embeddings_type != "HF":
+    sys.exit(
+        f"ERROR: build_faiss.py only supports EMBEDDINGS_TYPE=HF, got '{embeddings_type}'"
+    )
+
+embeddings_config = {"type": embeddings_type, "name": hf_embeddings}
+
+logging.info("Pre-building FAISS indices")
+logging.info("  model     : %s", hf_embeddings)
+logging.info("  fast_mode : %s", fast_mode)
+
+from src.agents.retriever_tools import RetrieverTools
+
+tools = RetrieverTools()
+tools.initialize(
+    embeddings_config=embeddings_config,
+    reranking_model_name="",
+    use_cuda=False,
+    fast_mode=fast_mode,
+    contextual_rerank=False,
+)
+
+logging.info("FAISS pre-build complete")
diff --git a/backend/src/agents/retriever_tools.py b/backend/src/agents/retriever_tools.py
index c2ad3823..ac299bf7 100644
--- a/backend/src/agents/retriever_tools.py
+++ b/backend/src/agents/retriever_tools.py
@@ -45,6 +45,7 @@ def initialize(
         reranking_model_name: str,
         use_cuda: bool = False,
         fast_mode: bool = False,
+        contextual_rerank: bool = True,
     ) -> None:
         markdown_docs_map = {
             "general": [
@@ -97,7 +98,7 @@ def initialize(
             else markdown_docs_map["general"],
             other_docs_path=[] if fast_mode else ["./data/pdf"],
             weights=[0.6, 0.2, 0.2],
-            contextual_rerank=True,
+            contextual_rerank=contextual_rerank,
             search_k=search_k,
             chunk_size=chunk_size,
         )
@@ -112,7 +113,7 @@ def initialize(
             if fast_mode
             else markdown_docs_map["install"],
             weights=[0.6, 0.2, 0.2],
-            contextual_rerank=True,
+            contextual_rerank=contextual_rerank,
             search_k=search_k,
             chunk_size=chunk_size,
         )
@@ -128,7 +129,7 @@ def initialize(
             else markdown_docs_map["commands"],
             other_docs_path=[] if fast_mode else ["./data/pdf"],
             weights=[0.6, 0.2, 0.2],
-            contextual_rerank=True,
+            contextual_rerank=contextual_rerank,
             search_k=search_k,
             chunk_size=chunk_size,
         )
@@ -143,7 +144,7 @@ def initialize(
             if fast_mode
             else ["./data/html/yosys_docs"],
             weights=[0.6, 0.2, 0.2],
-            contextual_rerank=True,
+            contextual_rerank=contextual_rerank,
             search_k=search_k,
             chunk_size=chunk_size,
         )
@@ -158,7 +159,7 @@ def initialize(
             if fast_mode
             else ["./data/html/klayout_docs"],
             weights=[0.6, 0.2, 0.2],
-            contextual_rerank=True,
+            contextual_rerank=contextual_rerank,
             search_k=search_k,
             chunk_size=chunk_size,
         )
@@ -173,7 +174,7 @@ def initialize(
             if fast_mode
             else markdown_docs_map["errinfo"],
             weights=[0.6, 0.2, 0.2],
-            contextual_rerank=True,
+            contextual_rerank=contextual_rerank,
             search_k=search_k,
             chunk_size=chunk_size,
         )

From 754588741b998dcf3a934e3b4b0c0b016cb6fb3f Mon Sep 17 00:00:00 2001
From: Jack Luar <jluar@precisioninno.com>
Date: Sun, 7 Jun 2026 07:47:37 +0000
Subject: [PATCH 2/3] fix: move import to top of build_faiss.py to satisfy ruff
 E402

Signed-off-by: Jack Luar <jluar@precisioninno.com>
---
 backend/scripts/build_faiss.py | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/backend/scripts/build_faiss.py b/backend/scripts/build_faiss.py
index 8fda8a96..ca59b651 100644
--- a/backend/scripts/build_faiss.py
+++ b/backend/scripts/build_faiss.py
@@ -14,9 +14,11 @@
 ARG values propagate through cleanly.
 """
 
+import logging
 import os
 import sys
-import logging
+
+from src.agents.retriever_tools import RetrieverTools
 
 logging.basicConfig(level="INFO", format="%(levelname)s %(message)s")
 
@@ -38,8 +40,6 @@
 logging.info("  model     : %s", hf_embeddings)
 logging.info("  fast_mode : %s", fast_mode)
 
-from src.agents.retriever_tools import RetrieverTools
-
 tools = RetrieverTools()
 tools.initialize(
     embeddings_config=embeddings_config,

From 72911e74b894a574b35ba34b5c08dc40072517aa Mon Sep 17 00:00:00 2001
From: Jack Luar <jluar@precisioninno.com>
Date: Sun, 7 Jun 2026 09:04:15 +0000
Subject: [PATCH 3/3] ci: make FAISS build incremental and decouple from PR
 builds

Move FAISS index construction out of the main Dockerfile into a
dedicated Dockerfile.faiss-cache built only by the new build-faiss.yml
secret CI workflow (manual trigger + on upload.yml completion).

The main Dockerfile now does COPY --from=faiss-cache-image, so PRs
never rebuild indices.

build_faiss.py gains per-index hash-based skipping: a manifest.json
tracks a SHA256 of each index source file paths+sizes. On each secret
CI run the previous faiss_db/ is extracted from the old cache image and
placed in the build context; unchanged indices are skipped entirely.

Index names migrated from fragile counter-based similarity_INST1..6 to
stable explicit names (general, install, commands, yosys_rtdocs,
klayout, errinfo) so manifest keys are stable across runs.

Signed-off-by: Jack Luar <jluar@precisioninno.com>
---
 .github/workflows/build-faiss.yml             |  59 ++++++
 backend/Dockerfile                            |  31 ++-
 backend/Dockerfile.faiss-cache                |  40 ++++
 backend/Dockerfile.faiss-cache.dockerignore   |   7 +
 backend/scripts/build_faiss.py                | 182 +++++++++++++++---
 backend/src/agents/retriever_tools.py         |   6 +
 backend/src/chains/hybrid_retriever_chain.py  |   3 +
 .../src/chains/similarity_retriever_chain.py  |   3 +-
 8 files changed, 285 insertions(+), 46 deletions(-)
 create mode 100644 .github/workflows/build-faiss.yml
 create mode 100644 backend/Dockerfile.faiss-cache
 create mode 100644 backend/Dockerfile.faiss-cache.dockerignore

diff --git a/.github/workflows/build-faiss.yml b/.github/workflows/build-faiss.yml
new file mode 100644
index 00000000..fa0f1ef9
--- /dev/null
+++ b/.github/workflows/build-faiss.yml
@@ -0,0 +1,59 @@
+name: Build FAISS cache image
+
+on:
+  workflow_dispatch:
+  workflow_run:
+    workflows: ["Upload latest documentation"]
+    types: [completed]
+
+permissions:
+  contents: read
+  packages: write
+
+env:
+  CACHE_IMAGE: ghcr.io/${{ github.repository_owner }}/orassistant-faiss-cache
+
+jobs:
+  build-faiss-cache:
+    # Skip if triggered by upload workflow that failed
+    if: >
+      github.event_name == 'workflow_dispatch' ||
+      github.event.workflow_run.conclusion == 'success'
+    runs-on: ubuntu-latest
+    steps:
+      - name: Checkout code
+        uses: actions/checkout@34e114876b0b11c390a56381ad16ebd13914f8d5  # v4.3.1
+
+      - name: Log in to GHCR
+        uses: docker/login-action@74a5d142397b4f367a81961eba4e8cd7edddf772  # v3.4.0
+        with:
+          registry: ghcr.io
+          username: ${{ github.actor }}
+          password: ${{ secrets.GITHUB_TOKEN }}
+
+      - name: Restore previous faiss_db for incremental build
+        run: |
+          mkdir -p backend/faiss_db
+          if docker pull ${{ env.CACHE_IMAGE }}:latest 2>/dev/null; then
+            docker create --name prev-faiss ${{ env.CACHE_IMAGE }}:latest
+            docker cp prev-faiss:/ORAssistant-backend/faiss_db/. backend/faiss_db/ || true
+            docker rm prev-faiss
+            echo "Restored previous faiss_db for incremental build"
+          else
+            echo "No previous cache image found — building all indices from scratch"
+          fi
+          # Ensure at least one file exists so COPY ./faiss_db in Dockerfile always succeeds
+          touch backend/faiss_db/.keep
+
+      - name: Build FAISS cache image
+        run: |
+          docker build \
+            -f backend/Dockerfile.faiss-cache \
+            -t ${{ env.CACHE_IMAGE }}:latest \
+            -t ${{ env.CACHE_IMAGE }}:${{ github.sha }} \
+            backend/
+
+      - name: Push FAISS cache image
+        run: |
+          docker push ${{ env.CACHE_IMAGE }}:latest
+          docker push ${{ env.CACHE_IMAGE }}:${{ github.sha }}
diff --git a/backend/Dockerfile b/backend/Dockerfile
index de9ddd83..01b00ef0 100644
--- a/backend/Dockerfile
+++ b/backend/Dockerfile
@@ -1,3 +1,8 @@
+# Pull pre-built FAISS indices from the cache image (built by the build-faiss CI workflow).
+# This avoids rebuilding indices on every PR — only the secret CI rebuilds them.
+ARG FAISS_CACHE_IMAGE=ghcr.io/the-openroad-project/orassistant-faiss-cache:latest
+FROM ${FAISS_CACHE_IMAGE} AS faiss-cache
+
 FROM ghcr.io/astral-sh/uv:python3.13-bookworm-slim
 
 WORKDIR /ORAssistant-backend
@@ -22,25 +27,13 @@ COPY . .
 
 RUN uv venv .venv && uv sync --dev && uv run /ORAssistant-backend/src/post_install.py
 
-RUN git clone https://huggingface.co/datasets/The-OpenROAD-Project/ORAssistant_RAG_Dataset && \
-    mkdir -p data && \
-    mv ORAssistant_RAG_Dataset/* data/ && \
-    rm -rf ORAssistant_RAG_Dataset
-
-# Build FAISS indices into the image using HuggingFace embeddings (no API quota).
-# At container startup HybridRetrieverChain detects faiss_db/ and loads from disk,
-# reducing graph init from ~60 min to a few seconds.
-# Override these ARGs to build with a different model when needed.
-ARG BUILD_EMBEDDINGS_TYPE=HF
-ARG BUILD_HF_MODEL=thenlper/gte-large
-RUN PYTHONPATH=/ORAssistant-backend \
-    EMBEDDINGS_TYPE=${BUILD_EMBEDDINGS_TYPE} \
-    HF_EMBEDDINGS=${BUILD_HF_MODEL} \
-    FAST_MODE=true \
-    uv run python scripts/build_faiss.py
-
-# Set HF as the default embedding backend so runtime matches the pre-built indices.
-# Override at container runtime (docker run -e / docker-compose environment) if needed.
+# Copy pre-built FAISS indices from the cache image.
+# HybridRetrieverChain detects faiss_db/<name> at startup and takes the fast load_db()
+# path, reducing graph init from ~60 min to a few seconds.
+COPY --from=faiss-cache /ORAssistant-backend/faiss_db ./faiss_db
+
+# Runtime embedding model must match the model used when building the indices.
+# Override via docker run -e or docker-compose environment if using a different model.
 ENV EMBEDDINGS_TYPE=HF
 ENV HF_EMBEDDINGS=thenlper/gte-large
 
diff --git a/backend/Dockerfile.faiss-cache b/backend/Dockerfile.faiss-cache
new file mode 100644
index 00000000..3929750e
--- /dev/null
+++ b/backend/Dockerfile.faiss-cache
@@ -0,0 +1,40 @@
+FROM ghcr.io/astral-sh/uv:python3.13-bookworm-slim
+
+WORKDIR /ORAssistant-backend
+
+RUN apt-get update && apt-get install -y \
+    build-essential \
+    gcc \
+    git \
+    git-lfs \
+    wget && \
+    git lfs install && \
+    rm -rf /var/lib/apt/lists/*
+
+RUN pip install uv
+
+COPY ./pyproject.toml /ORAssistant-backend/pyproject.toml
+COPY ./src ./src
+COPY ./scripts ./scripts
+
+RUN uv venv .venv && uv sync --dev && uv run /ORAssistant-backend/src/post_install.py
+
+# Restore previous faiss_db for incremental builds.
+# The build-faiss CI workflow extracts faiss_db/ from the previous cache image and places
+# it in the build context. On first run the directory contains only a .keep sentinel.
+COPY ./faiss_db ./faiss_db
+
+# Download the RAG dataset (always refreshed so the hash check in build_faiss.py
+# can detect data changes from the latest upload).
+RUN git clone https://huggingface.co/datasets/The-OpenROAD-Project/ORAssistant_RAG_Dataset && \
+    mkdir -p data && \
+    mv ORAssistant_RAG_Dataset/* data/ && \
+    rm -rf ORAssistant_RAG_Dataset
+
+ARG BUILD_EMBEDDINGS_TYPE=HF
+ARG BUILD_HF_MODEL=thenlper/gte-large
+RUN PYTHONPATH=/ORAssistant-backend \
+    EMBEDDINGS_TYPE=${BUILD_EMBEDDINGS_TYPE} \
+    HF_EMBEDDINGS=${BUILD_HF_MODEL} \
+    FAST_MODE=true \
+    uv run python scripts/build_faiss.py
diff --git a/backend/Dockerfile.faiss-cache.dockerignore b/backend/Dockerfile.faiss-cache.dockerignore
new file mode 100644
index 00000000..66542e52
--- /dev/null
+++ b/backend/Dockerfile.faiss-cache.dockerignore
@@ -0,0 +1,7 @@
+.venv
+*.egg-info
+.mypy-cache
+__pycache__
+data
+tests
+# faiss_db is intentionally NOT excluded — CI places previous indices here for incremental builds
diff --git a/backend/scripts/build_faiss.py b/backend/scripts/build_faiss.py
index ca59b651..8ea5852d 100644
--- a/backend/scripts/build_faiss.py
+++ b/backend/scripts/build_faiss.py
@@ -1,33 +1,35 @@
 """
-Pre-build FAISS indices for all retriever chains at Docker image build time.
+Pre-build FAISS indices at Docker image build time with per-index incremental skipping.
 
-Run from /ORAssistant-backend (the WORKDIR in the Dockerfile) so that data/ is
-reachable via relative paths.  Uses HuggingFace embeddings by default so no
-external API key or network quota is required during docker build.
+Each index has a hash computed from its source file paths + sizes. If the hash matches
+the stored manifest and the index directory already exists, that index is skipped.
+Only changed or missing indices are rebuilt, so the secret CI only pays for what changed.
 
-The saved indices land in faiss_db/ inside the image.  At container startup,
-HybridRetrieverChain.create_hybrid_retriever() detects existing directories and
-takes the load_db() path instead of re-embedding, dropping init time from ~60 min
-to a few seconds.
-
-EMBEDDINGS_TYPE and HF_EMBEDDINGS are read from the environment so the Dockerfile
-ARG values propagate through cleanly.
+Run from /ORAssistant-backend (the WORKDIR in the Dockerfile) so data/ is reachable.
+EMBEDDINGS_TYPE and HF_EMBEDDINGS are read from the environment.
 """
 
+import hashlib
+import json
 import logging
 import os
 import sys
+from pathlib import Path
 
-from src.agents.retriever_tools import RetrieverTools
+from src.chains.hybrid_retriever_chain import HybridRetrieverChain
 
 logging.basicConfig(level="INFO", format="%(levelname)s %(message)s")
 
-if not os.path.isdir("data"):
-    sys.exit("ERROR: run from backend directory — data/ not found")
+FAISS_DB_DIR = Path("faiss_db")
+MANIFEST_FILE = FAISS_DB_DIR / "manifest.json"
 
 embeddings_type = os.environ.get("EMBEDDINGS_TYPE", "HF")
 hf_embeddings = os.environ.get("HF_EMBEDDINGS", "thenlper/gte-large")
 fast_mode = os.environ.get("FAST_MODE", "true").lower() == "true"
+chunk_size = int(os.environ.get("CHUNK_SIZE", 4000))
+
+if not os.path.isdir("data"):
+    sys.exit("ERROR: run from backend directory — data/ not found")
 
 if embeddings_type != "HF":
     sys.exit(
@@ -36,17 +38,145 @@
 
 embeddings_config = {"type": embeddings_type, "name": hf_embeddings}
 
-logging.info("Pre-building FAISS indices")
-logging.info("  model     : %s", hf_embeddings)
-logging.info("  fast_mode : %s", fast_mode)
-
-tools = RetrieverTools()
-tools.initialize(
-    embeddings_config=embeddings_config,
-    reranking_model_name="",
-    use_cuda=False,
-    fast_mode=fast_mode,
-    contextual_rerank=False,
+_MD = "./data/markdown"
+_HTML = "./data/html"
+
+# Mirrors fastmode_docs_map / markdown_docs_map in retriever_tools.py.
+# Each entry must use the same paths and index_name as RetrieverTools.initialize().
+INDEX_DEFS: dict[bool, list[dict]] = {
+    True: [  # fast_mode=True
+        {"name": "general", "markdown_docs_path": [f"{_MD}/OR_docs"]},
+        {"name": "install", "markdown_docs_path": [f"{_MD}/ORFS_docs/installation"]},
+        {"name": "commands", "markdown_docs_path": [f"{_MD}/OR_docs/tools"]},
+        {
+            "name": "yosys_rtdocs",
+            "html_docs_path": [
+                f"{_HTML}/yosys_docs/yosyshq.readthedocs.io"
+                "/projects/yosys/en/latest/getting_started"
+            ],
+        },
+        {
+            "name": "klayout",
+            "html_docs_path": [f"{_HTML}/klayout_docs/www.klayout.de/examples"],
+        },
+        {"name": "errinfo", "markdown_docs_path": [f"{_MD}/gh_discussions/Bug"]},
+    ],
+    False: [  # fast_mode=False (full dataset)
+        {
+            "name": "general",
+            "markdown_docs_path": [
+                f"{_MD}/OR_docs",
+                f"{_MD}/ORFS_docs",
+                f"{_MD}/gh_discussions",
+                f"{_MD}/manpages/man1",
+                f"{_MD}/manpages/man2",
+                f"{_MD}/OpenSTA_docs",
+            ],
+            "html_docs_path": [f"{_HTML}/or_website/"],
+            "other_docs_path": ["./data/pdf"],
+        },
+        {
+            "name": "install",
+            "markdown_docs_path": [
+                f"{_MD}/ORFS_docs/installation",
+                f"{_MD}/OR_docs/installation",
+                f"{_MD}/gh_discussions/Build",
+                f"{_MD}/gh_discussions/Installation",
+                f"{_MD}/OpenSTA_docs",
+            ],
+        },
+        {
+            "name": "commands",
+            "markdown_docs_path": [
+                f"{_MD}/OR_docs/tools",
+                f"{_MD}/ORFS_docs/general",
+                f"{_MD}/gh_discussions/Query",
+                f"{_MD}/gh_discussions/Runtime",
+                f"{_MD}/gh_discussions/Documentation",
+                f"{_MD}/manpages/man1",
+                f"{_MD}/manpages/man2",
+                f"{_MD}/OpenSTA_docs",
+            ],
+            "other_docs_path": ["./data/pdf"],
+        },
+        {"name": "yosys_rtdocs", "html_docs_path": [f"{_HTML}/yosys_docs"]},
+        {"name": "klayout", "html_docs_path": [f"{_HTML}/klayout_docs"]},
+        {
+            "name": "errinfo",
+            "markdown_docs_path": [
+                f"{_MD}/manpages/man3",
+                f"{_MD}/gh_discussions/Bug",
+            ],
+        },
+    ],
+}
+
+
+def _source_paths(index_def: dict) -> list[str]:
+    paths: list[str] = []
+    for key in ("markdown_docs_path", "html_docs_path", "other_docs_path"):
+        paths.extend(index_def.get(key, []))
+    return paths
+
+
+def _hash_paths(paths: list[str]) -> str:
+    """Stable hash over file path + size for all files under the given directories."""
+    h = hashlib.sha256()
+    for base in sorted(p for p in paths if Path(p).exists()):
+        for f in sorted(Path(base).rglob("*")):
+            if f.is_file() and not f.name.startswith("."):
+                h.update(str(f.relative_to(Path(base))).encode())
+                h.update(str(f.stat().st_size).encode())
+    return h.hexdigest()
+
+
+def _load_manifest() -> dict:
+    if MANIFEST_FILE.exists():
+        return json.loads(MANIFEST_FILE.read_text())
+    return {}
+
+
+def _save_manifest(manifest: dict) -> None:
+    FAISS_DB_DIR.mkdir(exist_ok=True)
+    MANIFEST_FILE.write_text(json.dumps(manifest, indent=2))
+
+
+logging.info(
+    "Pre-building FAISS indices (fast_mode=%s, model=%s)", fast_mode, hf_embeddings
 )
 
-logging.info("FAISS pre-build complete")
+manifest = _load_manifest()
+updated = False
+
+for index_def in INDEX_DEFS[fast_mode]:
+    name: str = index_def["name"]
+    paths = _source_paths(index_def)
+    current_hash = _hash_paths(paths)
+    index_dir = FAISS_DB_DIR / name
+
+    if manifest.get(name) == current_hash and index_dir.is_dir():
+        logging.info("Skipping %s (source data unchanged)", name)
+        continue
+
+    logging.info("Building index: %s", name)
+    chain = HybridRetrieverChain(
+        embeddings_config=embeddings_config,
+        reranking_model_name="",
+        use_cuda=False,
+        index_name=name,
+        markdown_docs_path=index_def.get("markdown_docs_path"),
+        html_docs_path=index_def.get("html_docs_path"),
+        other_docs_path=index_def.get("other_docs_path"),
+        chunk_size=chunk_size,
+        contextual_rerank=False,
+    )
+    chain.create_hybrid_retriever()
+    manifest[name] = current_hash
+    updated = True
+    logging.info("Built index: %s", name)
+
+if updated:
+    _save_manifest(manifest)
+    logging.info("FAISS pre-build complete (manifest updated)")
+else:
+    logging.info("FAISS pre-build complete (all indices up to date, nothing rebuilt)")
diff --git a/backend/src/agents/retriever_tools.py b/backend/src/agents/retriever_tools.py
index ac299bf7..21ffa9ea 100644
--- a/backend/src/agents/retriever_tools.py
+++ b/backend/src/agents/retriever_tools.py
@@ -101,6 +101,7 @@ def initialize(
             contextual_rerank=contextual_rerank,
             search_k=search_k,
             chunk_size=chunk_size,
+            index_name="general",
         )
         general_retriever_chain.create_hybrid_retriever()
         RetrieverTools.general_retriever = general_retriever_chain.retriever
@@ -116,6 +117,7 @@ def initialize(
             contextual_rerank=contextual_rerank,
             search_k=search_k,
             chunk_size=chunk_size,
+            index_name="install",
         )
         install_retriever_chain.create_hybrid_retriever()
         RetrieverTools.install_retriever = install_retriever_chain.retriever
@@ -132,6 +134,7 @@ def initialize(
             contextual_rerank=contextual_rerank,
             search_k=search_k,
             chunk_size=chunk_size,
+            index_name="commands",
         )
         commands_retriever_chain.create_hybrid_retriever()
         RetrieverTools.commands_retriever = commands_retriever_chain.retriever
@@ -147,6 +150,7 @@ def initialize(
             contextual_rerank=contextual_rerank,
             search_k=search_k,
             chunk_size=chunk_size,
+            index_name="yosys_rtdocs",
         )
         yosys_rtdocs_retriever_chain.create_hybrid_retriever()
         RetrieverTools.yosys_rtdocs_retriever = yosys_rtdocs_retriever_chain.retriever
@@ -162,6 +166,7 @@ def initialize(
             contextual_rerank=contextual_rerank,
             search_k=search_k,
             chunk_size=chunk_size,
+            index_name="klayout",
         )
         klayout_retriever_chain.create_hybrid_retriever()
         RetrieverTools.klayout_retriever = klayout_retriever_chain.retriever
@@ -177,6 +182,7 @@ def initialize(
             contextual_rerank=contextual_rerank,
             search_k=search_k,
             chunk_size=chunk_size,
+            index_name="errinfo",
         )
         errinfo_retriever_chain.create_hybrid_retriever()
         RetrieverTools.errinfo_retriever = errinfo_retriever_chain.retriever
diff --git a/backend/src/chains/hybrid_retriever_chain.py b/backend/src/chains/hybrid_retriever_chain.py
index d96be2d8..44a24be8 100644
--- a/backend/src/chains/hybrid_retriever_chain.py
+++ b/backend/src/chains/hybrid_retriever_chain.py
@@ -36,6 +36,7 @@ def __init__(
         weights: list[float] = [0.33, 0.33, 0.33],
         chunk_size: int = 500,
         contextual_rerank: bool = False,
+        index_name: Optional[str] = None,
     ):
         super().__init__(
             llm_model=llm_model,
@@ -58,6 +59,7 @@ def __init__(
         self.chunk_size: int = chunk_size
 
         self.contextual_rerank: bool = contextual_rerank
+        self.index_name: Optional[str] = index_name
         self.retriever: Any  # RunnableParallel compatibility
 
     def create_hybrid_retriever(self) -> None:
@@ -72,6 +74,7 @@ def create_hybrid_retriever(self) -> None:
             html_docs_path=self.html_docs_path,
             chunk_size=self.chunk_size,
             use_cuda=self.use_cuda,
+            name=self.index_name,
         )
         if self.vector_db is None:
             cur_path = os.path.abspath(__file__)
diff --git a/backend/src/chains/similarity_retriever_chain.py b/backend/src/chains/similarity_retriever_chain.py
index 01547ebf..1c0285b2 100644
--- a/backend/src/chains/similarity_retriever_chain.py
+++ b/backend/src/chains/similarity_retriever_chain.py
@@ -28,6 +28,7 @@ def __init__(
         embeddings_config: Optional[dict[str, str]] = None,
         use_cuda: bool = False,
         chunk_size: int = 500,
+        name: Optional[str] = None,
     ):
         super().__init__(
             llm_model=llm_model,
@@ -36,7 +37,7 @@ def __init__(
         )
 
         SimilarityRetrieverChain.count += 1
-        self.name = f"similarity_INST{SimilarityRetrieverChain.count}"
+        self.name = name if name is not None else f"similarity_INST{SimilarityRetrieverChain.count}"
 
         self.embeddings_config: Optional[dict[str, str]] = embeddings_config
         self.use_cuda: bool = use_cuda