diff --git a/.github/PULL_REQUEST_TEMPLATE.md b/.github/PULL_REQUEST_TEMPLATE.md
new file mode 100644
index 00000000..2337d0f0
--- /dev/null
+++ b/.github/PULL_REQUEST_TEMPLATE.md
@@ -0,0 +1,21 @@
+## Summary
+
+<!-- Brief description of what this PR does -->
+
+## Changes
+
+<!-- List the key changes -->
+
+-
+
+## Checklist
+
+- [ ] Code compiles (`cargo build`)
+- [ ] Tests pass (`cargo test --lib --all-features`)
+- [ ] No new clippy warnings (`cargo clippy --all-features`)
+- [ ] Public APIs have documentation comments
+- [ ] Python bindings updated (if Rust API changed)
+
+## Notes
+
+<!-- Anything reviewers should know? Breaking changes, migration notes, etc. -->
diff --git a/Cargo.toml b/Cargo.toml
index 1a626bab..cd8fca41 100644
--- a/Cargo.toml
+++ b/Cargo.toml
@@ -3,7 +3,7 @@ members = ["rust", "python"]
 resolver = "2"
 
 [workspace.package]
-version = "0.1.28"
+version = "0.1.29"
 edition = "2024"
 authors = ["zTgx <beautifularea@gmail.com>"]
 license = "Apache-2.0"
diff --git a/README.md b/README.md
index 96d73505..556ba5f3 100644
--- a/README.md
+++ b/README.md
@@ -13,15 +13,11 @@
 
 </div>
 
-**Vectorless** is a reasoning-native document engine designed to be the foundational layer for AI applications that need structured access to documents, with the core written in Rust. It does not use vector databases, embeddings, or similarity search. Instead, it transforms documents into hierarchical semantic trees and uses the LLM itself to navigate and retrieve — purely LLM-guided, from indexing to querying.
+**Vectorless** is a reasoning-native document engine designed to be the foundational layer for AI applications that need structured access to documents, with the core written in Rust. It does not use vector databases, embeddings, or similarity search. Instead, it will reason through any of your structured documents — **PDFs, Markdown, reports, contracts** — and retrieve only what's relevant. Nothing more, nothing less.
 
 
 
-## Why Vectorless
-
-Most document retrieval solutions rely on vector similarity — splitting documents into chunks, embedding them, and searching by cosine distance. This works for rough topic matching, but breaks down when you need **precision**: specific numbers, cross-section references, or multi-step reasoning across a document.
-
-Vectorless takes a different approach. No vectors at all. It builds a **semantic tree index** of each document — preserving the original hierarchy — and uses the LLM itself to navigate that structure. The LLM generates the tree during indexing and reasons through it during retrieval. Pure LLM guidance, end to end.
+## How It Works
 
 <div align="center">
   <img src="https://vectorless.dev/img/workflow.svg" alt="Vectorless Workflow" width="900">
@@ -48,6 +44,7 @@ async fn main() -> vectorless::Result<()> {
     let engine = EngineBuilder::new()
         .with_key("sk-...")
         .with_model("gpt-4o")
+        .with_endpoint("https://api.openai.com/v1")
         .build()
         .await?;
 
@@ -77,7 +74,7 @@ import asyncio
 from vectorless import Engine, IndexContext, QueryContext
 
 async def main():
-    engine = Engine(api_key="sk-...", model="gpt-4o")
+    engine = Engine(api_key="sk-...", model="gpt-4o", endpoint="https://api.openai.com/v1")
 
     # Index a document
     result = await engine.index(IndexContext.from_path("./report.pdf"))
@@ -130,7 +127,7 @@ result = await engine.query(
 Indexed documents are stored in a workspace — there's no need to reprocess files between sessions:
 
 ```python
-engine = Engine(api_key="sk-...", model="gpt-4o")
+engine = Engine(api_key="sk-...", model="gpt-4o", endpoint="https://api.openai.com/v1")
 
 # List all indexed documents
 docs = await engine.list()
diff --git a/docs/docs/api-reference.mdx b/docs/docs/api-reference.mdx
new file mode 100644
index 00000000..5261afbf
--- /dev/null
+++ b/docs/docs/api-reference.mdx
@@ -0,0 +1,17 @@
+---
+sidebar_position: 9
+title: API Reference
+description: Complete API reference for Vectorless Rust crate and Python SDK.
+---
+
+# API Reference
+
+> This page is a work in progress. The full API reference will be published in a future update.
+
+In the meantime, you can refer to the following resources:
+
+- **Rust crate docs**: [docs.rs/vectorless](https://docs.rs/vectorless) — auto-generated documentation from source code
+- **Python SDK docs**: Available via `help(vectorless)` in an interactive Python session
+- **Source code**: [github.com/vectorlessflow/vectorless](https://github.com/vectorlessflow/vectorless)
+
+For usage examples, see [Quick Query](/docs/examples/quick-query), [Multi-Document](/docs/examples/multi-document), and [Batch Indexing](/docs/examples/batch-indexing).
diff --git a/docs/docusaurus.config.ts b/docs/docusaurus.config.ts
index 6b329f6e..b72d033d 100644
--- a/docs/docusaurus.config.ts
+++ b/docs/docusaurus.config.ts
@@ -111,7 +111,7 @@ const config: Config = {
             },
             {
               label: 'API Reference',
-              href: 'https://docs.rs/vectorless',
+              to: '/docs/api-reference',
             },
           ],
         },
@@ -133,7 +133,7 @@ const config: Config = {
           ],
         },
       ],
-      copyright: `Copyright © ${new Date().getFullYear()} Vectorless`,
+      copyright: `Copyright \u00A9 ${new Date().getFullYear()} Vectorless`,
     },
     prism: {
       theme: prismThemes.github,
diff --git a/docs/sidebars.ts b/docs/sidebars.ts
index e3ddf067..2f70bedb 100644
--- a/docs/sidebars.ts
+++ b/docs/sidebars.ts
@@ -42,6 +42,7 @@ const sidebars: SidebarsConfig = {
         'sdk/rust',
       ],
     },
+    'api-reference',
     {
       type: 'category',
       label: 'Examples',
diff --git a/docs/src/components/GitHubStar/index.tsx b/docs/src/components/GitHubStar/index.tsx
index b2247874..712e8b74 100644
--- a/docs/src/components/GitHubStar/index.tsx
+++ b/docs/src/components/GitHubStar/index.tsx
@@ -1,5 +1,5 @@
 import React, { useState, useEffect } from 'react';
-import { FaGithub, FaStar } from 'react-icons/fa';
+import { FaGithub } from 'react-icons/fa';
 import styles from './styles.module.css';
 
 function formatStars(count: number | null): string {
@@ -40,16 +40,16 @@ export default function GitHubStar(): React.ReactElement {
         rel="noopener noreferrer"
         className={styles.githubStarButton}
       >
-        <FaGithub size={14} />
+        <FaGithub size={16} />
         <span className={styles.githubStarText}>Star</span>
       </a>
       {loading ? (
         <div className={styles.githubStarCount}>
-          <span className={styles.spinner}>...</span>
+          <span className={styles.spinner}>&hellip;</span>
         </div>
       ) : (
         <a
-          href="https://github.com/vectorlessflow/vectorless/stargazers"
+          href="https://github.com/vectorlessflow/vectorless"
           target="_blank"
           rel="noopener noreferrer"
           className={styles.githubStarCount}
diff --git a/docs/src/components/GitHubStar/styles.module.css b/docs/src/components/GitHubStar/styles.module.css
index b46d03be..051e45c1 100644
--- a/docs/src/components/GitHubStar/styles.module.css
+++ b/docs/src/components/GitHubStar/styles.module.css
@@ -15,7 +15,7 @@
   border-radius: 3px;
   text-decoration: none;
   font-size: 12px;
-  font-weight: 700;
+  font-weight: 600;
   line-height: 24px;
   transition: background-color 0.2s;
 }
@@ -46,7 +46,7 @@
   margin-left: 5px;
   padding: 0 5px;
   font-size: 12px;
-  font-weight: 700;
+  font-weight: 600;
   line-height: 24px;
   border: 1px solid #d5d5d5;
   border-radius: 3px;
diff --git a/docs/src/css/custom.css b/docs/src/css/custom.css
index 8bbdf711..b6f2ebc6 100644
--- a/docs/src/css/custom.css
+++ b/docs/src/css/custom.css
@@ -6,18 +6,26 @@
 
 :root {
   --primary: #AF788B;
-  --primary-dark: #96637A;
+  --primary-dark: #8B5E6F;
+  --primary-deeper: #6E4556;
   --primary-light: #C9A0AE;
+  --primary-soft: rgba(175, 120, 139, 0.12);
   --text: #1e293b;
-  --text-light: #64748b;
+  --text-light: #5a4a52;
   --bg: #ffffff;
-  --bg-secondary: #fdf8f9;
-  --border: #e8dde1;
+  --bg-secondary: #F5EBEE;
+  --bg-offset: #F6F8FA;
+  --card-bg: #FAF5F7;
+  --border: #E2E8F0;
+  --code-bg: #0F172A;
+  --code-text: #E2E8F0;
+  --code-comment: #6272A4;
+  --code-keyword: #FF79C6;
 
   --ifm-color-primary: #AF788B;
-  --ifm-color-primary-dark: #96637A;
-  --ifm-color-primary-darker: #8d5a6f;
-  --ifm-color-primary-darkest: #6e4556;
+  --ifm-color-primary-dark: #8B5E6F;
+  --ifm-color-primary-darker: #7a5062;
+  --ifm-color-primary-darkest: #6E4556;
   --ifm-color-primary-light: #C9A0AE;
   --ifm-color-primary-lighter: #d3b0bb;
   --ifm-color-primary-lightest: #e8d0d8;
@@ -26,6 +34,19 @@
 }
 
 [data-theme='dark'] {
+  --text: #EEF2FF;
+  --text-light: #8B9AB0;
+  --bg: #0A0C10;
+  --bg-secondary: #11151A;
+  --bg-offset: #11151A;
+  --card-bg: #11151A;
+  --border: #1E293B;
+  --primary-soft: rgba(201, 160, 174, 0.15);
+  --code-bg: #010409;
+  --code-text: #E2E8F0;
+  --code-comment: #6272A4;
+  --code-keyword: #FF79C6;
+
   --ifm-color-primary: #C9A0AE;
   --ifm-color-primary-dark: #b88d9d;
   --ifm-color-primary-darker: #af7f91;
@@ -36,38 +57,92 @@
   --docusaurus-highlighted-code-line-bg: rgba(175, 120, 139, 0.2);
 }
 
-/* Navbar: no border, no shadow, match homepage bg */
+/* ===== Navbar ===== */
 .navbar {
-  background-color: #fdf8f9 !important;
+  background-color: var(--bg) !important;
   border-bottom: none !important;
   box-shadow: none !important;
+  height: 68px !important;
+  padding: 0 1.5rem !important;
+}
+
+.navbar__inner {
+  height: 68px !important;
+  max-width: 1200px;
+  margin: 0 auto;
+}
+
+.navbar__brand {
+  height: 68px !important;
+}
+
+.navbar__title {
+  font-size: 1.4rem !important;
+  font-weight: 700 !important;
+  color: var(--text) !important;
+  letter-spacing: -0.01em;
+}
+
+.navbar__logo {
+  height: 36px;
+  margin-right: 0.6rem;
+}
+
+.navbar__link {
+  font-size: 0.95rem !important;
+  font-weight: 500 !important;
+  color: var(--text-light) !important;
+  transition: color 0.15s !important;
+}
+
+.navbar__link:hover {
+  color: var(--primary-dark) !important;
+}
+
+.navbar__link--active {
+  color: var(--primary-dark) !important;
 }
 
 [data-theme='dark'] .navbar {
-  background-color: var(--ifm-background-color) !important;
+  background-color: var(--bg) !important;
+  border-bottom: none !important;
+}
+
+[data-theme='dark'] .navbar__title {
+  color: var(--text) !important;
+}
+
+[data-theme='dark'] .navbar__link {
+  color: var(--text-light) !important;
+}
+
+[data-theme='dark'] .navbar__link:hover {
+  color: var(--primary-light) !important;
+}
+
+[data-theme='dark'] .navbar__link--active {
+  color: var(--primary-light) !important;
 }
 
 /* ===== Footer ===== */
 .footer {
   background-color: transparent !important;
-  padding: 3rem 1.5rem 2rem;
+  padding: 5rem 1.5rem 1.5rem;
 }
 
-/* Column titles */
 .footer__title {
-  font-size: 0.8rem;
+  font-size: 0.85rem;
   font-weight: 700;
   text-transform: uppercase;
   letter-spacing: 0.08em;
   color: var(--text);
-  margin-bottom: 0.75rem;
+  margin-bottom: 1rem;
 }
 
-/* Link items */
 .footer__link-item {
-  font-size: 0.88rem;
+  font-size: 0.92rem;
   color: var(--text-light);
-  line-height: 1.8;
+  line-height: 2;
   transition: color 0.15s;
 }
 
@@ -75,18 +150,11 @@
   color: var(--primary);
 }
 
-/* Hide external-link icons */
 .footer__link-item svg {
   display: none;
 }
 
-/* Copyright */
 .footer__copyright {
-  text-align: center;
-  font-size: 0.8rem;
+  font-size: 0.88rem;
   color: var(--text-light);
-  letter-spacing: 0.03em;
-  margin-top: 2rem;
-  padding-top: 1.5rem;
-  border-top: 1px solid var(--border);
 }
diff --git a/docs/src/pages/index.module.css b/docs/src/pages/index.module.css
index 37cf66aa..f2685eb8 100644
--- a/docs/src/pages/index.module.css
+++ b/docs/src/pages/index.module.css
@@ -8,118 +8,115 @@
 
 /* ===== Hero ===== */
 .heroBanner {
-  padding: 5rem 1.5rem 4rem;
+  padding: 10rem 1.5rem 6rem;
   position: relative;
   overflow: hidden;
-  background: linear-gradient(180deg, var(--bg-secondary) 0%, var(--bg) 100%);
+  background-color: var(--bg);
 }
 
 .heroInner {
-  max-width: 1200px;
+  max-width: 1100px;
   margin: 0 auto;
-  display: flex;
-  align-items: center;
-  gap: 3rem;
+  text-align: center;
 }
 
-/* -- Left column -- */
-.heroContent {
-  flex: 1;
-  min-width: 0;
+.heroTitle {
+  font-size: 5.5rem;
+  font-weight: 800;
+  font-family: 'Inter', 'Libre Franklin', -apple-system, BlinkMacSystemFont, sans-serif;
+  color: var(--text);
+  margin: 0 0 1.75rem;
+  letter-spacing: -0.03em;
+  line-height: 1.1;
+  white-space: nowrap;
 }
 
-.heroLogo {
-  display: block;
-  max-width: 320px;
-  width: 100%;
-  height: auto;
-  margin-bottom: 1.5rem;
+.heroTitleEmphasis {
+  color: var(--text);
+}
+
+.heroTitleLight {
+  color: #9a8a92;
+  font-weight: 300;
 }
 
 .heroTagline {
   color: var(--text-light);
-  font-size: 1.15rem;
+  font-size: 1.3rem;
   line-height: 1.7;
-  margin: 0 0 1.75rem;
+  margin: 0 0 3rem;
 }
 
-.heroActions {
-  display: flex;
-  gap: 0.75rem;
-  flex-wrap: wrap;
+.heroTaglineHighlight {
+  color: var(--text);
+  font-weight: 600;
 }
 
-/* -- Right column: code preview -- */
-.codePreview {
-  flex: 1 1 520px;
-  max-width: 560px;
-  border-radius: 12px;
-  overflow: hidden;
-  border: 1px solid var(--border);
-  background: #1e1e2e;
-  box-shadow: 0 8px 32px rgba(0, 0, 0, 0.12);
+.heroTaglineLine1 {
+  /* first line is naturally longer */
 }
 
-.codeHeader {
-  display: flex;
-  align-items: center;
-  justify-content: space-between;
-  padding: 0.55rem 1rem;
-  background: #181825;
+.heroTaglineLine2 {
+  /* second line shorter */
 }
 
-.codeDots {
-  display: flex;
-  gap: 6px;
+.heroTagline strong {
+  color: var(--text);
+  font-weight: 600;
 }
 
-.codeDots span {
-  width: 10px;
-  height: 10px;
-  border-radius: 50%;
+.heroTagline em {
+  color: var(--primary-dark);
+  font-style: italic;
 }
 
-.codeDots span:nth-child(1) { background: #f38ba8; }
-.codeDots span:nth-child(2) { background: #f9e2af; }
-.codeDots span:nth-child(3) { background: #a6e3a1; }
+.heroActions {
+  display: flex;
+  gap: 1rem;
+  justify-content: center;
+  align-items: center;
+  flex-wrap: wrap;
+}
 
-.codeLang {
-  font-size: 0.7rem;
-  color: #6c7086;
-  font-weight: 500;
+/* GitHub Star button */
+.githubStarButton {
+  display: inline-flex;
+  align-items: center;
+  gap: 0.5rem;
+  padding: 0.8rem 1.8rem;
+  font-size: 1rem;
+  font-weight: 600;
+  border-radius: 999px;
+  background-color: var(--text);
+  color: #fff;
+  text-decoration: none;
 }
 
-.codeBlock {
-  margin: 0;
-  padding: 1rem 1.25rem;
-  font-size: 0.78rem;
-  line-height: 1.7;
-  color: #cdd6f4;
-  overflow-x: auto;
-  background: transparent;
+[data-theme='dark'] .githubStarButton {
+  background-color: #f3f3f3;
+  color: #333;
 }
 
-.codeBlock code {
-  font-family: 'SF Mono', 'Fira Code', 'JetBrains Mono', monospace;
-  font-size: 0.76rem;
+.starIcon {
+  margin-left: 0.4rem;
 }
 
 /* ===== Buttons ===== */
 .buttonPrimary {
   display: inline-flex;
   align-items: center;
-  padding: 0.65rem 1.6rem;
-  font-size: 0.92rem;
+  padding: 0.75rem 2rem;
+  font-size: 0.95rem;
   font-weight: 600;
   border-radius: 8px;
-  background-color: var(--primary);
+  background-color: var(--primary-dark);
   color: #fff;
   text-decoration: none;
   transition: background-color 0.2s, transform 0.1s;
 }
 
 .buttonPrimary:hover {
-  background-color: var(--primary-dark);
+  background-color: var(--primary-deeper);
   color: #fff;
   text-decoration: none;
   transform: translateY(-1px);
@@ -128,8 +125,8 @@
 .buttonSecondary {
   display: inline-flex;
   align-items: center;
-  padding: 0.65rem 1.6rem;
-  font-size: 0.92rem;
+  padding: 0.75rem 2rem;
+  font-size: 0.95rem;
   font-weight: 600;
   border-radius: 8px;
   background-color: transparent;
@@ -141,7 +138,7 @@
 
 .buttonSecondary:hover {
   border-color: var(--primary);
-  color: var(--primary);
+  color: var(--primary-dark);
   text-decoration: none;
   transform: translateY(-1px);
 }
@@ -152,7 +149,7 @@
 }
 
 .sectionAlt {
-  background-color: var(--bg-secondary);
+  background-color: var(--bg-offset);
 }
 
 .sectionInner {
@@ -175,192 +172,512 @@
   margin: 0 0 3rem;
 }
 
-/* ===== Feature Grid ===== */
-.grid {
-  display: grid;
-  grid-template-columns: repeat(3, 1fr);
+/* ===== Get Started — Linear Dark Demo Card ===== */
+.demoCard {
+  max-width: 1200px;
+  margin: 0 auto;
+  background: #121417;
+  border-radius: 16px;
+  border: 1px solid #23262B;
+  overflow: hidden;
+  box-shadow: 0 12px 40px rgba(0, 0, 0, 0.4);
+}
+
+.demoTabs {
+  display: flex;
+  align-items: center;
   gap: 1.5rem;
+  padding: 0 1.25rem;
+  border-bottom: 1px solid #23262B;
+  background: #121417;
 }
 
-.card {
-  padding: 1.75rem;
-  border-radius: 12px;
-  border: 1px solid var(--border);
-  background: var(--bg);
-  transition: border-color 0.2s, box-shadow 0.2s;
+.demoTab {
+  padding: 0.875rem 0 0.75rem;
+  font-size: 0.8rem;
+  font-weight: 500;
+  color: #8E95A3;
+  border: none;
+  border-bottom: 2px solid transparent;
+  background: transparent;
+  cursor: pointer;
+  transition: all 0.15s ease;
+  letter-spacing: -0.2px;
+  font-family: 'Inter', -apple-system, BlinkMacSystemFont, sans-serif;
 }
 
-.card:hover {
-  border-color: var(--primary-light);
-  box-shadow: 0 4px 20px rgba(175, 120, 139, 0.08);
+.demoTabActive {
+  color: #AF788B;
+  border-bottom-color: #AF788B;
 }
 
-.cardIcon {
-  display: inline-flex;
+.demoTab:not(.demoTabActive):hover {
+  color: #EBEDF0;
+}
+
+.demoPanel {
+  background: #0B0D0E;
+}
+
+.demoCodeHeader {
+  padding: 0.75rem 1.25rem;
+  background: #0B0D0E;
+  border-bottom: 1px solid #2A2E34;
+  display: flex;
   align-items: center;
-  justify-content: center;
-  width: 44px;
-  height: 44px;
-  font-size: 1.35rem;
-  border-radius: 10px;
-  background: var(--bg-secondary);
-  margin-bottom: 1rem;
+  gap: 0.75rem;
 }
 
-.cardTitle {
-  font-size: 1.05rem;
-  font-weight: 600;
-  margin: 0 0 0.5rem;
-  color: var(--text);
+.windowDots {
+  display: flex;
+  gap: 0.5rem;
 }
 
-.cardDesc {
-  font-size: 0.88rem;
-  line-height: 1.65;
-  color: var(--text-light);
+.windowDot {
+  width: 11px;
+  height: 11px;
+  border-radius: 50%;
+  display: inline-block;
+}
+
+.dotRed {
+  background: #ED6A5E;
+}
+
+.dotYellow {
+  background: #F5BD4F;
+}
+
+.dotGreen {
+  background: #61C454;
+}
+
+.copyBtn {
+  margin-left: auto;
+  background: transparent;
+  border: none;
+  color: #8E95A3;
+  font-size: 0.7rem;
+  font-family: 'JetBrains Mono', 'Fira Code', monospace;
+  cursor: pointer;
+  padding: 0.25rem 0.75rem;
+  border-radius: 6px;
+  transition: all 0.15s;
+  letter-spacing: -0.2px;
+}
+
+.copyBtn:hover {
+  background: rgba(175, 120, 139, 0.1);
+  color: #AF788B;
+}
+
+.demoPre {
   margin: 0;
+  padding: 1.75rem 2rem;
+  overflow-x: auto;
+  font-family: 'JetBrains Mono', 'Fira Code', 'SF Mono', Menlo, monospace;
+  font-size: 0.85rem;
+  line-height: 1.75;
+  color: #EBEDF0;
+  background: #0B0D0E;
 }
 
-/* ===== How It Works ===== */
-.steps {
+.demoPre code {
+  font-family: inherit;
+  background: transparent;
+  border: none;
+  padding: 0;
+  color: inherit;
+}
+
+/* Syntax highlight tokens */
+.hlKeyword {
+  color: #AF788B;
+  font-weight: 500;
+}
+
+.hlFunction {
+  color: #6DCDFF;
+}
+
+.hlString {
+  color: #B0E57C;
+}
+
+.hlComment {
+  color: #5E6673;
+  font-style: italic;
+}
+
+.hlType {
+  color: #6DCDFF;
+}
+
+.hlAttribute {
+  color: #D9A7E8;
+}
+
+.terminalOutput {
+  background: #0B0D0E;
+  border-top: 1px solid #2A2E34;
+  padding: 1rem 2rem;
+  font-family: 'JetBrains Mono', 'Fira Code', monospace;
+  font-size: 0.78rem;
+  color: #8E95A3;
+  line-height: 1.7;
+}
+
+.terminalPrompt {
+  color: #B0E57C;
+}
+
+.terminalAnswer {
+  color: #EBEDF0;
+}
+
+.terminalCursor {
+  display: inline-block;
+  width: 7px;
+  height: 13px;
+  background-color: #AF788B;
+  vertical-align: middle;
+  margin-left: 4px;
+  animation: cursorBlink 1s step-end infinite;
+}
+
+@keyframes cursorBlink {
+  0%, 100% { opacity: 1; }
+  50% { opacity: 0; }
+}
+
+.installBar {
+  padding: 1rem 2rem;
+  background: #121417;
+  border-top: 1px solid #23262B;
   display: flex;
-  gap: 2rem;
-  max-width: 960px;
-  margin: 0 auto;
+  align-items: center;
+  justify-content: space-between;
+  flex-wrap: wrap;
+  gap: 0.75rem;
+}
+
+.installCommand {
+  font-family: 'JetBrains Mono', 'Fira Code', monospace;
+  font-size: 0.75rem;
+  color: #8E95A3;
+  background: #0B0D0E;
+  padding: 0.4rem 1rem;
+  border-radius: 8px;
+  border: 1px solid #23262B;
+}
+
+.installCommand span {
+  color: #AF788B;
 }
 
-.step {
-  flex: 1;
+.installBtn {
+  background: #AF788B;
+  border: none;
+  color: white;
+  font-size: 0.75rem;
+  font-weight: 500;
+  padding: 0.4rem 1.2rem;
+  border-radius: 20px;
+  cursor: pointer;
+  transition: background 0.15s;
+  font-family: 'Inter', -apple-system, BlinkMacSystemFont, sans-serif;
+}
+
+.installBtn:hover {
+  background: #9A6A7C;
+}
+
+/* ===== How It Works ===== */
+.workflowWrapper {
+  max-width: 100%;
+  padding: 0;
+  margin: 0 auto;
   text-align: center;
 }
 
-.stepNum {
-  display: inline-flex;
-  align-items: center;
+.workflowImg {
+  width: 100%;
+  height: auto;
+  display: block;
+  min-height: 520px;
+  object-fit: contain;
+}
+
+/* ===== Use Cases Slider ===== */
+.sliderOuter {
+  overflow: hidden;
+  width: 100%;
+  padding: 1rem 0;
+}
+
+.sliderTrack {
+  display: flex;
+  gap: 1.5rem;
+  transition: transform 0.45s cubic-bezier(0.2, 0.9, 0.4, 1.1);
+  will-change: transform;
+}
+
+.caseCard {
+  flex: 0 0 calc(65% - 0.75rem);
+  background: #121417;
+  border: 1px solid #23262B;
+  border-radius: 16px;
+  padding: 3rem 3rem 2.5rem;
+  opacity: 0.4;
+  transform: scale(0.94);
+  transition: all 0.35s ease;
+  filter: brightness(0.75);
+  min-height: 460px;
+  display: flex;
+  flex-direction: column;
   justify-content: center;
-  width: 48px;
-  height: 48px;
-  border-radius: 50%;
-  background: var(--primary);
-  color: #fff;
-  font-size: 1rem;
-  font-weight: 700;
-  margin-bottom: 1.25rem;
+  gap: 0.5rem;
 }
 
-.stepTitle {
-  font-size: 1.1rem;
+.caseCardActive {
+  opacity: 1;
+  transform: scale(1);
+  filter: brightness(1);
+  border-color: #AF788B;
+  box-shadow: 0 12px 40px rgba(175, 120, 139, 0.18);
+}
+
+.caseTitle {
+  font-size: 1.55rem;
   font-weight: 600;
-  margin: 0 0 0.5rem;
-  color: var(--text);
+  margin: 0 0 0.75rem;
+  color: #EBEDF0;
 }
 
-.stepDesc {
+.caseDesc {
+  color: #8E95A3;
+  font-size: 1.05rem;
+  line-height: 1.7;
+  margin: 0 0 1.75rem;
+}
+
+.caseQuery {
+  background: #0B0D0E;
+  border-radius: 12px;
+  padding: 1.5rem 1.75rem;
+  font-family: 'JetBrains Mono', 'Fira Code', monospace;
   font-size: 0.88rem;
-  line-height: 1.65;
+  color: #EBEDF0;
+  border: 1px solid #23262B;
+  line-height: 1.7;
+}
+
+.caseQueryLabel {
+  color: #AF788B;
+  font-weight: 600;
+  margin-bottom: 0.5rem;
+}
+
+.caseQueryText {
+  color: #EBEDF0;
+}
+
+.caseAnswer {
+  color: #8E95A3;
+  margin-top: 0.75rem;
+  padding-top: 0.75rem;
+  border-top: 1px solid #23262B;
+  font-size: 0.75rem;
+}
+
+.sliderNav {
+  display: flex;
+  justify-content: center;
+  align-items: center;
+  gap: 1rem;
+  margin-top: 2.5rem;
+}
+
+.sliderBtn {
+  background: var(--card-bg);
+  border: 1px solid var(--border);
   color: var(--text-light);
-  margin: 0;
+  font-size: 1.2rem;
+  width: 44px;
+  height: 44px;
+  border-radius: 44px;
+  display: inline-flex;
+  align-items: center;
+  justify-content: center;
+  cursor: pointer;
+  transition: all 0.2s;
+}
+
+.sliderBtn:hover {
+  border-color: var(--primary);
+  color: var(--primary-dark);
+  background: var(--primary-soft);
+}
+
+.sliderDots {
+  display: flex;
+  gap: 0.5rem;
+}
+
+.sliderDot {
+  width: 8px;
+  height: 8px;
+  border-radius: 8px;
+  background: var(--text-light);
+  border: none;
+  padding: 0;
+  cursor: pointer;
+  transition: all 0.25s;
+  opacity: 0.4;
+}
+
+.sliderDotActive {
+  width: 28px;
+  background: var(--primary);
+  opacity: 1;
 }
 
 /* ===== CTA ===== */
+.sectionCtaDark {
+  background: #0B0D0E;
+  padding: 3rem 1.5rem;
+}
+
 .ctaBox {
+  max-width: 880px;
+  margin: 0 auto;
   text-align: center;
   padding: 4rem 2rem;
-  border-radius: 16px;
-  background: var(--bg-secondary);
-  border: 1px solid var(--border);
 }
 
 .ctaTitle {
-  font-size: 2rem;
+  font-size: 2.5rem;
   font-weight: 700;
-  margin: 0 0 0.75rem;
+  letter-spacing: -0.02em;
+  margin: 0 0 1rem;
   color: var(--text);
 }
 
 .ctaDesc {
-  font-size: 1.1rem;
-  color: var(--text-light);
-  margin: 0 0 2rem;
+  font-size: 1.05rem;
+  color: #8E95A3;
+  max-width: 520px;
+  margin: 0 auto 2rem;
+  line-height: 1.6;
 }
 
-.ctaDesc code {
-  padding: 0.2em 0.5em;
-  border-radius: 4px;
-  background: var(--bg);
-  border: 1px solid var(--border);
-  font-size: 0.95rem;
-  color: var(--primary-dark);
+.ctaButtons {
+  display: flex;
+  justify-content: center;
+  gap: 1rem;
+  margin-bottom: 1.5rem;
+  flex-wrap: wrap;
+}
+
+.ctaBtnSecondary {
+  padding: 0.7rem 1.8rem;
+  border-radius: 40px;
+  font-weight: 600;
+  font-size: 0.88rem;
+  background: transparent;
+  border: 1px solid #23262B;
+  color: #EBEDF0;
+  text-decoration: none;
+  cursor: pointer;
+  transition: all 0.2s;
+  font-family: 'Inter', -apple-system, BlinkMacSystemFont, sans-serif;
+}
+
+.ctaBtnSecondary:hover {
+  border-color: #AF788B;
+  background: rgba(175, 120, 139, 0.12);
+  color: #AF788B;
+  text-decoration: none;
 }
 
-.ctaActions {
+.ctaInstallCards {
   display: flex;
-  gap: 0.75rem;
   justify-content: center;
+  gap: 1rem;
   flex-wrap: wrap;
+  margin-bottom: 2rem;
 }
 
-/* ===== Dark theme overrides ===== */
-[data-theme='dark'] .codePreview {
-  border-color: #313244;
-  box-shadow: 0 8px 32px rgba(0, 0, 0, 0.3);
+.ctaInstallItem {
+  background: #121417;
+  border: 1px solid #23262B;
+  border-radius: 12px;
+  padding: 0.65rem 1.25rem;
+  display: flex;
+  align-items: center;
+  gap: 1rem;
 }
 
-[data-theme='dark'] .card {
-  background: #181825;
-  border-color: #313244;
+.ctaInstallCommand {
+  font-family: 'JetBrains Mono', 'Fira Code', monospace;
+  font-size: 0.82rem;
+  color: #EBEDF0;
 }
 
-[data-theme='dark'] .card:hover {
-  border-color: var(--primary);
+.ctaInstallCommand span {
+  color: #AF788B;
+}
+
+.ctaCopyIcon {
+  background: transparent;
+  border: none;
+  color: #8E95A3;
+  cursor: pointer;
+  padding: 0.25rem 0.65rem;
+  border-radius: 6px;
+  font-size: 0.7rem;
+  font-family: 'Inter', sans-serif;
+  transition: all 0.15s;
+}
+
+.ctaCopyIcon:hover {
+  background: rgba(175, 120, 139, 0.12);
+  color: #AF788B;
+}
+
+/* ===== Dark theme overrides ===== */
+[data-theme='dark'] .heroTitleEmphasis {
+  color: var(--primary-light);
 }
 
-[data-theme='dark'] .cardIcon {
-  background: #1e1e2e;
+[data-theme='dark'] .heroTitleLight {
+  color: #6B7A8A;
 }
 
-[data-theme='dark'] .ctaBox {
-  background: #181825;
-  border-color: #313244;
+[data-theme='dark'] .heroTaglineHighlight {
+  color: var(--text);
 }
 
-[data-theme='dark'] .ctaDesc code {
-  background: #1e1e2e;
-  border-color: #313244;
+[data-theme='dark'] .card:hover {
+  border-color: var(--primary);
 }
 
 /* ===== Responsive ===== */
 @media screen and (max-width: 996px) {
   .heroBanner {
-    padding: 3rem 1.5rem 2.5rem;
+    padding: 6rem 1.5rem 4rem;
   }
 
-  .heroInner {
-    flex-direction: column;
-    gap: 2.5rem;
-  }
-
-  .heroLogo {
-    max-width: 240px;
+  .heroTitle {
+    font-size: 3.2rem;
   }
 
   .heroTagline {
-    font-size: 1rem;
+    font-size: 1.15rem;
   }
 
-  .codePreview {
-    flex: none;
-    max-width: 100%;
-    width: 100%;
-  }
-
-  .grid {
-    grid-template-columns: repeat(2, 1fr);
-  }
-
-  .steps {
-    flex-direction: column;
-    gap: 2.5rem;
+  .caseCard {
+    flex: 0 0 calc(70% - 0.75rem);
   }
 
   .section {
@@ -370,30 +687,36 @@
 
 @media screen and (max-width: 600px) {
   .heroBanner {
-    padding: 2rem 1rem 1.5rem;
+    padding: 4.5rem 1rem 3rem;
   }
 
-  .heroLogo {
-    max-width: 200px;
+  .heroTitle {
+    font-size: 2rem;
   }
 
   .heroActions {
     flex-direction: column;
+    align-items: center;
   }
 
   .buttonPrimary,
   .buttonSecondary {
     width: 100%;
     justify-content: center;
+    max-width: 280px;
+  }
+
+  .caseCard {
+    flex: 0 0 calc(90% - 0.75rem);
   }
 
-  .grid {
-    grid-template-columns: 1fr;
+  .demoPre {
+    font-size: 0.65rem;
   }
 
-  .ctaActions {
+  .installBar {
     flex-direction: column;
-    align-items: center;
+    align-items: flex-start;
   }
 
   .sectionTitle {
diff --git a/docs/src/pages/index.tsx b/docs/src/pages/index.tsx
index 83e3d697..c75abfd7 100644
--- a/docs/src/pages/index.tsx
+++ b/docs/src/pages/index.tsx
@@ -1,142 +1,238 @@
 import type {ReactNode} from 'react';
+import {useState, useMemo, useRef, useEffect, useCallback} from 'react';
 import useDocusaurusContext from '@docusaurus/useDocusaurusContext';
 import Layout from '@theme/Layout';
 import Heading from '@theme/Heading';
 import Link from '@docusaurus/Link';
-import useBaseUrl from '@docusaurus/useBaseUrl';
-import {Highlight, themes} from 'prism-react-renderer';
 
 import styles from './index.module.css';
 
 function HomepageHeader() {
-  const {siteConfig} = useDocusaurusContext();
   return (
     <header className={styles.heroBanner}>
       <div className={styles.heroInner}>
-        <div className={styles.heroContent}>
-          <img
-            className={styles.heroLogo}
-            src={useBaseUrl('img/with-title.png')}
-            alt={siteConfig.title}
-          />
-          <p className={styles.heroTagline}>
-            No vector database. No embeddings. No similarity search.<br />
-            Retrieve by reasoning, not by math.
-          </p>
-          <div className={styles.heroActions}>
-            <Link className={styles.buttonPrimary} to="/docs/intro">
-              Get Started
-            </Link>
-            <Link
-              className={styles.buttonSecondary}
-              href="https://github.com/vectorlessflow/vectorless"
-              target="_blank"
-              rel="noopener noreferrer">
-              GitHub
-            </Link>
-          </div>
+        <h1 className={styles.heroTitle}>
+          <span className={styles.heroTitleEmphasis}>Reason, </span>
+          <span className={styles.heroTitleLight}>don't vector</span>
+        </h1>
+        <p className={styles.heroTagline}>
+          <span className={styles.heroTaglineLine1}>
+            <span className={styles.heroTaglineHighlight}>Vectorless</span> will reason through any of your structured documents — <span className={styles.heroTaglineHighlight}>PDFs, Markdown, reports, contracts</span>,
+          </span>
+          <br />
+          <span className={styles.heroTaglineLine2}>and retrieve only what's relevant. <span className={styles.heroTaglineHighlight}>Nothing more, nothing less.</span></span>
+        </p>
+        <div className={styles.heroActions}>
+          <Link
+            className={styles.githubStarButton}
+            href="https://github.com/vectorlessflow/vectorless"
+            target="_blank"
+            rel="noopener noreferrer">
+            <svg stroke="currentColor" fill="currentColor" strokeWidth="0" viewBox="0 0 496 512" height="22" width="22" xmlns="http://www.w3.org/2000/svg"><path d="M165.9 397.4c0 2-2.3 3.6-5.2 3.6-3.3.3-5.6-1.3-5.6-3.6 0-2 2.3-3.6 5.2-3.6 3-.3 5.6 1.3 5.6 3.6zm-31.1-4.5c-.7 2 1.3 4.3 4.3 4.9 2.6 1 5.6 0 6.2-2s-1.3-4.3-4.3-5.2c-2.6-.7-5.5.3-6.2 2.3zm44.2-1.7c-2.9.7-4.9 2.6-4.6 4.9.3 2 2.9 3.3 5.9 2.6 2.9-.7 4.9-2.6 4.6-4.6-.3-1.9-3-3.2-5.9-2.9zM244.8 8C106.1 8 0 113.3 0 252c0 110.9 69.8 205.8 169.5 239.2 12.8 2.3 17.3-5.6 17.3-12.1 0-6.2-.3-40.4-.3-61.4 0 0-70 15-84.7-29.8 0 0-11.4-29.1-27.8-36.6 0 0-22.9-15.7 1.6-15.4 0 0 24.9 2 38.6 25.8 21.9 38.6 58.6 27.5 72.9 20.9 2.3-16 8.8-27.1 16-33.7-55.9-6.2-112.3-14.3-112.3-110.5 0-27.5 7.6-41.3 23.6-58.9-2.6-6.5-11.1-33.3 2.6-67.9 20.9-6.5 69 27 69 27 20-5.6 41.5-8.5 62.8-8.5s42.8 2.9 62.8 8.5c0 0 48.1-33.6 69-27 13.7 34.7 5.2 61.4 2.6 67.9 16 17.7 25.8 31.5 25.8 58.9 0 96.5-58.9 104.2-114.8 110.5 9.2 7.9 17 22.9 17 46.4 0 33.7-.3 75.4-.3 83.6 0 6.5 4.6 14.4 17.3 12.1C428.2 457.8 496 362.9 496 252 496 113.3 383.5 8 244.8 8zM97.2 352.9c-1.3 1-1 3.3.7 5.2 1.6 1.6 3.9 2.3 5.2 1 1.3-1 1-3.3-.7-5.2-1.6-1.6-3.9-2.3-5.2-1zm-10.8-8.1c-.7 1.3.3 2.9 2.3 3.9 1.6 1 3.6.7 4.3-.7.7-1.3-.3-2.9-2.3-3.9-2-.6-3.6-.3-4.3.7zm32.4 35.6c-1.6 1.3-1 4.3 1.3 6.2 2.3 2.3 5.2 2.6 6.5 1 1.3-1.3.7-4.3-1.3-6.2-2.2-2.3-5.2-2.6-6.5-1zm-11.4-14.7c-1.6 1-1.6 3.6 0 5.9 1.6 2.3 4.3 3.3 5.6 2.3 1.6-1.3 1.6-3.9 0-6.2-1.4-2.3-4-3.3-5.6-2z"></path></svg>
+            Star on GitHub
+            <svg className={styles.starIcon} stroke="currentColor" fill="currentColor" strokeWidth="0" viewBox="0 0 24 24" height="22" width="22" xmlns="http://www.w3.org/2000/svg"><path d="M16.6,20.463a1.5,1.5,0,0,1-.7-.174l-3.666-1.927a.5.5,0,0,0-.464,0L8.1,20.289a1.5,1.5,0,0,1-2.177-1.581l.7-4.082a.5.5,0,0,0-.143-.442L3.516,11.293a1.5,1.5,0,0,1,.832-2.559l4.1-.6a.5.5,0,0,0,.376-.273l1.833-3.714a1.5,1.5,0,0,1,2.69,0l1.833,3.714a.5.5,0,0,0,.376.274l4.1.6a1.5,1.5,0,0,1,.832,2.559l-2.965,2.891a.5.5,0,0,0-.144.442l.7,4.082A1.5,1.5,0,0,1,16.6,20.463Zm-3.9-2.986L16.364,19.4a.5.5,0,0,0,.725-.527l-.7-4.082a1.5,1.5,0,0,1,.432-1.328l2.965-2.89a.5.5,0,0,0-.277-.853l-4.1-.6a1.5,1.5,0,0,1-1.13-.821L12.449,4.594a.516.516,0,0,0-.9,0L9.719,8.308a1.5,1.5,0,0,1-1.13.82l-4.1.6a.5.5,0,0,0-.277.853L7.18,13.468A1.5,1.5,0,0,1,7.611,14.8l-.7,4.082a.5.5,0,0,0,.726.527L11.3,17.477a1.5,1.5,0,0,1,1.4,0Z"></path></svg>
+          </Link>
         </div>
+      </div>
+    </header>
+  );
+}
 
-        <div className={styles.codePreview}>
-          <div className={styles.codeHeader}>
-            <span className={styles.codeDots}>
-              <span /><span /><span />
-            </span>
-            <span className={styles.codeLang}>Python</span>
-          </div>
-          <Highlight theme={themes.dracula} code={`import asyncio
-from vectorless import Engine, IndexContext
+/* ---- Regex-based syntax highlighter ---- */
+function highlight(code: string, lang: 'python' | 'rust'): ReactNode[] {
+  // Each rule has exactly ONE capture group in its regex
+  const rules: {re: RegExp; cls: string}[] = lang === 'python'
+    ? [
+        {re: /(#.*)/g, cls: styles.hlComment},
+        {re: /("(?:[^"\\]|\\.)*")/g, cls: styles.hlString},
+        {re: /\b(import|from|async|def|await|return|as|with|for|in|if|else|None|True|False)\b/g, cls: styles.hlKeyword},
+        {re: /\b([A-Z][A-Za-z0-9_]*)\b/g, cls: styles.hlType},
+        {re: /\b([a-z_]\w*)\s*(?=\()/g, cls: styles.hlFunction},
+      ]
+    : [
+        {re: /(\/\/.*)/g, cls: styles.hlComment},
+        {re: /("(?:[^"\\]|\\.)*")/g, cls: styles.hlString},
+        {re: /\b(use|let|mut|fn|async|await|return|if|else|match|struct|impl|pub|mod|crate|self|super|where|for|in|loop|while|break|continue|move|ref|type|enum|trait|const|static|unsafe|extern)\b/g, cls: styles.hlKeyword},
+        {re: /\b([A-Z][A-Za-z0-9_]*)\b/g, cls: styles.hlType},
+        {re: /\b(\w+!)/g, cls: styles.hlFunction},
+        {re: /\b([a-z_]\w*)\s*(?=\()/g, cls: styles.hlFunction},
+        {re: /(#\[.*?\])/g, cls: styles.hlAttribute},
+      ];
+
+  // Build combined regex — join the single capture-group sources directly
+  const combined = rules.map(r => r.re.source).join('|');
+  const re = new RegExp(combined, 'gm');
+
+  const nodes: ReactNode[] = [];
+  let lastIdx = 0;
+  let m: RegExpExecArray | null;
+  re.lastIndex = 0;
+
+  while ((m = re.exec(code)) !== null) {
+    if (m.index > lastIdx) {
+      nodes.push(code.slice(lastIdx, m.index));
+    }
+    // match[1..rules.length] corresponds to each rule's capture group
+    for (let i = 0; i < rules.length; i++) {
+      const captured = m[i + 1];
+      if (captured !== undefined) {
+        nodes.push(<span key={`${m.index}-${i}`} className={rules[i].cls}>{captured}</span>);
+        break;
+      }
+    }
+    lastIdx = re.lastIndex;
+  }
+  if (lastIdx < code.length) {
+    nodes.push(code.slice(lastIdx));
+  }
+  return nodes;
+}
+
+// Exact code from README
+const PYTHON_CODE = `import asyncio
+from vectorless import Engine, IndexContext, QueryContext
 
 async def main():
-    engine = Engine(
-        api_key="sk-...",
-        model="gpt-4o",
-    )
+    engine = Engine(api_key="sk-...", model="gpt-4o", endpoint="https://api.openai.com/v1")
 
     # Index a document
-    result = await engine.index(
-        IndexContext.from_path("./report.pdf")
-    )
+    result = await engine.index(IndexContext.from_path("./report.pdf"))
     doc_id = result.doc_id
 
-    # Query — LLM navigates the tree
+    # Query
     result = await engine.query(
-        doc_id, "What is the total revenue?"
+        QueryContext("What is the total revenue?").with_doc_ids([doc_id])
     )
     print(result.single().content)
 
-asyncio.run(main())`} language="python">
-            {({tokens, getLineProps, getTokenProps}) => (
-              <pre className={styles.codeBlock}>
-                <code>
-                  {tokens.map((line, i) => (
-                    <div key={i} {...getLineProps({line})}>
-                      {line.map((token, key) => (
-                        <span key={key} {...getTokenProps({token})} />
-                      ))}
-                    </div>
-                  ))}
-                </code>
-              </pre>
-            )}
-          </Highlight>
-        </div>
-      </div>
-    </header>
-  );
+asyncio.run(main())`;
+
+const RUST_CODE = `use vectorless::client::{EngineBuilder, IndexContext, QueryContext};
+
+#[tokio::main]
+async fn main() -> vectorless::Result<()> {
+    let engine = EngineBuilder::new()
+        .with_key("sk-...")
+        .with_model("gpt-4o")
+        .with_endpoint("https://api.openai.com/v1")
+        .build()
+        .await?;
+
+    // Index a document
+    let result = engine.index(IndexContext::from_path("./report.pdf")).await?;
+    let doc_id = result.doc_id().unwrap();
+
+    // Query
+    let result = engine.query(
+        QueryContext::new("What is the total revenue?")
+            .with_doc_ids(vec![doc_id.to_string()])
+    ).await?;
+    println!("{}", result.content);
+
+    Ok(())
+}`;
+
+function PythonCode() {
+  const nodes = useMemo(() => highlight(PYTHON_CODE, 'python'), []);
+  return <pre className={styles.demoPre}><code>{nodes}</code></pre>;
+}
+
+function RustCode() {
+  const nodes = useMemo(() => highlight(RUST_CODE, 'rust'), []);
+  return <pre className={styles.demoPre}><code>{nodes}</code></pre>;
 }
 
-function SectionWhy() {
-  const items = [
-    {
-      icon: '\u{1F9E0}',
-      title: 'Reasoning-Native',
-      desc: 'LLMs navigate hierarchical document trees with semantic understanding \u2014 not vector proximity.',
-    },
-    {
-      icon: '\u{1F5C2}\u{FE0F}',
-      title: 'No Vector Database',
-      desc: 'Eliminate embedding pipelines, vector stores, and similarity search entirely. Trees are the index.',
-    },
-    {
-      icon: '\u26A1',
-      title: 'Rust-Powered',
-      desc: 'Core engine in Rust with Python bindings. Arena-based trees, async I/O, and zero-copy traversal.',
-    },
-    {
-      icon: '\u{1F50D}',
-      title: 'Multi-Algorithm Search',
-      desc: 'Beam search, MCTS, and greedy algorithms with LLM-guided Pilot at key decision points.',
-    },
-    {
-      icon: '\u{1F4CA}',
-      title: 'Explainable Results',
-      desc: 'Full reasoning chain traces every navigation decision. Audit how and why content was retrieved.',
-    },
-    {
-      icon: '\u{1F4C4}',
-      title: 'PDF & Markdown',
-      desc: 'Index PDFs and Markdown out of the box. Hierarchical structure extracted automatically.',
-    },
-  ];
+function SectionGetStarted() {
+  const [activeTab, setActiveTab] = useState<'python' | 'rust'>('python');
+  const [copyLabel, setCopyLabel] = useState('Copy');
+  const [installLabel, setInstallLabel] = useState('Copy & install');
+
+  const installCmd = activeTab === 'python' ? 'pip install vectorless' : 'cargo add vectorless';
+
+  const handleCopy = () => {
+    const code = activeTab === 'python' ? PYTHON_CODE : RUST_CODE;
+    navigator.clipboard.writeText(code);
+    setCopyLabel('\u2713 Copied!');
+    setTimeout(() => setCopyLabel('Copy'), 1500);
+  };
+
+  const handleInstallCopy = () => {
+    navigator.clipboard.writeText(installCmd);
+    setInstallLabel('\u2713 Copied!');
+    setTimeout(() => setInstallLabel('Copy & install'), 1500);
+  };
 
   return (
     <section className={styles.section}>
       <div className={styles.sectionInner}>
         <Heading as="h2" className={styles.sectionTitle}>
-          Why Vectorless?
+          Get Started
         </Heading>
         <p className={styles.sectionSubtitle}>
-          RAG without the baggage.
+          Just a few lines of code to get up and running.
         </p>
-        <div className={styles.grid}>
-          {items.map((item, i) => (
-            <div key={i} className={styles.card}>
-              <span className={styles.cardIcon}>{item.icon}</span>
-              <Heading as="h3" className={styles.cardTitle}>{item.title}</Heading>
-              <p className={styles.cardDesc}>{item.desc}</p>
+        <div className={styles.demoCard}>
+          {/* Tabs */}
+          <div className={styles.demoTabs}>
+            <button
+              className={`${styles.demoTab} ${activeTab === 'python' ? styles.demoTabActive : ''}`}
+              onClick={() => { setActiveTab('python'); setCopyLabel('Copy'); }}>
+              Python
+            </button>
+            <button
+              className={`${styles.demoTab} ${activeTab === 'rust' ? styles.demoTabActive : ''}`}
+              onClick={() => { setActiveTab('rust'); setCopyLabel('Copy'); }}>
+              Rust
+            </button>
+          </div>
+
+          {/* Python panel */}
+          {activeTab === 'python' && (
+            <div className={styles.demoPanel}>
+              <div className={styles.demoCodeHeader}>
+                <div className={styles.windowDots}>
+                  <span className={`${styles.windowDot} ${styles.dotRed}`} />
+                  <span className={`${styles.windowDot} ${styles.dotYellow}`} />
+                  <span className={`${styles.windowDot} ${styles.dotGreen}`} />
+                </div>
+                <button className={styles.copyBtn} onClick={handleCopy}>{copyLabel}</button>
+              </div>
+              <PythonCode />
+              <div className={styles.terminalOutput}>
+                <span className={styles.terminalPrompt}>$</span> python demo.py<br />
+                <span className={styles.terminalAnswer}>&rarr; The total revenue for fiscal year 2024 was $2.3 billion, a 15% increase YoY.</span>
+                <span className={styles.terminalCursor} />
+              </div>
             </div>
-          ))}
+          )}
+
+          {/* Rust panel */}
+          {activeTab === 'rust' && (
+            <div className={styles.demoPanel}>
+              <div className={styles.demoCodeHeader}>
+                <div className={styles.windowDots}>
+                  <span className={`${styles.windowDot} ${styles.dotRed}`} />
+                  <span className={`${styles.windowDot} ${styles.dotYellow}`} />
+                  <span className={`${styles.windowDot} ${styles.dotGreen}`} />
+                </div>
+                <button className={styles.copyBtn} onClick={handleCopy}>{copyLabel}</button>
+              </div>
+              <RustCode />
+              <div className={styles.terminalOutput}>
+                <span className={styles.terminalPrompt}>$</span> cargo run<br />
+                <span className={styles.terminalAnswer}>&rarr; The total revenue for fiscal year 2024 was $2.3 billion, a 15% increase YoY.</span>
+                <span className={styles.terminalCursor} />
+              </div>
+            </div>
+          )}
+
+          {/* Install bar */}
+          <div className={styles.installBar}>
+            <div className={styles.installCommand}>
+              <span>$</span> {installCmd}
+            </div>
+            <button className={styles.installBtn} onClick={handleInstallCopy}>{installLabel}</button>
+          </div>
         </div>
       </div>
     </section>
@@ -144,28 +240,133 @@ function SectionWhy() {
 }
 
 function SectionHowItWorks() {
-  const steps = [
-    { num: '01', title: 'Index', desc: 'Parse documents into hierarchical semantic trees with LLM-generated summaries.' },
-    { num: '02', title: 'Navigate', desc: 'Pilot uses LLM to navigate the tree at key forks \u2014 beam search explores multiple paths in parallel.' },
-    { num: '03', title: 'Retrieve', desc: 'Evaluate sufficiency and backtrack if needed. Aggregate only the most relevant content within budget.' },
-  ];
+  return (
+    <section className={styles.section}>
+      <div className={styles.sectionInner}>
+        <Heading as="h2" className={styles.sectionTitle}>
+          How does Vectorless work?
+        </Heading>
+        <p className={styles.sectionSubtitle}>
+          You declare a few lines of code. We do everything else.
+        </p>
+        <div className={styles.workflowWrapper}>
+          <img src="/img/workflow.svg" alt="How Vectorless works" className={styles.workflowImg} />
+        </div>
+      </div>
+    </section>
+  );
+}
+
+const USE_CASES = [
+  {
+    title: 'Financial reports',
+    desc: 'Extract specific KPIs from 10\u2011K, annual reports, or earnings transcripts \u2014 even across fiscal years.',
+    query: '\u201cWhat was the net profit margin for Q3 2024?\u201d',
+    answer: '18.4%, up from 16.2% in Q3 2023. Source: Section 6.2, page 34.',
+  },
+  {
+    title: 'Legal & contracts',
+    desc: 'Locate clauses, definitions, or obligations across complex agreements without missing cross\u2011references.',
+    query: '\u201cWhich sections define \u2018force majeure\u2019 and what are the notice requirements?\u201d',
+    answer: 'Section 12.3(a) + 12.3(b) \u2014 30\u2011day written notice required.',
+  },
+  {
+    title: 'Technical docs',
+    desc: 'Navigate large API references, internal wikis, or on\u2011prem manuals with step\u2011by\u2011step reasoning.',
+    query: '\u201cHow to configure authentication for the WebSocket gateway?\u201d',
+    answer: 'See \u201cWebSocket Auth\u201d \u2192 section 4.2.1: use Authorization: Bearer <token>.',
+  },
+  {
+    title: 'Research papers',
+    desc: 'Cross\u2011reference findings, tables, or citations across arXiv preprints or internal literature.',
+    query: '\u201cWhat datasets were used for evaluation in Section 4?\u201d',
+    answer: 'Table 2: SQuAD, Natural Questions, and TriviaQA.',
+  },
+  {
+    title: 'Cross\u2011document analysis',
+    desc: 'Compare metrics, definitions, or timelines across multiple reports in one query.',
+    query: '\u201cCompare R&D spending from 2023 vs 2024 annual reports.\u201d',
+    answer: '2023: $12.4M (page 9) \u00b7 2024: $15.1M (page 11) \u2192 +21.8% YoY.',
+  },
+  {
+    title: 'Compliance & audit',
+    desc: 'Trace every retrieved statement back to its source \u2014 full explainability for regulated industries.',
+    query: '\u201cShow me all references to data retention policy.\u201d',
+    answer: 'Section 3.2 (page 8), Section 5.1 (page 14), and Appendix B.',
+  },
+];
+
+function SectionUseCases() {
+  const [current, setCurrent] = useState(0);
+  const outerRef = useRef<HTMLDivElement>(null);
+  const trackRef = useRef<HTMLDivElement>(null);
+  const [offset, setOffset] = useState(0);
+
+  const total = USE_CASES.length;
+
+  const measure = useCallback(() => {
+    if (!outerRef.current || !trackRef.current) return;
+    const outerW = outerRef.current.offsetWidth;
+    const firstCard = trackRef.current.children[0] as HTMLElement;
+    if (!firstCard) return;
+    const cardW = firstCard.offsetWidth;
+    const gap = 24; // 1.5rem
+    const step = cardW + gap;
+    const newOffset = outerW / 2 - current * step - cardW / 2;
+    setOffset(newOffset);
+  }, [current]);
+
+  useEffect(() => {
+    measure();
+    window.addEventListener('resize', measure);
+    return () => window.removeEventListener('resize', measure);
+  }, [measure]);
+
+  const prev = () => setCurrent(i => Math.max(0, i - 1));
+  const next = () => setCurrent(i => Math.min(total - 1, i + 1));
 
   return (
-    <section className={`${styles.section} ${styles.sectionAlt}`}>
+    <section className={styles.section}>
       <div className={styles.sectionInner}>
         <Heading as="h2" className={styles.sectionTitle}>
-          How It Works
+          Use cases &middot; precision reasoning
         </Heading>
-        <div className={styles.steps}>
-          {steps.map((step, i) => (
-            <div key={i} className={styles.step}>
-              <div className={styles.stepNum}>{step.num}</div>
-              <div className={styles.stepBody}>
-                <Heading as="h3" className={styles.stepTitle}>{step.title}</Heading>
-                <p className={styles.stepDesc}>{step.desc}</p>
+        <p className={styles.sectionSubtitle}>
+          Vectorless navigates through the structure of any document to retrieve exact context.
+        </p>
+        <div className={styles.sliderOuter} ref={outerRef}>
+          <div
+            className={styles.sliderTrack}
+            ref={trackRef}
+            style={{transform: `translateX(${offset}px)`}}>
+            {USE_CASES.map((c, i) => (
+              <div
+                key={i}
+                className={`${styles.caseCard} ${i === current ? styles.caseCardActive : ''}`}>
+                <Heading as="h3" className={styles.caseTitle}>{c.title}</Heading>
+                <p className={styles.caseDesc}>{c.desc}</p>
+                <div className={styles.caseQuery}>
+                  <div className={styles.caseQueryLabel}>Query:</div>
+                  <div className={styles.caseQueryText}>{c.query}</div>
+                  <div className={styles.caseAnswer}>{c.answer}</div>
+                </div>
               </div>
-            </div>
-          ))}
+            ))}
+          </div>
+        </div>
+        <div className={styles.sliderNav}>
+          <button className={styles.sliderBtn} onClick={prev} aria-label="Previous">&larr;</button>
+          <div className={styles.sliderDots}>
+            {USE_CASES.map((_, i) => (
+              <button
+                key={i}
+                className={`${styles.sliderDot} ${i === current ? styles.sliderDotActive : ''}`}
+                onClick={() => setCurrent(i)}
+                aria-label={`Go to slide ${i + 1}`}
+              />
+            ))}
+          </div>
+          <button className={styles.sliderBtn} onClick={next} aria-label="Next">&rarr;</button>
         </div>
       </div>
     </section>
@@ -173,28 +374,49 @@ function SectionHowItWorks() {
 }
 
 function SectionCTA() {
+  const [pipLabel, setPipLabel] = useState('Copy');
+  const [cargoLabel, setCargoLabel] = useState('Copy');
+
+  const handlePipCopy = () => {
+    navigator.clipboard.writeText('pip install vectorless');
+    setPipLabel('\u2713');
+    setTimeout(() => setPipLabel('Copy'), 1500);
+  };
+
+  const handleCargoCopy = () => {
+    navigator.clipboard.writeText('cargo add vectorless');
+    setCargoLabel('\u2713');
+    setTimeout(() => setCargoLabel('Copy'), 1500);
+  };
+
   return (
     <section className={styles.section}>
       <div className={styles.sectionInner}>
         <div className={styles.ctaBox}>
           <Heading as="h2" className={styles.ctaTitle}>
-            Start building in minutes
+            Start reasoning, not vectoring
           </Heading>
-          <p className={styles.ctaDesc}>
-            <code>pip install vectorless</code>
-          </p>
-          <div className={styles.ctaActions}>
-            <Link className={styles.buttonPrimary} to="/docs/intro">
-              Read the Docs
-            </Link>
+          <div className={styles.ctaButtons}>
             <Link
-              className={styles.buttonSecondary}
+              className={styles.githubStarButton}
               href="https://github.com/vectorlessflow/vectorless"
               target="_blank"
               rel="noopener noreferrer">
-              View on GitHub
+              <svg stroke="currentColor" fill="currentColor" strokeWidth="0" viewBox="0 0 496 512" height="22" width="22" xmlns="http://www.w3.org/2000/svg"><path d="M165.9 397.4c0 2-2.3 3.6-5.2 3.6-3.3.3-5.6-1.3-5.6-3.6 0-2 2.3-3.6 5.2-3.6 3-.3 5.6 1.3 5.6 3.6zm-31.1-4.5c-.7 2 1.3 4.3 4.3 4.9 2.6 1 5.6 0 6.2-2s-1.3-4.3-4.3-5.2c-2.6-.7-5.5.3-6.2 2.3zm44.2-1.7c-2.9.7-4.9 2.6-4.6 4.9.3 2 2.9 3.3 5.9 2.6 2.9-.7 4.9-2.6 4.6-4.6-.3-1.9-3-3.2-5.9-2.9zM244.8 8C106.1 8 0 113.3 0 252c0 110.9 69.8 205.8 169.5 239.2 12.8 2.3 17.3-5.6 17.3-12.1 0-6.2-.3-40.4-.3-61.4 0 0-70 15-84.7-29.8 0 0-11.4-29.1-27.8-36.6 0 0-22.9-15.7 1.6-15.4 0 0 24.9 2 38.6 25.8 21.9 38.6 58.6 27.5 72.9 20.9 2.3-16 8.8-27.1 16-33.7-55.9-6.2-112.3-14.3-112.3-110.5 0-27.5 7.6-41.3 23.6-58.9-2.6-6.5-11.1-33.3 2.6-67.9 20.9-6.5 69 27 69 27 20-5.6 41.5-8.5 62.8-8.5s42.8 2.9 62.8 8.5c0 0 48.1-33.6 69-27 13.7 34.7 5.2 61.4 2.6 67.9 16 17.7 25.8 31.5 25.8 58.9 0 96.5-58.9 104.2-114.8 110.5 9.2 7.9 17 22.9 17 46.4 0 33.7-.3 75.4-.3 83.6 0 6.5 4.6 14.4 17.3 12.1C428.2 457.8 496 362.9 496 252 496 113.3 383.5 8 244.8 8zM97.2 352.9c-1.3 1-1 3.3.7 5.2 1.6 1.6 3.9 2.3 5.2 1 1.3-1 1-3.3-.7-5.2-1.6-1.6-3.9-2.3-5.2-1zm-10.8-8.1c-.7 1.3.3 2.9 2.3 3.9 1.6 1 3.6.7 4.3-.7.7-1.3-.3-2.9-2.3-3.9-2-.6-3.6-.3-4.3.7zm32.4 35.6c-1.6 1.3-1 4.3 1.3 6.2 2.3 2.3 5.2 2.6 6.5 1 1.3-1.3.7-4.3-1.3-6.2-2.2-2.3-5.2-2.6-6.5-1zm-11.4-14.7c-1.6 1-1.6 3.6 0 5.9 1.6 2.3 4.3 3.3 5.6 2.3 1.6-1.3 1.6-3.9 0-6.2-1.4-2.3-4-3.3-5.6-2z"></path></svg>
+              Star on GitHub
+              <svg className={styles.starIcon} stroke="currentColor" fill="currentColor" strokeWidth="0" viewBox="0 0 24 24" height="22" width="22" xmlns="http://www.w3.org/2000/svg"><path d="M16.6,20.463a1.5,1.5,0,0,1-.7-.174l-3.666-1.927a.5.5,0,0,0-.464,0L8.1,20.289a1.5,1.5,0,0,1-2.177-1.581l.7-4.082a.5.5,0,0,0-.143-.442L3.516,11.293a1.5,1.5,0,0,1,.832-2.559l4.1-.6a.5.5,0,0,0,.376-.273l1.833-3.714a1.5,1.5,0,0,1,2.69,0l1.833,3.714a.5.5,0,0,0,.376.274l4.1.6a1.5,1.5,0,0,1,.832,2.559l-2.965,2.891a.5.5,0,0,0-.144.442l.7,4.082A1.5,1.5,0,0,1,16.6,20.463Zm-3.9-2.986L16.364,19.4a.5.5,0,0,0,.725-.527l-.7-4.082a1.5,1.5,0,0,1,.432-1.328l2.965-2.89a.5.5,0,0,0-.277-.853l-4.1-.6a1.5,1.5,0,0,1-1.13-.821L12.449,4.594a.516.516,0,0,0-.9,0L9.719,8.308a1.5,1.5,0,0,1-1.13.82l-4.1.6a.5.5,0,0,0-.277.853L7.18,13.468A1.5,1.5,0,0,1,7.611,14.8l-.7,4.082a.5.5,0,0,0,.726.527L11.3,17.477a1.5,1.5,0,0,1,1.4,0Z"></path></svg>
             </Link>
           </div>
+          <div className={styles.ctaInstallCards}>
+            <div className={styles.ctaInstallItem}>
+              <div className={styles.ctaInstallCommand}><span>$</span> pip install vectorless</div>
+              <button className={styles.ctaCopyIcon} onClick={handlePipCopy}>{pipLabel}</button>
+            </div>
+            <div className={styles.ctaInstallItem}>
+              <div className={styles.ctaInstallCommand}><span>$</span> cargo add vectorless</div>
+              <button className={styles.ctaCopyIcon} onClick={handleCargoCopy}>{cargoLabel}</button>
+            </div>
+          </div>
         </div>
       </div>
     </section>
@@ -209,8 +431,9 @@ export default function Home(): ReactNode {
       description="Reasoning-native document intelligence engine. No vector database, no embeddings. Retrieve by reasoning.">
       <HomepageHeader />
       <main>
-        <SectionWhy />
+        <SectionGetStarted />
         <SectionHowItWorks />
+        <SectionUseCases />
         <SectionCTA />
       </main>
     </Layout>
diff --git a/docs/src/theme/Navbar/index.tsx b/docs/src/theme/Navbar/index.tsx
index 35abb2a6..2437b65e 100644
--- a/docs/src/theme/Navbar/index.tsx
+++ b/docs/src/theme/Navbar/index.tsx
@@ -26,6 +26,7 @@ export default function Navbar(): React.ReactElement {
               alt={logo?.alt || title}
             />
           </Link>
+        <div className={styles.logo}>Vectorless</div>
         </div>
         <div className={styles.navbarCenter}>
           {leftItems.map((item, i) => <NavbarItem {...(item as NavbarItemConfig)} key={i} />)}
diff --git a/docs/src/theme/Navbar/styles.module.css b/docs/src/theme/Navbar/styles.module.css
index c8d5283d..9e3c803e 100644
--- a/docs/src/theme/Navbar/styles.module.css
+++ b/docs/src/theme/Navbar/styles.module.css
@@ -27,10 +27,17 @@
 }
 
 .navbarLogo {
-  height: 32px;
+  height: 40px;
   width: auto;
 }
 
+.logo {
+  font-size: 1.6rem;
+  font-weight: 800;
+  letter-spacing: -0.02em;
+  color: var(--primary);
+}
+
 /* Center: navigation links */
 .navbarCenter {
   flex: 1;
diff --git a/pyproject.toml b/pyproject.toml
index f752a6ea..9d83bdd6 100644
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -4,7 +4,7 @@ build-backend = "maturin"
 
 [project]
 name = "vectorless"
-version = "0.1.7"
+version = "0.1.8"
 description = "Reasoning-native document intelligence engine for AI"
 readme = "README.md"
 requires-python = ">=3.9"
diff --git a/python/src/config.rs b/python/src/config.rs
new file mode 100644
index 00000000..93a0552e
--- /dev/null
+++ b/python/src/config.rs
@@ -0,0 +1,86 @@
+// Copyright (c) 2026 vectorless developers
+// SPDX-License-Identifier: Apache-2.0
+
+//! Config Python wrapper.
+
+use pyo3::prelude::*;
+
+/// Advanced configuration for Engine internals.
+///
+/// Create a Config to customize storage, retrieval, concurrency,
+/// and other engine parameters beyond the basic builder API.
+///
+/// Example:
+///
+/// ```python
+/// from vectorless import Config, Engine
+///
+/// config = Config()
+/// config.set_workspace_dir("/data/vectorless")
+/// config.set_top_k(10)
+/// config.set_max_concurrent_requests(20)
+///
+/// engine = Engine(api_key="sk-...", model="gpt-4o", config=config)
+/// ```
+#[pyclass(name = "Config")]
+pub struct PyConfig {
+    pub(crate) inner: vectorless::Config,
+}
+
+#[pymethods]
+impl PyConfig {
+    /// Create a new Config with defaults.
+    #[new]
+    fn new() -> Self {
+        Self {
+            inner: vectorless::Config::default(),
+        }
+    }
+
+    /// Set the workspace directory for persisted documents.
+    ///
+    /// Default: ~/.vectorless
+    fn set_workspace_dir(&mut self, dir: &str) {
+        self.inner.storage.workspace_dir = std::path::PathBuf::from(dir);
+    }
+
+    /// Set the number of top-k results to return from queries.
+    ///
+    /// Default: 3
+    fn set_top_k(&mut self, k: usize) {
+        self.inner.retrieval.top_k = k;
+    }
+
+    /// Set the maximum concurrent LLM API calls.
+    ///
+    /// Default: 10
+    fn set_max_concurrent_requests(&mut self, max: usize) {
+        self.inner.concurrency.max_concurrent_requests = max;
+    }
+
+    /// Set the rate limit (requests per minute).
+    ///
+    /// Default: 500
+    fn set_requests_per_minute(&mut self, rpm: usize) {
+        self.inner.concurrency.requests_per_minute = rpm;
+    }
+
+    /// Set the maximum iterations for retrieval search.
+    fn set_max_iterations(&mut self, max: usize) {
+        self.inner.retrieval.search.max_iterations = max;
+    }
+
+    /// Set the retrieval temperature.
+    ///
+    /// Default: 0.0
+    fn set_temperature(&mut self, temp: f32) {
+        self.inner.retrieval.temperature = temp;
+    }
+
+    /// Enable or disable metrics collection.
+    ///
+    /// Default: True
+    fn set_metrics_enabled(&mut self, enabled: bool) {
+        self.inner.metrics.enabled = enabled;
+    }
+}
diff --git a/python/src/context.rs b/python/src/context.rs
new file mode 100644
index 00000000..3eedc6f9
--- /dev/null
+++ b/python/src/context.rs
@@ -0,0 +1,288 @@
+// Copyright (c) 2026 vectorless developers
+// SPDX-License-Identifier: Apache-2.0
+
+//! IndexContext, QueryContext, and IndexOptions Python wrappers.
+
+use pyo3::prelude::*;
+
+use ::vectorless::client::{DocumentFormat, IndexContext, IndexMode, IndexOptions, QueryContext};
+
+use super::error::VectorlessError;
+
+/// Parse format string to DocumentFormat.
+fn parse_format(format: &str) -> PyResult<DocumentFormat> {
+    match format.to_lowercase().as_str() {
+        "markdown" | "md" => Ok(DocumentFormat::Markdown),
+        "pdf" => Ok(DocumentFormat::Pdf),
+        _ => Err(PyErr::from(VectorlessError::new(
+            format!("Unknown format: {}. Supported: markdown, pdf", format),
+            "config",
+        ))),
+    }
+}
+
+// ============================================================
+// IndexOptions
+// ============================================================
+
+/// Options for controlling indexing behavior.
+///
+/// Args:
+///     mode: Indexing mode - "default", "force", or "incremental".
+///     generate_summaries: Whether to generate summaries. Default: True.
+///     generate_description: Whether to generate document description. Default: False.
+///     include_text: Whether to include node text in the tree. Default: True.
+///     generate_ids: Whether to generate node IDs. Default: True.
+///     enable_synonym_expansion: Whether to expand keywords with LLM-generated
+///         synonyms during indexing. Improves recall for differently-worded queries.
+///         Default: False.
+#[pyclass(name = "IndexOptions", skip_from_py_object)]
+#[derive(Clone)]
+pub struct PyIndexOptions {
+    pub(crate) inner: IndexOptions,
+}
+
+#[pymethods]
+impl PyIndexOptions {
+    #[new]
+    #[pyo3(signature = (mode="default", generate_summaries=true, generate_description=false, include_text=true, generate_ids=true, enable_synonym_expansion=false))]
+    fn new(
+        mode: &str,
+        generate_summaries: bool,
+        generate_description: bool,
+        include_text: bool,
+        generate_ids: bool,
+        enable_synonym_expansion: bool,
+    ) -> PyResult<Self> {
+        let mut opts = IndexOptions::new();
+        match mode {
+            "default" => {}
+            "force" => opts = opts.with_mode(IndexMode::Force),
+            "incremental" => opts = opts.with_mode(IndexMode::Incremental),
+            _ => {
+                return Err(PyErr::from(VectorlessError::new(
+                    format!(
+                        "Unknown mode: {}. Supported: default, force, incremental",
+                        mode
+                    ),
+                    "config",
+                )));
+            }
+        }
+        opts.generate_summaries = generate_summaries;
+        opts.generate_description = generate_description;
+        opts.include_text = include_text;
+        opts.generate_ids = generate_ids;
+        opts.enable_synonym_expansion = enable_synonym_expansion;
+        Ok(Self { inner: opts })
+    }
+
+    fn __repr__(&self) -> String {
+        format!(
+            "IndexOptions(mode='{}', generate_summaries={}, generate_description={}, include_text={}, generate_ids={}, enable_synonym_expansion={})",
+            match self.inner.mode {
+                IndexMode::Default => "default",
+                IndexMode::Force => "force",
+                IndexMode::Incremental => "incremental",
+            },
+            self.inner.generate_summaries,
+            self.inner.generate_description,
+            self.inner.include_text,
+            self.inner.generate_ids,
+            self.inner.enable_synonym_expansion,
+        )
+    }
+}
+
+// ============================================================
+// IndexContext
+// ============================================================
+
+/// Context for indexing a document.
+///
+/// Create using the static methods:
+///
+/// ```python
+/// from vectorless import IndexContext
+///
+/// # Single file
+/// ctx = IndexContext.from_path("./document.pdf")
+///
+/// # Multiple files
+/// ctx = IndexContext.from_paths(["./a.pdf", "./b.md"])
+///
+/// # Directory
+/// ctx = IndexContext.from_dir("./docs/")
+///
+/// # From text
+/// ctx = IndexContext.from_content("# Title\\nContent...", "markdown").with_name("doc")
+///
+/// # From bytes
+/// ctx = IndexContext.from_bytes(data, "pdf").with_name("doc")
+/// ```
+#[pyclass(name = "IndexContext")]
+pub struct PyIndexContext {
+    pub(crate) inner: IndexContext,
+}
+
+#[pymethods]
+impl PyIndexContext {
+    /// Create an IndexContext from a single file path.
+    #[staticmethod]
+    fn from_path(path: String) -> Self {
+        Self {
+            inner: IndexContext::from_path(&path),
+        }
+    }
+
+    /// Create an IndexContext from multiple file paths.
+    #[staticmethod]
+    fn from_paths(paths: Vec<String>) -> Self {
+        Self {
+            inner: IndexContext::from_paths(&paths),
+        }
+    }
+
+    /// Create an IndexContext from all supported files in a directory.
+    ///
+    /// Args:
+    ///     path: Directory path to scan.
+    ///     recursive: If True, scan subdirectories recursively. Default: False.
+    #[staticmethod]
+    #[pyo3(signature = (path, recursive=false))]
+    fn from_dir(path: String, recursive: bool) -> Self {
+        let inner = IndexContext::from_dir(&path, recursive);
+        Self { inner }
+    }
+
+    /// Create an IndexContext from text content.
+    #[staticmethod]
+    #[pyo3(signature = (content, format="markdown"))]
+    fn from_content(content: String, format: &str) -> PyResult<Self> {
+        let doc_format = parse_format(format)?;
+        let ctx = IndexContext::from_content(&content, doc_format);
+        Ok(Self { inner: ctx })
+    }
+
+    /// Create an IndexContext from binary data.
+    #[staticmethod]
+    fn from_bytes(data: Vec<u8>, format: &str) -> PyResult<Self> {
+        let doc_format = parse_format(format)?;
+        let ctx = IndexContext::from_bytes(data, doc_format);
+        Ok(Self { inner: ctx })
+    }
+
+    /// Set the document name (single-source only).
+    fn with_name(&self, name: String) -> Self {
+        let ctx = self.inner.clone().with_name(&name);
+        Self { inner: ctx }
+    }
+
+    /// Apply indexing options.
+    fn with_options(&self, options: &PyIndexOptions) -> Self {
+        let ctx = self.inner.clone().with_options(options.inner.clone());
+        Self { inner: ctx }
+    }
+
+    /// Set indexing mode.
+    fn with_mode(&self, mode: &str) -> PyResult<Self> {
+        let m = match mode {
+            "default" => IndexMode::Default,
+            "force" => IndexMode::Force,
+            "incremental" => IndexMode::Incremental,
+            _ => {
+                return Err(PyErr::from(VectorlessError::new(
+                    format!(
+                        "Unknown mode: {}. Supported: default, force, incremental",
+                        mode
+                    ),
+                    "config",
+                )));
+            }
+        };
+        let ctx = self.inner.clone().with_mode(m);
+        Ok(Self { inner: ctx })
+    }
+
+    /// Number of document sources.
+    fn __len__(&self) -> usize {
+        self.inner.len()
+    }
+
+    /// Whether no sources are present.
+    fn is_empty(&self) -> bool {
+        self.inner.is_empty()
+    }
+
+    fn __repr__(&self) -> String {
+        format!("IndexContext(sources={})", self.inner.len())
+    }
+}
+
+// ============================================================
+// QueryContext
+// ============================================================
+
+/// Context for a query operation.
+///
+/// ```python
+/// from vectorless import QueryContext
+///
+/// # Query specific documents
+/// ctx = QueryContext("What is the total revenue?").with_doc_ids([doc_id])
+///
+/// # Query multiple documents
+/// ctx = QueryContext("What is the architecture?").with_doc_ids(["doc-1", "doc-2"])
+///
+/// # Query entire workspace
+/// ctx = QueryContext("Explain the algorithm")
+/// ```
+#[pyclass(name = "QueryContext")]
+pub struct PyQueryContext {
+    pub(crate) inner: QueryContext,
+}
+
+#[pymethods]
+impl PyQueryContext {
+    /// Create a new query context (defaults to workspace scope).
+    #[new]
+    fn new(query: String) -> Self {
+        Self {
+            inner: QueryContext::new(&query),
+        }
+    }
+
+    /// Set scope to specific documents.
+    fn with_doc_ids(&self, doc_ids: Vec<String>) -> Self {
+        let ctx = self.inner.clone().with_doc_ids(doc_ids);
+        Self { inner: ctx }
+    }
+
+    /// Set scope to entire workspace.
+    fn with_workspace(&self) -> Self {
+        let ctx = self.inner.clone().with_workspace();
+        Self { inner: ctx }
+    }
+
+    /// Set the maximum tokens for the result content.
+    fn with_max_tokens(&self, tokens: usize) -> Self {
+        let ctx = self.inner.clone().with_max_tokens(tokens);
+        Self { inner: ctx }
+    }
+
+    /// Set whether to include the reasoning chain.
+    fn with_include_reasoning(&self, include: bool) -> Self {
+        let ctx = self.inner.clone().with_include_reasoning(include);
+        Self { inner: ctx }
+    }
+
+    /// Set the maximum tree traversal depth.
+    fn with_depth_limit(&self, depth: usize) -> Self {
+        let ctx = self.inner.clone().with_depth_limit(depth);
+        Self { inner: ctx }
+    }
+
+    fn __repr__(&self) -> String {
+        "QueryContext(...)".to_string()
+    }
+}
diff --git a/python/src/document.rs b/python/src/document.rs
new file mode 100644
index 00000000..eee70c0e
--- /dev/null
+++ b/python/src/document.rs
@@ -0,0 +1,59 @@
+// Copyright (c) 2026 vectorless developers
+// SPDX-License-Identifier: Apache-2.0
+
+//! DocumentInfo Python wrapper.
+
+use pyo3::prelude::*;
+
+use ::vectorless::client::DocumentInfo;
+
+/// Information about an indexed document.
+#[pyclass(name = "DocumentInfo")]
+pub struct PyDocumentInfo {
+    pub(crate) inner: DocumentInfo,
+}
+
+#[pymethods]
+impl PyDocumentInfo {
+    #[getter]
+    fn id(&self) -> &str {
+        &self.inner.id
+    }
+
+    #[getter]
+    fn name(&self) -> &str {
+        &self.inner.name
+    }
+
+    #[getter]
+    fn format(&self) -> &str {
+        &self.inner.format
+    }
+
+    #[getter]
+    fn description(&self) -> Option<&str> {
+        self.inner.description.as_deref()
+    }
+
+    #[getter]
+    fn source_path(&self) -> Option<&str> {
+        self.inner.source_path.as_deref()
+    }
+
+    #[getter]
+    fn page_count(&self) -> Option<usize> {
+        self.inner.page_count
+    }
+
+    #[getter]
+    fn line_count(&self) -> Option<usize> {
+        self.inner.line_count
+    }
+
+    fn __repr__(&self) -> String {
+        format!(
+            "DocumentInfo(id='{}', name='{}', format='{}')",
+            self.inner.id, self.inner.name, self.inner.format
+        )
+    }
+}
diff --git a/python/src/engine.rs b/python/src/engine.rs
new file mode 100644
index 00000000..8f7dc015
--- /dev/null
+++ b/python/src/engine.rs
@@ -0,0 +1,242 @@
+// Copyright (c) 2026 vectorless developers
+// SPDX-License-Identifier: Apache-2.0
+
+//! Engine Python wrapper and async helpers.
+
+use pyo3::prelude::*;
+use pyo3_async_runtimes::tokio::future_into_py;
+use std::sync::Arc;
+use tokio::runtime::Runtime;
+
+use ::vectorless::client::{Engine, EngineBuilder, IndexContext, QueryContext};
+
+use super::config::PyConfig;
+use super::context::{PyIndexContext, PyQueryContext};
+use super::document::PyDocumentInfo;
+use super::error::VectorlessError;
+use super::error::to_py_err;
+use super::graph::PyDocumentGraph;
+use super::metrics::PyMetricsReport;
+use super::results::{PyIndexResult, PyQueryResult};
+
+// ============================================================
+// Engine async helpers (named functions to avoid FnOnce HRTB issue)
+// ============================================================
+
+async fn run_index(engine: Arc<Engine>, ctx: IndexContext) -> PyResult<PyIndexResult> {
+    let result = engine.index(ctx).await.map_err(to_py_err)?;
+    Ok(PyIndexResult { inner: result })
+}
+
+async fn run_query(engine: Arc<Engine>, ctx: QueryContext) -> PyResult<PyQueryResult> {
+    let result = engine.query(ctx).await.map_err(to_py_err)?;
+    Ok(PyQueryResult { inner: result })
+}
+
+async fn run_list(engine: Arc<Engine>) -> PyResult<Vec<PyDocumentInfo>> {
+    let docs = engine.list().await.map_err(to_py_err)?;
+    Ok(docs
+        .into_iter()
+        .map(|d| PyDocumentInfo { inner: d })
+        .collect())
+}
+
+async fn run_remove(engine: Arc<Engine>, doc_id: String) -> PyResult<bool> {
+    engine.remove(&doc_id).await.map_err(to_py_err)
+}
+
+async fn run_clear(engine: Arc<Engine>) -> PyResult<usize> {
+    engine.clear().await.map_err(to_py_err)
+}
+
+async fn run_exists(engine: Arc<Engine>, doc_id: String) -> PyResult<bool> {
+    engine.exists(&doc_id).await.map_err(to_py_err)
+}
+
+async fn run_get_graph(engine: Arc<Engine>) -> PyResult<Option<PyDocumentGraph>> {
+    let graph = engine.get_graph().await.map_err(to_py_err)?;
+    Ok(graph.map(|g| PyDocumentGraph { inner: g }))
+}
+
+fn run_metrics_report(engine: Arc<Engine>) -> PyMetricsReport {
+    PyMetricsReport {
+        inner: engine.metrics_report(),
+    }
+}
+
+// ============================================================
+// Engine
+// ============================================================
+
+/// The main vectorless engine.
+///
+/// `api_key` and `model` are **required**.
+///
+/// ```python
+/// from vectorless import Engine, IndexContext, QueryContext
+///
+/// engine = Engine(
+///     api_key="sk-...",
+///     model="gpt-4o",
+/// )
+///
+/// # Index
+/// result = await engine.index(IndexContext.from_path("./report.pdf"))
+/// doc_id = result.doc_id
+///
+/// # Query
+/// answer = await engine.query(QueryContext("What is the revenue?").with_doc_ids([doc_id]))
+/// print(answer.single().content)
+/// ```
+#[pyclass(name = "Engine")]
+pub struct PyEngine {
+    inner: Arc<Engine>,
+}
+
+#[pymethods]
+impl PyEngine {
+    /// Create a new Engine.
+    ///
+    /// Args:
+    ///     api_key: **Required**. LLM API key.
+    ///     model: **Required**. LLM model name.
+    ///     endpoint: Optional API endpoint.
+    ///     config: Optional Config for advanced tuning.
+    ///
+    /// Raises:
+    ///     VectorlessError: If engine creation fails.
+    #[new]
+    #[pyo3(signature = (api_key=None, model=None, endpoint=None, config=None))]
+    fn new(
+        api_key: Option<String>,
+        model: Option<String>,
+        endpoint: Option<String>,
+        config: Option<PyRef<PyConfig>>,
+    ) -> PyResult<Self> {
+        let rt = Runtime::new().map_err(|e| {
+            PyErr::from(VectorlessError::new(
+                format!("Failed to create tokio runtime: {}", e),
+                "config",
+            ))
+        })?;
+
+        let rust_config = config.map(|c| c.inner.clone());
+
+        let engine = rt.block_on(async {
+            let mut builder = EngineBuilder::new();
+
+            if let Some(config) = rust_config {
+                builder = builder.with_config(config);
+            }
+
+            if let Some(m) = &model {
+                builder = builder.with_model(m);
+            }
+            if let Some(e) = &endpoint {
+                builder = builder.with_endpoint(e);
+            }
+            if let Some(key) = api_key {
+                builder = builder.with_key(key);
+            }
+
+            builder.build().await
+        });
+
+        let engine = engine.map_err(|e| {
+            PyErr::from(VectorlessError::new(
+                format!("Failed to create engine: {}", e),
+                "config",
+            ))
+        })?;
+
+        Ok(Self {
+            inner: Arc::new(engine),
+        })
+    }
+
+    /// Index a document.
+    ///
+    /// Args:
+    ///     ctx: IndexContext created from from_path, from_paths, from_dir, etc.
+    ///
+    /// Returns:
+    ///     IndexResult with doc_id and items.
+    ///
+    /// Raises:
+    ///     VectorlessError: If indexing fails.
+    fn index<'py>(&self, py: Python<'py>, ctx: &PyIndexContext) -> PyResult<Bound<'py, PyAny>> {
+        let engine = Arc::clone(&self.inner);
+        let index_ctx = ctx.inner.clone();
+        future_into_py(py, run_index(engine, index_ctx))
+    }
+
+    /// Query indexed documents.
+    ///
+    /// Args:
+    ///     ctx: QueryContext with query text and scope.
+    ///
+    /// Returns:
+    ///     QueryResult with answer and score.
+    ///
+    /// Raises:
+    ///     VectorlessError: If query fails.
+    fn query<'py>(&self, py: Python<'py>, ctx: &PyQueryContext) -> PyResult<Bound<'py, PyAny>> {
+        let engine = Arc::clone(&self.inner);
+        let query_ctx = ctx.inner.clone();
+        future_into_py(py, run_query(engine, query_ctx))
+    }
+
+    /// List all indexed documents.
+    ///
+    /// Returns:
+    ///     List of DocumentInfo objects.
+    fn list<'py>(&self, py: Python<'py>) -> PyResult<Bound<'py, PyAny>> {
+        let engine = Arc::clone(&self.inner);
+        future_into_py(py, run_list(engine))
+    }
+
+    /// Remove a document by ID.
+    ///
+    /// Returns:
+    ///     True if removed, False if not found.
+    fn remove<'py>(&self, py: Python<'py>, doc_id: String) -> PyResult<Bound<'py, PyAny>> {
+        let engine = Arc::clone(&self.inner);
+        future_into_py(py, run_remove(engine, doc_id))
+    }
+
+    /// Remove all indexed documents.
+    ///
+    /// Returns:
+    ///     Number of documents removed.
+    fn clear<'py>(&self, py: Python<'py>) -> PyResult<Bound<'py, PyAny>> {
+        let engine = Arc::clone(&self.inner);
+        future_into_py(py, run_clear(engine))
+    }
+
+    /// Check if a document exists.
+    fn exists<'py>(&self, py: Python<'py>, doc_id: String) -> PyResult<Bound<'py, PyAny>> {
+        let engine = Arc::clone(&self.inner);
+        future_into_py(py, run_exists(engine, doc_id))
+    }
+
+    /// Get the cross-document relationship graph.
+    ///
+    /// Returns:
+    ///     DocumentGraph if any documents exist, else None.
+    fn get_graph<'py>(&self, py: Python<'py>) -> PyResult<Bound<'py, PyAny>> {
+        let engine = Arc::clone(&self.inner);
+        future_into_py(py, run_get_graph(engine))
+    }
+
+    /// Generate a complete metrics report.
+    ///
+    /// Returns:
+    ///     MetricsReport with LLM, Pilot, and Retrieval metrics.
+    fn metrics_report(&self) -> PyMetricsReport {
+        run_metrics_report(Arc::clone(&self.inner))
+    }
+
+    fn __repr__(&self) -> String {
+        "Engine(...)".to_string()
+    }
+}
diff --git a/python/src/error.rs b/python/src/error.rs
new file mode 100644
index 00000000..d128ce5a
--- /dev/null
+++ b/python/src/error.rs
@@ -0,0 +1,71 @@
+// Copyright (c) 2026 vectorless developers
+// SPDX-License-Identifier: Apache-2.0
+
+//! Python exception types and error conversion.
+
+use pyo3::exceptions::PyException;
+use pyo3::prelude::*;
+
+use ::vectorless::error::Error as RustError;
+
+/// Python exception for vectorless errors.
+#[pyclass(extends = PyException, subclass)]
+pub struct VectorlessError {
+    message: String,
+    kind: String,
+}
+
+#[pymethods]
+impl VectorlessError {
+    #[new]
+    fn new_py(message: String, kind: String) -> Self {
+        Self { message, kind }
+    }
+
+    #[getter]
+    fn message(&self) -> &str {
+        &self.message
+    }
+
+    #[getter]
+    fn kind(&self) -> &str {
+        &self.kind
+    }
+
+    fn __str__(&self) -> &str {
+        &self.message
+    }
+
+    fn __repr__(&self) -> String {
+        format!("VectorlessError('{}', kind='{}')", self.message, self.kind)
+    }
+}
+
+impl VectorlessError {
+    pub fn new(message: String, kind: &str) -> Self {
+        Self {
+            message,
+            kind: kind.to_string(),
+        }
+    }
+}
+
+impl From<VectorlessError> for PyErr {
+    fn from(err: VectorlessError) -> PyErr {
+        PyErr::new::<VectorlessError, _>((err.message, err.kind))
+    }
+}
+
+/// Convert vectorless errors to Python exceptions.
+pub fn to_py_err(e: RustError) -> PyErr {
+    let message = e.to_string();
+    let kind = match &e {
+        RustError::DocumentNotFound(_) => "not_found",
+        RustError::Parse(_) => "parse",
+        RustError::Config(_) => "config",
+        RustError::Workspace(_) => "workspace",
+        RustError::Llm(_) => "llm",
+        _ => "unknown",
+    };
+    VectorlessError::new(message, kind).into()
+}
diff --git a/python/src/graph.rs b/python/src/graph.rs
new file mode 100644
index 00000000..1aacd47f
--- /dev/null
+++ b/python/src/graph.rs
@@ -0,0 +1,212 @@
+// Copyright (c) 2026 vectorless developers
+// SPDX-License-Identifier: Apache-2.0
+
+//! DocumentGraph Python wrappers.
+
+use pyo3::prelude::*;
+
+use ::vectorless::graph::{
+    DocumentGraph, DocumentGraphNode, EdgeEvidence, GraphEdge, WeightedKeyword,
+};
+
+/// A keyword with weight from document analysis.
+#[pyclass(name = "WeightedKeyword")]
+pub struct PyWeightedKeyword {
+    pub(crate) inner: WeightedKeyword,
+}
+
+#[pymethods]
+impl PyWeightedKeyword {
+    #[getter]
+    fn keyword(&self) -> &str {
+        &self.inner.keyword
+    }
+
+    #[getter]
+    fn weight(&self) -> f32 {
+        self.inner.weight
+    }
+
+    fn __repr__(&self) -> String {
+        format!(
+            "WeightedKeyword('{}', weight={:.2})",
+            self.inner.keyword, self.inner.weight
+        )
+    }
+}
+
+/// Evidence for a cross-document connection.
+#[pyclass(name = "EdgeEvidence")]
+pub struct PyEdgeEvidence {
+    pub(crate) inner: EdgeEvidence,
+}
+
+#[pymethods]
+impl PyEdgeEvidence {
+    /// Number of shared keywords.
+    #[getter]
+    fn shared_keyword_count(&self) -> usize {
+        self.inner.shared_keyword_count
+    }
+
+    /// Jaccard similarity of keyword sets.
+    #[getter]
+    fn keyword_jaccard(&self) -> f32 {
+        self.inner.keyword_jaccard
+    }
+
+    /// Shared keywords with weights.
+    #[getter]
+    fn shared_keywords(&self) -> Vec<(String, f32, f32)> {
+        self.inner
+            .shared_keywords
+            .iter()
+            .map(|sk| (sk.keyword.clone(), sk.source_weight, sk.target_weight))
+            .collect()
+    }
+
+    fn __repr__(&self) -> String {
+        format!(
+            "EdgeEvidence(shared={}, jaccard={:.2})",
+            self.inner.shared_keyword_count, self.inner.keyword_jaccard
+        )
+    }
+}
+
+/// An edge representing a relationship between two documents.
+#[pyclass(name = "GraphEdge")]
+pub struct PyGraphEdge {
+    pub(crate) inner: GraphEdge,
+}
+
+#[pymethods]
+impl PyGraphEdge {
+    /// Target document ID.
+    #[getter]
+    fn target_doc_id(&self) -> &str {
+        &self.inner.target_doc_id
+    }
+
+    /// Edge weight (connection strength).
+    #[getter]
+    fn weight(&self) -> f32 {
+        self.inner.weight
+    }
+
+    /// Evidence for this connection.
+    #[getter]
+    fn evidence(&self) -> PyEdgeEvidence {
+        PyEdgeEvidence {
+            inner: self.inner.evidence.clone(),
+        }
+    }
+
+    fn __repr__(&self) -> String {
+        format!(
+            "GraphEdge(target='{}', weight={:.2})",
+            self.inner.target_doc_id, self.inner.weight
+        )
+    }
+}
+
+/// A node in the document graph representing an indexed document.
+#[pyclass(name = "DocumentGraphNode")]
+pub struct PyDocumentGraphNode {
+    pub(crate) inner: DocumentGraphNode,
+}
+
+#[pymethods]
+impl PyDocumentGraphNode {
+    #[getter]
+    fn doc_id(&self) -> &str {
+        &self.inner.doc_id
+    }
+
+    #[getter]
+    fn title(&self) -> &str {
+        &self.inner.title
+    }
+
+    #[getter]
+    fn format(&self) -> &str {
+        &self.inner.format
+    }
+
+    #[getter]
+    fn node_count(&self) -> usize {
+        self.inner.node_count
+    }
+
+    /// Top keywords extracted from the document.
+    #[getter]
+    fn top_keywords(&self) -> Vec<PyWeightedKeyword> {
+        self.inner
+            .top_keywords
+            .iter()
+            .map(|kw| PyWeightedKeyword { inner: kw.clone() })
+            .collect()
+    }
+
+    fn __repr__(&self) -> String {
+        format!(
+            "DocumentGraphNode(doc_id='{}', title='{}')",
+            self.inner.doc_id, self.inner.title
+        )
+    }
+}
+
+/// Cross-document relationship graph.
+///
+/// Automatically rebuilt after indexing. Connects documents
+/// that share keywords via Jaccard similarity.
+#[pyclass(name = "DocumentGraph")]
+pub struct PyDocumentGraph {
+    pub(crate) inner: DocumentGraph,
+}
+
+#[pymethods]
+impl PyDocumentGraph {
+    /// Number of document nodes.
+    fn node_count(&self) -> usize {
+        self.inner.node_count()
+    }
+
+    /// Number of relationship edges.
+    fn edge_count(&self) -> usize {
+        self.inner.edge_count()
+    }
+
+    /// Get a document node by ID.
+    fn get_node(&self, doc_id: String) -> Option<PyDocumentGraphNode> {
+        self.inner
+            .get_node(&doc_id)
+            .map(|n| PyDocumentGraphNode { inner: n.clone() })
+    }
+
+    /// Get all document IDs in the graph.
+    fn doc_ids(&self) -> Vec<String> {
+        self.inner.doc_ids().map(|s| s.to_string()).collect()
+    }
+
+    /// Get edges (neighbors) for a document.
+    fn get_neighbors(&self, doc_id: String) -> Vec<PyGraphEdge> {
+        self.inner
+            .get_neighbors(&doc_id)
+            .iter()
+            .map(|e| PyGraphEdge { inner: e.clone() })
+            .collect()
+    }
+
+    /// Whether the graph is empty.
+    fn is_empty(&self) -> bool {
+        self.inner.is_empty()
+    }
+
+    fn __repr__(&self) -> String {
+        format!(
+            "DocumentGraph(nodes={}, edges={})",
+            self.inner.node_count(),
+            self.inner.edge_count()
+        )
+    }
+}
diff --git a/python/src/lib.rs b/python/src/lib.rs
index f6ff36ee..ebee59cf 100644
--- a/python/src/lib.rs
+++ b/python/src/lib.rs
@@ -3,1566 +3,30 @@
 
 //! Python bindings for vectorless.
 
-use pyo3::exceptions::PyException;
 use pyo3::prelude::*;
-use pyo3_async_runtimes::tokio::future_into_py;
-use std::sync::Arc;
-use tokio::runtime::Runtime;
 
-use ::vectorless::client::{
-    DocumentFormat, DocumentInfo, Engine, EngineBuilder, FailedItem, IndexContext, IndexItem,
-    IndexMode, IndexOptions, IndexResult, QueryContext, QueryResult, QueryResultItem,
+mod config;
+mod context;
+mod document;
+mod engine;
+mod error;
+mod graph;
+mod metrics;
+mod results;
+
+use config::PyConfig;
+use context::{PyIndexContext, PyIndexOptions, PyQueryContext};
+use document::PyDocumentInfo;
+use engine::PyEngine;
+use error::VectorlessError;
+use graph::{PyDocumentGraph, PyDocumentGraphNode, PyEdgeEvidence, PyGraphEdge, PyWeightedKeyword};
+use metrics::{
+    PyLlmMetricsReport, PyMetricsReport, PyPilotMetricsReport, PyRetrievalMetricsReport,
 };
-use ::vectorless::error::Error as RustError;
-use ::vectorless::metrics::IndexMetrics;
-use ::vectorless::metrics::{
-    LlmMetricsReport, MetricsReport, PilotMetricsReport, RetrievalMetricsReport,
+use results::{
+    PyFailedItem, PyIndexItem, PyIndexMetrics, PyIndexResult, PyQueryResult, PyQueryResultItem,
 };
 
-// ============================================================
-// Error Types
-// ============================================================
-
-/// Python exception for vectorless errors.
-#[pyclass(extends = PyException, subclass)]
-pub struct VectorlessError {
-    message: String,
-    kind: String,
-}
-
-#[pymethods]
-impl VectorlessError {
-    #[new]
-    fn new_py(message: String, kind: String) -> Self {
-        Self { message, kind }
-    }
-
-    #[getter]
-    fn message(&self) -> &str {
-        &self.message
-    }
-
-    #[getter]
-    fn kind(&self) -> &str {
-        &self.kind
-    }
-
-    fn __str__(&self) -> &str {
-        &self.message
-    }
-
-    fn __repr__(&self) -> String {
-        format!("VectorlessError('{}', kind='{}')", self.message, self.kind)
-    }
-}
-
-impl VectorlessError {
-    fn new(message: String, kind: &str) -> Self {
-        Self {
-            message,
-            kind: kind.to_string(),
-        }
-    }
-}
-
-impl From<VectorlessError> for PyErr {
-    fn from(err: VectorlessError) -> PyErr {
-        PyErr::new::<VectorlessError, _>((err.message, err.kind))
-    }
-}
-
-/// Convert vectorless errors to Python exceptions.
-fn to_py_err(e: RustError) -> PyErr {
-    let message = e.to_string();
-    let kind = match &e {
-        RustError::DocumentNotFound(_) => "not_found",
-        RustError::Parse(_) => "parse",
-        RustError::Config(_) => "config",
-        RustError::Workspace(_) => "workspace",
-        RustError::Llm(_) => "llm",
-        _ => "unknown",
-    };
-    VectorlessError::new(message, kind).into()
-}
-
-/// Parse format string to DocumentFormat.
-fn parse_format(format: &str) -> PyResult<DocumentFormat> {
-    match format.to_lowercase().as_str() {
-        "markdown" | "md" => Ok(DocumentFormat::Markdown),
-        "pdf" => Ok(DocumentFormat::Pdf),
-        _ => Err(PyErr::from(VectorlessError::new(
-            format!("Unknown format: {}. Supported: markdown, pdf", format),
-            "config",
-        ))),
-    }
-}
-
-// ============================================================
-// IndexOptions
-// ============================================================
-
-/// Options for controlling indexing behavior.
-///
-/// Args:
-///     mode: Indexing mode - "default", "force", or "incremental".
-///     generate_summaries: Whether to generate summaries. Default: True.
-///     generate_description: Whether to generate document description. Default: False.
-///     include_text: Whether to include node text in the tree. Default: True.
-///     generate_ids: Whether to generate node IDs. Default: True.
-///     enable_synonym_expansion: Whether to expand keywords with LLM-generated
-///         synonyms during indexing. Improves recall for differently-worded queries.
-///         Default: False.
-#[pyclass(name = "IndexOptions", skip_from_py_object)]
-#[derive(Clone)]
-pub struct PyIndexOptions {
-    inner: IndexOptions,
-}
-
-#[pymethods]
-impl PyIndexOptions {
-    #[new]
-    #[pyo3(signature = (mode="default", generate_summaries=true, generate_description=false, include_text=true, generate_ids=true, enable_synonym_expansion=false))]
-    fn new(
-        mode: &str,
-        generate_summaries: bool,
-        generate_description: bool,
-        include_text: bool,
-        generate_ids: bool,
-        enable_synonym_expansion: bool,
-    ) -> PyResult<Self> {
-        let mut opts = IndexOptions::new();
-        match mode {
-            "default" => {}
-            "force" => opts = opts.with_mode(IndexMode::Force),
-            "incremental" => opts = opts.with_mode(IndexMode::Incremental),
-            _ => {
-                return Err(PyErr::from(VectorlessError::new(
-                    format!(
-                        "Unknown mode: {}. Supported: default, force, incremental",
-                        mode
-                    ),
-                    "config",
-                )));
-            }
-        }
-        opts.generate_summaries = generate_summaries;
-        opts.generate_description = generate_description;
-        opts.include_text = include_text;
-        opts.generate_ids = generate_ids;
-        opts.enable_synonym_expansion = enable_synonym_expansion;
-        Ok(Self { inner: opts })
-    }
-
-    fn __repr__(&self) -> String {
-        format!(
-            "IndexOptions(mode='{}', generate_summaries={}, generate_description={}, include_text={}, generate_ids={}, enable_synonym_expansion={})",
-            match self.inner.mode {
-                IndexMode::Default => "default",
-                IndexMode::Force => "force",
-                IndexMode::Incremental => "incremental",
-            },
-            self.inner.generate_summaries,
-            self.inner.generate_description,
-            self.inner.include_text,
-            self.inner.generate_ids,
-            self.inner.enable_synonym_expansion,
-        )
-    }
-}
-
-// ============================================================
-// IndexContext
-// ============================================================
-
-/// Context for indexing a document.
-///
-/// Create using the static methods:
-///
-/// ```python
-/// from vectorless import IndexContext
-///
-/// # Single file
-/// ctx = IndexContext.from_path("./document.pdf")
-///
-/// # Multiple files
-/// ctx = IndexContext.from_paths(["./a.pdf", "./b.md"])
-///
-/// # Directory
-/// ctx = IndexContext.from_dir("./docs/")
-///
-/// # From text
-/// ctx = IndexContext.from_content("# Title\\nContent...", "markdown").with_name("doc")
-///
-/// # From bytes
-/// ctx = IndexContext.from_bytes(data, "pdf").with_name("doc")
-/// ```
-#[pyclass(name = "IndexContext")]
-pub struct PyIndexContext {
-    inner: IndexContext,
-}
-
-#[pymethods]
-impl PyIndexContext {
-    /// Create an IndexContext from a single file path.
-    #[staticmethod]
-    fn from_path(path: String) -> Self {
-        Self {
-            inner: IndexContext::from_path(&path),
-        }
-    }
-
-    /// Create an IndexContext from multiple file paths.
-    #[staticmethod]
-    fn from_paths(paths: Vec<String>) -> Self {
-        Self {
-            inner: IndexContext::from_paths(&paths),
-        }
-    }
-
-    /// Create an IndexContext from all supported files in a directory.
-    ///
-    /// Args:
-    ///     path: Directory path to scan.
-    ///     recursive: If True, scan subdirectories recursively. Default: False.
-    #[staticmethod]
-    #[pyo3(signature = (path, recursive=false))]
-    fn from_dir(path: String, recursive: bool) -> Self {
-        let inner = IndexContext::from_dir(&path, recursive);
-        Self { inner }
-    }
-
-    /// Create an IndexContext from text content.
-    #[staticmethod]
-    #[pyo3(signature = (content, format="markdown"))]
-    fn from_content(content: String, format: &str) -> PyResult<Self> {
-        let doc_format = parse_format(format)?;
-        let ctx = IndexContext::from_content(&content, doc_format);
-        Ok(Self { inner: ctx })
-    }
-
-    /// Create an IndexContext from binary data.
-    #[staticmethod]
-    fn from_bytes(data: Vec<u8>, format: &str) -> PyResult<Self> {
-        let doc_format = parse_format(format)?;
-        let ctx = IndexContext::from_bytes(data, doc_format);
-        Ok(Self { inner: ctx })
-    }
-
-    /// Set the document name (single-source only).
-    fn with_name(&self, name: String) -> Self {
-        let ctx = self.inner.clone().with_name(&name);
-        Self { inner: ctx }
-    }
-
-    /// Apply indexing options.
-    fn with_options(&self, options: &PyIndexOptions) -> Self {
-        let ctx = self.inner.clone().with_options(options.inner.clone());
-        Self { inner: ctx }
-    }
-
-    /// Set indexing mode.
-    fn with_mode(&self, mode: &str) -> PyResult<Self> {
-        let m = match mode {
-            "default" => IndexMode::Default,
-            "force" => IndexMode::Force,
-            "incremental" => IndexMode::Incremental,
-            _ => {
-                return Err(PyErr::from(VectorlessError::new(
-                    format!(
-                        "Unknown mode: {}. Supported: default, force, incremental",
-                        mode
-                    ),
-                    "config",
-                )));
-            }
-        };
-        let ctx = self.inner.clone().with_mode(m);
-        Ok(Self { inner: ctx })
-    }
-
-    /// Number of document sources.
-    fn __len__(&self) -> usize {
-        self.inner.len()
-    }
-
-    /// Whether no sources are present.
-    fn is_empty(&self) -> bool {
-        self.inner.is_empty()
-    }
-
-    fn __repr__(&self) -> String {
-        format!("IndexContext(sources={})", self.inner.len())
-    }
-}
-
-// ============================================================
-// QueryContext
-// ============================================================
-
-/// Context for a query operation.
-///
-/// ```python
-/// from vectorless import QueryContext
-///
-/// # Query specific documents
-/// ctx = QueryContext("What is the total revenue?").with_doc_ids([doc_id])
-///
-/// # Query multiple documents
-/// ctx = QueryContext("What is the architecture?").with_doc_ids(["doc-1", "doc-2"])
-///
-/// # Query entire workspace
-/// ctx = QueryContext("Explain the algorithm")
-/// ```
-#[pyclass(name = "QueryContext")]
-pub struct PyQueryContext {
-    inner: QueryContext,
-}
-
-#[pymethods]
-impl PyQueryContext {
-    /// Create a new query context (defaults to workspace scope).
-    #[new]
-    fn new(query: String) -> Self {
-        Self {
-            inner: QueryContext::new(&query),
-        }
-    }
-
-    /// Set scope to specific documents.
-    fn with_doc_ids(&self, doc_ids: Vec<String>) -> Self {
-        let ctx = self.inner.clone().with_doc_ids(doc_ids);
-        Self { inner: ctx }
-    }
-
-    /// Set scope to entire workspace.
-    fn with_workspace(&self) -> Self {
-        let ctx = self.inner.clone().with_workspace();
-        Self { inner: ctx }
-    }
-
-    /// Set the maximum tokens for the result content.
-    fn with_max_tokens(&self, tokens: usize) -> Self {
-        let ctx = self.inner.clone().with_max_tokens(tokens);
-        Self { inner: ctx }
-    }
-
-    /// Set whether to include the reasoning chain.
-    fn with_include_reasoning(&self, include: bool) -> Self {
-        let ctx = self.inner.clone().with_include_reasoning(include);
-        Self { inner: ctx }
-    }
-
-    /// Set the maximum tree traversal depth.
-    fn with_depth_limit(&self, depth: usize) -> Self {
-        let ctx = self.inner.clone().with_depth_limit(depth);
-        Self { inner: ctx }
-    }
-
-    fn __repr__(&self) -> String {
-        "QueryContext(...)".to_string()
-    }
-}
-
-// ============================================================
-// QueryResultItem
-// ============================================================
-
-/// A single document's query result.
-#[pyclass(name = "QueryResultItem")]
-pub struct PyQueryResultItem {
-    inner: QueryResultItem,
-}
-
-#[pymethods]
-impl PyQueryResultItem {
-    /// The document ID.
-    #[getter]
-    fn doc_id(&self) -> &str {
-        &self.inner.doc_id
-    }
-
-    /// The retrieved content.
-    #[getter]
-    fn content(&self) -> &str {
-        &self.inner.content
-    }
-
-    /// Relevance score (0.0 to 1.0).
-    #[getter]
-    fn score(&self) -> f32 {
-        self.inner.score
-    }
-
-    /// Node IDs that matched.
-    #[getter]
-    fn node_ids(&self) -> Vec<String> {
-        self.inner.node_ids.clone()
-    }
-
-    fn __repr__(&self) -> String {
-        format!(
-            "QueryResultItem(doc_id='{}', score={:.2}, content_len={})",
-            self.inner.doc_id,
-            self.inner.score,
-            self.inner.content.len()
-        )
-    }
-}
-
-// ============================================================
-// FailedItem
-// ============================================================
-
-/// A failed item in a batch operation.
-#[pyclass(name = "FailedItem")]
-pub struct PyFailedItem {
-    inner: FailedItem,
-}
-
-#[pymethods]
-impl PyFailedItem {
-    /// Source description.
-    #[getter]
-    fn source(&self) -> &str {
-        &self.inner.source
-    }
-
-    /// Error message.
-    #[getter]
-    fn error(&self) -> &str {
-        &self.inner.error
-    }
-
-    fn __repr__(&self) -> String {
-        format!(
-            "FailedItem(source='{}', error='{}')",
-            self.inner.source, self.inner.error
-        )
-    }
-}
-
-// ============================================================
-// QueryResult
-// ============================================================
-
-/// Result of a document query.
-#[pyclass(name = "QueryResult")]
-pub struct PyQueryResult {
-    inner: QueryResult,
-}
-
-#[pymethods]
-impl PyQueryResult {
-    /// Result items (one per document).
-    #[getter]
-    fn items(&self) -> Vec<PyQueryResultItem> {
-        self.inner
-            .items
-            .iter()
-            .map(|i| PyQueryResultItem { inner: i.clone() })
-            .collect()
-    }
-
-    /// Get the first (single-doc) result item.
-    fn single(&self) -> Option<PyQueryResultItem> {
-        self.inner
-            .single()
-            .map(|i| PyQueryResultItem { inner: i.clone() })
-    }
-
-    /// Number of result items.
-    fn __len__(&self) -> usize {
-        self.inner.len()
-    }
-
-    /// Whether any documents failed.
-    fn has_failures(&self) -> bool {
-        self.inner.has_failures()
-    }
-
-    /// Failed items.
-    #[getter]
-    fn failed(&self) -> Vec<PyFailedItem> {
-        self.inner
-            .failed
-            .iter()
-            .map(|f| PyFailedItem { inner: f.clone() })
-            .collect()
-    }
-
-    fn __repr__(&self) -> String {
-        format!(
-            "QueryResult(items={}, failed={})",
-            self.inner.len(),
-            self.inner.failed.len()
-        )
-    }
-}
-
-// ============================================================
-// IndexMetrics
-// ============================================================
-
-/// Indexing pipeline metrics.
-#[pyclass(name = "IndexMetrics")]
-pub struct PyIndexMetrics {
-    inner: IndexMetrics,
-}
-
-#[pymethods]
-impl PyIndexMetrics {
-    /// Total indexing time (ms).
-    #[getter]
-    fn total_time_ms(&self) -> u64 {
-        self.inner.total_time_ms()
-    }
-
-    /// Parse stage duration (ms).
-    #[getter]
-    fn parse_time_ms(&self) -> u64 {
-        self.inner.parse_time_ms
-    }
-
-    /// Build stage duration (ms).
-    #[getter]
-    fn build_time_ms(&self) -> u64 {
-        self.inner.build_time_ms
-    }
-
-    /// Enhance (summary) stage duration (ms).
-    #[getter]
-    fn enhance_time_ms(&self) -> u64 {
-        self.inner.enhance_time_ms
-    }
-
-    /// Number of nodes processed.
-    #[getter]
-    fn nodes_processed(&self) -> usize {
-        self.inner.nodes_processed
-    }
-
-    /// Number of summaries successfully generated.
-    #[getter]
-    fn summaries_generated(&self) -> usize {
-        self.inner.summaries_generated
-    }
-
-    /// Number of summaries that failed to generate.
-    #[getter]
-    fn summaries_failed(&self) -> usize {
-        self.inner.summaries_failed
-    }
-
-    /// Number of LLM calls made.
-    #[getter]
-    fn llm_calls(&self) -> usize {
-        self.inner.llm_calls
-    }
-
-    /// Total tokens generated by LLM.
-    #[getter]
-    fn total_tokens_generated(&self) -> usize {
-        self.inner.total_tokens_generated
-    }
-
-    /// Number of topics in reasoning index.
-    #[getter]
-    fn topics_indexed(&self) -> usize {
-        self.inner.topics_indexed
-    }
-
-    /// Number of keywords in reasoning index.
-    #[getter]
-    fn keywords_indexed(&self) -> usize {
-        self.inner.keywords_indexed
-    }
-
-    fn __repr__(&self) -> String {
-        format!(
-            "IndexMetrics(total={}ms, summaries={}, failed={}, llm_calls={})",
-            self.inner.total_time_ms(),
-            self.inner.summaries_generated,
-            self.inner.summaries_failed,
-            self.inner.llm_calls,
-        )
-    }
-}
-
-// ============================================================
-// Runtime Metrics Reports
-// ============================================================
-
-/// LLM usage metrics report.
-#[pyclass(name = "LlmMetricsReport")]
-pub struct PyLlmMetricsReport {
-    inner: LlmMetricsReport,
-}
-
-#[pymethods]
-impl PyLlmMetricsReport {
-    /// Total number of LLM calls.
-    #[getter]
-    fn total_calls(&self) -> u64 {
-        self.inner.total_calls
-    }
-
-    /// Number of successful calls.
-    #[getter]
-    fn successful_calls(&self) -> u64 {
-        self.inner.successful_calls
-    }
-
-    /// Number of failed calls.
-    #[getter]
-    fn failed_calls(&self) -> u64 {
-        self.inner.failed_calls
-    }
-
-    /// Success rate (0.0 - 1.0).
-    #[getter]
-    fn success_rate(&self) -> f64 {
-        self.inner.success_rate
-    }
-
-    /// Total input tokens.
-    #[getter]
-    fn total_input_tokens(&self) -> u64 {
-        self.inner.total_input_tokens
-    }
-
-    /// Total output tokens.
-    #[getter]
-    fn total_output_tokens(&self) -> u64 {
-        self.inner.total_output_tokens
-    }
-
-    /// Total tokens (input + output).
-    #[getter]
-    fn total_tokens(&self) -> u64 {
-        self.inner.total_tokens
-    }
-
-    /// Average latency per call in milliseconds.
-    #[getter]
-    fn avg_latency_ms(&self) -> f64 {
-        self.inner.avg_latency_ms
-    }
-
-    /// Total latency in milliseconds.
-    #[getter]
-    fn total_latency_ms(&self) -> u64 {
-        self.inner.total_latency_ms
-    }
-
-    /// Estimated cost in USD.
-    #[getter]
-    fn estimated_cost_usd(&self) -> f64 {
-        self.inner.estimated_cost_usd
-    }
-
-    /// Number of rate limit errors.
-    #[getter]
-    fn rate_limit_errors(&self) -> u64 {
-        self.inner.rate_limit_errors
-    }
-
-    /// Number of timeout errors.
-    #[getter]
-    fn timeout_errors(&self) -> u64 {
-        self.inner.timeout_errors
-    }
-
-    /// Number of fallback triggers.
-    #[getter]
-    fn fallback_triggers(&self) -> u64 {
-        self.inner.fallback_triggers
-    }
-
-    fn __repr__(&self) -> String {
-        format!(
-            "LlmMetricsReport(calls={}, tokens={}, cost=${:.4})",
-            self.inner.total_calls, self.inner.total_tokens, self.inner.estimated_cost_usd,
-        )
-    }
-}
-
-/// Pilot decision metrics report.
-#[pyclass(name = "PilotMetricsReport")]
-pub struct PyPilotMetricsReport {
-    inner: PilotMetricsReport,
-}
-
-#[pymethods]
-impl PyPilotMetricsReport {
-    /// Total number of Pilot decisions.
-    #[getter]
-    fn total_decisions(&self) -> u64 {
-        self.inner.total_decisions
-    }
-
-    /// Number of start guidance calls.
-    #[getter]
-    fn start_guidance_calls(&self) -> u64 {
-        self.inner.start_guidance_calls
-    }
-
-    /// Number of fork decisions.
-    #[getter]
-    fn fork_decisions(&self) -> u64 {
-        self.inner.fork_decisions
-    }
-
-    /// Number of backtrack calls.
-    #[getter]
-    fn backtrack_calls(&self) -> u64 {
-        self.inner.backtrack_calls
-    }
-
-    /// Number of evaluate calls.
-    #[getter]
-    fn evaluate_calls(&self) -> u64 {
-        self.inner.evaluate_calls
-    }
-
-    /// Decision accuracy based on feedback (0.0 - 1.0).
-    #[getter]
-    fn accuracy(&self) -> f64 {
-        self.inner.accuracy
-    }
-
-    /// Number of correct decisions.
-    #[getter]
-    fn correct_decisions(&self) -> u64 {
-        self.inner.correct_decisions
-    }
-
-    /// Number of incorrect decisions.
-    #[getter]
-    fn incorrect_decisions(&self) -> u64 {
-        self.inner.incorrect_decisions
-    }
-
-    /// Average confidence across all decisions.
-    #[getter]
-    fn avg_confidence(&self) -> f64 {
-        self.inner.avg_confidence
-    }
-
-    /// Number of LLM calls made by Pilot.
-    #[getter]
-    fn llm_calls(&self) -> u64 {
-        self.inner.llm_calls
-    }
-
-    /// Number of interventions.
-    #[getter]
-    fn interventions(&self) -> u64 {
-        self.inner.interventions
-    }
-
-    /// Number of skipped interventions.
-    #[getter]
-    fn skipped_interventions(&self) -> u64 {
-        self.inner.skipped_interventions
-    }
-
-    /// Number of budget exhausted events.
-    #[getter]
-    fn budget_exhausted(&self) -> u64 {
-        self.inner.budget_exhausted
-    }
-
-    /// Number of algorithm fallbacks.
-    #[getter]
-    fn algorithm_fallbacks(&self) -> u64 {
-        self.inner.algorithm_fallbacks
-    }
-
-    fn __repr__(&self) -> String {
-        format!(
-            "PilotMetricsReport(decisions={}, accuracy={:.2}, avg_confidence={:.2})",
-            self.inner.total_decisions, self.inner.accuracy, self.inner.avg_confidence,
-        )
-    }
-}
-
-/// Retrieval operation metrics report.
-#[pyclass(name = "RetrievalMetricsReport")]
-pub struct PyRetrievalMetricsReport {
-    inner: RetrievalMetricsReport,
-}
-
-#[pymethods]
-impl PyRetrievalMetricsReport {
-    /// Total number of queries.
-    #[getter]
-    fn total_queries(&self) -> u64 {
-        self.inner.total_queries
-    }
-
-    /// Total number of search iterations.
-    #[getter]
-    fn total_iterations(&self) -> u64 {
-        self.inner.total_iterations
-    }
-
-    /// Average iterations per query.
-    #[getter]
-    fn avg_iterations(&self) -> f64 {
-        self.inner.avg_iterations
-    }
-
-    /// Total nodes visited.
-    #[getter]
-    fn nodes_visited(&self) -> u64 {
-        self.inner.nodes_visited
-    }
-
-    /// Total paths found.
-    #[getter]
-    fn paths_found(&self) -> u64 {
-        self.inner.paths_found
-    }
-
-    /// Average path length.
-    #[getter]
-    fn avg_path_length(&self) -> f64 {
-        self.inner.avg_path_length
-    }
-
-    /// Average path score (0.0 - 1.0).
-    #[getter]
-    fn avg_path_score(&self) -> f64 {
-        self.inner.avg_path_score
-    }
-
-    /// Number of high-score paths (>= 0.5).
-    #[getter]
-    fn high_score_paths(&self) -> u64 {
-        self.inner.high_score_paths
-    }
-
-    /// Number of low-score paths (< 0.3).
-    #[getter]
-    fn low_score_paths(&self) -> u64 {
-        self.inner.low_score_paths
-    }
-
-    /// Number of cache hits.
-    #[getter]
-    fn cache_hits(&self) -> u64 {
-        self.inner.cache_hits
-    }
-
-    /// Number of cache misses.
-    #[getter]
-    fn cache_misses(&self) -> u64 {
-        self.inner.cache_misses
-    }
-
-    /// Cache hit rate (0.0 - 1.0).
-    #[getter]
-    fn cache_hit_rate(&self) -> f64 {
-        self.inner.cache_hit_rate
-    }
-
-    /// Total latency in milliseconds.
-    #[getter]
-    fn total_latency_ms(&self) -> u64 {
-        self.inner.total_latency_ms
-    }
-
-    /// Average latency per query in milliseconds.
-    #[getter]
-    fn avg_latency_ms(&self) -> f64 {
-        self.inner.avg_latency_ms
-    }
-
-    /// Number of backtracks.
-    #[getter]
-    fn backtracks(&self) -> u64 {
-        self.inner.backtracks
-    }
-
-    /// Number of sufficiency checks.
-    #[getter]
-    fn sufficiency_checks(&self) -> u64 {
-        self.inner.sufficiency_checks
-    }
-
-    /// Sufficiency rate (0.0 - 1.0).
-    #[getter]
-    fn sufficiency_rate(&self) -> f64 {
-        self.inner.sufficiency_rate
-    }
-
-    fn __repr__(&self) -> String {
-        format!(
-            "RetrievalMetricsReport(queries={}, avg_score={:.2}, cache_hit={:.1}%)",
-            self.inner.total_queries,
-            self.inner.avg_path_score,
-            self.inner.cache_hit_rate * 100.0,
-        )
-    }
-}
-
-/// Complete metrics report combining all subsystem metrics.
-#[pyclass(name = "MetricsReport")]
-pub struct PyMetricsReport {
-    inner: MetricsReport,
-}
-
-#[pymethods]
-impl PyMetricsReport {
-    /// LLM metrics.
-    #[getter]
-    fn llm(&self) -> PyLlmMetricsReport {
-        PyLlmMetricsReport {
-            inner: self.inner.llm.clone(),
-        }
-    }
-
-    /// Pilot metrics.
-    #[getter]
-    fn pilot(&self) -> PyPilotMetricsReport {
-        PyPilotMetricsReport {
-            inner: self.inner.pilot.clone(),
-        }
-    }
-
-    /// Retrieval metrics.
-    #[getter]
-    fn retrieval(&self) -> PyRetrievalMetricsReport {
-        PyRetrievalMetricsReport {
-            inner: self.inner.retrieval.clone(),
-        }
-    }
-
-    /// Total estimated cost in USD.
-    fn total_cost_usd(&self) -> f64 {
-        self.inner.total_cost_usd()
-    }
-
-    /// Overall success rate (0.0 - 1.0).
-    fn overall_success_rate(&self) -> f64 {
-        self.inner.overall_success_rate()
-    }
-
-    fn __repr__(&self) -> String {
-        format!(
-            "MetricsReport(llm_calls={}, cost=${:.4}, queries={})",
-            self.inner.llm.total_calls,
-            self.inner.total_cost_usd(),
-            self.inner.retrieval.total_queries,
-        )
-    }
-}
-
-// ============================================================
-// IndexItem / IndexResult
-// ============================================================
-
-/// A single indexed document item.
-#[pyclass(name = "IndexItem")]
-pub struct PyIndexItem {
-    inner: IndexItem,
-}
-
-#[pymethods]
-impl PyIndexItem {
-    #[getter]
-    fn doc_id(&self) -> &str {
-        &self.inner.doc_id
-    }
-
-    #[getter]
-    fn name(&self) -> &str {
-        &self.inner.name
-    }
-
-    #[getter]
-    fn format(&self) -> String {
-        format!("{:?}", self.inner.format).to_lowercase()
-    }
-
-    #[getter]
-    fn description(&self) -> Option<&str> {
-        self.inner.description.as_deref()
-    }
-
-    #[getter]
-    fn source_path(&self) -> Option<&str> {
-        self.inner.source_path.as_deref()
-    }
-
-    #[getter]
-    fn page_count(&self) -> Option<usize> {
-        self.inner.page_count
-    }
-
-    /// Indexing pipeline metrics (timing, LLM usage, etc.).
-    #[getter]
-    fn metrics(&self) -> Option<PyIndexMetrics> {
-        self.inner
-            .metrics
-            .as_ref()
-            .map(|m| PyIndexMetrics { inner: m.clone() })
-    }
-
-    fn __repr__(&self) -> String {
-        format!(
-            "IndexItem(doc_id='{}', name='{}')",
-            self.inner.doc_id, self.inner.name
-        )
-    }
-}
-
-/// Result of a document indexing operation.
-#[pyclass(name = "IndexResult")]
-pub struct PyIndexResult {
-    inner: IndexResult,
-}
-
-#[pymethods]
-impl PyIndexResult {
-    /// The document ID (convenience for single-document indexing).
-    #[getter]
-    fn doc_id(&self) -> Option<String> {
-        self.inner.doc_id().map(|s| s.to_string())
-    }
-
-    /// All indexed items.
-    #[getter]
-    fn items(&self) -> Vec<PyIndexItem> {
-        self.inner
-            .items
-            .iter()
-            .map(|i| PyIndexItem { inner: i.clone() })
-            .collect()
-    }
-
-    /// Failed items.
-    #[getter]
-    fn failed(&self) -> Vec<PyFailedItem> {
-        self.inner
-            .failed
-            .iter()
-            .map(|f| PyFailedItem { inner: f.clone() })
-            .collect()
-    }
-
-    /// Whether any items failed.
-    fn has_failures(&self) -> bool {
-        self.inner.has_failures()
-    }
-
-    /// Total number of items (successful + failed).
-    fn total(&self) -> usize {
-        self.inner.total()
-    }
-
-    fn __len__(&self) -> usize {
-        self.inner.len()
-    }
-
-    fn __repr__(&self) -> String {
-        format!(
-            "IndexResult(doc_id={:?}, count={}, failed={})",
-            self.inner.doc_id(),
-            self.inner.items.len(),
-            self.inner.failed.len()
-        )
-    }
-}
-
-// ============================================================
-// DocumentInfo
-// ============================================================
-
-/// Information about an indexed document.
-#[pyclass(name = "DocumentInfo")]
-pub struct PyDocumentInfo {
-    inner: DocumentInfo,
-}
-
-#[pymethods]
-impl PyDocumentInfo {
-    #[getter]
-    fn id(&self) -> &str {
-        &self.inner.id
-    }
-
-    #[getter]
-    fn name(&self) -> &str {
-        &self.inner.name
-    }
-
-    #[getter]
-    fn format(&self) -> &str {
-        &self.inner.format
-    }
-
-    #[getter]
-    fn description(&self) -> Option<&str> {
-        self.inner.description.as_deref()
-    }
-
-    #[getter]
-    fn source_path(&self) -> Option<&str> {
-        self.inner.source_path.as_deref()
-    }
-
-    #[getter]
-    fn page_count(&self) -> Option<usize> {
-        self.inner.page_count
-    }
-
-    #[getter]
-    fn line_count(&self) -> Option<usize> {
-        self.inner.line_count
-    }
-
-    fn __repr__(&self) -> String {
-        format!(
-            "DocumentInfo(id='{}', name='{}', format='{}')",
-            self.inner.id, self.inner.name, self.inner.format
-        )
-    }
-}
-
-// ============================================================
-// DocumentGraph types
-// ============================================================
-
-use ::vectorless::graph::{
-    DocumentGraph, DocumentGraphNode, EdgeEvidence, GraphEdge, WeightedKeyword,
-};
-
-/// A keyword with weight from document analysis.
-#[pyclass(name = "WeightedKeyword")]
-pub struct PyWeightedKeyword {
-    inner: WeightedKeyword,
-}
-
-#[pymethods]
-impl PyWeightedKeyword {
-    #[getter]
-    fn keyword(&self) -> &str {
-        &self.inner.keyword
-    }
-
-    #[getter]
-    fn weight(&self) -> f32 {
-        self.inner.weight
-    }
-
-    fn __repr__(&self) -> String {
-        format!(
-            "WeightedKeyword('{}', weight={:.2})",
-            self.inner.keyword, self.inner.weight
-        )
-    }
-}
-
-/// Evidence for a cross-document connection.
-#[pyclass(name = "EdgeEvidence")]
-pub struct PyEdgeEvidence {
-    inner: EdgeEvidence,
-}
-
-#[pymethods]
-impl PyEdgeEvidence {
-    /// Number of shared keywords.
-    #[getter]
-    fn shared_keyword_count(&self) -> usize {
-        self.inner.shared_keyword_count
-    }
-
-    /// Jaccard similarity of keyword sets.
-    #[getter]
-    fn keyword_jaccard(&self) -> f32 {
-        self.inner.keyword_jaccard
-    }
-
-    /// Shared keywords with weights.
-    #[getter]
-    fn shared_keywords(&self) -> Vec<(String, f32, f32)> {
-        self.inner
-            .shared_keywords
-            .iter()
-            .map(|sk| (sk.keyword.clone(), sk.source_weight, sk.target_weight))
-            .collect()
-    }
-
-    fn __repr__(&self) -> String {
-        format!(
-            "EdgeEvidence(shared={}, jaccard={:.2})",
-            self.inner.shared_keyword_count, self.inner.keyword_jaccard
-        )
-    }
-}
-
-/// An edge representing a relationship between two documents.
-#[pyclass(name = "GraphEdge")]
-pub struct PyGraphEdge {
-    inner: GraphEdge,
-}
-
-#[pymethods]
-impl PyGraphEdge {
-    /// Target document ID.
-    #[getter]
-    fn target_doc_id(&self) -> &str {
-        &self.inner.target_doc_id
-    }
-
-    /// Edge weight (connection strength).
-    #[getter]
-    fn weight(&self) -> f32 {
-        self.inner.weight
-    }
-
-    /// Evidence for this connection.
-    #[getter]
-    fn evidence(&self) -> PyEdgeEvidence {
-        PyEdgeEvidence {
-            inner: self.inner.evidence.clone(),
-        }
-    }
-
-    fn __repr__(&self) -> String {
-        format!(
-            "GraphEdge(target='{}', weight={:.2})",
-            self.inner.target_doc_id, self.inner.weight
-        )
-    }
-}
-
-/// A node in the document graph representing an indexed document.
-#[pyclass(name = "DocumentGraphNode")]
-pub struct PyDocumentGraphNode {
-    inner: DocumentGraphNode,
-}
-
-#[pymethods]
-impl PyDocumentGraphNode {
-    #[getter]
-    fn doc_id(&self) -> &str {
-        &self.inner.doc_id
-    }
-
-    #[getter]
-    fn title(&self) -> &str {
-        &self.inner.title
-    }
-
-    #[getter]
-    fn format(&self) -> &str {
-        &self.inner.format
-    }
-
-    #[getter]
-    fn node_count(&self) -> usize {
-        self.inner.node_count
-    }
-
-    /// Top keywords extracted from the document.
-    #[getter]
-    fn top_keywords(&self) -> Vec<PyWeightedKeyword> {
-        self.inner
-            .top_keywords
-            .iter()
-            .map(|kw| PyWeightedKeyword { inner: kw.clone() })
-            .collect()
-    }
-
-    fn __repr__(&self) -> String {
-        format!(
-            "DocumentGraphNode(doc_id='{}', title='{}')",
-            self.inner.doc_id, self.inner.title
-        )
-    }
-}
-
-/// Cross-document relationship graph.
-///
-/// Automatically rebuilt after indexing. Connects documents
-/// that share keywords via Jaccard similarity.
-#[pyclass(name = "DocumentGraph")]
-pub struct PyDocumentGraph {
-    inner: DocumentGraph,
-}
-
-#[pymethods]
-impl PyDocumentGraph {
-    /// Number of document nodes.
-    fn node_count(&self) -> usize {
-        self.inner.node_count()
-    }
-
-    /// Number of relationship edges.
-    fn edge_count(&self) -> usize {
-        self.inner.edge_count()
-    }
-
-    /// Get a document node by ID.
-    fn get_node(&self, doc_id: String) -> Option<PyDocumentGraphNode> {
-        self.inner
-            .get_node(&doc_id)
-            .map(|n| PyDocumentGraphNode { inner: n.clone() })
-    }
-
-    /// Get all document IDs in the graph.
-    fn doc_ids(&self) -> Vec<String> {
-        self.inner.doc_ids().map(|s| s.to_string()).collect()
-    }
-
-    /// Get edges (neighbors) for a document.
-    fn get_neighbors(&self, doc_id: String) -> Vec<PyGraphEdge> {
-        self.inner
-            .get_neighbors(&doc_id)
-            .iter()
-            .map(|e| PyGraphEdge { inner: e.clone() })
-            .collect()
-    }
-
-    /// Whether the graph is empty.
-    fn is_empty(&self) -> bool {
-        self.inner.is_empty()
-    }
-
-    fn __repr__(&self) -> String {
-        format!(
-            "DocumentGraph(nodes={}, edges={})",
-            self.inner.node_count(),
-            self.inner.edge_count()
-        )
-    }
-}
-
-// ============================================================
-// Engine async helpers (named functions to avoid FnOnce HRTB issue)
-// ============================================================
-
-async fn run_index(engine: Arc<Engine>, ctx: IndexContext) -> PyResult<PyIndexResult> {
-    let result = engine.index(ctx).await.map_err(to_py_err)?;
-    Ok(PyIndexResult { inner: result })
-}
-
-async fn run_query(engine: Arc<Engine>, ctx: QueryContext) -> PyResult<PyQueryResult> {
-    let result = engine.query(ctx).await.map_err(to_py_err)?;
-    Ok(PyQueryResult { inner: result })
-}
-
-async fn run_list(engine: Arc<Engine>) -> PyResult<Vec<PyDocumentInfo>> {
-    let docs = engine.list().await.map_err(to_py_err)?;
-    Ok(docs
-        .into_iter()
-        .map(|d| PyDocumentInfo { inner: d })
-        .collect())
-}
-
-async fn run_remove(engine: Arc<Engine>, doc_id: String) -> PyResult<bool> {
-    engine.remove(&doc_id).await.map_err(to_py_err)
-}
-
-async fn run_clear(engine: Arc<Engine>) -> PyResult<usize> {
-    engine.clear().await.map_err(to_py_err)
-}
-
-async fn run_exists(engine: Arc<Engine>, doc_id: String) -> PyResult<bool> {
-    engine.exists(&doc_id).await.map_err(to_py_err)
-}
-
-async fn run_get_graph(engine: Arc<Engine>) -> PyResult<Option<PyDocumentGraph>> {
-    let graph = engine.get_graph().await.map_err(to_py_err)?;
-    Ok(graph.map(|g| PyDocumentGraph { inner: g }))
-}
-
-fn run_metrics_report(engine: Arc<Engine>) -> PyMetricsReport {
-    PyMetricsReport {
-        inner: engine.metrics_report(),
-    }
-}
-
-// ============================================================
-// Engine
-// ============================================================
-
-/// The main vectorless engine.
-///
-/// `api_key` and `model` are **required**.
-///
-/// ```python
-/// from vectorless import Engine, IndexContext, QueryContext
-///
-/// engine = Engine(
-///     api_key="sk-...",
-///     model="gpt-4o",
-/// )
-///
-/// # Index
-/// result = await engine.index(IndexContext.from_path("./report.pdf"))
-/// doc_id = result.doc_id
-///
-/// # Query
-/// answer = await engine.query(QueryContext("What is the revenue?").with_doc_ids([doc_id]))
-/// print(answer.single().content)
-/// ```
-#[pyclass(name = "Engine")]
-pub struct PyEngine {
-    inner: Arc<Engine>,
-}
-
-#[pymethods]
-impl PyEngine {
-    /// Create a new Engine.
-    ///
-    /// Args:
-    ///     config_path: Path to configuration file (optional).
-    ///     api_key: **Required**. LLM API key.
-    ///     model: **Required**. LLM model name.
-    ///     endpoint: Optional API endpoint.
-    ///
-    /// Raises:
-    ///     VectorlessError: If engine creation fails.
-    #[new]
-    #[pyo3(signature = (config_path=None, api_key=None, model=None, endpoint=None))]
-    fn new(
-        config_path: Option<String>,
-        api_key: Option<String>,
-        model: Option<String>,
-        endpoint: Option<String>,
-    ) -> PyResult<Self> {
-        let rt = Runtime::new().map_err(|e| {
-            PyErr::from(VectorlessError::new(
-                format!("Failed to create tokio runtime: {}", e),
-                "config",
-            ))
-        })?;
-
-        let engine = rt.block_on(async {
-            let mut builder = EngineBuilder::new();
-
-            if let Some(path) = &config_path {
-                builder = builder.with_config_path(path);
-            }
-            if let Some(m) = &model {
-                builder = builder.with_model(m);
-            }
-            if let Some(e) = &endpoint {
-                builder = builder.with_endpoint(e);
-            }
-            if let Some(key) = api_key {
-                builder = builder.with_key(key);
-            }
-
-            builder.build().await
-        });
-
-        let engine = engine.map_err(|e| {
-            PyErr::from(VectorlessError::new(
-                format!("Failed to create engine: {}", e),
-                "config",
-            ))
-        })?;
-
-        Ok(Self {
-            inner: Arc::new(engine),
-        })
-    }
-
-    /// Index a document.
-    ///
-    /// Args:
-    ///     ctx: IndexContext created from from_path, from_paths, from_dir, etc.
-    ///
-    /// Returns:
-    ///     IndexResult with doc_id and items.
-    ///
-    /// Raises:
-    ///     VectorlessError: If indexing fails.
-    fn index<'py>(&self, py: Python<'py>, ctx: &PyIndexContext) -> PyResult<Bound<'py, PyAny>> {
-        let engine = Arc::clone(&self.inner);
-        let index_ctx = ctx.inner.clone();
-        future_into_py(py, run_index(engine, index_ctx))
-    }
-
-    /// Query indexed documents.
-    ///
-    /// Args:
-    ///     ctx: QueryContext with query text and scope.
-    ///
-    /// Returns:
-    ///     QueryResult with answer and score.
-    ///
-    /// Raises:
-    ///     VectorlessError: If query fails.
-    fn query<'py>(&self, py: Python<'py>, ctx: &PyQueryContext) -> PyResult<Bound<'py, PyAny>> {
-        let engine = Arc::clone(&self.inner);
-        let query_ctx = ctx.inner.clone();
-        future_into_py(py, run_query(engine, query_ctx))
-    }
-
-    /// List all indexed documents.
-    ///
-    /// Returns:
-    ///     List of DocumentInfo objects.
-    fn list<'py>(&self, py: Python<'py>) -> PyResult<Bound<'py, PyAny>> {
-        let engine = Arc::clone(&self.inner);
-        future_into_py(py, run_list(engine))
-    }
-
-    /// Remove a document by ID.
-    ///
-    /// Returns:
-    ///     True if removed, False if not found.
-    fn remove<'py>(&self, py: Python<'py>, doc_id: String) -> PyResult<Bound<'py, PyAny>> {
-        let engine = Arc::clone(&self.inner);
-        future_into_py(py, run_remove(engine, doc_id))
-    }
-
-    /// Remove all indexed documents.
-    ///
-    /// Returns:
-    ///     Number of documents removed.
-    fn clear<'py>(&self, py: Python<'py>) -> PyResult<Bound<'py, PyAny>> {
-        let engine = Arc::clone(&self.inner);
-        future_into_py(py, run_clear(engine))
-    }
-
-    /// Check if a document exists.
-    fn exists<'py>(&self, py: Python<'py>, doc_id: String) -> PyResult<Bound<'py, PyAny>> {
-        let engine = Arc::clone(&self.inner);
-        future_into_py(py, run_exists(engine, doc_id))
-    }
-
-    /// Get the cross-document relationship graph.
-    ///
-    /// Returns:
-    ///     DocumentGraph if any documents exist, else None.
-    fn get_graph<'py>(&self, py: Python<'py>) -> PyResult<Bound<'py, PyAny>> {
-        let engine = Arc::clone(&self.inner);
-        future_into_py(py, run_get_graph(engine))
-    }
-
-    /// Generate a complete metrics report.
-    ///
-    /// Returns:
-    ///     MetricsReport with LLM, Pilot, and Retrieval metrics.
-    fn metrics_report(&self) -> PyMetricsReport {
-        run_metrics_report(Arc::clone(&self.inner))
-    }
-
-    fn __repr__(&self) -> String {
-        "Engine(...)".to_string()
-    }
-}
-
-// ============================================================
-// Module Definition
-// ============================================================
-
 /// Vectorless - Reasoning-native document intelligence engine.
 ///
 /// ```python
@@ -1595,6 +59,7 @@ fn _vectorless(m: &Bound<'_, PyModule>) -> PyResult<()> {
     m.add_class::<PyPilotMetricsReport>()?;
     m.add_class::<PyRetrievalMetricsReport>()?;
     m.add_class::<PyMetricsReport>()?;
+    m.add_class::<PyConfig>()?;
     m.add_class::<PyEngine>()?;
 
     m.add("__version__", env!("CARGO_PKG_VERSION"))?;
diff --git a/python/src/metrics.rs b/python/src/metrics.rs
new file mode 100644
index 00000000..669511cb
--- /dev/null
+++ b/python/src/metrics.rs
@@ -0,0 +1,376 @@
+// Copyright (c) 2026 vectorless developers
+// SPDX-License-Identifier: Apache-2.0
+
+//! Metrics report Python wrappers.
+
+use pyo3::prelude::*;
+
+use ::vectorless::metrics::{
+    LlmMetricsReport, MetricsReport, PilotMetricsReport, RetrievalMetricsReport,
+};
+
+/// LLM usage metrics report.
+#[pyclass(name = "LlmMetricsReport")]
+pub struct PyLlmMetricsReport {
+    pub(crate) inner: LlmMetricsReport,
+}
+
+#[pymethods]
+impl PyLlmMetricsReport {
+    /// Total number of LLM calls.
+    #[getter]
+    fn total_calls(&self) -> u64 {
+        self.inner.total_calls
+    }
+
+    /// Number of successful calls.
+    #[getter]
+    fn successful_calls(&self) -> u64 {
+        self.inner.successful_calls
+    }
+
+    /// Number of failed calls.
+    #[getter]
+    fn failed_calls(&self) -> u64 {
+        self.inner.failed_calls
+    }
+
+    /// Success rate (0.0 - 1.0).
+    #[getter]
+    fn success_rate(&self) -> f64 {
+        self.inner.success_rate
+    }
+
+    /// Total input tokens.
+    #[getter]
+    fn total_input_tokens(&self) -> u64 {
+        self.inner.total_input_tokens
+    }
+
+    /// Total output tokens.
+    #[getter]
+    fn total_output_tokens(&self) -> u64 {
+        self.inner.total_output_tokens
+    }
+
+    /// Total tokens (input + output).
+    #[getter]
+    fn total_tokens(&self) -> u64 {
+        self.inner.total_tokens
+    }
+
+    /// Average latency per call in milliseconds.
+    #[getter]
+    fn avg_latency_ms(&self) -> f64 {
+        self.inner.avg_latency_ms
+    }
+
+    /// Total latency in milliseconds.
+    #[getter]
+    fn total_latency_ms(&self) -> u64 {
+        self.inner.total_latency_ms
+    }
+
+    /// Estimated cost in USD.
+    #[getter]
+    fn estimated_cost_usd(&self) -> f64 {
+        self.inner.estimated_cost_usd
+    }
+
+    /// Number of rate limit errors.
+    #[getter]
+    fn rate_limit_errors(&self) -> u64 {
+        self.inner.rate_limit_errors
+    }
+
+    /// Number of timeout errors.
+    #[getter]
+    fn timeout_errors(&self) -> u64 {
+        self.inner.timeout_errors
+    }
+
+    /// Number of fallback triggers.
+    #[getter]
+    fn fallback_triggers(&self) -> u64 {
+        self.inner.fallback_triggers
+    }
+
+    fn __repr__(&self) -> String {
+        format!(
+            "LlmMetricsReport(calls={}, tokens={}, cost=${:.4})",
+            self.inner.total_calls, self.inner.total_tokens, self.inner.estimated_cost_usd,
+        )
+    }
+}
+
+/// Pilot decision metrics report.
+#[pyclass(name = "PilotMetricsReport")]
+pub struct PyPilotMetricsReport {
+    pub(crate) inner: PilotMetricsReport,
+}
+
+#[pymethods]
+impl PyPilotMetricsReport {
+    /// Total number of Pilot decisions.
+    #[getter]
+    fn total_decisions(&self) -> u64 {
+        self.inner.total_decisions
+    }
+
+    /// Number of start guidance calls.
+    #[getter]
+    fn start_guidance_calls(&self) -> u64 {
+        self.inner.start_guidance_calls
+    }
+
+    /// Number of fork decisions.
+    #[getter]
+    fn fork_decisions(&self) -> u64 {
+        self.inner.fork_decisions
+    }
+
+    /// Number of backtrack calls.
+    #[getter]
+    fn backtrack_calls(&self) -> u64 {
+        self.inner.backtrack_calls
+    }
+
+    /// Number of evaluate calls.
+    #[getter]
+    fn evaluate_calls(&self) -> u64 {
+        self.inner.evaluate_calls
+    }
+
+    /// Decision accuracy based on feedback (0.0 - 1.0).
+    #[getter]
+    fn accuracy(&self) -> f64 {
+        self.inner.accuracy
+    }
+
+    /// Number of correct decisions.
+    #[getter]
+    fn correct_decisions(&self) -> u64 {
+        self.inner.correct_decisions
+    }
+
+    /// Number of incorrect decisions.
+    #[getter]
+    fn incorrect_decisions(&self) -> u64 {
+        self.inner.incorrect_decisions
+    }
+
+    /// Average confidence across all decisions.
+    #[getter]
+    fn avg_confidence(&self) -> f64 {
+        self.inner.avg_confidence
+    }
+
+    /// Number of LLM calls made by Pilot.
+    #[getter]
+    fn llm_calls(&self) -> u64 {
+        self.inner.llm_calls
+    }
+
+    /// Number of interventions.
+    #[getter]
+    fn interventions(&self) -> u64 {
+        self.inner.interventions
+    }
+
+    /// Number of skipped interventions.
+    #[getter]
+    fn skipped_interventions(&self) -> u64 {
+        self.inner.skipped_interventions
+    }
+
+    /// Number of budget exhausted events.
+    #[getter]
+    fn budget_exhausted(&self) -> u64 {
+        self.inner.budget_exhausted
+    }
+
+    /// Number of algorithm fallbacks.
+    #[getter]
+    fn algorithm_fallbacks(&self) -> u64 {
+        self.inner.algorithm_fallbacks
+    }
+
+    fn __repr__(&self) -> String {
+        format!(
+            "PilotMetricsReport(decisions={}, accuracy={:.2}, avg_confidence={:.2})",
+            self.inner.total_decisions, self.inner.accuracy, self.inner.avg_confidence,
+        )
+    }
+}
+
+/// Retrieval operation metrics report.
+#[pyclass(name = "RetrievalMetricsReport")]
+pub struct PyRetrievalMetricsReport {
+    pub(crate) inner: RetrievalMetricsReport,
+}
+
+#[pymethods]
+impl PyRetrievalMetricsReport {
+    /// Total number of queries.
+    #[getter]
+    fn total_queries(&self) -> u64 {
+        self.inner.total_queries
+    }
+
+    /// Total number of search iterations.
+    #[getter]
+    fn total_iterations(&self) -> u64 {
+        self.inner.total_iterations
+    }
+
+    /// Average iterations per query.
+    #[getter]
+    fn avg_iterations(&self) -> f64 {
+        self.inner.avg_iterations
+    }
+
+    /// Total nodes visited.
+    #[getter]
+    fn nodes_visited(&self) -> u64 {
+        self.inner.nodes_visited
+    }
+
+    /// Total paths found.
+    #[getter]
+    fn paths_found(&self) -> u64 {
+        self.inner.paths_found
+    }
+
+    /// Average path length.
+    #[getter]
+    fn avg_path_length(&self) -> f64 {
+        self.inner.avg_path_length
+    }
+
+    /// Average path score (0.0 - 1.0).
+    #[getter]
+    fn avg_path_score(&self) -> f64 {
+        self.inner.avg_path_score
+    }
+
+    /// Number of high-score paths (>= 0.5).
+    #[getter]
+    fn high_score_paths(&self) -> u64 {
+        self.inner.high_score_paths
+    }
+
+    /// Number of low-score paths (< 0.3).
+    #[getter]
+    fn low_score_paths(&self) -> u64 {
+        self.inner.low_score_paths
+    }
+
+    /// Number of cache hits.
+    #[getter]
+    fn cache_hits(&self) -> u64 {
+        self.inner.cache_hits
+    }
+
+    /// Number of cache misses.
+    #[getter]
+    fn cache_misses(&self) -> u64 {
+        self.inner.cache_misses
+    }
+
+    /// Cache hit rate (0.0 - 1.0).
+    #[getter]
+    fn cache_hit_rate(&self) -> f64 {
+        self.inner.cache_hit_rate
+    }
+
+    /// Total latency in milliseconds.
+    #[getter]
+    fn total_latency_ms(&self) -> u64 {
+        self.inner.total_latency_ms
+    }
+
+    /// Average latency per query in milliseconds.
+    #[getter]
+    fn avg_latency_ms(&self) -> f64 {
+        self.inner.avg_latency_ms
+    }
+
+    /// Number of backtracks.
+    #[getter]
+    fn backtracks(&self) -> u64 {
+        self.inner.backtracks
+    }
+
+    /// Number of sufficiency checks.
+    #[getter]
+    fn sufficiency_checks(&self) -> u64 {
+        self.inner.sufficiency_checks
+    }
+
+    /// Sufficiency rate (0.0 - 1.0).
+    #[getter]
+    fn sufficiency_rate(&self) -> f64 {
+        self.inner.sufficiency_rate
+    }
+
+    fn __repr__(&self) -> String {
+        format!(
+            "RetrievalMetricsReport(queries={}, avg_score={:.2}, cache_hit={:.1}%)",
+            self.inner.total_queries,
+            self.inner.avg_path_score,
+            self.inner.cache_hit_rate * 100.0,
+        )
+    }
+}
+
+/// Complete metrics report combining all subsystem metrics.
+#[pyclass(name = "MetricsReport")]
+pub struct PyMetricsReport {
+    pub(crate) inner: MetricsReport,
+}
+
+#[pymethods]
+impl PyMetricsReport {
+    /// LLM metrics.
+    #[getter]
+    fn llm(&self) -> PyLlmMetricsReport {
+        PyLlmMetricsReport {
+            inner: self.inner.llm.clone(),
+        }
+    }
+
+    /// Pilot metrics.
+    #[getter]
+    fn pilot(&self) -> PyPilotMetricsReport {
+        PyPilotMetricsReport {
+            inner: self.inner.pilot.clone(),
+        }
+    }
+
+    /// Retrieval metrics.
+    #[getter]
+    fn retrieval(&self) -> PyRetrievalMetricsReport {
+        PyRetrievalMetricsReport {
+            inner: self.inner.retrieval.clone(),
+        }
+    }
+
+    /// Total estimated cost in USD.
+    fn total_cost_usd(&self) -> f64 {
+        self.inner.total_cost_usd()
+    }
+
+    /// Overall success rate (0.0 - 1.0).
+    fn overall_success_rate(&self) -> f64 {
+        self.inner.overall_success_rate()
+    }
+
+    fn __repr__(&self) -> String {
+        format!(
+            "MetricsReport(llm_calls={}, cost=${:.4}, queries={})",
+            self.inner.llm.total_calls,
+            self.inner.total_cost_usd(),
+            self.inner.retrieval.total_queries,
+        )
+    }
+}
diff --git a/python/src/results.rs b/python/src/results.rs
new file mode 100644
index 00000000..fe780a4c
--- /dev/null
+++ b/python/src/results.rs
@@ -0,0 +1,351 @@
+// Copyright (c) 2026 vectorless developers
+// SPDX-License-Identifier: Apache-2.0
+
+//! Query and index result Python wrappers.
+
+use pyo3::prelude::*;
+
+use ::vectorless::client::{FailedItem, IndexItem, IndexResult, QueryResult, QueryResultItem};
+use ::vectorless::metrics::IndexMetrics;
+
+// ============================================================
+// QueryResultItem
+// ============================================================
+
+/// A single document's query result.
+#[pyclass(name = "QueryResultItem")]
+pub struct PyQueryResultItem {
+    pub(crate) inner: QueryResultItem,
+}
+
+#[pymethods]
+impl PyQueryResultItem {
+    /// The document ID.
+    #[getter]
+    fn doc_id(&self) -> &str {
+        &self.inner.doc_id
+    }
+
+    /// The retrieved content.
+    #[getter]
+    fn content(&self) -> &str {
+        &self.inner.content
+    }
+
+    /// Relevance score (0.0 to 1.0).
+    #[getter]
+    fn score(&self) -> f32 {
+        self.inner.score
+    }
+
+    /// Node IDs that matched.
+    #[getter]
+    fn node_ids(&self) -> Vec<String> {
+        self.inner.node_ids.clone()
+    }
+
+    fn __repr__(&self) -> String {
+        format!(
+            "QueryResultItem(doc_id='{}', score={:.2}, content_len={})",
+            self.inner.doc_id,
+            self.inner.score,
+            self.inner.content.len()
+        )
+    }
+}
+
+// ============================================================
+// FailedItem
+// ============================================================
+
+/// A failed item in a batch operation.
+#[pyclass(name = "FailedItem")]
+pub struct PyFailedItem {
+    pub(crate) inner: FailedItem,
+}
+
+#[pymethods]
+impl PyFailedItem {
+    /// Source description.
+    #[getter]
+    fn source(&self) -> &str {
+        &self.inner.source
+    }
+
+    /// Error message.
+    #[getter]
+    fn error(&self) -> &str {
+        &self.inner.error
+    }
+
+    fn __repr__(&self) -> String {
+        format!(
+            "FailedItem(source='{}', error='{}')",
+            self.inner.source, self.inner.error
+        )
+    }
+}
+
+// ============================================================
+// QueryResult
+// ============================================================
+
+/// Result of a document query.
+#[pyclass(name = "QueryResult")]
+pub struct PyQueryResult {
+    pub(crate) inner: QueryResult,
+}
+
+#[pymethods]
+impl PyQueryResult {
+    /// Result items (one per document).
+    #[getter]
+    fn items(&self) -> Vec<PyQueryResultItem> {
+        self.inner
+            .items
+            .iter()
+            .map(|i| PyQueryResultItem { inner: i.clone() })
+            .collect()
+    }
+
+    /// Get the first (single-doc) result item.
+    fn single(&self) -> Option<PyQueryResultItem> {
+        self.inner
+            .single()
+            .map(|i| PyQueryResultItem { inner: i.clone() })
+    }
+
+    /// Number of result items.
+    fn __len__(&self) -> usize {
+        self.inner.len()
+    }
+
+    /// Whether any documents failed.
+    fn has_failures(&self) -> bool {
+        self.inner.has_failures()
+    }
+
+    /// Failed items.
+    #[getter]
+    fn failed(&self) -> Vec<PyFailedItem> {
+        self.inner
+            .failed
+            .iter()
+            .map(|f| PyFailedItem { inner: f.clone() })
+            .collect()
+    }
+
+    fn __repr__(&self) -> String {
+        format!(
+            "QueryResult(items={}, failed={})",
+            self.inner.len(),
+            self.inner.failed.len()
+        )
+    }
+}
+
+// ============================================================
+// IndexMetrics
+// ============================================================
+
+/// Indexing pipeline metrics.
+#[pyclass(name = "IndexMetrics")]
+pub struct PyIndexMetrics {
+    pub(crate) inner: IndexMetrics,
+}
+
+#[pymethods]
+impl PyIndexMetrics {
+    /// Total indexing time (ms).
+    #[getter]
+    fn total_time_ms(&self) -> u64 {
+        self.inner.total_time_ms()
+    }
+
+    /// Parse stage duration (ms).
+    #[getter]
+    fn parse_time_ms(&self) -> u64 {
+        self.inner.parse_time_ms
+    }
+
+    /// Build stage duration (ms).
+    #[getter]
+    fn build_time_ms(&self) -> u64 {
+        self.inner.build_time_ms
+    }
+
+    /// Enhance (summary) stage duration (ms).
+    #[getter]
+    fn enhance_time_ms(&self) -> u64 {
+        self.inner.enhance_time_ms
+    }
+
+    /// Number of nodes processed.
+    #[getter]
+    fn nodes_processed(&self) -> usize {
+        self.inner.nodes_processed
+    }
+
+    /// Number of summaries successfully generated.
+    #[getter]
+    fn summaries_generated(&self) -> usize {
+        self.inner.summaries_generated
+    }
+
+    /// Number of summaries that failed to generate.
+    #[getter]
+    fn summaries_failed(&self) -> usize {
+        self.inner.summaries_failed
+    }
+
+    /// Number of LLM calls made.
+    #[getter]
+    fn llm_calls(&self) -> usize {
+        self.inner.llm_calls
+    }
+
+    /// Total tokens generated by LLM.
+    #[getter]
+    fn total_tokens_generated(&self) -> usize {
+        self.inner.total_tokens_generated
+    }
+
+    /// Number of topics in reasoning index.
+    #[getter]
+    fn topics_indexed(&self) -> usize {
+        self.inner.topics_indexed
+    }
+
+    /// Number of keywords in reasoning index.
+    #[getter]
+    fn keywords_indexed(&self) -> usize {
+        self.inner.keywords_indexed
+    }
+
+    fn __repr__(&self) -> String {
+        format!(
+            "IndexMetrics(total={}ms, summaries={}, failed={}, llm_calls={})",
+            self.inner.total_time_ms(),
+            self.inner.summaries_generated,
+            self.inner.summaries_failed,
+            self.inner.llm_calls,
+        )
+    }
+}
+
+// ============================================================
+// IndexItem / IndexResult
+// ============================================================
+
+/// A single indexed document item.
+#[pyclass(name = "IndexItem")]
+pub struct PyIndexItem {
+    pub(crate) inner: IndexItem,
+}
+
+#[pymethods]
+impl PyIndexItem {
+    #[getter]
+    fn doc_id(&self) -> &str {
+        &self.inner.doc_id
+    }
+
+    #[getter]
+    fn name(&self) -> &str {
+        &self.inner.name
+    }
+
+    #[getter]
+    fn format(&self) -> String {
+        format!("{:?}", self.inner.format).to_lowercase()
+    }
+
+    #[getter]
+    fn description(&self) -> Option<&str> {
+        self.inner.description.as_deref()
+    }
+
+    #[getter]
+    fn source_path(&self) -> Option<&str> {
+        self.inner.source_path.as_deref()
+    }
+
+    #[getter]
+    fn page_count(&self) -> Option<usize> {
+        self.inner.page_count
+    }
+
+    /// Indexing pipeline metrics (timing, LLM usage, etc.).
+    #[getter]
+    fn metrics(&self) -> Option<PyIndexMetrics> {
+        self.inner
+            .metrics
+            .as_ref()
+            .map(|m| PyIndexMetrics { inner: m.clone() })
+    }
+
+    fn __repr__(&self) -> String {
+        format!(
+            "IndexItem(doc_id='{}', name='{}')",
+            self.inner.doc_id, self.inner.name
+        )
+    }
+}
+
+/// Result of a document indexing operation.
+#[pyclass(name = "IndexResult")]
+pub struct PyIndexResult {
+    pub(crate) inner: IndexResult,
+}
+
+#[pymethods]
+impl PyIndexResult {
+    /// The document ID (convenience for single-document indexing).
+    #[getter]
+    fn doc_id(&self) -> Option<String> {
+        self.inner.doc_id().map(|s| s.to_string())
+    }
+
+    /// All indexed items.
+    #[getter]
+    fn items(&self) -> Vec<PyIndexItem> {
+        self.inner
+            .items
+            .iter()
+            .map(|i| PyIndexItem { inner: i.clone() })
+            .collect()
+    }
+
+    /// Failed items.
+    #[getter]
+    fn failed(&self) -> Vec<PyFailedItem> {
+        self.inner
+            .failed
+            .iter()
+            .map(|f| PyFailedItem { inner: f.clone() })
+            .collect()
+    }
+
+    /// Whether any items failed.
+    fn has_failures(&self) -> bool {
+        self.inner.has_failures()
+    }
+
+    /// Total number of items (successful + failed).
+    fn total(&self) -> usize {
+        self.inner.total()
+    }
+
+    fn __len__(&self) -> usize {
+        self.inner.len()
+    }
+
+    fn __repr__(&self) -> String {
+        format!(
+            "IndexResult(doc_id={:?}, count={}, failed={})",
+            self.inner.doc_id(),
+            self.inner.items.len(),
+            self.inner.failed.len()
+        )
+    }
+}
diff --git a/rust/examples/advanced.rs b/rust/examples/advanced.rs
deleted file mode 100644
index fa14e931..00000000
--- a/rust/examples/advanced.rs
+++ /dev/null
@@ -1,78 +0,0 @@
-// Copyright (c) 2026 vectorless developers
-// SPDX-License-Identifier: Apache-2.0
-
-//! Advanced usage example - Full Configuration.
-//!
-//! This example demonstrates how to use a configuration file
-//! for advanced use cases where you need fine-grained control.
-//!
-//! # Usage
-//!
-//! ```bash
-//! # Using environment variables for LLM config (overrides config file):
-//! LLM_API_KEY=sk-xxx LLM_MODEL=gpt-4o cargo run --example advanced
-//!
-//! # Or with defaults (using config file):
-//! cargo run --example advanced
-//! ```
-
-use vectorless::{EngineBuilder, IndexContext, QueryContext};
-
-#[tokio::main]
-async fn main() -> vectorless::Result<()> {
-    // Initialize tracing for debug output (set RUST_LOG=debug to see more)
-    tracing_subscriber::fmt::init();
-
-    println!("=== Vectorless Advanced Example (Config File) ===\n");
-
-    // Load all settings from the specified config file.
-    // The config file must include api_key and model.
-    // If environment variables are set, they override the config file values.
-    let mut builder = EngineBuilder::new().with_config_path("./config.toml");
-
-    // Override config with env vars if present
-    if let Ok(api_key) = std::env::var("LLM_API_KEY") {
-        builder = builder.with_key(&api_key);
-    }
-    if let Ok(model) = std::env::var("LLM_MODEL") {
-        builder = builder.with_model(&model);
-    }
-    if let Ok(endpoint) = std::env::var("LLM_ENDPOINT") {
-        builder = builder.with_endpoint(&endpoint);
-    }
-
-    let client = builder
-        .build()
-        .await
-        .map_err(|e: vectorless::BuildError| vectorless::Error::Config(e.to_string()))?;
-
-    println!("Client created with config file\n");
-
-    // Index a document
-    let result = client.index(IndexContext::from_path("./README.md")).await?;
-    let doc_id = result.doc_id().unwrap().to_string();
-    println!("Indexed: {}\n", doc_id);
-
-    // Query
-    let result = client
-        .query(
-            QueryContext::new("What features does Vectorless provide?")
-                .with_doc_ids(vec![doc_id.clone()]),
-        )
-        .await?;
-    println!("Query: What features does Vectorless provide?");
-    if let Some(item) = result.single() {
-        println!("Score: {:.2}", item.score);
-        if !item.content.is_empty() {
-            let preview: String = item.content.chars().take(200).collect();
-            println!("Result: {}...\n", preview);
-        }
-    }
-
-    // Cleanup
-    client.remove(&doc_id).await?;
-    println!("Cleaned up");
-
-    println!("\n=== Done ===");
-    Ok(())
-}
diff --git a/rust/src/client/builder.rs b/rust/src/client/builder.rs
index 7fea2913..b0c035cf 100644
--- a/rust/src/client/builder.rs
+++ b/rust/src/client/builder.rs
@@ -5,89 +5,37 @@
 //!
 //! This module provides [`EngineBuilder`] for configuring and building
 //! [`Engine`] instances with sensible defaults.
-//!
-//! # Configuration
-//!
-//! `api_key` and `model` are **required**. `endpoint` is optional
-//! (defaults to the model provider's standard endpoint).
-//!
-//! Configuration sources (later overrides earlier):
-//! 1. Default configuration
-//! 2. Config file (via `with_config_path`)
-//! 3. Builder methods (`with_key`, `with_model`, etc.) — highest priority
-//!
-//! # Examples
-//!
-//! ```rust,no_run
-//! use vectorless::client::EngineBuilder;
-//!
-//! # #[tokio::main]
-//! # async fn main() -> Result<(), vectorless::BuildError> {
-//! let engine = EngineBuilder::new()
-//!     .with_key("sk-...")
-//!     .with_model("gpt-4o")
-//!     .build()
-//!     .await?;
-//! # Ok(())
-//! # }
-//! ```
-//!
-//! ## With Custom Endpoint
-//!
-//! ```rust,no_run
-//! use vectorless::client::EngineBuilder;
-//!
-//! # #[tokio::main]
-//! # async fn main() -> Result<(), vectorless::BuildError> {
-//! let engine = EngineBuilder::new()
-//!     .with_key("sk-...")
-//!     .with_model("deepseek-chat")
-//!     .with_endpoint("https://api.deepseek.com/v1")
-//!     .build()
-//!     .await?;
-//! # Ok(())
-//! # }
-//! ```
-
-use crate::config::{Config, ConfigLoader, RetrievalConfig};
-use crate::memo::MemoStore;
-use crate::retrieval::PipelineRetriever;
-use crate::storage::Workspace;
-
-use super::engine::Engine;
-use crate::events::EventEmitter;
+
+use crate::{
+    client::engine::Engine, config::Config, events::EventEmitter, retrieval::PipelineRetriever,
+    storage::Workspace,
+};
 
 /// Builder for creating a [`Engine`] client.
 ///
-/// `api_key` and `model` are required and must be set via builder methods
-/// or provided through a config file.
+/// `api_key`, `model` and `endpoint` are **required**.
 ///
 /// # Example
 ///
 /// ```rust,no_run
 /// use vectorless::client::EngineBuilder;
 ///
-/// # #[tokio::main]
-/// # async fn main() -> Result<(), vectorless::BuildError> {
-/// let client = EngineBuilder::new()
-///     .with_key("sk-...")
-///     .with_model("gpt-4o")
-///     .build()
-///     .await?;
-/// # Ok(())
-/// # }
+/// #[tokio::main]
+/// async fn main() -> Result<(), vectorless::BuildError> {
+///     let client = EngineBuilder::new()
+///         .with_key("sk-...")
+///         .with_model("gpt-4o")
+///         .with_endpoint("https://api.xxx.com/v1")
+///         .build()
+///         .await?;
+///    Ok(())
+/// }
 /// ```
 #[derive(Debug)]
 pub struct EngineBuilder {
-    /// Configuration file path.
-    config_path: Option<std::path::PathBuf>,
-
-    /// Custom configuration.
+    /// Custom configuration for advanced tuning.
     config: Option<Config>,
 
-    /// Custom retrieval config.
-    retrieval_config: Option<RetrievalConfig>,
-
     /// Event emitter.
     events: Option<EventEmitter>,
 
@@ -99,18 +47,6 @@ pub struct EngineBuilder {
 
     /// LLM endpoint URL (override).
     endpoint: Option<String>,
-
-    /// Top-K for retrieval (override).
-    top_k: Option<usize>,
-
-    /// Fast mode flag.
-    fast_mode: bool,
-
-    /// Precise mode flag.
-    precise_mode: bool,
-
-    /// Memo store for caching LLM decisions.
-    memo_store: Option<MemoStore>,
 }
 
 impl EngineBuilder {
@@ -118,17 +54,11 @@ impl EngineBuilder {
     #[must_use]
     pub fn new() -> Self {
         Self {
-            config_path: None,
             config: None,
-            retrieval_config: None,
             events: None,
             api_key: None,
             model: None,
             endpoint: None,
-            top_k: None,
-            fast_mode: false,
-            precise_mode: false,
-            memo_store: None,
         }
     }
 
@@ -136,31 +66,17 @@ impl EngineBuilder {
     // Basic Configuration
     // ============================================================
 
-    /// Set the configuration file path.
-    ///
-    /// The file must be a valid TOML configuration. No auto-detection is performed.
-    #[must_use]
-    pub fn with_config_path(mut self, path: impl Into<std::path::PathBuf>) -> Self {
-        self.config_path = Some(path.into());
-        self
-    }
-
-    /// Set a custom configuration object.
+    /// Set a custom configuration.
     ///
-    /// This overrides any config file settings.
+    /// When provided, this replaces the default [`Config`] entirely.
+    /// Builder methods (`with_key`, `with_model`, `with_endpoint`)
+    /// will still override the corresponding fields on top of this config.
     #[must_use]
     pub fn with_config(mut self, config: Config) -> Self {
         self.config = Some(config);
         self
     }
 
-    /// Set custom retrieval configuration.
-    #[must_use]
-    pub fn with_retrieval_config(mut self, config: RetrievalConfig) -> Self {
-        self.retrieval_config = Some(config);
-        self
-    }
-
     /// Set the event emitter for callbacks.
     #[must_use]
     pub fn with_events(mut self, events: EventEmitter) -> Self {
@@ -168,40 +84,6 @@ impl EngineBuilder {
         self
     }
 
-    /// Set a memo store for caching LLM decisions.
-    ///
-    /// When enabled, the pilot will cache navigation decisions based on
-    /// context fingerprints, avoiding redundant API calls for similar
-    /// navigation scenarios.
-    ///
-    /// # Example
-    ///
-    /// ```rust,no_run
-    /// use vectorless::client::EngineBuilder;
-    /// use vectorless::memo::MemoStore;
-    /// use chrono::Duration;
-    ///
-    /// # #[tokio::main]
-    /// # async fn main() -> Result<(), vectorless::BuildError> {
-    /// let memo_store = MemoStore::new()
-    ///     .with_ttl(Duration::days(7))
-    ///     .with_model("gpt-4o");
-    ///
-    /// let engine = EngineBuilder::new()
-    ///     .with_key("sk-...")
-    ///     .with_model("gpt-4o")
-    ///     .with_memo_store(memo_store)
-    ///     .build()
-    ///     .await?;
-    /// # Ok(())
-    /// # }
-    /// ```
-    #[must_use]
-    pub fn with_memo_store(mut self, store: MemoStore) -> Self {
-        self.memo_store = Some(store);
-        self
-    }
-
     // ============================================================
     // LLM Configuration
     // ============================================================
@@ -281,45 +163,6 @@ impl EngineBuilder {
     // Retrieval Configuration
     // ============================================================
 
-    /// Set the number of results to return from queries.
-    ///
-    /// Default is 5. Higher values return more context but cost more tokens.
-    #[must_use]
-    pub fn with_top_k(mut self, k: usize) -> Self {
-        self.top_k = Some(k);
-        self
-    }
-
-    // ============================================================
-    // Preset Configurations
-    // ============================================================
-
-    /// Enable fast mode for quicker but less thorough retrieval.
-    ///
-    /// Fast mode uses:
-    /// - Keyword-based retrieval (no LLM calls)
-    /// - Lower beam width / MCTS simulations
-    /// - Lazy summary generation
-    #[must_use]
-    pub fn fast(mut self) -> Self {
-        self.fast_mode = true;
-        self.precise_mode = false;
-        self
-    }
-
-    /// Enable precise mode for higher quality retrieval.
-    ///
-    /// Precise mode uses:
-    /// - MCTS-based retrieval
-    /// - Higher simulation count
-    /// - Full summary generation
-    #[must_use]
-    pub fn precise(mut self) -> Self {
-        self.precise_mode = true;
-        self.fast_mode = false;
-        self
-    }
-
     /// Build the Engine client.
     ///
     /// `api_key` and `model` must be provided via builder methods or config file.
@@ -347,22 +190,8 @@ impl EngineBuilder {
     /// # }
     /// ```
     pub async fn build(self) -> Result<Engine, BuildError> {
-        // Load or create configuration
-        let mut config = if let Some(config) = self.config {
-            config
-        } else if let Some(path) = self.config_path {
-            ConfigLoader::new()
-                .file(&path)
-                .load()
-                .map_err(|e| BuildError::Config(e.to_string()))?
-        } else {
-            Config::default()
-        };
-
-        // Apply builder overrides to retrieval config
-        if let Some(retrieval_config) = self.retrieval_config {
-            config.retrieval = retrieval_config;
-        }
+        // Load user-provided or default configuration
+        let mut config = self.config.unwrap_or_default();
 
         // Apply individual overrides to LlmPoolConfig (primary) + legacy config (compat)
         if let Some(api_key) = self.api_key {
@@ -392,18 +221,6 @@ impl EngineBuilder {
             config.retrieval.endpoint = endpoint.clone();
             config.summary.endpoint = endpoint;
         }
-        if let Some(top_k) = self.top_k {
-            config.retrieval.top_k = top_k;
-        }
-
-        // Apply preset modes
-        if self.fast_mode {
-            config.retrieval.search.max_iterations = 5;
-        }
-        if self.precise_mode {
-            config.retrieval.search.max_iterations = 100;
-        }
-
         // Validate required settings
         let resolved_key = config
             .llm
@@ -423,6 +240,9 @@ impl EngineBuilder {
         if retrieval_model.is_empty() {
             return Err(BuildError::MissingModel);
         }
+        if config.llm.endpoint.is_none() {
+            return Err(BuildError::MissingEndpoint);
+        }
 
         // Open workspace from config
         let workspace = Workspace::new(&config.storage.workspace_dir)
@@ -456,15 +276,6 @@ impl EngineBuilder {
                 retriever.with_content_config(retrieval_config.content.to_aggregator_config());
         }
 
-        // Add memo store if provided or create default
-        if let Some(memo_store) = self.memo_store {
-            retriever = retriever.with_memo_store(memo_store);
-        } else {
-            // Create default memo store with model from config
-            let memo_store = MemoStore::new().with_model(retrieval_model).with_version(1);
-            retriever = retriever.with_memo_store(memo_store);
-        }
-
         // Build engine
         let events = self.events.unwrap_or_default();
         Engine::with_components(config, workspace, retriever, indexer, events)
@@ -482,10 +293,6 @@ impl Default for EngineBuilder {
 /// Error during client build.
 #[derive(Debug, thiserror::Error)]
 pub enum BuildError {
-    /// Configuration error.
-    #[error("Configuration error: {0}")]
-    Config(String),
-
     /// Workspace error.
     #[error("Workspace error: {0}")]
     Workspace(String),
@@ -498,6 +305,12 @@ pub enum BuildError {
     #[error("Missing model: call .with_model(\"gpt-4o\") or set model in config file")]
     MissingModel,
 
+    /// Missing endpoint URL.
+    #[error(
+        "Missing endpoint: call .with_endpoint(\"https://api.xxx.com/v1\") or set endpoint in config"
+    )]
+    MissingEndpoint,
+
     /// Other error.
     #[error("{0}")]
     Other(String),
@@ -507,13 +320,6 @@ pub enum BuildError {
 mod tests {
     use super::*;
 
-    #[test]
-    fn test_builder_defaults() {
-        let builder = EngineBuilder::new();
-        assert!(!builder.fast_mode);
-        assert!(!builder.precise_mode);
-    }
-
     #[test]
     fn test_builder_with_key() {
         let builder = EngineBuilder::new().with_key("sk-test-key");
@@ -537,27 +343,4 @@ mod tests {
         assert_eq!(builder.model, Some("gpt-4o-mini".to_string()));
         assert_eq!(builder.api_key, Some("sk-test".to_string()));
     }
-
-    #[test]
-    fn test_builder_fast_mode() {
-        let builder = EngineBuilder::new().fast();
-
-        assert!(builder.fast_mode);
-        assert!(!builder.precise_mode);
-    }
-
-    #[test]
-    fn test_builder_precise_mode() {
-        let builder = EngineBuilder::new().precise();
-
-        assert!(builder.precise_mode);
-        assert!(!builder.fast_mode);
-    }
-
-    #[test]
-    fn test_builder_top_k() {
-        let builder = EngineBuilder::new().with_top_k(10);
-
-        assert_eq!(builder.top_k, Some(10));
-    }
 }
diff --git a/rust/src/client/engine.rs b/rust/src/client/engine.rs
index 5c909c36..6cc4e207 100644
--- a/rust/src/client/engine.rs
+++ b/rust/src/client/engine.rs
@@ -19,6 +19,7 @@
 //! let engine = EngineBuilder::new()
 //!     .with_key("sk-...")
 //!     .with_model("gpt-4o")
+//!     .with_endpoint("https://api.openai.com/v1")
 //!     .build()
 //!     .await?;
 //!
@@ -36,28 +37,33 @@
 //! # }
 //! ```
 
-use std::collections::HashMap;
-use std::sync::Arc;
+use std::{collections::HashMap, sync::Arc};
 
 use futures::StreamExt;
 use tracing::info;
 
-use crate::config::Config;
-use crate::error::Result;
-use crate::index::PipelineOptions;
-use crate::index::incremental::{self, IndexAction};
-use crate::metrics::MetricsHub;
-use crate::retrieval::{PipelineRetriever, RetrieveEventReceiver};
-use crate::storage::{PersistedDocument, Workspace};
-use crate::{DocumentTree, Error};
-
-use super::index_context::{IndexContext, IndexSource};
-use super::indexer::IndexerClient;
-use super::query_context::{QueryContext, QueryScope};
-use super::retriever::RetrieverClient;
-use super::types::{DocumentInfo, FailedItem, IndexItem, IndexMode, IndexResult, QueryResult};
-use super::workspace::WorkspaceClient;
-use crate::events::EventEmitter;
+use crate::{
+    DocumentTree, Error,
+    config::Config,
+    error::Result,
+    events::EventEmitter,
+    index::{
+        PipelineOptions,
+        incremental::{self, IndexAction},
+    },
+    metrics::MetricsHub,
+    retrieval::{PipelineRetriever, RetrieveEventReceiver},
+    storage::{PersistedDocument, Workspace},
+};
+
+use super::{
+    index_context::{IndexContext, IndexSource},
+    indexer::IndexerClient,
+    query_context::{QueryContext, QueryScope},
+    retriever::RetrieverClient,
+    types::{DocumentInfo, FailedItem, IndexItem, IndexMode, IndexResult, QueryResult},
+    workspace::WorkspaceClient,
+};
 
 /// The main Engine client.
 ///
diff --git a/rust/src/config/mod.rs b/rust/src/config/mod.rs
index 0a347826..f6d26927 100644
--- a/rust/src/config/mod.rs
+++ b/rust/src/config/mod.rs
@@ -11,9 +11,9 @@ mod merge;
 mod types;
 mod validator;
 
-pub(crate) use loader::ConfigLoader;
+pub use types::Config;
 pub(crate) use types::{
-    CacheConfig, CompressionAlgorithm, ConcurrencyConfig, Config, FallbackBehavior, FallbackConfig,
+    CacheConfig, CompressionAlgorithm, ConcurrencyConfig, FallbackBehavior, FallbackConfig,
     IndexerConfig, LlmClientConfig, LlmConfig, LlmMetricsConfig, LlmPoolConfig, MetricsConfig,
     OnAllFailedBehavior, PilotMetricsConfig, RetrievalConfig, RetrievalMetricsConfig,
     SufficiencyConfig, SummaryConfig,
diff --git a/rust/src/lib.rs b/rust/src/lib.rs
index 7541d900..26dcceae 100644
--- a/rust/src/lib.rs
+++ b/rust/src/lib.rs
@@ -4,11 +4,9 @@
 
 //! # Vectorless
 //!
-//! An ultra-performant reasoning-native document intelligence engine for AI.
-//!
-//! It transforms documents into rich semantic trees and uses LLMs to
-//! intelligently traverse the hierarchy — retrieving the most relevant content
-//! through structural reasoning and deep contextual understanding.
+//! A document engine for AI. It transforms documents into hierarchical semantic
+//! trees and uses the LLM itself to navigate and retrieve — purely LLM-guided,
+//! from indexing to querying. No vector databases, no embeddings, no similarity search.
 //!
 //! ## Quick Start
 //!
@@ -36,7 +34,8 @@
 //! ```
 
 pub mod client;
-mod config;
+pub mod config;
+pub use config::Config;
 pub mod document;
 pub mod error;
 pub mod events;